diff --git a/annotations_filtered/n-5bVE4K2Ls_filtered.json b/annotations_filtered/n-5bVE4K2Ls_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd4fec3842619c5b87d2fca1b435d49c6383dad1 --- /dev/null +++ b/annotations_filtered/n-5bVE4K2Ls_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.23], [9.0, 16.58], [19.0, 19.36], [25.0, 25.57], [26.0, 29.52], [30.0, 31.82], [32.0, 34.52], [35.0, 36.64], [40.0, 43.68], [44.0, 44.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.96, 99.95, 0.0, 0.0, 99.97, 0.0, 87.74, 0.0, 99.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [3.23, 7.58, 0.36, 0.57, 3.52, 1.82, 2.52, 1.64, 3.68, 0.98]} \ No newline at end of file diff --git a/annotations_filtered/n-mpifTiPV4_filtered.json b/annotations_filtered/n-mpifTiPV4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4bcf1501fa603f8773fc3a4e8fb63f687d796424 --- /dev/null +++ b/annotations_filtered/n-mpifTiPV4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.96], [14.0, 16.41], [17.0, 18.1], [18.0, 19.52], [21.0, 25.05], [26.0, 26.59], [28.0, 28.07], [34.0, 34.79], [37.0, 37.27], [42.0, 44.0], [46.0, 46.14], [50.0, 52.25], [53.0, 53.57], [61.0, 61.3], [66.0, 66.04], [66.0, 66.5], [73.0, 74.83], [82.0, 82.34], [84.0, 84.08], [85.0, 87.61], [88.0, 88.53], [95.0, 95.3], [96.0, 96.42], [100.0, 100.18], [102.0, 102.3], [106.0, 106.54], [107.0, 107.35], [107.0, 107.76], [109.0, 108.95], [109.0, 111.42], [119.0, 121.76], [125.0, 125.47], [127.0, 127.3]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 35.26, 0.0, 0.0, 59.15, 0.0, 0.0, 0.0, 0.0, 76.86, 0.0, 31.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.94, 43.93, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 21.96], ["mains hum", 21.32], ["sidetone", 11.87]], null, null, null, null, null, null, null, null, null, [["speech", 21.04], ["chirp tone", 10.42], ["sneeze", 8.94]], null, null, null, null, null, null, null, [["speech", 30.16], ["animal", 21.5], ["dog", 6.3]], null, null, null, null, null, null, null, null, null, [["fly, housefly", 24.63], ["hum", 16.92], ["mains hum", 10.41]], [["speech", 47.12], ["hum", 8.4], ["throbbing", 3.93]], null, null], "duration": [0.96, 2.41, 1.1, 1.52, 4.05, 0.59, 0.07, 0.79, 0.27, 2.0, 0.14, 2.25, 0.57, 0.3, 0.04, 0.5, 1.83, 0.34, 0.08, 2.61, 0.53, 0.3, 0.42, 0.18, 0.3, 0.54, 0.35, 0.76, -0.05, 2.42, 2.76, 0.47, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/n-omBTsCIDE_filtered.json b/annotations_filtered/n-omBTsCIDE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3b4bdfd7e1c6a38ac1204eaa15e3e85a0e9b2b9 --- /dev/null +++ b/annotations_filtered/n-omBTsCIDE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 9.83], [10.0, 10.61], [11.0, 11.47], [15.0, 15.16], [19.0, 23.18], [25.0, 25.08], [27.0, 27.13], [28.0, 29.91], [31.0, 31.11], [32.0, 37.4], [39.0, 39.06], [45.0, 45.12], [56.0, 59.68], [63.0, 63.19], [64.0, 64.91], [67.0, 67.07], [78.0, 78.93], [96.0, 96.69], [109.0, 109.98], [117.0, 119.33], [122.0, 122.98], [123.0, 123.97], [125.0, 125.41], [127.0, 128.68]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.61, 0.0, 0.0, 0.0, 44.43, 0.0, 0.0, 0.0, 0.0, 69.34, 0.0, 0.0, 98.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.17, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 13.01], ["hum", 11.37], ["bouncing", 7.33]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.83, 0.61, 0.47, 0.16, 4.18, 0.08, 0.13, 1.91, 0.11, 5.4, 0.06, 0.12, 3.68, 0.19, 0.91, 0.07, 0.93, 0.69, 0.98, 2.33, 0.98, 0.97, 0.41, 1.68]} \ No newline at end of file diff --git a/annotations_filtered/n0Fz-ACCMHk_filtered.json b/annotations_filtered/n0Fz-ACCMHk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc64f437329329a791b0e99d67e52b377b6756b2 --- /dev/null +++ b/annotations_filtered/n0Fz-ACCMHk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.01], [24.0, 24.33], [26.0, 28.31], [29.0, 29.49], [33.0, 33.32], [36.0, 36.19], [39.0, 39.66], [40.0, 41.34], [42.0, 42.28], [46.0, 47.44], [48.0, 49.87], [51.0, 60.72], [61.0, 62.61], [64.0, 66.77], [68.0, 69.52], [70.0, 71.51], [72.0, 74.6], [75.0, 76.25], [78.0, 78.7], [79.0, 79.88], [83.0, 84.23], [85.0, 85.53], [89.0, 91.98], [96.0, 99.12], [101.0, 101.85], [102.0, 107.15], [107.0, 109.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.8, 35.8, 0.0, 59.42, 69.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["clang", 15.67], ["boing", 13.66], ["arrow", 13.61]], null, null, null], "duration": [0.01, 0.33, 2.31, 0.49, 0.32, 0.19, 0.66, 1.34, 0.28, 1.44, 1.87, 9.72, 1.61, 2.77, 1.52, 1.51, 2.6, 1.25, 0.7, 0.88, 1.23, 0.53, 2.98, 3.12, 0.85, 5.15, 2.27]} \ No newline at end of file diff --git a/annotations_filtered/n0QO2xOuqp0_filtered.json b/annotations_filtered/n0QO2xOuqp0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..deac3708f656a93b7c11ef5c6ad1388771e9ba0f --- /dev/null +++ b/annotations_filtered/n0QO2xOuqp0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.09], [13.0, 23.8], [26.0, 25.84], [28.0, 28.54], [34.0, 34.97], [40.0, 42.36], [44.0, 49.52], [54.0, 57.87], [63.0, 79.02], [83.0, 93.51], [97.0, 98.81], [105.0, 105.21], [110.0, 115.16], [126.0, 132.81], [145.0, 147.56], [154.0, 157.3], [158.0, 158.16], [159.0, 160.88], [162.0, 167.81]], "keep_status": [false, false, false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [30.79, 29.02, 0.0, 0.0, 0.0, 28.97, 28.98, 29.49, 28.84, 29.21, 0.0, 0.0, 28.9, 28.81, 29.18, 29.53, 0.0, 0.0, 28.78], "audiomae_on_audioset": [[["music", 60.94], ["throbbing", 9.68], ["sidetone", 2.85]], [["smash, crash", 44.44], ["whack, thwack", 22.46], ["music", 22.03]], null, null, null, [["music", 23.22], ["speech", 16.01], ["cattle, bovinae", 8.83]], [["speech", 39.6], ["vehicle", 12.86], ["music", 9.58]], [["music", 56.91], ["speech", 30.17], ["sidetone", 2.35]], [["music", 78.33], ["speech", 3.14], ["whip", 1.98]], [["music", 52.14], ["cacophony", 8.1], ["throbbing", 7.43]], null, null, [["music", 64.81], ["speech", 14.85], ["boing", 5.07]], [["music", 71.59], ["speech", 5.9], ["musical instrument", 1.61]], [["music", 36.66], ["speech", 27.72], ["electronic music", 7.16]], [["music", 46.65], ["throbbing", 28.08], ["hum", 7.3]], null, null, [["throbbing", 56.65], ["music", 15.17], ["hum", 14.51]]], "duration": [2.09, 10.8, -0.16, 0.54, 0.97, 2.36, 5.52, 3.87, 16.02, 10.51, 1.81, 0.21, 5.16, 6.81, 2.56, 3.3, 0.16, 1.88, 5.81]} \ No newline at end of file diff --git a/annotations_filtered/n13FhFrtu_8_filtered.json b/annotations_filtered/n13FhFrtu_8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35e56fc8d2f61775dc0da1495771325d8e68a805 --- /dev/null +++ b/annotations_filtered/n13FhFrtu_8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.51], [14.0, 15.08], [15.0, 17.02], [19.0, 24.36], [26.0, 27.45], [30.0, 31.16], [33.0, 35.36], [39.0, 40.14], [43.0, 45.52], [50.0, 59.8], [63.0, 64.23], [66.0, 66.56], [68.0, 68.28], [70.0, 70.36], [72.0, 73.7], [79.0, 79.71], [80.0, 80.87], [82.0, 83.17], [85.0, 92.08], [96.0, 100.03], [101.0, 102.22], [107.0, 107.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.56, 47.78, 0.0, 0.0, 98.36, 0.0, 100.0, 64.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.31, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 56.64], ["sidetone", 12.66], ["telephone", 7.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.51, 1.08, 2.02, 5.36, 1.45, 1.16, 2.36, 1.14, 2.52, 9.8, 1.23, 0.56, 0.28, 0.36, 1.7, 0.71, 0.87, 1.17, 7.08, 4.03, 1.22, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/n16wkJDq2VQ_filtered.json b/annotations_filtered/n16wkJDq2VQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8733f6024606dbd857f9afa2d4d47b73d0cf8a87 --- /dev/null +++ b/annotations_filtered/n16wkJDq2VQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.9], [11.0, 11.06], [23.0, 23.11], [24.0, 25.84], [26.0, 27.97], [31.0, 31.43], [36.0, 37.66], [38.0, 44.25], [45.0, 47.76], [48.0, 50.08], [51.0, 51.34], [53.0, 53.37], [54.0, 55.29], [58.0, 58.58], [63.0, 64.1], [68.0, 68.77], [70.0, 71.59], [76.0, 76.42], [77.0, 78.27], [81.0, 86.83], [91.0, 94.07], [97.0, 97.71], [99.0, 100.36], [101.0, 105.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17, 99.52, 76.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.78, 37.93, 0.0, 0.0, 98.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 65.27], ["noise", 2.9], ["beatboxing", 2.48]], null, null, null], "duration": [-0.1, 0.06, 0.11, 1.84, 1.97, 0.43, 1.66, 6.25, 2.76, 2.08, 0.34, 0.37, 1.29, 0.58, 1.1, 0.77, 1.59, 0.42, 1.27, 5.83, 3.07, 0.71, 1.36, 4.54]} \ No newline at end of file diff --git a/annotations_filtered/n16wxs5pgvk_filtered.json b/annotations_filtered/n16wxs5pgvk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6bd3a847dda53ed54b8a692b5d447e1a5da2ec2d --- /dev/null +++ b/annotations_filtered/n16wxs5pgvk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 18.67], [42.0, 42.58], [43.0, 45.64], [69.0, 69.43], [77.0, 80.89], [94.0, 95.07], [97.0, 101.11], [118.0, 118.96]], "keep_status": [false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 45.75, 0.0, 31.95, 0.0, 31.16, 0.0], "audiomae_on_audioset": [null, null, [["fart", 32.51], ["speech", 12.62], ["noise", 7.27]], null, [["speech", 77.2], ["fart", 4.37], ["noise", 4.13]], null, [["music", 54.81], ["trombone", 8.35], ["brass instrument", 5.45]], null], "duration": [-0.33, 0.58, 2.64, 0.43, 3.89, 1.07, 4.11, 0.96]} \ No newline at end of file diff --git a/annotations_filtered/n1BXpNTsoB8_filtered.json b/annotations_filtered/n1BXpNTsoB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc4a85115c02570f1a553ccaeee3026a147c72ce --- /dev/null +++ b/annotations_filtered/n1BXpNTsoB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 30.16], [31.0, 32.63], [40.0, 40.51], [41.0, 42.16], [47.0, 47.19], [48.0, 50.14], [51.0, 52.88], [55.0, 57.96], [59.0, 60.32], [63.0, 65.26], [68.0, 69.03], [71.0, 71.29], [74.0, 77.94], [79.0, 79.57], [80.0, 81.82], [83.0, 83.12], [86.0, 86.26], [87.0, 86.95], [87.0, 87.89], [89.0, 89.85], [90.0, 91.79], [93.0, 94.36], [95.0, 95.98], [97.0, 98.63], [99.0, 100.87], [105.0, 106.15], [109.0, 110.05], [110.0, 111.35], [113.0, 113.53], [118.0, 118.69], [121.0, 124.07], [125.0, 125.9], [127.0, 128.75]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.54, 0.0, 60.32, 0.0, 45.78, 0.0, 0.0, 43.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.66, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 63.7], ["sine wave", 7.09], ["music", 4.74]], null, null, null, [["speech", 36.9], ["sidetone", 19.63], ["busy signal", 6.28]], null, null, [["speech", 71.66], ["dial tone", 8.55], ["busy signal", 2.87]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 1.63, 0.51, 1.16, 0.19, 2.14, 1.88, 2.96, 1.32, 2.26, 1.03, 0.29, 3.94, 0.57, 1.82, 0.12, 0.26, -0.05, 0.89, 0.85, 1.79, 1.36, 0.98, 1.63, 1.87, 1.15, 1.05, 1.35, 0.53, 0.69, 3.07, 0.9, 1.75]} \ No newline at end of file diff --git a/annotations_filtered/n1GlWng3oOQ_filtered.json b/annotations_filtered/n1GlWng3oOQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bfe1485723b949724312e1117befd2976f27db3a --- /dev/null +++ b/annotations_filtered/n1GlWng3oOQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[56.0, 58.31], [59.0, 59.9], [60.0, 62.29], [63.0, 64.64], [66.0, 68.98], [70.0, 78.22], [79.0, 82.46], [84.0, 87.86], [89.0, 90.14], [91.0, 93.82], [95.0, 96.11], [97.0, 99.32], [100.0, 102.07], [103.0, 115.96], [116.0, 119.65], [120.0, 127.95], [131.0, 131.84], [133.0, 133.93], [135.0, 136.41], [138.0, 139.09], [140.0, 148.0], [149.0, 155.56], [156.0, 159.0], [160.0, 164.69], [165.0, 168.84], [170.0, 174.85], [176.0, 177.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [51.23, 0.0, 62.78, 0.0, 64.29, 58.38, 74.29, 85.9, 0.0, 98.36, 0.0, 92.97, 97.33, 58.47, 77.36, 62.99, 0.0, 0.0, 0.0, 0.0, 56.86, 56.86, 69.47, 73.67, 57.89, 53.53, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.31, 0.9, 2.29, 1.64, 2.98, 8.22, 3.46, 3.86, 1.14, 2.82, 1.11, 2.32, 2.07, 12.96, 3.65, 7.95, 0.84, 0.93, 1.41, 1.09, 8.0, 6.56, 3.0, 4.69, 3.84, 4.85, 1.96]} \ No newline at end of file diff --git a/annotations_filtered/n1TqCGEBdLw_filtered.json b/annotations_filtered/n1TqCGEBdLw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1b22bc5590bfeadba7e7dfaa38e2b3482bd3029 --- /dev/null +++ b/annotations_filtered/n1TqCGEBdLw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 54.99], [56.0, 70.29]], "keep_status": [false, false], "silence_prob": [0.0, 60.05], "audiomae_on_audioset": [null, null], "duration": [40.99, 14.29]} \ No newline at end of file diff --git a/annotations_filtered/n1VEmXiaFY4_filtered.json b/annotations_filtered/n1VEmXiaFY4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9eb77a736ce5b9c542afebc998cdf9f525b60f3 --- /dev/null +++ b/annotations_filtered/n1VEmXiaFY4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[86.0, 107.08], [108.0, 110.08], [117.0, 120.04], [122.0, 127.04], [129.0, 135.14], [137.0, 143.31], [143.0, 147.72], [148.0, 149.45], [153.0, 155.78], [162.0, 162.5]], "keep_status": [false, true, false, false, false, true, false, false, false, false], "silence_prob": [31.51, 46.68, 64.63, 53.84, 61.37, 48.95, 40.92, 0.0, 99.44, 0.0], "audiomae_on_audioset": [[["music", 61.4], ["hum", 10.88], ["throbbing", 7.79]], [["speech", 26.03], ["music", 20.1], ["hum", 14.09]], null, null, null, [["music", 29.49], ["gong", 13.49], ["singing bowl", 9.7]], [["speech", 67.48], ["music", 19.33], ["sidetone", 2.92]], null, null, null], "duration": [21.08, 2.08, 3.04, 5.04, 6.14, 6.31, 4.72, 1.45, 2.78, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/n1X2w0tinkg_filtered.json b/annotations_filtered/n1X2w0tinkg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d890f985dbecc971cfbacc87d27cad925145ce1 --- /dev/null +++ b/annotations_filtered/n1X2w0tinkg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.02], [14.0, 16.93], [22.0, 26.4], [29.0, 87.59], [90.0, 105.68], [106.0, 125.29]], "keep_status": [true, true, false, false, false, false], "silence_prob": [39.85, 43.58, 54.3, 0.0, 32.94, 37.35], "audiomae_on_audioset": [[["music", 57.55], ["didgeridoo", 8.15], ["synthesizer", 3.68]], [["music", 56.13], ["theremin", 8.61], ["musical instrument", 3.59]], null, null, [["music", 60.09], ["theremin", 14.39], ["ambient music", 6.25]], [["music", 70.8], ["foghorn", 7.37], ["didgeridoo", 4.55]]], "duration": [3.02, 2.93, 4.4, 58.59, 15.68, 19.29]} \ No newline at end of file diff --git a/annotations_filtered/n1lQR-GjWYw_filtered.json b/annotations_filtered/n1lQR-GjWYw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a28663e728ee9ab1f6700f74511333e0a5703bc --- /dev/null +++ b/annotations_filtered/n1lQR-GjWYw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 64.84], [66.0, 67.85], [69.0, 81.4], [85.0, 101.36], [105.0, 111.99], [113.0, 119.79], [121.0, 125.17]], "keep_status": [false, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 30.02, 30.19, 29.35, 30.89, 29.99], "audiomae_on_audioset": [null, null, [["music", 43.79], ["groan", 7.15], ["whack, thwack", 6.87]], [["music", 33.3], ["speech", 22.24], ["fart", 10.8]], [["music", 74.79], ["theremin", 3.69], ["whack, thwack", 2.87]], [["music", 51.94], ["smash, crash", 26.8], ["whack, thwack", 8.78]], [["moo", 23.6], ["livestock, farm animals, working animals", 22.8], ["cattle, bovinae", 19.08]]], "duration": [33.84, 1.85, 12.4, 16.36, 6.99, 6.79, 4.17]} \ No newline at end of file diff --git a/annotations_filtered/n1lbpj6868o_filtered.json b/annotations_filtered/n1lbpj6868o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..997513d033fc9086091f767187af34d068e5c006 --- /dev/null +++ b/annotations_filtered/n1lbpj6868o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 39.41], [62.0, 62.51], [86.0, 87.47], [88.0, 88.72], [90.0, 90.86], [98.0, 100.75], [108.0, 109.81], [114.0, 115.52], [117.0, 118.89], [119.0, 119.74], [120.0, 121.44], [123.0, 126.28]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [66.27, 0.0, 0.0, 0.0, 0.0, 40.12, 0.0, 0.0, 0.0, 0.0, 0.0, 34.08], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 38.93], ["music", 19.81], ["sidetone", 10.94]], null, null, null, null, null, [["music", 36.53], ["speech", 32.84], ["whack, thwack", 2.31]]], "duration": [5.41, 0.51, 1.47, 0.72, 0.86, 2.75, 1.81, 1.52, 1.89, 0.74, 1.44, 3.28]} \ No newline at end of file diff --git a/annotations_filtered/n1pSObsJ_hk_filtered.json b/annotations_filtered/n1pSObsJ_hk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80968cd953203f4a58731698c92111b2e23bdf1a --- /dev/null +++ b/annotations_filtered/n1pSObsJ_hk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.71], [18.0, 18.35], [24.0, 28.58], [29.0, 29.98], [31.0, 32.51], [35.0, 35.6], [36.0, 36.61], [37.0, 58.73], [63.0, 65.97], [67.0, 68.05], [76.0, 78.98], [82.0, 99.42], [113.0, 114.99], [115.0, 115.03], [119.0, 120.31], [120.0, 120.43], [120.0, 120.48], [121.0, 121.95], [126.0, 131.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [99.97, 0.0, 59.68, 0.0, 0.0, 0.0, 0.0, 41.34, 74.6, 0.0, 36.57, 50.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.15], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 66.15], ["radio", 3.24], ["explosion", 2.35]], null, null, [["speech", 60.15], ["fireworks", 4.27], ["noise", 2.92]], null, null, null, null, null, null, null, null], "duration": [2.71, 0.35, 4.58, 0.98, 1.51, 0.6, 0.61, 21.73, 2.97, 1.05, 2.98, 17.42, 1.99, 0.03, 1.31, 0.43, 0.48, 0.95, 5.77]} \ No newline at end of file diff --git a/annotations_filtered/n2A194yTWoQ_filtered.json b/annotations_filtered/n2A194yTWoQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ffea8365bae536901b6f1a7cae8128e481c2a61 --- /dev/null +++ b/annotations_filtered/n2A194yTWoQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.02], [7.0, 7.42], [10.0, 11.5], [12.0, 12.97], [15.0, 15.65], [28.0, 27.94], [29.0, 29.66], [37.0, 37.57], [43.0, 43.26], [48.0, 48.25], [51.0, 52.15], [55.0, 56.61], [60.0, 60.56], [62.0, 62.68], [67.0, 68.74], [72.0, 73.03], [77.0, 79.84], [81.0, 81.18], [84.0, 84.13], [87.0, 87.39], [91.0, 98.78], [99.0, 100.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.31, 0.0, 0.0, 0.0, 44.99, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 91.7], ["speech", 1.99], ["mains hum", 1.15]], null, null, null, [["hum", 26.15], ["sidetone", 15.45], ["mains hum", 14.17]], null], "duration": [1.02, 0.42, 1.5, 0.97, 0.65, -0.06, 0.66, 0.57, 0.26, 0.25, 1.15, 1.61, 0.56, 0.68, 1.74, 1.03, 2.84, 0.18, 0.13, 0.39, 7.78, 1.8]} \ No newline at end of file diff --git a/annotations_filtered/n2YCseaZK0Q_filtered.json b/annotations_filtered/n2YCseaZK0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ae51eef1dfb54ae9d483bc0a3b1c3d9d971f3d6 --- /dev/null +++ b/annotations_filtered/n2YCseaZK0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.12], [7.0, 8.04], [15.0, 16.02], [19.0, 20.48], [24.0, 27.72], [29.0, 34.13], [35.0, 36.37], [38.0, 38.67], [40.0, 41.84], [43.0, 52.78], [57.0, 61.59], [63.0, 64.13], [70.0, 72.27], [75.0, 75.69], [76.0, 92.6], [94.0, 97.02], [103.0, 109.02], [109.0, 121.85], [122.0, 124.92], [126.0, 127.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 58.98, 51.99, 0.0, 0.0, 0.0, 53.91, 57.97, 0.0, 53.65, 0.0, 48.74, 49.18, 48.87, 40.16, 44.63, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 24.62], ["hum", 20.8], ["throbbing", 13.72]], [["throbbing", 36.44], ["hum", 21.45], ["music", 17.25]], [["throbbing", 45.32], ["hum", 25.45], ["mains hum", 5.77]], [["hum", 45.11], ["throbbing", 17.55], ["mains hum", 14.93]], [["throbbing", 28.32], ["hum", 28.0], ["music", 22.52]], null], "duration": [1.12, 1.04, 1.02, 1.48, 3.72, 5.13, 1.37, 0.67, 1.84, 9.78, 4.59, 1.13, 2.27, 0.69, 16.6, 3.02, 6.02, 12.85, 2.92, 1.63]} \ No newline at end of file diff --git a/annotations_filtered/n2ZkOcq4vWU_filtered.json b/annotations_filtered/n2ZkOcq4vWU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34eb190cb09122530831fd634287ba498c78342a --- /dev/null +++ b/annotations_filtered/n2ZkOcq4vWU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.55], [5.0, 5.48], [7.0, 8.02], [8.0, 9.44], [10.0, 12.66], [13.0, 14.15], [16.0, 18.05], [19.0, 20.75], [23.0, 24.54], [26.0, 26.6]], "keep_status": [false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 47.31, 0.0, 46.22, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 40.18], ["hum", 33.12], ["speech", 7.17]], null, [["speech", 22.18], ["hum", 12.21], ["mains hum", 11.44]], null, null, null], "duration": [0.55, 0.48, 1.02, 1.44, 2.66, 1.15, 2.05, 1.75, 1.54, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/n2lTpPptOWA_filtered.json b/annotations_filtered/n2lTpPptOWA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5445474ddaee1e3a7a19c4fb94e7e9715e037f28 --- /dev/null +++ b/annotations_filtered/n2lTpPptOWA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 18.99], [19.0, 19.23], [19.0, 28.8], [55.0, 55.36], [60.0, 62.21], [64.0, 69.74], [72.0, 77.16], [91.0, 92.3], [108.0, 107.96]], "keep_status": [false, false, true, false, false, true, false, false, false], "silence_prob": [44.52, 0.0, 37.57, 0.0, 99.93, 31.81, 32.05, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 39.75], ["snicker", 15.74], ["laughter", 14.79]], null, [["speech", 44.9], ["honk", 7.7], ["goose", 6.52]], null, null, [["screaming", 37.69], ["moo", 15.92], ["cattle, bovinae", 15.6]], [["speech", 66.57], ["fart", 20.57], ["noise", 3.33]], null, null], "duration": [8.99, 0.23, 9.8, 0.36, 2.21, 5.74, 5.16, 1.3, -0.04]} \ No newline at end of file diff --git a/annotations_filtered/n3BgbwW6PXc_filtered.json b/annotations_filtered/n3BgbwW6PXc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d14e6189ca36b7907bb9798b66ecf491f8e37b8f --- /dev/null +++ b/annotations_filtered/n3BgbwW6PXc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.34], [10.0, 11.92], [14.0, 14.4], [15.0, 16.85], [17.0, 20.75], [26.0, 26.84], [28.0, 34.13], [46.0, 46.38], [47.0, 47.93], [49.0, 50.18], [52.0, 51.7], [53.0, 57.21], [61.0, 61.67], [62.0, 63.69], [65.0, 66.43], [69.0, 69.03], [81.0, 81.72]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.4, 0.0, 0.0, 0.0, 59.86, 0.0, 62.27, 0.0, 0.0, 0.0, 0.0, 63.53, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 34.47], ["speech", 23.2], ["sidetone", 8.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.34, 1.92, 0.4, 1.85, 3.75, 0.84, 6.13, 0.38, 0.93, 1.18, -0.3, 4.21, 0.67, 1.69, 1.43, 0.03, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/n3K6Fkd5ri8_filtered.json b/annotations_filtered/n3K6Fkd5ri8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd3da08f46acdc0df0c4f291797a25588b8b1373 --- /dev/null +++ b/annotations_filtered/n3K6Fkd5ri8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 9.9], [18.0, 18.23], [19.0, 19.36], [20.0, 20.19], [23.0, 23.72], [26.0, 26.25], [30.0, 30.0], [32.0, 32.58], [33.0, 33.64], [35.0, 35.02], [37.0, 37.03], [39.0, 40.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.1, 0.23, 0.36, 0.19, 0.72, 0.25, 0.0, 0.58, 0.64, 0.02, 0.03, 1.36]} \ No newline at end of file diff --git a/annotations_filtered/n3L8UVTe6Ak_filtered.json b/annotations_filtered/n3L8UVTe6Ak_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5621d200c92049a4dba6afcbffb2db8551ace9b --- /dev/null +++ b/annotations_filtered/n3L8UVTe6Ak_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.29], [7.0, 8.5], [12.0, 13.09], [17.0, 17.86], [22.0, 22.98], [26.0, 26.16], [34.0, 36.02], [39.0, 39.88], [40.0, 40.41], [43.0, 45.22], [47.0, 49.65], [51.0, 52.41], [54.0, 54.95], [57.0, 59.17], [69.0, 69.25], [71.0, 71.47], [73.0, 73.99], [77.0, 77.62], [79.0, 80.22], [82.0, 83.07], [85.0, 88.74], [91.0, 147.46], [148.0, 149.37], [153.0, 154.31], [166.0, 167.04], [170.0, 170.65], [175.0, 179.25], [181.0, 196.23], [197.0, 198.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.86, 0.0, 0.0, 64.75, 86.09, 0.0, 0.0, 68.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.39, 0.0, 0.0, 0.0, 0.0, 0.0, 49.87, 31.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.15], ["music", 14.2], ["croak", 7.45]], null, null, null, null, null, [["music", 31.26], ["hum", 10.83], ["speech", 7.24]], [["music", 46.67], ["speech", 16.5], ["hum", 8.78]], null], "duration": [0.29, 1.5, 1.09, 0.86, 0.98, 0.16, 2.02, 0.88, 0.41, 2.22, 2.65, 1.41, 0.95, 2.17, 0.25, 0.47, 0.99, 0.62, 1.22, 1.07, 3.74, 56.46, 1.37, 1.31, 1.04, 0.65, 4.25, 15.23, 1.78]} \ No newline at end of file diff --git a/annotations_filtered/n3PGfjyctSQ_filtered.json b/annotations_filtered/n3PGfjyctSQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..534af96ff99c50d3f0ec279709b4a1d55cb4444e --- /dev/null +++ b/annotations_filtered/n3PGfjyctSQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.01], [9.0, 9.63], [12.0, 13.05], [14.0, 15.7], [17.0, 17.34], [20.0, 22.49], [30.0, 31.24], [38.0, 39.36], [39.0, 39.46], [44.0, 44.69], [46.0, 46.65], [48.0, 48.59], [50.0, 50.85], [53.0, 53.22], [57.0, 57.35], [60.0, 60.78], [75.0, 75.9], [77.0, 79.49], [82.0, 83.73], [85.0, 88.48], [90.0, 90.69], [93.0, 94.19], [95.0, 98.56], [102.0, 104.04], [106.0, 106.79], [108.0, 107.94], [112.0, 114.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.26, 0.0, 81.71, 0.0, 0.0, 31.15, 30.82, 0.0, 0.0, 34.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 31.26], ["music", 25.38], ["chirp tone", 9.17]], null, null, null, null, [["music", 44.97], ["speech", 15.59], ["trombone", 8.78]], [["music", 19.32], ["boat, water vehicle", 9.54], ["vehicle", 6.13]], null, null, [["beatboxing", 37.81], ["boing", 26.27], ["fart", 15.53]]], "duration": [0.01, 0.63, 1.05, 1.7, 0.34, 2.49, 1.24, 1.36, 0.46, 0.69, 0.65, 0.59, 0.85, 0.22, 0.35, 0.78, 0.9, 2.49, 1.73, 3.48, 0.69, 1.19, 3.56, 2.04, 0.79, -0.06, 2.86]} \ No newline at end of file diff --git a/annotations_filtered/n3SrAOdy-tE_filtered.json b/annotations_filtered/n3SrAOdy-tE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4dbc2b579881443b97d7eb4dadbd3fd705f029d --- /dev/null +++ b/annotations_filtered/n3SrAOdy-tE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.72], [8.0, 9.66], [10.0, 12.01], [13.0, 15.04], [19.0, 19.2], [22.0, 23.33], [26.0, 27.43], [28.0, 29.47], [30.0, 33.13], [34.0, 37.72], [39.0, 40.32], [41.0, 48.2]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 43.98, 88.1, 0.0, 0.0, 0.0, 0.0, 51.88, 51.88, 0.0, 48.39], "audiomae_on_audioset": [null, null, [["speech", 48.87], ["sidetone", 8.73], ["chirp tone", 6.58]], null, null, null, null, null, null, null, null, [["speech", 23.47], ["cough", 15.93], ["music", 12.16]]], "duration": [1.72, 1.66, 2.01, 2.04, 0.2, 1.33, 1.43, 1.47, 3.13, 3.72, 1.32, 7.2]} \ No newline at end of file diff --git a/annotations_filtered/n3Y6B_UKam0_filtered.json b/annotations_filtered/n3Y6B_UKam0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57bde0d21e7466c7a6aec95c59cfa353b060d38d --- /dev/null +++ b/annotations_filtered/n3Y6B_UKam0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.21], [16.0, 16.56], [21.0, 22.42], [25.0, 26.91], [28.0, 29.02], [36.0, 44.31], [49.0, 49.01], [50.0, 50.67], [55.0, 60.32], [63.0, 63.31], [64.0, 64.47], [73.0, 73.13], [75.0, 75.81], [79.0, 83.69], [84.0, 86.81], [88.0, 87.67], [89.0, 89.28], [95.0, 99.18], [99.0, 100.14], [104.0, 104.3], [106.0, 106.57], [109.0, 108.85], [112.0, 127.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 64.41, 0.0, 0.0, 60.79, 0.0, 0.0, 0.0, 0.0, 61.87, 58.72, 0.0, 0.0, 68.8, 0.0, 0.0, 0.0, 0.0, 31.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 46.17], ["music", 6.99], ["buzz", 5.0]]], "duration": [1.21, 0.56, 1.42, 1.91, 1.02, 8.31, 0.01, 0.67, 5.32, 0.31, 0.47, 0.13, 0.81, 4.69, 2.81, -0.33, 0.28, 4.18, 1.14, 0.3, 0.57, -0.15, 15.03]} \ No newline at end of file diff --git a/annotations_filtered/n3tXVrGw3kY_filtered.json b/annotations_filtered/n3tXVrGw3kY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..480d74950ed52d84939c7357cc92b80a7e870508 --- /dev/null +++ b/annotations_filtered/n3tXVrGw3kY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.59], [9.0, 9.95], [12.0, 12.56], [21.0, 21.73], [25.0, 25.56], [30.0, 33.2], [39.0, 40.19], [50.0, 51.95], [54.0, 55.56], [62.0, 63.0], [83.0, 84.89], [87.0, 88.11], [91.0, 92.53], [97.0, 96.92], [101.0, 101.78], [118.0, 118.79], [127.0, 128.61]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.41, 0.0, 0.0, 0.0, 0.0, 33.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 36.88], ["fart", 13.92], ["whip", 12.62]], null, null, null, null, null, null, null, null, null, null, null], "duration": [2.59, 0.95, 0.56, 0.73, 0.56, 3.2, 1.19, 1.95, 1.56, 1.0, 1.89, 1.11, 1.53, -0.08, 0.78, 0.79, 1.61]} \ No newline at end of file diff --git a/annotations_filtered/n44APWaJZ58_filtered.json b/annotations_filtered/n44APWaJZ58_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..932b7f7fcf6f11486d822d4d187660bd70bc6516 --- /dev/null +++ b/annotations_filtered/n44APWaJZ58_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.61], [8.0, 7.87], [13.0, 14.66], [20.0, 21.15], [27.0, 28.17], [30.0, 30.4], [34.0, 36.51], [38.0, 38.03], [41.0, 41.17], [47.0, 48.63], [49.0, 49.65], [50.0, 53.06], [58.0, 92.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.08, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.61, -0.13, 1.66, 1.15, 1.17, 0.4, 2.51, 0.03, 0.17, 1.63, 0.65, 3.06, 34.75]} \ No newline at end of file diff --git a/annotations_filtered/n4BJBz8GpzI_filtered.json b/annotations_filtered/n4BJBz8GpzI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3eea9cd28224b1ff86cf65a76894a729cb449078 --- /dev/null +++ b/annotations_filtered/n4BJBz8GpzI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 80.96], [81.0, 115.7], [116.0, 117.07], [117.0, 123.92]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 28.9], "audiomae_on_audioset": [null, null, null, [["music", 46.79], ["speech", 24.71], ["hum", 6.25]]], "duration": [62.96, 34.7, 1.07, 6.92]} \ No newline at end of file diff --git a/annotations_filtered/n4Mohc3SrHs_filtered.json b/annotations_filtered/n4Mohc3SrHs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f04c05ae63ba24615181dd1a448e0958c429a75 --- /dev/null +++ b/annotations_filtered/n4Mohc3SrHs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.55], [16.0, 15.84], [16.0, 16.66], [20.0, 20.63], [22.0, 21.74], [25.0, 26.4], [27.0, 28.46], [42.0, 42.63], [44.0, 44.69]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.55, -0.16, 0.66, 0.63, -0.26, 1.4, 1.46, 0.63, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/n4bsNkDyF2s_filtered.json b/annotations_filtered/n4bsNkDyF2s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8593977a343a4122e8e7621af53fcb6661e05f49 --- /dev/null +++ b/annotations_filtered/n4bsNkDyF2s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.2], [13.0, 20.39], [23.0, 41.74], [45.0, 60.98]], "keep_status": [false, true, false, true], "silence_prob": [0.0, 43.13, 28.4, 28.3], "audiomae_on_audioset": [null, [["hum", 28.06], ["music", 24.89], ["mains hum", 9.15]], [["music", 76.33], ["speech", 3.77], ["throbbing", 1.9]], [["music", 28.71], ["speech", 13.55], ["explosion", 7.93]]], "duration": [0.2, 7.39, 18.74, 15.98]} \ No newline at end of file diff --git a/annotations_filtered/n4pUbyGBD18_filtered.json b/annotations_filtered/n4pUbyGBD18_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..022cbd4a2b7080fd3bcee8ee51d50b1460471b63 --- /dev/null +++ b/annotations_filtered/n4pUbyGBD18_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.99], [2.0, 2.78], [5.0, 6.61], [8.0, 7.96], [10.0, 10.4], [12.0, 12.88], [19.0, 19.45], [28.0, 31.48], [33.0, 33.05], [34.0, 34.82], [42.0, 42.53], [43.0, 43.85], [46.0, 48.81], [51.0, 51.54], [53.0, 53.64], [55.0, 55.36], [56.0, 56.47], [57.0, 58.16], [59.0, 61.47], [64.0, 64.39], [65.0, 74.21], [77.0, 87.39], [88.0, 88.43], [89.0, 136.19], [139.0, 140.37], [142.0, 143.07]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.86, 0.0, 0.0, 0.0, 0.0, 42.79, 0.0, 0.0, 0.0, 0.0, 0.0, 49.82, 0.0, 30.85, 48.91, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["sidetone", 25.07], ["hum", 11.98], ["mains hum", 9.89]], null, null, null, null, [["fly, housefly", 46.56], ["bee, wasp, etc.", 17.51], ["insect", 13.29]], null, null, null, null, null, [["fly, housefly", 41.02], ["insect", 16.67], ["bee, wasp, etc.", 9.37]], null, [["music", 17.09], ["hum", 15.72], ["mains hum", 6.0]], [["music", 45.62], ["wind instrument, woodwind instrument", 6.03], ["hum", 5.13]], null, null, null, null], "duration": [-0.01, 0.78, 1.61, -0.04, 0.4, 0.88, 0.45, 3.48, 0.05, 0.82, 0.53, 0.85, 2.81, 0.54, 0.64, 0.36, 0.47, 1.16, 2.47, 0.39, 9.21, 10.39, 0.43, 47.19, 1.37, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/n59mG9_X35Q_filtered.json b/annotations_filtered/n59mG9_X35Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db1fd9aa81daa67a9f69850bd6f93c404cfd5f62 --- /dev/null +++ b/annotations_filtered/n59mG9_X35Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.65], [7.0, 8.18], [14.0, 18.4], [20.0, 20.24], [21.0, 21.49], [28.0, 29.49], [35.0, 39.68], [41.0, 48.25], [52.0, 58.35], [58.0, 58.53], [59.0, 60.44], [62.0, 63.64], [73.0, 73.47], [74.0, 80.5], [86.0, 87.27], [89.0, 90.41], [95.0, 99.84]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.7, 0.0, 0.0, 0.0, 29.06, 30.0, 32.37, 0.0, 0.0, 0.0, 0.0, 36.39, 0.0, 0.0, 32.34], "audiomae_on_audioset": [null, null, [["music", 28.91], ["grunt", 18.4], ["speech", 13.9]], null, null, null, [["music", 39.54], ["throbbing", 19.77], ["hum", 14.23]], [["speech", 43.08], ["music", 34.74], ["throbbing", 2.89]], [["music", 53.7], ["theremin", 13.93], ["soundtrack music", 4.33]], null, null, null, null, [["music", 76.5], ["didgeridoo", 8.69], ["musical instrument", 3.55]], null, null, [["music", 48.87], ["grunt", 22.24], ["animal", 13.24]]], "duration": [0.65, 1.18, 4.4, 0.24, 0.49, 1.49, 4.68, 7.25, 6.35, 0.53, 1.44, 1.64, 0.47, 6.5, 1.27, 1.41, 4.84]} \ No newline at end of file diff --git a/annotations_filtered/n5ArS3Got4U_filtered.json b/annotations_filtered/n5ArS3Got4U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48f9750d098a57061f93bdf772696262154756d2 --- /dev/null +++ b/annotations_filtered/n5ArS3Got4U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 13.32], [14.0, 33.2], [34.0, 41.08], [55.0, 55.0], [56.0, 56.96], [59.0, 60.07], [65.0, 65.64], [67.0, 67.71], [69.0, 69.6], [82.0, 87.81], [88.0, 88.32], [89.0, 117.54], [118.0, 119.69], [120.0, 122.52], [124.0, 127.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 96.54, 70.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.45, 0.0, 44.63, 0.0, 97.73, 95.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 81.75], ["didgeridoo", 2.53], ["cello", 1.57]], null, null, null], "duration": [8.32, 19.2, 7.08, 0.0, 0.96, 1.07, 0.64, 0.71, 0.6, 5.81, 0.32, 28.54, 1.69, 2.52, 3.55]} \ No newline at end of file diff --git a/annotations_filtered/n5HtgUGCM30_filtered.json b/annotations_filtered/n5HtgUGCM30_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..835f85feb2609d296753e243b1d2d5e718f2f48a --- /dev/null +++ b/annotations_filtered/n5HtgUGCM30_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.82], [11.0, 72.49], [75.0, 121.02]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.82, 61.49, 46.02]} \ No newline at end of file diff --git a/annotations_filtered/n5PnSNCFBYs_filtered.json b/annotations_filtered/n5PnSNCFBYs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3120c14ecb36586095fa54d12c4452f8c8f9201 --- /dev/null +++ b/annotations_filtered/n5PnSNCFBYs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.34], [10.0, 16.68], [21.0, 24.02], [26.0, 28.02], [29.0, 30.21], [38.0, 39.28], [56.0, 60.52], [68.0, 69.43]], "keep_status": [false, false, true, false, false, false, true, false], "silence_prob": [0.0, 38.37, 43.38, 81.35, 0.0, 0.0, 44.81, 0.0], "audiomae_on_audioset": [null, [["music", 46.62], ["speech", 19.26], ["throbbing", 8.49]], [["music", 24.81], ["hum", 12.89], ["synthesizer", 5.48]], null, null, null, [["speech", 40.22], ["radio", 17.38], ["frog", 4.3]], null], "duration": [0.34, 6.68, 3.02, 2.02, 1.21, 1.28, 4.52, 1.43]} \ No newline at end of file diff --git a/annotations_filtered/n5tMCxz-9uY_filtered.json b/annotations_filtered/n5tMCxz-9uY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf5d2b25c94eaab4e83e87cedddd55155709376b --- /dev/null +++ b/annotations_filtered/n5tMCxz-9uY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.76], [26.0, 30.79], [44.0, 44.12], [50.0, 50.75], [53.0, 53.15], [55.0, 56.78], [58.0, 61.82], [68.0, 68.49], [78.0, 79.14], [93.0, 92.99], [102.0, 102.05], [104.0, 104.57], [111.0, 111.84], [121.0, 122.5], [125.0, 136.78], [140.0, 151.58], [157.0, 157.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 31.2, 0.0, 0.0, 0.0, 0.0, 30.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.32, 30.57, 0.0], "audiomae_on_audioset": [null, [["music", 78.77], ["quack", 2.23], ["boing", 1.9]], null, null, null, null, [["music", 95.33], ["musical instrument", 0.6], ["guitar", 0.44]], null, null, null, null, null, null, null, [["music", 49.87], ["boing", 15.09], ["speech", 4.89]], [["music", 83.62], ["reggae", 1.58], ["drum and bass", 1.27]], null], "duration": [1.76, 4.79, 0.12, 0.75, 0.15, 1.78, 3.82, 0.49, 1.14, -0.01, 0.05, 0.57, 0.84, 1.5, 11.78, 11.58, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/n6H7zga2Ks0_filtered.json b/annotations_filtered/n6H7zga2Ks0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c71ab910a32c7db3eb18318f483500ce585d1218 --- /dev/null +++ b/annotations_filtered/n6H7zga2Ks0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.03], [12.0, 13.26], [16.0, 17.27], [21.0, 23.21], [24.0, 26.05], [28.0, 29.03], [31.0, 33.94], [34.0, 36.0], [38.0, 40.02], [46.0, 45.99], [48.0, 50.6], [55.0, 56.02], [57.0, 58.41], [59.0, 60.03], [62.0, 63.85], [65.0, 66.02], [67.0, 67.49], [69.0, 69.13], [76.0, 78.07], [84.0, 84.47], [85.0, 87.99], [90.0, 95.99], [96.0, 99.42], [102.0, 103.72], [104.0, 105.43], [107.0, 106.98], [108.0, 109.98], [111.0, 112.75], [114.0, 114.67], [115.0, 116.77], [119.0, 119.52], [123.0, 123.82], [124.0, 126.79], [128.0, 128.55], [130.0, 132.27], [133.0, 136.22], [137.0, 138.3], [139.0, 142.82], [143.0, 144.59], [146.0, 148.19]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 0.0, 0.0, 99.48, 86.82, 0.0, 100.0, 48.91, 83.7, 0.0, 99.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 78.38, 99.95, 99.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 0.0, 100.0, 100.0, 0.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 54.23], ["sidetone", 10.47], ["hum", 5.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.03, 1.26, 1.27, 2.21, 2.05, 1.03, 2.94, 2.0, 2.02, -0.01, 2.6, 1.02, 1.41, 1.03, 1.85, 1.02, 0.49, 0.13, 2.07, 0.47, 2.99, 5.99, 3.42, 1.72, 1.43, -0.02, 1.98, 1.75, 0.67, 1.77, 0.52, 0.82, 2.79, 0.55, 2.27, 3.22, 1.3, 3.82, 1.59, 2.19]} \ No newline at end of file diff --git a/annotations_filtered/n75PgMSxAOw_filtered.json b/annotations_filtered/n75PgMSxAOw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90d9142e0e19310029f911f1514a8829b2eeb86d --- /dev/null +++ b/annotations_filtered/n75PgMSxAOw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 32.48], [34.0, 97.07], [100.0, 118.02], [121.0, 125.79]], "keep_status": [true, false, true, true], "silence_prob": [30.64, 0.0, 29.65, 32.05], "audiomae_on_audioset": [[["speech", 47.71], ["vehicle", 5.51], ["music", 5.09]], null, [["whack, thwack", 36.42], ["music", 16.08], ["thump, thud", 14.98]], [["vehicle", 9.01], ["fly, housefly", 8.22], ["throbbing", 6.91]]], "duration": [21.48, 63.07, 18.02, 4.79]} \ No newline at end of file diff --git a/annotations_filtered/n7KKfjFRw8w_filtered.json b/annotations_filtered/n7KKfjFRw8w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f241f9b638570e4c721acbd7323f16985ae476f2 --- /dev/null +++ b/annotations_filtered/n7KKfjFRw8w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.77], [20.0, 24.65], [29.0, 32.86], [34.0, 35.04], [40.0, 81.82], [86.0, 86.04], [87.0, 87.12], [90.0, 89.7], [91.0, 91.08], [94.0, 93.6], [95.0, 110.34], [111.0, 111.27], [112.0, 114.52], [115.0, 118.22]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 33.96, 36.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.34, 0.0, 39.33, 51.99], "audiomae_on_audioset": [null, [["speech", 39.09], ["music", 22.37], ["synthesizer", 4.47]], [["music", 20.48], ["speech", 17.55], ["pulse", 7.72]], null, null, null, null, null, null, null, [["speech", 42.04], ["music", 24.03], ["sidetone", 11.79]], null, [["music", 53.32], ["musical instrument", 7.63], ["synthesizer", 7.21]], null], "duration": [0.77, 4.65, 3.86, 1.04, 41.82, 0.04, 0.12, -0.3, 0.08, -0.4, 15.34, 0.27, 2.52, 3.22]} \ No newline at end of file diff --git a/annotations_filtered/n7W0yxKnuvs_filtered.json b/annotations_filtered/n7W0yxKnuvs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7917453b7f10e0a49dc63276b0c472c3f7b9b2d --- /dev/null +++ b/annotations_filtered/n7W0yxKnuvs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.68], [3.0, 4.72], [6.0, 9.71], [12.0, 13.71], [20.0, 20.28], [22.0, 23.19], [25.0, 27.03], [30.0, 31.21], [32.0, 33.44], [37.0, 37.39], [41.0, 45.71], [47.0, 47.82], [49.0, 49.74], [52.0, 52.86], [54.0, 54.85], [57.0, 62.77], [64.0, 66.19], [67.0, 67.61], [69.0, 70.26], [71.0, 71.49], [73.0, 73.35], [74.0, 78.27], [84.0, 85.5], [86.0, 87.42], [90.0, 90.32], [91.0, 92.35], [95.0, 96.42], [98.0, 98.76], [103.0, 102.93], [108.0, 108.45], [114.0, 114.76], [117.0, 117.71], [119.0, 121.96], [123.0, 123.53], [127.0, 129.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.05, 0.0, 0.0, 0.0, 78.55, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.76, 0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.91, 0.0, 89.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.68, 1.72, 3.71, 1.71, 0.28, 1.19, 2.03, 1.21, 1.44, 0.39, 4.71, 0.82, 0.74, 0.86, 0.85, 5.77, 2.19, 0.61, 1.26, 0.49, 0.35, 4.27, 1.5, 1.42, 0.32, 1.35, 1.42, 0.76, -0.07, 0.45, 0.76, 0.71, 2.96, 0.53, 2.76]} \ No newline at end of file diff --git a/annotations_filtered/n7cRx_7umjE_filtered.json b/annotations_filtered/n7cRx_7umjE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43f4495b1c3a19b20893bc2de5332a6281307643 --- /dev/null +++ b/annotations_filtered/n7cRx_7umjE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.35], [5.0, 6.59], [11.0, 18.03], [20.0, 33.99], [35.0, 43.95], [52.0, 80.2], [81.0, 96.2]], "keep_status": [true, false, true, false, true, true, true], "silence_prob": [39.75, 0.0, 38.32, 35.15, 32.44, 31.2, 30.22], "audiomae_on_audioset": [[["vehicle", 15.68], ["music", 11.36], ["car", 4.49]], null, [["music", 28.88], ["speech", 24.04], ["throbbing", 11.25]], [["music", 42.59], ["speech", 21.05], ["throbbing", 10.78]], [["hum", 31.52], ["mains hum", 15.9], ["music", 9.08]], [["music", 34.24], ["speech", 9.09], ["hum", 9.0]], [["speech", 37.72], ["music", 26.4], ["fart", 4.95]]], "duration": [2.35, 1.59, 7.03, 13.99, 8.95, 28.2, 15.2]} \ No newline at end of file diff --git a/annotations_filtered/n7l2RLvI7Ss_filtered.json b/annotations_filtered/n7l2RLvI7Ss_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4284c47930b9e567aaf44b2883a21470191e68d0 --- /dev/null +++ b/annotations_filtered/n7l2RLvI7Ss_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.05], [9.0, 9.14], [12.0, 12.7], [18.0, 22.33], [26.0, 26.74], [29.0, 28.78], [30.0, 30.74], [33.0, 33.1], [34.0, 34.97], [35.0, 35.56], [40.0, 40.1], [41.0, 41.07], [49.0, 49.33], [50.0, 50.89], [53.0, 54.21], [56.0, 56.88], [61.0, 61.77], [63.0, 65.94], [66.0, 67.26], [68.0, 68.17], [69.0, 69.18], [69.0, 70.02], [71.0, 71.27], [73.0, 73.8], [76.0, 77.6], [78.0, 78.92], [80.0, 80.0], [81.0, 81.6], [83.0, 82.88], [84.0, 83.91], [84.0, 85.41], [88.0, 88.64], [94.0, 94.09], [96.0, 96.97], [98.0, 98.0], [98.0, 100.14], [102.0, 104.13], [106.0, 107.13], [109.0, 109.41], [110.0, 111.94], [114.0, 114.07], [115.0, 115.45], [116.0, 115.96], [116.0, 117.21], [125.0, 125.02], [130.0, 130.22], [131.0, 130.98], [132.0, 132.22], [134.0, 133.64], [136.0, 136.78], [139.0, 140.17], [141.0, 141.61], [143.0, 143.83], [144.0, 144.88], [146.0, 146.5], [147.0, 147.68], [148.0, 148.46], [151.0, 151.5], [152.0, 152.19], [153.0, 153.39], [156.0, 156.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 97.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.05, 0.14, 0.7, 4.33, 0.74, -0.22, 0.74, 0.1, 0.97, 0.56, 0.1, 0.07, 0.33, 0.89, 1.21, 0.88, 0.77, 2.94, 1.26, 0.17, 0.18, 1.02, 0.27, 0.8, 1.6, 0.92, 0.0, 0.6, -0.12, -0.09, 1.41, 0.64, 0.09, 0.97, 0.0, 2.14, 2.13, 1.13, 0.41, 1.94, 0.07, 0.45, -0.04, 1.21, 0.02, 0.22, -0.02, 0.22, -0.36, 0.78, 1.17, 0.61, 0.83, 0.88, 0.5, 0.68, 0.46, 0.5, 0.19, 0.39, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/n86CV7VKvfE_filtered.json b/annotations_filtered/n86CV7VKvfE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b961889b6c0207fb71aaa72500a86ecbcd22e90 --- /dev/null +++ b/annotations_filtered/n86CV7VKvfE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.81], [12.0, 13.56], [22.0, 22.23], [32.0, 32.56], [33.0, 33.3], [39.0, 40.0], [41.0, 40.74], [42.0, 42.75], [45.0, 45.45], [51.0, 51.22], [59.0, 59.68], [62.0, 62.11], [64.0, 64.39], [66.0, 66.68], [67.0, 67.56], [68.0, 68.86], [76.0, 76.98], [78.0, 79.71], [84.0, 84.97], [88.0, 88.11], [91.0, 92.03], [96.0, 96.57], [99.0, 99.72], [102.0, 102.44], [104.0, 103.64], [106.0, 106.37], [108.0, 108.77], [111.0, 111.94], [113.0, 113.26], [119.0, 119.89], [124.0, 124.21], [125.0, 126.25], [129.0, 129.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 1.56, 0.23, 0.56, 0.3, 1.0, -0.26, 0.75, 0.45, 0.22, 0.68, 0.11, 0.39, 0.68, 0.56, 0.86, 0.98, 1.71, 0.97, 0.11, 1.03, 0.57, 0.72, 0.44, -0.36, 0.37, 0.77, 0.94, 0.26, 0.89, 0.21, 1.25, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/n8mK-A_0viA_filtered.json b/annotations_filtered/n8mK-A_0viA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13a673169672269fa0d36fc4ee9016159e119959 --- /dev/null +++ b/annotations_filtered/n8mK-A_0viA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.12], [15.0, 19.08], [20.0, 21.37], [27.0, 30.11], [31.0, 33.45], [35.0, 102.39], [105.0, 106.0], [108.0, 109.09], [110.0, 110.51], [112.0, 119.6], [120.0, 130.54], [131.0, 131.28]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 62.27, 0.0, 49.22, 35.74, 0.0, 0.0, 0.0, 0.0, 31.7, 34.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 54.38], ["whale vocalization", 12.25], ["sine wave", 4.97]], [["music", 34.47], ["synthesizer", 9.94], ["didgeridoo", 6.63]], null, null, null, null, [["animal", 21.27], ["groan", 16.72], ["roar", 8.2]], [["speech", 48.26], ["sidetone", 30.47], ["music", 6.32]], null], "duration": [1.12, 4.08, 1.37, 3.11, 2.45, 67.39, 1.0, 1.09, 0.51, 7.6, 10.54, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/n8yUoQP6Rwo_filtered.json b/annotations_filtered/n8yUoQP6Rwo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..529e93efc5114dfe22f528f8b78693b67cc17e11 --- /dev/null +++ b/annotations_filtered/n8yUoQP6Rwo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.89], [5.0, 5.61], [9.0, 16.66], [22.0, 30.91], [36.0, 41.44], [42.0, 42.62], [44.0, 52.37], [54.0, 56.2], [61.0, 62.14], [64.0, 82.86]], "keep_status": [false, false, false, true, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 49.59, 30.13, 28.67, 0.0, 29.12, 29.44, 0.0, 29.3], "audiomae_on_audioset": [null, null, [["whale vocalization", 64.52], ["music", 11.4], ["speech", 8.86]], [["whale vocalization", 25.82], ["animal", 11.63], ["buzz", 8.67]], [["animal", 13.18], ["speech", 11.35], ["livestock, farm animals, working animals", 8.82]], null, [["speech", 21.7], ["music", 14.65], ["roar", 8.73]], [["speech", 24.02], ["fly, housefly", 23.68], ["insect", 11.74]], null, [["music", 50.82], ["speech", 12.57], ["groan", 11.49]]], "duration": [0.89, 0.61, 7.66, 8.91, 5.44, 0.62, 8.37, 2.2, 1.14, 18.86]} \ No newline at end of file diff --git a/annotations_filtered/n9-Wk6ulBuA_filtered.json b/annotations_filtered/n9-Wk6ulBuA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08c82bff1cf6fc6b169a7fa2b6ae1c783b0d104a --- /dev/null +++ b/annotations_filtered/n9-Wk6ulBuA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.58], [14.0, 14.08], [15.0, 18.64], [23.0, 28.0], [33.0, 33.89], [34.0, 41.5], [42.0, 47.26], [51.0, 51.34], [52.0, 54.01], [57.0, 65.91], [67.0, 68.76]], "keep_status": [false, false, true, false, false, true, true, false, true, true, false], "silence_prob": [0.0, 0.0, 32.28, 34.42, 0.0, 31.89, 32.56, 0.0, 33.0, 32.54, 0.0], "audiomae_on_audioset": [null, null, [["music", 31.24], ["speech", 16.7], ["knock", 10.39]], [["hum", 40.18], ["mains hum", 25.3], ["throbbing", 11.8]], null, [["sidetone", 24.85], ["throbbing", 24.43], ["speech", 14.35]], [["speech", 52.28], ["hum", 6.8], ["music", 6.3]], null, [["speech", 57.78], ["music", 4.16], ["speech synthesizer", 3.57]], [["whack, thwack", 40.9], ["throbbing", 8.13], ["music", 7.33]], null], "duration": [0.58, 0.08, 3.64, 5.0, 0.89, 7.5, 5.26, 0.34, 2.01, 8.91, 1.76]} \ No newline at end of file diff --git a/annotations_filtered/n92XBsqbSF4_filtered.json b/annotations_filtered/n92XBsqbSF4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47fff8f139e8521ef3b9224b67323d8313c9c9ca --- /dev/null +++ b/annotations_filtered/n92XBsqbSF4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 18.55], [20.0, 178.68]], "keep_status": [false, false], "silence_prob": [43.82, 0.0], "audiomae_on_audioset": [[["speech", 32.41], ["music", 31.03], ["hum", 6.98]], null], "duration": [4.55, 158.68]} \ No newline at end of file diff --git a/annotations_filtered/n94um7eDILg_filtered.json b/annotations_filtered/n94um7eDILg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c5c9f721c7da72b3e967c80d0117b9d5e8045fe --- /dev/null +++ b/annotations_filtered/n94um7eDILg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.47], [13.0, 13.46], [15.0, 14.99], [16.0, 19.23], [21.0, 21.25], [22.0, 22.69], [25.0, 25.24], [26.0, 26.5], [39.0, 39.51], [42.0, 47.55], [59.0, 59.0], [61.0, 62.01], [63.0, 63.26], [69.0, 69.58], [71.0, 71.42], [72.0, 72.76], [79.0, 81.23], [84.0, 85.19], [86.0, 87.44], [88.0, 88.96], [90.0, 111.91], [114.0, 114.62]], "keep_status": [true, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [32.77, 0.0, 0.0, 32.45, 0.0, 0.0, 0.0, 0.0, 0.0, 36.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.79, 0.0, 0.0, 0.0, 32.73, 0.0], "audiomae_on_audioset": [[["thump, thud", 17.92], ["rumble", 8.86], ["speech", 7.21]], null, null, [["fly, housefly", 28.36], ["insect", 13.81], ["wail, moan", 7.59]], null, null, null, null, null, [["speech", 29.41], ["groan", 18.11], ["grunt", 4.91]], null, null, null, null, null, null, [["music", 9.36], ["cattle, bovinae", 8.58], ["animal", 7.68]], null, null, null, [["music", 17.52], ["fly, housefly", 13.64], ["groan", 8.42]], null], "duration": [2.47, 0.46, -0.01, 3.23, 0.25, 0.69, 0.24, 0.5, 0.51, 5.55, 0.0, 1.01, 0.26, 0.58, 0.42, 0.76, 2.23, 1.19, 1.44, 0.96, 21.91, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/n9L9jMlulXI_filtered.json b/annotations_filtered/n9L9jMlulXI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2aaaa0120a055fc98a043d881b524fb3c21231a1 --- /dev/null +++ b/annotations_filtered/n9L9jMlulXI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.92], [22.0, 21.83], [24.0, 24.07], [25.0, 26.38], [27.0, 27.35], [28.0, 28.11], [28.0, 31.92], [32.0, 32.76], [37.0, 38.96], [41.0, 43.93], [46.0, 46.25], [46.0, 46.92], [50.0, 55.98], [58.0, 71.91], [79.0, 80.43], [88.0, 87.91], [89.0, 90.31], [100.0, 99.94], [104.0, 104.7]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.71, 0.0, 0.0, 38.75, 0.0, 0.0, 34.04, 31.04, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["animal", 9.18], ["electric shaver, electric razor", 9.0], ["hum", 8.06]], null, null, [["hum", 43.79], ["throbbing", 24.77], ["mains hum", 9.15]], null, null, [["animal", 11.92], ["speech", 7.3], ["fart", 5.5]], [["speech", 22.51], ["hum", 20.66], ["mains hum", 13.6]], null, null, null, null, null], "duration": [0.92, -0.17, 0.07, 1.38, 0.35, 0.11, 3.92, 0.76, 1.96, 2.93, 0.25, 0.92, 5.98, 13.91, 1.43, -0.09, 1.31, -0.06, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/n9hjsuaj448_filtered.json b/annotations_filtered/n9hjsuaj448_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/n9hjsuaj448_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/n9uVWlO0GAs_filtered.json b/annotations_filtered/n9uVWlO0GAs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/n9uVWlO0GAs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/nA1lAszNSoI_filtered.json b/annotations_filtered/nA1lAszNSoI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51943b0b231aad71a0802242060e85049886b769 --- /dev/null +++ b/annotations_filtered/nA1lAszNSoI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 41.13], [42.0, 67.95], [71.0, 78.54], [82.0, 92.94], [93.0, 139.78], [143.0, 154.03]], "keep_status": [false, true, false, false, false, false], "silence_prob": [0.0, 29.84, 33.02, 30.21, 0.0, 39.83], "audiomae_on_audioset": [null, [["music", 29.07], ["hum", 21.54], ["throbbing", 17.39]], [["music", 57.28], ["hum", 16.1], ["throbbing", 6.34]], [["hum", 28.68], ["throbbing", 22.88], ["mains hum", 20.17]], null, [["music", 72.96], ["whale vocalization", 10.08], ["ambient music", 4.85]]], "duration": [40.13, 25.95, 7.54, 10.94, 46.78, 11.03]} \ No newline at end of file diff --git a/annotations_filtered/nALXcRjbVzs_filtered.json b/annotations_filtered/nALXcRjbVzs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..329dcc0cdb06195c537575765f05248bb7d2f4f1 --- /dev/null +++ b/annotations_filtered/nALXcRjbVzs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.5], [11.0, 16.56], [19.0, 19.13], [20.0, 20.48], [35.0, 37.23], [42.0, 42.57], [45.0, 45.45], [48.0, 48.22], [48.0, 52.24], [61.0, 61.6], [65.0, 81.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 99.44, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 97.0, 0.0, 32.85], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 22.58], ["animal", 11.06], ["livestock, farm animals, working animals", 10.16]]], "duration": [1.5, 5.56, 0.13, 0.48, 2.23, 0.57, 0.45, 0.22, 4.24, 0.6, 16.45]} \ No newline at end of file diff --git a/annotations_filtered/nAgSecmB9lM_filtered.json b/annotations_filtered/nAgSecmB9lM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dba44f11ca61daf3541f43789732cfaad8b6563c --- /dev/null +++ b/annotations_filtered/nAgSecmB9lM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.61], [21.0, 21.79], [30.0, 30.54], [37.0, 41.25], [43.0, 89.73], [92.0, 97.38]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.53, 0.0, 99.31], "audiomae_on_audioset": [null, null, null, [["roaring cats (lions, tigers)", 19.14], ["roar", 14.79], ["wild animals", 12.88]], null, null], "duration": [0.61, 0.79, 0.54, 4.25, 46.73, 5.38]} \ No newline at end of file diff --git a/annotations_filtered/nAqJV2olXN0_filtered.json b/annotations_filtered/nAqJV2olXN0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b5bd6bb21d3f49e3f46e58828a6c639e0f1c636 --- /dev/null +++ b/annotations_filtered/nAqJV2olXN0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.92], [8.0, 9.22], [20.0, 20.12], [21.0, 37.57], [38.0, 38.89], [40.0, 40.8], [41.0, 42.06], [45.0, 46.6], [47.0, 65.04], [67.0, 74.92], [75.0, 75.91], [76.0, 76.86], [82.0, 84.03], [84.0, 85.97], [91.0, 93.88], [95.0, 100.9]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 43.66, 0.0, 0.0, 0.0, 0.0, 48.56, 50.56, 0.0, 0.0, 52.45, 0.0, 44.99, 67.38], "audiomae_on_audioset": [null, null, null, [["speech", 60.49], ["radio", 4.91], ["sidetone", 4.07]], null, null, null, null, [["music", 42.85], ["musical instrument", 7.27], ["guitar", 5.77]], null, null, null, null, null, [["music", 31.47], ["mains hum", 17.88], ["hum", 9.88]], null], "duration": [1.92, 1.22, 0.12, 16.57, 0.89, 0.8, 1.06, 1.6, 18.04, 7.92, 0.91, 0.86, 2.03, 1.97, 2.88, 5.9]} \ No newline at end of file diff --git a/annotations_filtered/nAuz36A1zG0_filtered.json b/annotations_filtered/nAuz36A1zG0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88cbce43057702c1cf0bebf02b34face076882d2 --- /dev/null +++ b/annotations_filtered/nAuz36A1zG0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 13.95], [14.0, 82.0], [87.0, 88.11]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [-0.05, 68.0, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/nB95pK8TgYw_filtered.json b/annotations_filtered/nB95pK8TgYw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a981a24e4846e6eb63bf032aa619720fdec44e0b --- /dev/null +++ b/annotations_filtered/nB95pK8TgYw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.23], [9.0, 17.69], [18.0, 21.47], [23.0, 26.92], [28.0, 28.34], [36.0, 36.34], [38.0, 38.64], [42.0, 43.14], [44.0, 45.3], [46.0, 51.66], [54.0, 58.7], [60.0, 60.79], [62.0, 65.25], [66.0, 69.11], [72.0, 72.93], [74.0, 74.85], [76.0, 76.0], [77.0, 77.41], [80.0, 81.45], [82.0, 84.82], [85.0, 88.3], [90.0, 91.32], [93.0, 98.31], [99.0, 99.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.17, 98.8, 99.44, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 41.7, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.16, 86.27, 0.0, 90.95, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["explosion", 36.98], ["eruption", 20.33], ["speech", 14.46]], null, null, null, null, null, null, null, null, null, null, null], "duration": [2.23, 8.69, 3.47, 3.92, 0.34, 0.34, 0.64, 1.14, 1.3, 5.66, 4.7, 0.79, 3.25, 3.11, 0.93, 0.85, 0.0, 0.41, 1.45, 2.82, 3.3, 1.32, 5.31, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/nB9rg6sxHhU_filtered.json b/annotations_filtered/nB9rg6sxHhU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d8b1566c12ae64abd4bfc0afefd48aaf03bcb00 --- /dev/null +++ b/annotations_filtered/nB9rg6sxHhU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.53], [12.0, 11.77], [25.0, 25.57], [34.0, 34.91], [36.0, 40.2], [41.0, 42.82], [44.0, 50.21], [55.0, 57.08], [60.0, 61.84], [67.0, 68.84], [72.0, 73.53], [86.0, 86.46], [89.0, 91.2], [96.0, 98.27], [101.0, 103.0], [114.0, 115.72], [123.0, 124.46], [132.0, 131.99], [135.0, 135.84], [136.0, 140.68], [147.0, 148.27], [154.0, 170.51], [173.0, 175.02], [180.0, 182.01], [185.0, 186.63], [197.0, 199.03], [205.0, 207.6], [218.0, 218.62], [220.0, 222.4], [228.0, 232.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 91.13, 0.0, 33.67, 49.13, 0.0, 0.0, 0.0, 0.0, 40.06, 39.99, 40.24, 0.0, 0.0, 0.0, 0.0, 30.86, 0.0, 32.72, 39.54, 38.21, 0.0, 39.78, 30.99, 0.0, 31.98, 30.78], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 43.85], ["theremin", 34.95], ["guitar", 2.8]], [["music", 73.19], ["synthesizer", 3.81], ["musical instrument", 2.11]], null, null, null, null, [["music", 64.47], ["synthesizer", 5.85], ["middle eastern music", 1.65]], [["music", 62.48], ["flute", 5.97], ["carnatic music", 5.12]], [["music", 59.43], ["didgeridoo", 7.15], ["synthesizer", 5.07]], null, null, null, null, [["music", 68.82], ["singing", 2.94], ["swing music", 2.28]], null, [["music", 84.87], ["synthesizer", 0.98], ["keyboard (musical)", 0.8]], [["music", 68.34], ["singing", 3.11], ["musical instrument", 2.38]], [["music", 69.74], ["theremin", 5.46], ["middle eastern music", 2.34]], null, [["music", 30.76], ["double bass", 14.95], ["cello", 10.41]], [["music", 74.35], ["soundtrack music", 2.01], ["sampler", 1.7]], null, [["music", 74.53], ["musical instrument", 3.86], ["synthesizer", 3.58]], [["music", 74.73], ["didgeridoo", 2.45], ["electronic music", 2.05]]], "duration": [1.53, -0.23, 0.57, 0.91, 4.2, 1.82, 6.21, 2.08, 1.84, 1.84, 1.53, 0.46, 2.2, 2.27, 2.0, 1.72, 1.46, -0.01, 0.84, 4.68, 1.27, 16.51, 2.02, 2.01, 1.63, 2.03, 2.6, 0.62, 2.4, 4.06]} \ No newline at end of file diff --git a/annotations_filtered/nBQDz9PiMDU_filtered.json b/annotations_filtered/nBQDz9PiMDU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ee543511845bdc35df28dedf41d7ae3cd50f4cc --- /dev/null +++ b/annotations_filtered/nBQDz9PiMDU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.9], [20.0, 20.61], [22.0, 21.71], [23.0, 24.66], [26.0, 31.35], [33.0, 33.84], [36.0, 37.76], [39.0, 42.43], [44.0, 48.41], [51.0, 53.4], [56.0, 57.35], [59.0, 61.97], [63.0, 65.4], [68.0, 71.85], [77.0, 77.94], [79.0, 83.44], [86.0, 88.13], [91.0, 94.17], [97.0, 99.1], [102.0, 103.72], [107.0, 109.41], [111.0, 111.0], [113.0, 117.34], [121.0, 126.5], [132.0, 134.43], [138.0, 138.47], [142.0, 142.65], [143.0, 143.38], [149.0, 149.3], [153.0, 153.23], [162.0, 162.19], [166.0, 167.59], [168.0, 169.23]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, true, false, true, true, true, true, false, true, false, true, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.87, 0.0, 0.0, 38.02, 32.96, 36.46, 0.0, 36.12, 30.76, 33.45, 0.0, 35.03, 33.31, 34.72, 36.17, 0.0, 34.51, 0.0, 33.78, 33.49, 42.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 70.14], ["music", 5.94], ["echo", 2.48]], null, null, [["sidetone", 74.92], ["speech", 16.42], ["music", 3.21]], [["music", 59.86], ["speech", 6.92], ["effects unit", 5.29]], [["vehicle", 12.4], ["boat, water vehicle", 6.22], ["car", 4.5]], null, [["speech", 34.23], ["radio", 11.42], ["noise", 10.91]], [["speech", 43.59], ["sidetone", 21.72], ["radio", 17.08]], [["buzz", 38.16], ["white noise", 5.3], ["vehicle", 5.03]], null, [["noise", 33.22], ["music", 13.68], ["speech", 6.89]], [["sine wave", 22.37], ["chirp tone", 16.07], ["music", 13.56]], [["music", 29.9], ["musical instrument", 9.99], ["hum", 8.09]], [["music", 37.61], ["synthesizer", 9.63], ["hum", 8.32]], null, [["speech", 16.45], ["music", 15.12], ["sidetone", 11.68]], null, [["speech", 39.03], ["hum", 11.14], ["music", 7.75]], [["music", 42.01], ["synthesizer", 7.94], ["sine wave", 5.32]], [["music", 35.49], ["brass instrument", 16.92], ["french horn", 12.87]], null, null, null, null, null, null, null, null], "duration": [1.9, 0.61, -0.29, 1.66, 5.35, 0.84, 1.76, 3.43, 4.41, 2.4, 1.35, 2.97, 2.4, 3.85, 0.94, 4.44, 2.13, 3.17, 2.1, 1.72, 2.41, 0.0, 4.34, 5.5, 2.43, 0.47, 0.65, 0.38, 0.3, 0.23, 0.19, 1.59, 1.23]} \ No newline at end of file diff --git a/annotations_filtered/nBRPKaHMFn4_filtered.json b/annotations_filtered/nBRPKaHMFn4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13995e3977a74a33206b188fb58ef0df7b53277c --- /dev/null +++ b/annotations_filtered/nBRPKaHMFn4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [1.0, 1.83], [2.0, 5.41], [8.0, 10.74], [14.0, 18.01], [18.0, 24.14], [25.0, 31.28], [33.0, 33.27], [34.0, 34.82], [35.0, 36.17], [42.0, 42.72], [44.0, 44.44], [46.0, 46.67], [50.0, 51.71], [54.0, 57.21], [58.0, 58.77], [60.0, 60.98], [69.0, 72.0], [76.0, 77.16], [86.0, 85.94], [88.0, 92.37], [96.0, 100.67], [102.0, 104.06], [105.0, 107.27], [113.0, 113.71], [118.0, 119.72], [123.0, 123.33], [123.0, 123.52], [124.0, 123.72], [124.0, 123.79], [124.0, 123.82], [125.0, 126.39], [128.0, 131.28], [132.0, 133.56], [135.0, 136.27], [140.0, 140.02], [142.0, 143.11], [144.0, 148.78], [150.0, 156.64], [159.0, 160.83], [162.0, 162.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 51.6, 51.28, 69.74, 99.97, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 0.83, 3.41, 2.74, 4.01, 6.14, 6.28, 0.27, 0.82, 1.17, 0.72, 0.44, 0.67, 1.71, 3.21, 0.77, 0.98, 3.0, 1.16, -0.06, 4.37, 4.67, 2.06, 2.27, 0.71, 1.72, 0.33, 0.52, -0.28, -0.21, -0.18, 1.39, 3.28, 1.56, 1.27, 0.02, 1.11, 4.78, 6.64, 1.83, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/nBRTe09eseE_filtered.json b/annotations_filtered/nBRTe09eseE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3da6f6f184dd8af248731c4255f42c7047b9d6db --- /dev/null +++ b/annotations_filtered/nBRTe09eseE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.15], [7.0, 7.38], [7.0, 7.42], [7.0, 7.45], [7.0, 8.85], [14.0, 14.81], [16.0, 16.5], [26.0, 31.8], [33.0, 33.2], [38.0, 137.3], [138.0, 140.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.47, 0.0, 0.0, 31.41], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 38.16], ["music", 26.52], ["mains hum", 9.48]], null, null, [["hum", 40.91], ["mains hum", 34.33], ["music", 5.41]]], "duration": [0.15, 0.38, 0.42, 0.45, 1.85, 0.81, 0.5, 5.8, 0.2, 99.3, 2.49]} \ No newline at end of file diff --git a/annotations_filtered/nBZ39gX_FlU_filtered.json b/annotations_filtered/nBZ39gX_FlU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72e28de9204556d8c374c56503c6ace77417876f --- /dev/null +++ b/annotations_filtered/nBZ39gX_FlU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 22.86], [25.0, 32.27], [33.0, 57.7], [61.0, 91.02], [92.0, 93.61], [95.0, 95.35], [96.0, 96.79], [98.0, 99.64], [103.0, 104.85], [109.0, 116.94], [120.0, 122.77], [134.0, 137.27], [138.0, 142.13], [143.0, 143.82]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true, false, false], "silence_prob": [33.14, 30.67, 32.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.5, 32.06, 31.89, 31.75, 0.0], "audiomae_on_audioset": [[["throbbing", 34.52], ["music", 30.14], ["hum", 17.66]], [["hum", 30.56], ["mains hum", 27.63], ["music", 11.88]], [["music", 47.31], ["throbbing", 27.52], ["hum", 10.62]], null, null, null, null, null, null, [["fly, housefly", 34.26], ["mosquito", 9.05], ["insect", 8.53]], [["gong", 20.96], ["music", 19.61], ["sonar", 8.44]], [["moo", 21.9], ["cattle, bovinae", 12.62], ["livestock, farm animals, working animals", 12.05]], [["speech", 34.0], ["hum", 23.24], ["music", 14.7]], null], "duration": [15.86, 7.27, 24.7, 30.02, 1.61, 0.35, 0.79, 1.64, 1.85, 7.94, 2.77, 3.27, 4.13, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/nBmNcy4zZNU_filtered.json b/annotations_filtered/nBmNcy4zZNU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac3f092d60bce16326d5f14a6ff98bbe22ae6a87 --- /dev/null +++ b/annotations_filtered/nBmNcy4zZNU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 19.45], [21.0, 26.77], [28.0, 29.05], [30.0, 31.78], [44.0, 44.54], [50.0, 53.27], [54.0, 55.26], [56.0, 57.59], [65.0, 66.36], [67.0, 68.08], [72.0, 77.19], [82.0, 82.9], [85.0, 84.94], [86.0, 92.77], [99.0, 99.74], [100.0, 101.95], [103.0, 103.57], [110.0, 117.51], [120.0, 125.91], [130.0, 131.08]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, true, false, false], "silence_prob": [32.56, 66.76, 0.0, 0.0, 0.0, 56.03, 0.0, 0.0, 0.0, 0.0, 31.93, 0.0, 0.0, 34.41, 0.0, 0.0, 0.0, 34.2, 51.71, 0.0], "audiomae_on_audioset": [[["clang", 21.88], ["fly, housefly", 14.11], ["ding", 11.08]], null, null, null, null, null, null, null, null, null, [["speech", 29.24], ["whale vocalization", 18.62], ["animal", 17.06]], null, null, [["speech", 30.13], ["noise", 12.63], ["screaming", 7.76]], null, null, null, [["grunt", 54.6], ["groan", 8.62], ["hum", 5.04]], null, null], "duration": [8.45, 5.77, 1.05, 1.78, 0.54, 3.27, 1.26, 1.59, 1.36, 1.08, 5.19, 0.9, -0.06, 6.77, 0.74, 1.95, 0.57, 7.51, 5.91, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/nBsxbjTIJxs_filtered.json b/annotations_filtered/nBsxbjTIJxs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a20138b5dface444a734105c196a610d78016f8 --- /dev/null +++ b/annotations_filtered/nBsxbjTIJxs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.23], [6.0, 6.03], [9.0, 9.14], [20.0, 20.49], [21.0, 23.45], [26.0, 26.69], [29.0, 29.19], [34.0, 35.8], [46.0, 46.97], [48.0, 48.49], [52.0, 52.79], [54.0, 54.21], [56.0, 56.69], [69.0, 69.96], [87.0, 89.63], [90.0, 90.9], [91.0, 92.33], [95.0, 95.05], [101.0, 101.21], [102.0, 102.81], [105.0, 105.76], [113.0, 113.58], [118.0, 118.59], [127.0, 127.36], [133.0, 133.61], [147.0, 148.07], [149.0, 149.54], [153.0, 152.88], [155.0, 155.95], [158.0, 158.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 56.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.23, 0.03, 0.14, 0.49, 2.45, 0.69, 0.19, 1.8, 0.97, 0.49, 0.79, 0.21, 0.69, 0.96, 2.63, 0.9, 1.33, 0.05, 0.21, 0.81, 0.76, 0.58, 0.59, 0.36, 0.61, 1.07, 0.54, -0.12, 0.95, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/nC-it_V8df0_filtered.json b/annotations_filtered/nC-it_V8df0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48e95d21c260d3c5226c99437130550f2b6f7731 --- /dev/null +++ b/annotations_filtered/nC-it_V8df0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 46.16], [47.0, 47.04], [47.0, 48.07], [48.0, 49.76], [51.0, 51.14], [54.0, 54.95], [60.0, 60.03], [61.0, 62.77], [65.0, 67.58], [68.0, 88.16], [95.0, 95.72], [97.0, 96.7], [97.0, 98.59], [99.0, 100.28], [105.0, 105.04], [116.0, 123.15], [128.0, 131.97], [134.0, 135.38]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [60.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.57, 34.99, 0.0, 0.0, 0.0, 0.0, 0.0, 36.31, 36.24, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 49.92], ["speech", 12.17], ["fly, housefly", 7.0]], [["boing", 58.31], ["music", 35.25], ["speech", 1.04]], null, null, null, null, null, [["music", 61.19], ["boing", 5.84], ["didgeridoo", 4.56]], [["speech", 21.78], ["boing", 19.65], ["fart", 12.42]], null], "duration": [21.16, 0.04, 1.07, 1.76, 0.14, 0.95, 0.03, 1.77, 2.58, 20.16, 0.72, -0.3, 1.59, 1.28, 0.04, 7.15, 3.97, 1.38]} \ No newline at end of file diff --git a/annotations_filtered/nCK7A5Zp9I4_filtered.json b/annotations_filtered/nCK7A5Zp9I4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d211e8e6f8c31df1d10212c4437cd303896679fe --- /dev/null +++ b/annotations_filtered/nCK7A5Zp9I4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.93], [11.0, 10.81], [12.0, 12.5], [14.0, 14.62], [16.0, 19.04], [20.0, 28.86], [31.0, 31.62], [33.0, 35.14], [36.0, 37.37], [38.0, 40.61], [42.0, 43.51], [44.0, 44.14], [44.0, 47.34], [49.0, 49.08], [50.0, 53.08], [55.0, 54.68], [56.0, 58.48], [59.0, 59.95], [60.0, 61.67], [68.0, 70.77], [72.0, 72.55], [76.0, 76.65], [79.0, 79.15], [80.0, 84.13], [86.0, 88.15], [90.0, 92.52], [94.0, 98.59]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.96, 0.0, 0.0, 0.0, 99.36, 47.46, 0.0, 92.48, 0.0, 100.0, 0.0, 0.0, 91.81, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 18.11], ["hum", 13.71], ["noise", 8.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.93, -0.19, 0.5, 0.62, 3.04, 8.86, 0.62, 2.14, 1.37, 2.61, 1.51, 0.14, 3.34, 0.08, 3.08, -0.32, 2.48, 0.95, 1.67, 2.77, 0.55, 0.65, 0.15, 4.13, 2.15, 2.52, 4.59]} \ No newline at end of file diff --git a/annotations_filtered/nCWBxPh4dGo_filtered.json b/annotations_filtered/nCWBxPh4dGo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95b447f18cacead1d4f83505d7b7932c3f733aac --- /dev/null +++ b/annotations_filtered/nCWBxPh4dGo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.01], [12.0, 25.47], [28.0, 70.87], [73.0, 73.25], [76.0, 80.84], [83.0, 83.66], [85.0, 86.51], [87.0, 104.75], [108.0, 115.67], [119.0, 154.55], [156.0, 158.89], [161.0, 161.13], [165.0, 166.72]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.55, 29.24, 0.0, 0.0, 30.88, 0.0, 0.0, 31.53, 28.92, 0.0, 29.74, 0.0, 0.0], "audiomae_on_audioset": [[["music", 48.89], ["speech", 28.0], ["electronic music", 1.83]], [["music", 30.02], ["speech", 5.95], ["groan", 5.49]], null, null, [["music", 36.22], ["speech", 33.74], ["boing", 10.64]], null, null, [["music", 45.68], ["synthesizer", 22.72], ["keyboard (musical)", 3.54]], [["music", 87.88], ["musical instrument", 1.43], ["rock and roll", 0.75]], null, [["music", 73.54], ["boing", 2.7], ["electronic music", 1.66]], null, null], "duration": [3.01, 13.47, 42.87, 0.25, 4.84, 0.66, 1.51, 17.75, 7.67, 35.55, 2.89, 0.13, 1.72]} \ No newline at end of file diff --git a/annotations_filtered/nCgg5XIxxjY_filtered.json b/annotations_filtered/nCgg5XIxxjY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d19e9c9a3671f509751ffd8adce6e8530f207be --- /dev/null +++ b/annotations_filtered/nCgg5XIxxjY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 24.38], [26.0, 50.67], [51.0, 52.49], [53.0, 75.44], [79.0, 79.73], [80.0, 82.26], [83.0, 84.75], [86.0, 86.51], [87.0, 88.86], [89.0, 95.23], [97.0, 97.82], [100.0, 100.35], [101.0, 101.6], [105.0, 105.93], [112.0, 119.89], [120.0, 121.1], [123.0, 123.06]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [32.4, 31.76, 0.0, 32.27, 0.0, 33.03, 0.0, 0.0, 0.0, 33.7, 0.0, 0.0, 0.0, 0.0, 37.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 57.0], ["synthesizer", 15.18], ["musical instrument", 7.82]], [["music", 75.99], ["didgeridoo", 13.74], ["musical instrument", 2.73]], null, [["music", 71.29], ["didgeridoo", 5.08], ["wind instrument, woodwind instrument", 2.54]], null, [["music", 82.87], ["didgeridoo", 7.23], ["musical instrument", 3.62]], null, null, null, [["fart", 35.28], ["whack, thwack", 23.05], ["creak", 8.19]], null, null, null, null, [["speech", 37.73], ["horse", 6.97], ["fart", 6.54]], null, null], "duration": [21.38, 24.67, 1.49, 22.44, 0.73, 2.26, 1.75, 0.51, 1.86, 6.23, 0.82, 0.35, 0.6, 0.93, 7.89, 1.1, 0.06]} \ No newline at end of file diff --git a/annotations_filtered/nCuYBELZjpY_filtered.json b/annotations_filtered/nCuYBELZjpY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0d86781d78f0e7d390494bacb8256c780c38dee --- /dev/null +++ b/annotations_filtered/nCuYBELZjpY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 53.13], [56.0, 74.71], [76.0, 90.22]], "keep_status": [true, false, false], "silence_prob": [31.85, 36.83, 44.32], "audiomae_on_audioset": [[["music", 36.84], ["noise", 17.89], ["explosion", 5.78]], [["music", 46.66], ["theremin", 23.41], ["whale vocalization", 14.06]], [["music", 55.53], ["theremin", 12.62], ["whale vocalization", 6.17]]], "duration": [7.13, 18.71, 14.22]} \ No newline at end of file diff --git a/annotations_filtered/nD6DMtXc3mY_filtered.json b/annotations_filtered/nD6DMtXc3mY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91825cc40c66c563bd230d6d2a66b1639e10434b --- /dev/null +++ b/annotations_filtered/nD6DMtXc3mY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.39], [9.0, 10.52], [16.0, 16.71], [20.0, 21.59], [22.0, 113.95], [120.0, 120.28], [122.0, 122.93], [123.0, 125.2], [132.0, 133.84], [137.0, 147.51], [149.0, 150.11], [151.0, 158.89], [160.0, 171.64]], "keep_status": [true, false, false, false, false, false, false, true, false, true, false, true, true], "silence_prob": [36.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.22, 0.0, 38.22, 0.0, 30.7, 30.85], "audiomae_on_audioset": [[["music", 33.75], ["hum", 15.33], ["speech", 14.24]], null, null, null, null, null, null, [["music", 53.78], ["didgeridoo", 10.98], ["hum", 4.89]], null, [["music", 31.47], ["didgeridoo", 15.42], ["hum", 14.05]], null, [["whale vocalization", 20.43], ["mains hum", 11.02], ["hum", 9.77]], [["music", 44.13], ["hum", 13.2], ["electronic music", 7.58]]], "duration": [2.39, 1.52, 0.71, 1.59, 91.95, 0.28, 0.93, 2.2, 1.84, 10.51, 1.11, 7.89, 11.64]} \ No newline at end of file diff --git a/annotations_filtered/nDBs6ywP9ZE_filtered.json b/annotations_filtered/nDBs6ywP9ZE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96ed12a91ee878e1df13513db783d830e977b326 --- /dev/null +++ b/annotations_filtered/nDBs6ywP9ZE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.37], [8.0, 9.83], [12.0, 14.69], [23.0, 24.76], [27.0, 30.03], [31.0, 72.84], [75.0, 77.18], [80.0, 81.85], [83.0, 112.58], [116.0, 117.93], [123.0, 123.57], [126.0, 131.7], [133.0, 134.94], [135.0, 142.28]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 43.74, 0.0, 32.46, 0.0, 31.81, 0.0, 36.77, 0.0, 0.0, 31.08, 0.0, 31.28], "audiomae_on_audioset": [null, null, [["music", 37.93], ["speech", 9.97], ["hum", 6.94]], null, [["hum", 56.42], ["throbbing", 26.55], ["mains hum", 3.93]], null, [["throbbing", 35.39], ["hum", 19.14], ["music", 15.4]], null, [["hum", 44.3], ["mains hum", 22.51], ["throbbing", 20.03]], null, null, [["throbbing", 29.2], ["hum", 24.55], ["music", 13.9]], null, [["music", 70.16], ["hum", 9.33], ["throbbing", 5.78]]], "duration": [1.37, 1.83, 2.69, 1.76, 3.03, 41.84, 2.18, 1.85, 29.58, 1.93, 0.57, 5.7, 1.94, 7.28]} \ No newline at end of file diff --git a/annotations_filtered/nDGZMXNYfF4_filtered.json b/annotations_filtered/nDGZMXNYfF4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c74dff3f00658e39015baa5952d2eb97b12a8c40 --- /dev/null +++ b/annotations_filtered/nDGZMXNYfF4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 47.14], [50.0, 60.12], [63.0, 68.82], [70.0, 70.7], [73.0, 73.33], [74.0, 83.93], [85.0, 115.75], [118.0, 118.52], [120.0, 131.89]], "keep_status": [false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 30.7, 30.81, 0.0, 0.0, 30.19, 0.0, 0.0, 30.67], "audiomae_on_audioset": [null, [["music", 66.28], ["didgeridoo", 19.62], ["musical instrument", 9.03]], [["music", 48.49], ["trombone", 14.71], ["grunt", 5.91]], null, null, [["music", 49.32], ["didgeridoo", 10.67], ["frog", 6.36]], null, null, [["music", 59.66], ["musical instrument", 10.0], ["synthesizer", 5.2]]], "duration": [34.14, 10.12, 5.82, 0.7, 0.33, 9.93, 30.75, 0.52, 11.89]} \ No newline at end of file diff --git a/annotations_filtered/nDKhoXEpIq8_filtered.json b/annotations_filtered/nDKhoXEpIq8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5be5179c2fad86123e6a4310b5d712bb2eed7ec7 --- /dev/null +++ b/annotations_filtered/nDKhoXEpIq8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.38], [4.0, 5.04], [5.0, 5.71], [6.0, 8.51], [12.0, 12.5], [16.0, 16.83], [19.0, 19.87], [21.0, 22.22], [28.0, 28.7], [29.0, 30.08], [35.0, 35.67], [37.0, 37.08], [38.0, 38.43], [42.0, 42.15], [43.0, 43.58], [47.0, 47.46], [49.0, 49.98], [51.0, 52.22], [54.0, 56.29], [59.0, 59.9], [63.0, 63.04], [65.0, 65.6], [73.0, 74.16], [78.0, 78.48], [89.0, 90.07], [93.0, 94.49], [98.0, 100.06], [101.0, 101.14], [103.0, 103.94], [106.0, 106.17], [112.0, 112.62], [114.0, 115.06], [119.0, 122.18], [128.0, 130.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0, 89.54, 70.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.38, 1.04, 0.71, 2.51, 0.5, 0.83, 0.87, 1.22, 0.7, 1.08, 0.67, 0.08, 0.43, 0.15, 0.58, 0.46, 0.98, 1.22, 2.29, 0.9, 0.04, 0.6, 1.16, 0.48, 1.07, 1.49, 2.06, 0.14, 0.94, 0.17, 0.62, 1.06, 3.18, 2.28]} \ No newline at end of file diff --git a/annotations_filtered/nDlEcFRZUYI_filtered.json b/annotations_filtered/nDlEcFRZUYI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b912e792c4c9795485c7bba6d3f315400104e05 --- /dev/null +++ b/annotations_filtered/nDlEcFRZUYI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.63], [4.0, 3.6], [5.0, 4.85], [7.0, 8.87], [11.0, 14.54], [16.0, 17.41], [19.0, 19.5], [21.0, 21.46], [22.0, 30.0], [31.0, 30.86], [32.0, 32.09], [33.0, 33.62], [34.0, 34.42], [35.0, 36.1], [37.0, 37.98], [39.0, 40.12], [41.0, 40.93], [43.0, 44.31], [48.0, 48.14], [49.0, 49.3], [50.0, 50.16], [51.0, 51.31], [52.0, 52.34], [56.0, 59.64], [61.0, 61.21], [63.0, 63.1], [65.0, 65.58], [66.0, 67.47], [68.0, 70.09], [71.0, 84.82], [88.0, 88.1], [92.0, 92.13], [94.0, 94.66], [95.0, 96.79], [103.0, 104.3], [107.0, 107.43], [111.0, 111.84], [114.0, 114.44], [115.0, 124.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 94.52, 0.0, 0.0, 0.0, 45.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.87, 0.0, 0.0, 0.0, 0.0, 99.96, 70.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 41.03], ["sidetone", 26.51], ["telephone", 8.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.63, -0.4, -0.15, 1.87, 3.54, 1.41, 0.5, 0.46, 8.0, -0.14, 0.09, 0.62, 0.42, 1.1, 0.98, 1.12, -0.07, 1.31, 0.14, 0.3, 0.16, 0.31, 0.34, 3.64, 0.21, 0.1, 0.58, 1.47, 2.09, 13.82, 0.1, 0.13, 0.66, 1.79, 1.3, 0.43, 0.84, 0.44, 9.82]} \ No newline at end of file diff --git a/annotations_filtered/nDw_DOEdai8_filtered.json b/annotations_filtered/nDw_DOEdai8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9cdcec21a347ecb8fa6e9aa6f9296d8d30ca737d --- /dev/null +++ b/annotations_filtered/nDw_DOEdai8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.06], [5.0, 6.39], [9.0, 10.25], [12.0, 13.8], [15.0, 15.23], [17.0, 17.79], [19.0, 20.41], [22.0, 23.06], [23.0, 23.92], [25.0, 25.25], [26.0, 26.2], [27.0, 27.13], [27.0, 38.21], [43.0, 43.85], [47.0, 47.56], [51.0, 50.99], [51.0, 51.63], [56.0, 57.43], [58.0, 59.76], [60.0, 61.08], [64.0, 64.69], [66.0, 66.88], [69.0, 68.93], [74.0, 73.75], [75.0, 76.23], [88.0, 88.77], [97.0, 97.11], [99.0, 99.33], [102.0, 101.95], [103.0, 104.57], [105.0, 105.04], [108.0, 108.89], [116.0, 115.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 56.42], ["livestock, farm animals, working animals", 17.97], ["cattle, bovinae", 3.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.06, 1.39, 1.25, 1.8, 0.23, 0.79, 1.41, 1.06, 0.92, 0.25, 0.2, 0.13, 11.21, 0.85, 0.56, -0.01, 0.63, 1.43, 1.76, 1.08, 0.69, 0.88, -0.07, -0.25, 1.23, 0.77, 0.11, 0.33, -0.05, 1.57, 0.04, 0.89, -0.23]} \ No newline at end of file diff --git a/annotations_filtered/nEGbOGGiENU_filtered.json b/annotations_filtered/nEGbOGGiENU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..994f76b985006f423ca0ad8555c82037c1209047 --- /dev/null +++ b/annotations_filtered/nEGbOGGiENU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.79], [22.0, 22.25], [23.0, 28.07], [28.0, 29.07], [31.0, 39.61], [40.0, 40.61], [50.0, 51.43], [52.0, 64.76], [65.0, 66.92], [70.0, 84.16], [87.0, 87.12], [95.0, 116.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.6, 0.0, 30.13, 0.0, 0.0, 30.14, 0.0, 29.84, 0.0, 30.14], "audiomae_on_audioset": [null, null, [["music", 41.67], ["speech", 40.76], ["synthesizer", 4.18]], null, [["music", 68.56], ["vehicle", 5.38], ["car", 4.84]], null, null, [["music", 77.14], ["synthesizer", 2.54], ["cacophony", 1.58]], null, [["music", 59.07], ["synthesizer", 7.05], ["throbbing", 4.81]], null, [["music", 49.37], ["car", 13.96], ["vehicle", 8.88]]], "duration": [1.79, 0.25, 5.07, 1.07, 8.61, 0.61, 1.43, 12.76, 1.92, 14.16, 0.12, 21.01]} \ No newline at end of file diff --git a/annotations_filtered/nEJKLKKO0uY_filtered.json b/annotations_filtered/nEJKLKKO0uY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..918d9abe5f61186c36c057aab0ba5d345a5981b2 --- /dev/null +++ b/annotations_filtered/nEJKLKKO0uY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.16], [4.0, 4.68], [5.0, 7.05], [8.0, 8.51], [11.0, 13.51], [15.0, 18.54], [26.0, 32.43], [35.0, 37.1], [38.0, 41.01], [42.0, 46.48], [48.0, 49.11], [50.0, 52.57], [54.0, 54.4], [56.0, 57.28], [60.0, 63.49], [65.0, 66.41], [67.0, 70.26], [73.0, 74.06], [78.0, 89.99], [94.0, 98.78], [100.0, 100.58], [106.0, 109.27], [114.0, 115.82], [121.0, 124.09], [125.0, 126.05]], "keep_status": [false, false, false, false, true, true, false, true, true, true, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false], "silence_prob": [31.08, 0.0, 30.24, 0.0, 32.11, 33.04, 33.91, 42.02, 35.3, 41.32, 0.0, 33.26, 0.0, 0.0, 36.49, 0.0, 34.84, 0.0, 32.49, 36.61, 0.0, 47.94, 0.0, 41.2, 0.0], "audiomae_on_audioset": [[["music", 59.15], ["throbbing", 6.58], ["speech", 5.59]], null, [["music", 47.71], ["speech", 25.03], ["hum", 3.89]], null, [["music", 39.94], ["musical instrument", 10.66], ["speech", 8.65]], [["speech", 32.25], ["music", 18.5], ["foghorn", 6.85]], [["speech", 60.16], ["clip-clop", 13.24], ["horse", 9.86]], [["fly, housefly", 33.14], ["bee, wasp, etc.", 19.69], ["insect", 13.11]], [["fly, housefly", 23.5], ["bee, wasp, etc.", 22.4], ["speech", 17.59]], [["speech", 17.12], ["sidetone", 12.31], ["hum", 11.5]], null, [["speech", 61.21], ["fly, housefly", 5.56], ["bee, wasp, etc.", 3.86]], null, null, [["bee, wasp, etc.", 15.79], ["mains hum", 14.87], ["speech", 14.55]], null, [["fly, housefly", 33.63], ["bee, wasp, etc.", 30.44], ["speech", 9.92]], null, [["speech", 48.1], ["music", 20.55], ["horse", 4.87]], [["music", 56.04], ["didgeridoo", 13.71], ["musical instrument", 5.39]], null, [["music", 51.16], ["theremin", 8.06], ["musical instrument", 5.43]], null, [["speech", 30.81], ["music", 21.7], ["foghorn", 5.89]], null], "duration": [2.16, 0.68, 2.05, 0.51, 2.51, 3.54, 6.43, 2.1, 3.01, 4.48, 1.11, 2.57, 0.4, 1.28, 3.49, 1.41, 3.26, 1.06, 11.99, 4.78, 0.58, 3.27, 1.82, 3.09, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/nET7V9DsWgo_filtered.json b/annotations_filtered/nET7V9DsWgo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a01dd909b70391c0b4b0bb97dcc802d3ca93a683 --- /dev/null +++ b/annotations_filtered/nET7V9DsWgo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 20.22], [28.0, 29.08], [37.0, 43.48], [46.0, 46.2], [62.0, 67.0]], "keep_status": [false, false, false, false, true], "silence_prob": [30.72, 0.0, 30.03, 0.0, 30.55], "audiomae_on_audioset": [[["music", 61.48], ["musical instrument", 5.32], ["didgeridoo", 3.97]], null, [["music", 74.77], ["electronic music", 2.07], ["musical instrument", 1.8]], null, [["music", 62.93], ["sampler", 3.49], ["singing", 2.69]]], "duration": [10.22, 1.08, 6.48, 0.2, 5.0]} \ No newline at end of file diff --git a/annotations_filtered/nEf2ML7wkBE_filtered.json b/annotations_filtered/nEf2ML7wkBE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90023259a86b7f3f6acd514c091d6a1df3441860 --- /dev/null +++ b/annotations_filtered/nEf2ML7wkBE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.39], [15.0, 15.92], [33.0, 33.76], [37.0, 37.72], [50.0, 51.02], [94.0, 94.81], [116.0, 115.75]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.39, 0.92, 0.76, 0.72, 1.02, 0.81, -0.25]} \ No newline at end of file diff --git a/annotations_filtered/nF2xGs2J6Gk_filtered.json b/annotations_filtered/nF2xGs2J6Gk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36a278c54d8621a7707ef6365ac19f41bf01c9c1 --- /dev/null +++ b/annotations_filtered/nF2xGs2J6Gk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.06], [5.0, 5.95], [7.0, 7.08], [8.0, 9.07], [10.0, 11.94], [15.0, 15.53], [19.0, 20.12], [21.0, 22.11], [24.0, 24.66], [25.0, 26.42], [30.0, 30.28], [35.0, 35.24], [38.0, 39.16], [43.0, 43.24], [45.0, 45.3], [47.0, 47.98], [49.0, 50.03], [51.0, 52.39], [54.0, 55.88], [57.0, 58.65], [68.0, 68.64], [69.0, 69.69], [71.0, 72.79], [75.0, 76.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.06, 0.95, 0.08, 1.07, 1.94, 0.53, 1.12, 1.11, 0.66, 1.42, 0.28, 0.24, 1.16, 0.24, 0.3, 0.98, 1.03, 1.39, 1.88, 1.65, 0.64, 0.69, 1.79, 1.2]} \ No newline at end of file diff --git a/annotations_filtered/nF74obZFKp8_filtered.json b/annotations_filtered/nF74obZFKp8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72cc6c82e83e8c3bcbb1835816962a657d594866 --- /dev/null +++ b/annotations_filtered/nF74obZFKp8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 22.92], [29.0, 35.31], [42.0, 96.85], [100.0, 109.63], [115.0, 140.78], [143.0, 149.82], [151.0, 161.5], [162.0, 165.11], [167.0, 167.49], [170.0, 171.17]], "keep_status": [false, false, false, false, true, false, false, true, false, false], "silence_prob": [28.83, 28.33, 0.0, 28.4, 28.35, 28.56, 28.63, 29.14, 0.0, 0.0], "audiomae_on_audioset": [[["music", 35.32], ["throbbing", 31.41], ["hum", 11.14]], [["music", 70.86], ["speech", 13.16], ["throbbing", 3.86]], null, [["music", 61.88], ["throbbing", 12.33], ["hum", 9.42]], [["music", 24.31], ["speech", 14.61], ["vehicle", 5.77]], [["music", 32.93], ["speech", 32.39], ["hum", 6.63]], [["music", 34.5], ["hum", 30.07], ["mains hum", 18.57]], [["music", 48.48], ["hum", 9.69], ["mains hum", 6.01]], null, null], "duration": [16.92, 6.31, 54.85, 9.63, 25.78, 6.82, 10.5, 3.11, 0.49, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/nFJvGENqc20_filtered.json b/annotations_filtered/nFJvGENqc20_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7593686623cd45e63b17b1185121024fb9286eb --- /dev/null +++ b/annotations_filtered/nFJvGENqc20_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.84], [7.0, 7.4], [9.0, 9.32], [28.0, 27.58], [30.0, 31.23], [38.0, 38.62], [65.0, 65.69], [68.0, 67.95], [73.0, 73.3], [83.0, 83.66], [86.0, 86.1], [91.0, 91.96], [102.0, 103.03], [106.0, 106.15], [109.0, 109.41], [118.0, 117.93], [120.0, 119.8], [122.0, 122.59], [126.0, 126.89], [130.0, 132.73], [134.0, 134.57], [136.0, 136.29], [138.0, 138.13], [140.0, 140.48], [142.0, 143.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.91, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.84, 0.4, 0.32, -0.42, 1.23, 0.62, 0.69, -0.05, 0.3, 0.66, 0.1, 0.96, 1.03, 0.15, 0.41, -0.07, -0.2, 0.59, 0.89, 2.73, 0.57, 0.29, 0.13, 0.48, 1.38]} \ No newline at end of file diff --git a/annotations_filtered/nFRuYV4QrnE_filtered.json b/annotations_filtered/nFRuYV4QrnE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24c9a6f62902a06473258d89d8a2853084f91bee --- /dev/null +++ b/annotations_filtered/nFRuYV4QrnE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 18.69], [20.0, 20.71], [28.0, 28.71], [31.0, 31.24], [34.0, 35.97], [37.0, 37.88], [45.0, 46.25], [48.0, 49.37], [50.0, 51.7], [54.0, 63.78]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [39.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.24], "audiomae_on_audioset": [[["hum", 33.16], ["speech", 24.98], ["music", 15.71]], null, null, null, null, null, null, null, null, [["speech", 32.77], ["music", 16.04], ["breaking", 7.93]]], "duration": [10.69, 0.71, 0.71, 0.24, 1.97, 0.88, 1.25, 1.37, 1.7, 9.78]} \ No newline at end of file diff --git a/annotations_filtered/nF_6OfgbF7c_filtered.json b/annotations_filtered/nF_6OfgbF7c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..69c009e14b150d5da66a4bfb20501078646c752c --- /dev/null +++ b/annotations_filtered/nF_6OfgbF7c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.65], [2.0, 4.56], [5.0, 7.96], [8.0, 10.32], [13.0, 12.75], [17.0, 17.02], [20.0, 20.78], [21.0, 22.49], [25.0, 25.66], [27.0, 26.86], [28.0, 30.25], [37.0, 37.88], [40.0, 39.93], [42.0, 43.19], [44.0, 44.63], [53.0, 53.76], [57.0, 57.33], [61.0, 61.33], [63.0, 63.58], [67.0, 67.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 77.87, 99.8, 48.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["sidetone", 44.34], ["speech", 23.12], ["telephone", 7.93]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.65, 2.56, 2.96, 2.32, -0.25, 0.02, 0.78, 1.49, 0.66, -0.14, 2.25, 0.88, -0.07, 1.19, 0.63, 0.76, 0.33, 0.33, 0.58, 0.41]} \ No newline at end of file diff --git a/annotations_filtered/nGWtzmsCHgc_filtered.json b/annotations_filtered/nGWtzmsCHgc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1de0610502ebe72e2f607a65943439770d8f54ea --- /dev/null +++ b/annotations_filtered/nGWtzmsCHgc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.18], [8.0, 8.99], [13.0, 13.69], [15.0, 15.79], [20.0, 20.07], [33.0, 33.29], [36.0, 37.29], [43.0, 43.11], [45.0, 45.25], [55.0, 55.51], [60.0, 60.02], [69.0, 77.7], [78.0, 81.72], [83.0, 84.0], [85.0, 86.66], [90.0, 90.61], [92.0, 91.79], [97.0, 97.46], [103.0, 103.3], [108.0, 109.39], [111.0, 113.53], [120.0, 125.54], [126.0, 126.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.47, 43.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.87, 54.97, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 56.51], ["guitar", 10.93], ["speech", 10.34]], null, null, null, null, null, null, null, [["music", 59.41], ["musical instrument", 4.67], ["guitar", 4.55]], null, null], "duration": [0.18, 0.99, 0.69, 0.79, 0.07, 0.29, 1.29, 0.11, 0.25, 0.51, 0.02, 8.7, 3.72, 1.0, 1.66, 0.61, -0.21, 0.46, 0.3, 1.39, 2.53, 5.54, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/nGx3WY944DU_filtered.json b/annotations_filtered/nGx3WY944DU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..beb4144a7279cc9f9965cb26f402e980eb01edd9 --- /dev/null +++ b/annotations_filtered/nGx3WY944DU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.0], [8.0, 7.84], [12.0, 11.79], [15.0, 18.64], [19.0, 21.02], [22.0, 24.36], [26.0, 40.53], [42.0, 44.66], [50.0, 50.57], [53.0, 54.5], [58.0, 65.35], [67.0, 68.89], [73.0, 80.49], [87.0, 88.72], [90.0, 101.75], [107.0, 108.63], [110.0, 110.69], [112.0, 112.72], [117.0, 117.19], [118.0, 120.48], [122.0, 122.22], [127.0, 127.3], [130.0, 131.04], [132.0, 131.65], [135.0, 135.41], [136.0, 136.76], [140.0, 149.67], [152.0, 152.05], [157.0, 160.91], [162.0, 162.35]], "keep_status": [false, false, false, false, true, false, true, true, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [56.1, 0.0, 0.0, 37.97, 49.92, 55.89, 38.15, 30.41, 0.0, 0.0, 35.06, 0.0, 35.72, 0.0, 32.3, 0.0, 0.0, 0.0, 0.0, 31.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.97, 0.0, 38.95, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 66.64], ["gong", 16.85], ["electronic music", 3.41]], [["speech", 42.63], ["music", 9.99], ["singing bowl", 6.59]], null, [["music", 51.55], ["hum", 9.59], ["electronic music", 7.21]], [["music", 16.3], ["mosquito", 11.33], ["fly, housefly", 5.44]], null, null, [["speech", 70.37], ["hum", 6.22], ["music", 6.12]], null, [["sheep", 20.03], ["bleat", 12.71], ["speech", 11.84]], null, [["speech", 37.46], ["music", 17.41], ["throbbing", 8.07]], null, null, null, null, [["moo", 40.3], ["cattle, bovinae", 26.82], ["speech", 6.41]], null, null, null, null, null, null, [["crying, sobbing", 26.34], ["whimper", 23.33], ["speech", 14.21]], null, [["moo", 29.32], ["cattle, bovinae", 28.49], ["whale vocalization", 21.38]], null], "duration": [2.0, -0.16, -0.21, 3.64, 2.02, 2.36, 14.53, 2.66, 0.57, 1.5, 7.35, 1.89, 7.49, 1.72, 11.75, 1.63, 0.69, 0.72, 0.19, 2.48, 0.22, 0.3, 1.04, -0.35, 0.41, 0.76, 9.67, 0.05, 3.91, 0.35]} \ No newline at end of file diff --git a/annotations_filtered/nH40NtYdL-U_filtered.json b/annotations_filtered/nH40NtYdL-U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5703217a80c4e5431a45de8b671f8aab4a24dd21 --- /dev/null +++ b/annotations_filtered/nH40NtYdL-U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[95.0, 95.89]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.89]} \ No newline at end of file diff --git a/annotations_filtered/nHByIEUb37Y_filtered.json b/annotations_filtered/nHByIEUb37Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c6dda56a52cc5416510f43555cd704da88674a0 --- /dev/null +++ b/annotations_filtered/nHByIEUb37Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.64], [9.0, 11.67], [14.0, 16.88], [20.0, 22.94], [26.0, 29.89], [31.0, 37.45], [38.0, 40.56], [41.0, 43.98], [45.0, 46.5], [49.0, 50.89], [53.0, 54.68], [60.0, 62.46], [65.0, 66.39]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [32.15, 37.55, 54.63, 75.07, 84.62, 84.25, 60.51, 49.4, 0.0, 0.0, 0.0, 37.19, 0.0], "audiomae_on_audioset": [[["cello", 35.49], ["double bass", 25.62], ["music", 17.81]], [["music", 59.69], ["musical instrument", 7.64], ["synthesizer", 7.63]], null, null, null, null, null, [["hum", 27.97], ["music", 26.82], ["mains hum", 13.99]], null, null, null, [["music", 28.34], ["quack", 13.05], ["duck", 7.51]], null], "duration": [2.64, 2.67, 2.88, 2.94, 3.89, 6.45, 2.56, 2.98, 1.5, 1.89, 1.68, 2.46, 1.39]} \ No newline at end of file diff --git a/annotations_filtered/nHCEOK9n5z8_filtered.json b/annotations_filtered/nHCEOK9n5z8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/nHCEOK9n5z8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/nHKJaG3sXMY_filtered.json b/annotations_filtered/nHKJaG3sXMY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7066c2e36a331b21bdeb4e93b8dff972267e9052 --- /dev/null +++ b/annotations_filtered/nHKJaG3sXMY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.48], [5.0, 6.57], [9.0, 11.13], [16.0, 21.42], [23.0, 23.46], [24.0, 24.09], [28.0, 27.82], [29.0, 30.18]], "keep_status": [false, false, true, false, false, false, false, false], "silence_prob": [48.23, 0.0, 41.44, 69.61, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 43.52], ["hum", 27.23], ["whale vocalization", 16.04]], null, [["tuning fork", 26.81], ["sidetone", 16.73], ["white noise", 9.57]], null, null, null, null, null], "duration": [2.48, 1.57, 2.13, 5.42, 0.46, 0.09, -0.18, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/nHcRQhadzhY_filtered.json b/annotations_filtered/nHcRQhadzhY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0dcaa5d93c4970be2a5fd99857e7a94536886de --- /dev/null +++ b/annotations_filtered/nHcRQhadzhY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 18.23], [19.0, 19.68], [21.0, 29.64], [39.0, 40.37], [44.0, 46.5], [59.0, 64.03], [69.0, 78.31], [82.0, 94.37], [95.0, 98.63], [104.0, 125.69], [134.0, 136.95], [147.0, 154.01], [157.0, 157.32], [159.0, 159.83], [162.0, 161.91], [163.0, 163.34], [164.0, 166.68], [169.0, 169.21], [176.0, 192.77], [199.0, 199.15], [201.0, 205.58], [211.0, 211.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [32.12, 0.0, 30.36, 0.0, 31.38, 30.34, 31.35, 31.1, 30.76, 30.48, 29.62, 31.49, 0.0, 0.0, 0.0, 0.0, 38.0, 0.0, 30.02, 0.0, 29.32, 0.0], "audiomae_on_audioset": [[["music", 74.65], ["musical instrument", 4.0], ["guitar", 3.21]], null, [["music", 49.51], ["speech", 27.44], ["rattle (instrument)", 2.32]], null, [["music", 64.87], ["speech", 7.49], ["techno", 3.73]], [["music", 75.23], ["speech", 6.0], ["boing", 2.44]], [["music", 54.45], ["speech", 29.32], ["didgeridoo", 1.77]], [["music", 84.51], ["musical instrument", 2.54], ["speech", 0.88]], [["music", 70.02], ["speech", 11.75], ["electronic music", 2.33]], [["music", 63.23], ["speech", 8.57], ["boing", 2.75]], [["music", 77.45], ["speech", 3.53], ["musical instrument", 1.74]], [["music", 71.45], ["speech", 3.64], ["boing", 3.15]], null, null, null, null, [["speech", 38.35], ["music", 12.04], ["fly, housefly", 10.37]], null, [["music", 65.63], ["throbbing", 5.79], ["cacophony", 3.86]], null, [["music", 29.32], ["hum", 21.97], ["throbbing", 19.42]], null], "duration": [3.23, 0.68, 8.64, 1.37, 2.5, 5.03, 9.31, 12.37, 3.63, 21.69, 2.95, 7.01, 0.32, 0.83, -0.09, 0.34, 2.68, 0.21, 16.77, 0.15, 4.58, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/nHyK6uFdDWY_filtered.json b/annotations_filtered/nHyK6uFdDWY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b088a5ab84f8832124e7741e31a0df69ebfd00b8 --- /dev/null +++ b/annotations_filtered/nHyK6uFdDWY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 12.41], [14.0, 15.43], [56.0, 93.51], [98.0, 103.1], [108.0, 109.11], [110.0, 130.49]], "keep_status": [false, false, false, false, false, false], "silence_prob": [32.78, 0.0, 0.0, 37.2, 0.0, 34.17], "audiomae_on_audioset": [[["music", 53.97], ["speech", 15.34], ["didgeridoo", 3.49]], null, null, [["speech", 36.23], ["music", 21.52], ["hum", 12.48]], null, [["music", 30.39], ["speech", 29.88], ["quack", 12.37]]], "duration": [5.41, 1.43, 37.51, 5.1, 1.11, 20.49]} \ No newline at end of file diff --git a/annotations_filtered/nI6agjxMa2s_filtered.json b/annotations_filtered/nI6agjxMa2s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b23b4336f92de1fee35dfc95d11c0a27d0cc9e7 --- /dev/null +++ b/annotations_filtered/nI6agjxMa2s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 18.45], [19.0, 25.59], [30.0, 34.3], [35.0, 56.2], [56.0, 77.21], [78.0, 90.05]], "keep_status": [true, true, true, true, false, false], "silence_prob": [30.95, 30.92, 30.49, 29.63, 29.61, 29.16], "audiomae_on_audioset": [[["speech", 29.48], ["music", 20.67], ["hum", 13.76]], [["music", 44.4], ["trombone", 10.13], ["brass instrument", 9.9]], [["mains hum", 22.71], ["music", 22.65], ["hum", 20.08]], [["music", 24.63], ["speech", 23.34], ["buzz", 10.45]], [["buzz", 56.22], ["music", 16.27], ["fly, housefly", 2.12]], [["speech", 55.78], ["vehicle", 13.83], ["music", 3.38]]], "duration": [5.45, 6.59, 4.3, 21.2, 21.21, 12.05]} \ No newline at end of file diff --git a/annotations_filtered/nID1enI2xW8_filtered.json b/annotations_filtered/nID1enI2xW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a74057e8d39baea86bdbedf2aa90d3fe5b0278c --- /dev/null +++ b/annotations_filtered/nID1enI2xW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 27.57], [30.0, 30.15], [34.0, 34.64], [41.0, 41.57], [43.0, 42.92], [53.0, 53.4], [54.0, 55.27], [60.0, 60.44], [62.0, 65.87], [70.0, 79.62], [80.0, 111.67], [112.0, 122.28], [126.0, 138.5], [139.0, 144.73], [147.0, 157.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [53.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.82, 57.01, 0.0, 67.63, 80.29, 100.0, 32.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["throbbing", 51.07], ["hum", 32.09], ["mains hum", 3.26]], null, null, null, null, null, [["speech", 36.83], ["music", 15.49], ["hum", 7.55]]], "duration": [17.57, 0.15, 0.64, 0.57, -0.08, 0.4, 1.27, 0.44, 3.87, 9.62, 31.67, 10.28, 12.5, 5.73, 10.96]} \ No newline at end of file diff --git a/annotations_filtered/nII3ya0MuM0_filtered.json b/annotations_filtered/nII3ya0MuM0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06cb5cbe6b01789b65b9ca467201ef95cf6402d7 --- /dev/null +++ b/annotations_filtered/nII3ya0MuM0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.99], [4.0, 19.52], [25.0, 24.65], [26.0, 26.22], [28.0, 28.83], [29.0, 29.83], [34.0, 34.94], [37.0, 74.58], [76.0, 78.19], [87.0, 87.25], [89.0, 89.45], [91.0, 90.95], [95.0, 95.25], [99.0, 104.94], [106.0, 106.74], [108.0, 111.67], [114.0, 116.07], [118.0, 118.69], [120.0, 122.62], [125.0, 125.76], [145.0, 147.58], [148.0, 150.01], [152.0, 152.15], [161.0, 163.95], [165.0, 165.64]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.3, 0.0, 0.0, 0.0, 0.0, 43.35, 0.0, 39.3, 82.97, 0.0, 87.74, 0.0, 62.47, 81.35, 0.0, 31.87, 0.0], "audiomae_on_audioset": [null, [["speech", 63.45], ["radio", 10.96], ["hum", 7.93]], null, null, null, null, null, null, [["grunt", 40.8], ["speech", 9.3], ["snicker", 5.82]], null, null, null, null, [["livestock, farm animals, working animals", 43.14], ["cattle, bovinae", 38.94], ["moo", 15.03]], null, [["speech", 47.54], ["radio", 8.96], ["whale vocalization", 8.52]], null, null, null, null, null, null, null, [["speech", 79.44], ["whimper", 3.55], ["sine wave", 3.28]], null], "duration": [0.99, 15.52, -0.35, 0.22, 0.83, 0.83, 0.94, 37.58, 2.19, 0.25, 0.45, -0.05, 0.25, 5.94, 0.74, 3.67, 2.07, 0.69, 2.62, 0.76, 2.58, 2.01, 0.15, 2.95, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/nIJQOFSGKks_filtered.json b/annotations_filtered/nIJQOFSGKks_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61ae32563850fd3582a05708f0eaf0d00dd73546 --- /dev/null +++ b/annotations_filtered/nIJQOFSGKks_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 35.38], [36.0, 38.2], [40.0, 42.2], [44.0, 49.59], [51.0, 53.84], [55.0, 57.18], [57.0, 57.21], [57.0, 62.09], [63.0, 87.64], [92.0, 91.77], [92.0, 92.52], [93.0, 93.33]], "keep_status": [false, false, false, true, true, true, false, false, false, false, false, false], "silence_prob": [36.0, 43.45, 46.9, 34.77, 35.35, 35.36, 0.0, 38.76, 37.4, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["synthesizer", 39.98], ["music", 38.69], ["musical instrument", 2.46]], [["music", 77.58], ["musical instrument", 3.68], ["cacophony", 2.17]], [["music", 59.65], ["fart", 6.19], ["throbbing", 4.59]], [["music", 49.74], ["speech", 10.99], ["fart", 5.22]], [["music", 57.88], ["speech", 10.04], ["animal", 1.78]], [["music", 37.81], ["fly, housefly", 13.1], ["mosquito", 11.7]], null, [["music", 73.54], ["speech", 2.07], ["smash, crash", 1.91]], [["music", 47.21], ["noise", 14.48], ["synthesizer", 12.03]], null, null, null], "duration": [8.38, 2.2, 2.2, 5.59, 2.84, 2.18, 0.21, 5.09, 24.64, -0.23, 0.52, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/nIW73heJdg4_filtered.json b/annotations_filtered/nIW73heJdg4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8051f577be77b9fd3da4f61214bee348f4d98c93 --- /dev/null +++ b/annotations_filtered/nIW73heJdg4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.52], [11.0, 12.85], [14.0, 14.34], [48.0, 48.71], [52.0, 53.03], [56.0, 56.17], [65.0, 83.35], [87.0, 131.65]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.39, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["whack, thwack", 31.46], ["whip", 30.2], ["speech", 10.11]], null], "duration": [0.52, 1.85, 0.34, 0.71, 1.03, 0.17, 18.35, 44.65]} \ No newline at end of file diff --git a/annotations_filtered/nIhrGSxslzQ_filtered.json b/annotations_filtered/nIhrGSxslzQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6965c375fa93d63c171388f0dce35f3bdf22641 --- /dev/null +++ b/annotations_filtered/nIhrGSxslzQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 42.47], [44.0, 43.95], [44.0, 44.29], [44.0, 74.16], [75.0, 80.64], [81.0, 81.87]], "keep_status": [false, false, false, false, false, false], "silence_prob": [43.08, 0.0, 0.0, 0.0, 40.38, 0.0], "audiomae_on_audioset": [[["music", 57.44], ["musical instrument", 13.11], ["trombone", 7.67]], null, null, null, [["music", 61.2], ["musical instrument", 7.37], ["synthesizer", 5.6]], null], "duration": [21.47, -0.05, 0.29, 30.16, 5.64, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/nImG5bpVpVI_filtered.json b/annotations_filtered/nImG5bpVpVI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..967a832276ab51497f16b5fa088b1432719d7c6e --- /dev/null +++ b/annotations_filtered/nImG5bpVpVI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.19], [27.0, 28.65], [31.0, 32.0]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.19, 1.65, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/nIuuhtJM_Dw_filtered.json b/annotations_filtered/nIuuhtJM_Dw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ccda9c0c0463d44eebde90a9c342647ae6c0c4e1 --- /dev/null +++ b/annotations_filtered/nIuuhtJM_Dw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.89], [8.0, 8.01], [12.0, 12.51], [17.0, 19.31], [22.0, 22.91], [30.0, 36.54], [43.0, 51.19], [52.0, 52.57], [53.0, 53.11], [58.0, 58.45], [63.0, 66.93], [67.0, 67.42], [88.0, 92.75], [96.0, 108.01], [111.0, 110.93], [113.0, 119.25], [121.0, 121.2], [123.0, 123.15], [126.0, 134.43], [137.0, 138.23], [140.0, 141.34]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 42.33, 0.0, 79.41, 59.24, 0.0, 0.0, 0.0, 47.78, 0.0, 87.55, 89.72, 0.0, 68.02, 0.0, 0.0, 61.08, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 32.81], ["music", 23.46], ["didgeridoo", 8.09]], null, null, null, null, null, null, [["speech", 61.86], ["radio", 5.67], ["livestock, farm animals, working animals", 3.05]], null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 0.01, 0.51, 2.31, 0.91, 6.54, 8.19, 0.57, 0.11, 0.45, 3.93, 0.42, 4.75, 12.01, -0.07, 6.25, 0.2, 0.15, 8.43, 1.23, 1.34]} \ No newline at end of file diff --git a/annotations_filtered/nJ04J0TWD1I_filtered.json b/annotations_filtered/nJ04J0TWD1I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78e6d482c3ec55cb2c9ef66724284f1d45929496 --- /dev/null +++ b/annotations_filtered/nJ04J0TWD1I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.97], [5.0, 7.15], [8.0, 7.7], [8.0, 9.39], [17.0, 17.85], [21.0, 21.3], [22.0, 24.48], [25.0, 25.37], [30.0, 30.87], [32.0, 32.41], [34.0, 34.35], [35.0, 35.77], [43.0, 43.6], [45.0, 46.06], [50.0, 52.14], [55.0, 55.92], [58.0, 58.29], [60.0, 60.94], [64.0, 66.36], [70.0, 70.8], [81.0, 83.96], [85.0, 86.16], [88.0, 88.42], [101.0, 101.73], [103.0, 103.37], [116.0, 117.71]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.74, 0.0, 0.0, 0.0, 0.0, 36.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.44, 0.0, 0.0, 0.0, 37.47, 0.0, 51.99, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 22.65], ["mains hum", 9.22], ["music", 9.04]], null, null, null, null, [["speech", 41.72], ["mains hum", 10.45], ["hum", 6.53]], null, null, null, null, null, null, null, [["fly, housefly", 36.95], ["insect", 22.44], ["bee, wasp, etc.", 8.66]], null, null, null, [["speech", 26.66], ["hum", 9.78], ["mains hum", 7.79]], null, null, null, null, null, null, null], "duration": [1.97, 2.15, -0.3, 1.39, 0.85, 0.3, 2.48, 0.37, 0.87, 0.41, 0.35, 0.77, 0.6, 1.06, 2.14, 0.92, 0.29, 0.94, 2.36, 0.8, 2.96, 1.16, 0.42, 0.73, 0.37, 1.71]} \ No newline at end of file diff --git a/annotations_filtered/nJ1hrmVHUJg_filtered.json b/annotations_filtered/nJ1hrmVHUJg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8227657ec4713ab248e62aecf061e607d2cf4ca --- /dev/null +++ b/annotations_filtered/nJ1hrmVHUJg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.75], [15.0, 15.16], [16.0, 16.65], [19.0, 19.16], [24.0, 25.2], [31.0, 36.37], [39.0, 39.06], [40.0, 40.39], [41.0, 47.12], [56.0, 57.81], [65.0, 64.83], [66.0, 66.85], [69.0, 69.87], [75.0, 89.8], [91.0, 91.45], [94.0, 94.68], [98.0, 97.77], [99.0, 109.8], [115.0, 146.92]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.02, 0.0, 0.0, 38.1, 0.0, 0.0, 0.0, 0.0, 30.22, 0.0, 0.0, 0.0, 29.56, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 26.66], ["speech", 16.86], ["air horn, truck horn", 4.03]], null, null, [["fly, housefly", 24.8], ["speech", 24.72], ["bee, wasp, etc.", 17.51]], null, null, null, null, [["music", 57.49], ["theremin", 11.66], ["didgeridoo", 6.61]], null, null, null, [["speech", 40.51], ["music", 9.96], ["animal", 7.09]], null], "duration": [0.75, 0.16, 0.65, 0.16, 1.2, 5.37, 0.06, 0.39, 6.12, 1.81, -0.17, 0.85, 0.87, 14.8, 0.45, 0.68, -0.23, 10.8, 31.92]} \ No newline at end of file diff --git a/annotations_filtered/nJPju1f6p0E_filtered.json b/annotations_filtered/nJPju1f6p0E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25f2b49296de0d4c22cc35ca14695e9ffedfb256 --- /dev/null +++ b/annotations_filtered/nJPju1f6p0E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.95], [15.0, 15.74], [17.0, 17.59], [30.0, 30.27], [31.0, 37.67], [42.0, 52.34], [56.0, 66.38], [68.0, 136.02], [136.0, 153.33], [155.0, 155.38]], "keep_status": [false, false, false, false, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.9, 30.59, 32.25, 0.0, 33.2, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 37.84], ["creak", 26.55], ["mechanisms", 7.71]], [["music", 58.37], ["musical instrument", 3.7], ["effects unit", 3.56]], [["fly, housefly", 28.08], ["livestock, farm animals, working animals", 12.75], ["insect", 11.6]], null, [["music", 20.72], ["didgeridoo", 12.97], ["theremin", 12.72]], null], "duration": [0.95, 0.74, 0.59, 0.27, 6.67, 10.34, 10.38, 68.02, 17.33, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/nJwGWiuonws_filtered.json b/annotations_filtered/nJwGWiuonws_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52c6e5c37c2963e867232f67312569bfe8b43627 --- /dev/null +++ b/annotations_filtered/nJwGWiuonws_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.97], [3.0, 5.7], [14.0, 15.15], [16.0, 19.35], [20.0, 20.49], [23.0, 23.48], [28.0, 30.4], [31.0, 31.8], [36.0, 36.19], [39.0, 39.18], [41.0, 42.26], [44.0, 46.06], [47.0, 47.56], [48.0, 48.51], [50.0, 51.26], [54.0, 55.32], [58.0, 58.67], [67.0, 67.37], [83.0, 84.2], [88.0, 88.53], [89.0, 90.85], [92.0, 91.77], [93.0, 93.77], [99.0, 99.39], [101.0, 101.38], [104.0, 104.38], [106.0, 107.2], [116.0, 116.21], [119.0, 119.38], [121.0, 122.35], [123.0, 123.5], [130.0, 132.65], [142.0, 142.47], [144.0, 144.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 67.13, 0.0, 96.77, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0, 0.0, 99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.03, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.03, 2.7, 1.15, 3.35, 0.49, 0.48, 2.4, 0.8, 0.19, 0.18, 1.26, 2.06, 0.56, 0.51, 1.26, 1.32, 0.67, 0.37, 1.2, 0.53, 1.85, -0.23, 0.77, 0.39, 0.38, 0.38, 1.2, 0.21, 0.38, 1.35, 0.5, 2.65, 0.47, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/nKB-Ij0vyB4_filtered.json b/annotations_filtered/nKB-Ij0vyB4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..394a0af0d5f0d5a05cc0fb186b83dc6e41f1c8f3 --- /dev/null +++ b/annotations_filtered/nKB-Ij0vyB4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.0], [7.0, 8.45], [9.0, 9.83], [11.0, 13.71], [16.0, 16.63], [19.0, 20.78], [22.0, 26.74], [27.0, 29.24], [31.0, 35.18], [39.0, 42.57], [52.0, 53.7], [55.0, 55.75], [58.0, 60.83], [61.0, 62.02], [63.0, 63.59], [72.0, 73.28], [76.0, 76.59], [83.0, 84.32], [85.0, 85.62], [95.0, 94.93], [99.0, 99.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [92.31, 0.0, 0.0, 77.2, 0.0, 0.0, 58.05, 53.78, 56.1, 57.89, 0.0, 0.0, 47.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 30.38], ["speech", 11.33], ["singing bowl", 9.67]], null, null, null, null, null, null, null, null], "duration": [2.0, 1.45, 0.83, 2.71, 0.63, 1.78, 4.74, 2.24, 4.18, 3.57, 1.7, 0.75, 2.83, 1.02, 0.59, 1.28, 0.59, 1.32, 0.62, -0.07, 0.98]} \ No newline at end of file diff --git a/annotations_filtered/nKDUDF3cgRA_filtered.json b/annotations_filtered/nKDUDF3cgRA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40da527b4a3b15d44762547a6a567995c137a3ac --- /dev/null +++ b/annotations_filtered/nKDUDF3cgRA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.51], [6.0, 8.9], [11.0, 10.93], [12.0, 28.27], [29.0, 30.4], [31.0, 59.75], [61.0, 83.34], [85.0, 90.95], [92.0, 92.42], [93.0, 94.0], [95.0, 122.08], [123.0, 128.7]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 36.78, 0.0, 43.05, 0.0, 43.33, 41.05, 33.55, 0.0, 0.0, 38.72, 58.22], "audiomae_on_audioset": [null, [["speech", 85.2], ["animal", 1.42], ["electric shaver, electric razor", 1.34]], null, [["speech", 76.55], ["electric shaver, electric razor", 4.85], ["telephone", 3.68]], null, [["music", 37.97], ["speech", 10.21], ["fly, housefly", 4.01]], [["music", 48.04], ["speech", 17.33], ["musical instrument", 6.8]], [["music", 42.46], ["musical instrument", 11.78], ["speech", 8.9]], null, null, [["speech", 82.97], ["beatboxing", 5.88], ["music", 2.71]], null], "duration": [1.51, 2.9, -0.07, 16.27, 1.4, 28.75, 22.34, 5.95, 0.42, 1.0, 27.08, 5.7]} \ No newline at end of file diff --git a/annotations_filtered/nKISdYhQcvw_filtered.json b/annotations_filtered/nKISdYhQcvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77960fe55feb524b12114c1f014fbb4b3bc11e30 --- /dev/null +++ b/annotations_filtered/nKISdYhQcvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 23.57], [30.0, 30.59], [31.0, 30.89], [32.0, 32.61], [35.0, 35.82], [36.0, 35.94], [36.0, 53.49], [58.0, 67.98], [69.0, 69.65], [70.0, 136.39], [138.0, 143.82]], "keep_status": [false, false, false, false, false, false, true, true, false, false, true], "silence_prob": [30.49, 0.0, 0.0, 0.0, 0.0, 0.0, 30.64, 32.3, 0.0, 0.0, 34.71], "audiomae_on_audioset": [[["cattle, bovinae", 49.56], ["moo", 28.12], ["livestock, farm animals, working animals", 11.24]], null, null, null, null, null, [["speech", 21.57], ["whack, thwack", 16.05], ["groan", 7.85]], [["whack, thwack", 8.07], ["fart", 6.94], ["speech", 6.83]], null, null, [["grunt", 26.36], ["music", 13.89], ["groan", 9.57]]], "duration": [15.57, 0.59, -0.11, 0.61, 0.82, -0.06, 17.49, 9.98, 0.65, 66.39, 5.82]} \ No newline at end of file diff --git a/annotations_filtered/nKdSvhCg3VY_filtered.json b/annotations_filtered/nKdSvhCg3VY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8f60f0a6549cc8cb13d144110897d0e5e408653 --- /dev/null +++ b/annotations_filtered/nKdSvhCg3VY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.56], [18.0, 18.87], [22.0, 22.91], [24.0, 26.35], [27.0, 27.41], [28.0, 29.42], [30.0, 29.74], [31.0, 32.71], [36.0, 37.4], [40.0, 41.62], [44.0, 46.52], [52.0, 52.47], [58.0, 59.37], [66.0, 66.31], [67.0, 67.46], [70.0, 72.03], [74.0, 75.68], [80.0, 84.38], [87.0, 90.56], [91.0, 94.68], [96.0, 98.78], [102.0, 103.79], [107.0, 107.94], [109.0, 140.04], [141.0, 142.55], [144.0, 153.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 97.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.97, 0.0, 0.0, 0.0, 0.0, 87.37, 0.0, 68.41, 58.05, 52.56, 46.4, 0.0, 0.0, 0.0, 0.0, 86.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 30.26], ["speech", 16.03], ["synthesizer", 8.26]], null, null, null, null, null], "duration": [1.56, 0.87, 0.91, 2.35, 0.41, 1.42, -0.26, 1.71, 1.4, 1.62, 2.52, 0.47, 1.37, 0.31, 0.46, 2.03, 1.68, 4.38, 3.56, 3.68, 2.78, 1.79, 0.94, 31.04, 1.55, 9.64]} \ No newline at end of file diff --git a/annotations_filtered/nKuJ6UvlGek_filtered.json b/annotations_filtered/nKuJ6UvlGek_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f8408ae01f7e2627fda8779225e3dd7e9a051cd --- /dev/null +++ b/annotations_filtered/nKuJ6UvlGek_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.42], [32.0, 32.17], [33.0, 33.86], [40.0, 47.61], [48.0, 51.68], [53.0, 52.96], [56.0, 56.25], [57.0, 58.16], [59.0, 59.53], [61.0, 61.26], [62.0, 64.29], [66.0, 66.72], [68.0, 68.47], [70.0, 70.88], [73.0, 74.49], [76.0, 79.96], [84.0, 86.02], [89.0, 90.53], [93.0, 95.77], [97.0, 97.87], [103.0, 103.76], [116.0, 117.0]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.4, 0.0, 0.0, 32.97, 34.53, 0.0, 0.0, 0.0, 0.0, 0.0, 45.46, 0.0, 0.0, 0.0, 0.0, 34.55, 33.45, 0.0, 33.18, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 71.88], ["didgeridoo", 6.04], ["musical instrument", 4.85]], null, null, [["noise", 32.15], ["hum", 22.87], ["speech", 11.72]], [["whale vocalization", 40.69], ["sidetone", 17.7], ["speech", 12.51]], null, null, null, null, null, [["mains hum", 40.2], ["hum", 18.66], ["music", 9.16]], null, null, null, null, [["mains hum", 43.94], ["hum", 18.32], ["music", 10.14]], [["theremin", 44.81], ["music", 24.2], ["didgeridoo", 5.63]], null, [["music", 52.24], ["gong", 12.24], ["vehicle", 8.46]], null, null, null], "duration": [3.42, 0.17, 0.86, 7.61, 3.68, -0.04, 0.25, 1.16, 0.53, 0.26, 2.29, 0.72, 0.47, 0.88, 1.49, 3.96, 2.02, 1.53, 2.77, 0.87, 0.76, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/nL3o4MGY9NQ_filtered.json b/annotations_filtered/nL3o4MGY9NQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83b3d4efdb9740c3606e2ba40f5b5eb8ebf4db57 --- /dev/null +++ b/annotations_filtered/nL3o4MGY9NQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 31.23], [32.0, 36.96], [37.0, 37.08], [37.0, 42.28], [43.0, 58.35], [60.0, 125.52], [127.0, 130.11], [131.0, 146.16], [147.0, 153.44], [154.0, 163.46], [164.0, 165.21], [166.0, 166.9]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [72.01, 79.41, 0.0, 79.24, 89.19, 0.0, 99.71, 93.6, 82.79, 42.67, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 22.14], ["whale vocalization", 18.67], ["theremin", 8.72]], null, null], "duration": [4.23, 4.96, 0.08, 5.28, 15.35, 65.52, 3.11, 15.16, 6.44, 9.46, 1.21, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/nLDgcHxJ4Sc_filtered.json b/annotations_filtered/nLDgcHxJ4Sc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bddb039b035b5c63ca6d7098d7e8540ab911f48c --- /dev/null +++ b/annotations_filtered/nLDgcHxJ4Sc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.34], [7.0, 7.7], [9.0, 9.05], [13.0, 13.8], [15.0, 15.13], [15.0, 16.26], [17.0, 18.71], [20.0, 20.61], [23.0, 25.68], [27.0, 31.29], [33.0, 34.11], [35.0, 37.35], [39.0, 39.99], [41.0, 44.59], [49.0, 57.16], [60.0, 61.25], [63.0, 63.49], [66.0, 66.7], [69.0, 69.96], [80.0, 81.24], [84.0, 90.88], [91.0, 90.91], [93.0, 92.92], [95.0, 97.95], [99.0, 99.93], [101.0, 101.66], [105.0, 105.73], [107.0, 107.7], [109.0, 110.32], [113.0, 113.88], [116.0, 118.74], [126.0, 131.82], [133.0, 141.45], [145.0, 146.03], [149.0, 150.89], [152.0, 151.97], [152.0, 154.04], [155.0, 165.45], [167.0, 167.75], [169.0, 169.69], [172.0, 174.61], [176.0, 177.67], [179.0, 182.38], [183.0, 186.65], [187.0, 194.12], [195.0, 196.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.16, 96.42, 0.0, 97.73, 0.0, 98.86, 68.93, 0.0, 0.0, 0.0, 0.0, 0.0, 61.57, 0.0, 0.0, 66.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.13, 83.88, 99.92, 0.0, 0.0, 0.0, 49.54, 47.54, 0.0, 0.0, 95.78, 0.0, 47.62, 99.91, 99.62, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 42.76], ["fly, housefly", 15.43], ["insect", 8.5]], [["speech", 34.32], ["grunt", 23.84], ["cattle, bovinae", 6.2]], null, null, null, null, [["speech", 76.11], ["sidetone", 9.98], ["dial tone", 2.7]], null, null, null], "duration": [0.34, 0.7, 0.05, 0.8, 0.13, 1.26, 1.71, 0.61, 2.68, 4.29, 1.11, 2.35, 0.99, 3.59, 8.16, 1.25, 0.49, 0.7, 0.96, 1.24, 6.88, -0.09, -0.08, 2.95, 0.93, 0.66, 0.73, 0.7, 1.32, 0.88, 2.74, 5.82, 8.45, 1.03, 1.89, -0.03, 2.04, 10.45, 0.75, 0.69, 2.61, 1.67, 3.38, 3.65, 7.12, 1.25]} \ No newline at end of file diff --git a/annotations_filtered/nLKymV5rwAU_filtered.json b/annotations_filtered/nLKymV5rwAU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17f961004b2dd4c11d994f31877e6c2484af611c --- /dev/null +++ b/annotations_filtered/nLKymV5rwAU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.69], [5.0, 12.43], [12.0, 15.53], [16.0, 16.31], [17.0, 19.53], [24.0, 25.02], [27.0, 30.6], [33.0, 83.08], [84.0, 85.43], [87.0, 90.36], [93.0, 97.17], [98.0, 99.55], [105.0, 105.61], [115.0, 115.25], [119.0, 121.64], [126.0, 127.09], [129.0, 130.17], [131.0, 131.7], [134.0, 133.74], [134.0, 137.57], [143.0, 145.74], [147.0, 147.63], [150.0, 151.16], [156.0, 155.82], [160.0, 160.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 77.36, 74.76, 0.0, 99.99, 0.0, 99.85, 0.0, 0.0, 100.0, 99.99, 0.0, 0.0, 0.0, 81.35, 0.0, 0.0, 0.0, 0.0, 76.7, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.69, 7.43, 3.53, 0.31, 2.53, 1.02, 3.6, 50.08, 1.43, 3.36, 4.17, 1.55, 0.61, 0.25, 2.64, 1.09, 1.17, 0.7, -0.26, 3.57, 2.74, 0.63, 1.16, -0.18, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/nLMkSN2F2xs_filtered.json b/annotations_filtered/nLMkSN2F2xs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6fa0528ff6e4ea573c25ccf3110c630e961e0311 --- /dev/null +++ b/annotations_filtered/nLMkSN2F2xs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 32.58], [33.0, 93.21], [94.0, 106.47], [108.0, 108.09], [109.0, 118.93], [124.0, 133.74], [140.0, 142.26]], "keep_status": [false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 28.88, 0.0, 28.96, 28.05, 40.41], "audiomae_on_audioset": [null, null, [["speech", 52.67], ["music", 9.98], ["buzz", 9.19]], null, [["speech", 57.09], ["music", 12.49], ["knock", 3.86]], [["speech", 45.12], ["music", 10.07], ["electric shaver, electric razor", 9.26]], [["frog", 26.57], ["croak", 12.88], ["hiccup", 9.24]]], "duration": [1.58, 60.21, 12.47, 0.09, 9.93, 9.74, 2.26]} \ No newline at end of file diff --git a/annotations_filtered/nLTcdOr66lA_filtered.json b/annotations_filtered/nLTcdOr66lA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f41c16574449afb2b8ea35b197c1eee5873c225e --- /dev/null +++ b/annotations_filtered/nLTcdOr66lA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 28.0], [33.0, 95.45], [96.0, 100.75]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 29.92], "audiomae_on_audioset": [null, null, [["speech", 60.08], ["music", 14.84], ["vehicle", 1.76]]], "duration": [1.0, 62.45, 4.75]} \ No newline at end of file diff --git a/annotations_filtered/nLXoZ69ce-I_filtered.json b/annotations_filtered/nLXoZ69ce-I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0cb9117c948419e9754edf5b249a75e47d8fef14 --- /dev/null +++ b/annotations_filtered/nLXoZ69ce-I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.49], [4.0, 9.24], [10.0, 11.6], [13.0, 14.3], [15.0, 15.75], [16.0, 16.66], [18.0, 18.37], [20.0, 20.68], [23.0, 28.21], [29.0, 30.5], [31.0, 32.0], [32.0, 32.66], [33.0, 33.71], [35.0, 35.63], [38.0, 39.21], [40.0, 41.25], [42.0, 43.16], [44.0, 44.56], [45.0, 47.14], [48.0, 48.74], [51.0, 51.73], [53.0, 52.91], [54.0, 54.04], [56.0, 58.48], [60.0, 65.03], [66.0, 66.85], [68.0, 70.07], [71.0, 75.64], [77.0, 77.43], [78.0, 79.08], [83.0, 83.74], [84.0, 85.08], [91.0, 96.26], [98.0, 98.74], [100.0, 100.6], [101.0, 102.34], [104.0, 105.14], [106.0, 106.19], [107.0, 107.5], [109.0, 109.73], [111.0, 111.99], [113.0, 113.21], [116.0, 116.55], [118.0, 118.99], [120.0, 121.83], [125.0, 125.74], [126.0, 128.31], [129.0, 130.72], [131.0, 130.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.23, 0.0, 0.0, 0.0, 0.0, 99.44, 99.92, 0.0, 99.96, 66.27, 0.0, 0.0, 0.0, 0.0, 75.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.49, 5.24, 1.6, 1.3, 0.75, 0.66, 0.37, 0.68, 5.21, 1.5, 1.0, 0.66, 0.71, 0.63, 1.21, 1.25, 1.16, 0.56, 2.14, 0.74, 0.73, -0.09, 0.04, 2.48, 5.03, 0.85, 2.07, 4.64, 0.43, 1.08, 0.74, 1.08, 5.26, 0.74, 0.6, 1.34, 1.14, 0.19, 0.5, 0.73, 0.99, 0.21, 0.55, 0.99, 1.83, 0.74, 2.31, 1.72, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/nLcCOlgev3k_filtered.json b/annotations_filtered/nLcCOlgev3k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b27cafbd14dcea35d00b776d90d9f6b3ddaa1c4 --- /dev/null +++ b/annotations_filtered/nLcCOlgev3k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.02], [25.0, 28.16], [30.0, 30.67], [32.0, 34.2], [42.0, 44.05], [45.0, 51.49], [56.0, 56.25], [59.0, 60.86], [63.0, 65.43], [66.0, 67.88], [74.0, 75.61], [80.0, 79.86], [83.0, 84.03], [100.0, 99.96], [101.0, 101.68], [104.0, 105.38], [107.0, 107.23], [113.0, 113.56], [115.0, 116.11], [120.0, 120.66], [123.0, 124.26], [125.0, 125.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 69.2, 0.0, 53.91, 79.76, 70.02, 0.0, 0.0, 74.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.02, 3.16, 0.67, 2.2, 2.05, 6.49, 0.25, 1.86, 2.43, 1.88, 1.61, -0.14, 1.03, -0.04, 0.68, 1.38, 0.23, 0.56, 1.11, 0.66, 1.26, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/nLeZGuvX7D8_filtered.json b/annotations_filtered/nLeZGuvX7D8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40b8bc5ed985455f52ad5a3631b4313dc0f76e80 --- /dev/null +++ b/annotations_filtered/nLeZGuvX7D8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.36], [11.0, 11.99], [15.0, 18.76], [21.0, 22.0], [24.0, 25.15], [27.0, 29.0], [31.0, 31.26], [33.0, 34.03], [35.0, 36.75], [38.0, 38.64], [40.0, 41.32], [43.0, 43.48], [45.0, 45.77], [52.0, 52.84], [54.0, 55.9], [58.0, 59.1], [61.0, 61.96], [63.0, 63.64], [65.0, 67.93], [70.0, 70.87], [71.0, 72.17], [77.0, 77.06], [78.0, 79.29], [90.0, 90.71], [92.0, 91.74], [95.0, 95.96], [101.0, 102.66], [105.0, 104.72], [106.0, 107.05], [109.0, 111.97], [113.0, 113.43], [115.0, 121.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.05, 0.0, 99.21, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.82, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.36, 0.99, 3.76, 1.0, 1.15, 2.0, 0.26, 1.03, 1.75, 0.64, 1.32, 0.48, 0.77, 0.84, 1.9, 1.1, 0.96, 0.64, 2.93, 0.87, 1.17, 0.06, 1.29, 0.71, -0.26, 0.96, 1.66, -0.28, 1.05, 2.97, 0.43, 6.76]} \ No newline at end of file diff --git a/annotations_filtered/nLkmfL6IVQs_filtered.json b/annotations_filtered/nLkmfL6IVQs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0795a601f02be2e5b450cf6a3a74b4464df71a93 --- /dev/null +++ b/annotations_filtered/nLkmfL6IVQs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.67], [5.0, 11.15], [16.0, 18.42], [20.0, 22.67], [23.0, 24.31], [26.0, 29.15], [33.0, 35.36], [38.0, 38.87], [41.0, 41.5], [48.0, 48.3], [48.0, 49.4], [53.0, 57.18], [77.0, 79.62], [80.0, 84.25], [91.0, 93.39], [100.0, 101.02], [108.0, 109.32], [116.0, 117.85], [130.0, 130.18], [134.0, 136.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 56.03, 66.27, 74.92, 0.0, 83.7, 56.7, 0.0, 0.0, 0.0, 0.0, 30.34, 29.31, 28.89, 30.01, 0.0, 0.0, 0.0, 0.0, 30.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 35.35], ["cattle, bovinae", 11.49], ["moo", 7.83]], [["music", 33.44], ["skateboard", 21.31], ["cattle, bovinae", 7.79]], [["cattle, bovinae", 38.75], ["moo", 37.55], ["livestock, farm animals, working animals", 8.78]], [["music", 57.31], ["moo", 3.23], ["cattle, bovinae", 3.11]], null, null, null, null, [["music", 63.91], ["hum", 6.5], ["throbbing", 3.24]]], "duration": [1.67, 6.15, 2.42, 2.67, 1.31, 3.15, 2.36, 0.87, 0.5, 0.3, 1.4, 4.18, 2.62, 4.25, 2.39, 1.02, 1.32, 1.85, 0.18, 2.22]} \ No newline at end of file diff --git a/annotations_filtered/nM-RPO10aPY_filtered.json b/annotations_filtered/nM-RPO10aPY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52c5d14a6a79638129ec98e45351a8bbf5f4c0bb --- /dev/null +++ b/annotations_filtered/nM-RPO10aPY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.28], [9.0, 9.96], [11.0, 17.22], [19.0, 23.48], [25.0, 25.88], [28.0, 27.82], [33.0, 39.18], [43.0, 47.07], [49.0, 94.85], [97.0, 97.5], [98.0, 101.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 91.13, 65.67, 0.0, 0.0, 71.0, 60.7, 0.0, 0.0, 72.01], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.28, 0.96, 6.22, 4.48, 0.88, -0.18, 6.18, 4.07, 45.85, 0.5, 3.33]} \ No newline at end of file diff --git a/annotations_filtered/nM0h6QXTpHQ_filtered.json b/annotations_filtered/nM0h6QXTpHQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b54726c66239eaea329096588b096c3a44139922 --- /dev/null +++ b/annotations_filtered/nM0h6QXTpHQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.45], [9.0, 9.54], [10.0, 11.4], [12.0, 12.46], [16.0, 16.63], [20.0, 20.68], [21.0, 21.57], [23.0, 24.24], [25.0, 35.24], [35.0, 36.66], [38.0, 38.74], [40.0, 46.31], [47.0, 47.8], [50.0, 51.39], [52.0, 52.02], [52.0, 53.43], [54.0, 54.53], [55.0, 56.32], [63.0, 63.37], [64.0, 70.17], [70.0, 71.07], [72.0, 72.55], [73.0, 76.72], [77.0, 77.6], [81.0, 81.36], [86.0, 86.12], [87.0, 88.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.43, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 0.54, 1.4, 0.46, 0.63, 0.68, 0.57, 1.24, 10.24, 1.66, 0.74, 6.31, 0.8, 1.39, 0.02, 1.43, 0.53, 1.32, 0.37, 6.17, 1.07, 0.55, 3.72, 0.6, 0.36, 0.12, 1.5]} \ No newline at end of file diff --git a/annotations_filtered/nM0u8GRt_hU_filtered.json b/annotations_filtered/nM0u8GRt_hU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8fda5d8afcd809ba8962a1cb681b051146e5134e --- /dev/null +++ b/annotations_filtered/nM0u8GRt_hU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.19], [9.0, 9.54], [11.0, 11.37], [11.0, 14.99], [15.0, 15.97], [18.0, 18.54], [20.0, 20.11], [22.0, 21.91], [24.0, 24.92], [27.0, 28.68], [29.0, 40.2], [41.0, 42.06], [43.0, 43.6], [45.0, 45.25], [45.0, 45.81], [46.0, 57.54], [59.0, 61.26], [62.0, 63.56], [64.0, 65.84], [66.0, 65.96], [66.0, 72.67], [73.0, 73.87], [75.0, 75.22], [79.0, 80.43], [81.0, 87.98], [89.0, 89.16], [90.0, 90.49], [106.0, 108.03], [108.0, 109.97], [111.0, 110.74], [113.0, 113.22], [114.0, 115.38], [116.0, 117.21], [118.0, 119.33], [122.0, 122.22], [123.0, 125.86], [126.0, 127.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 92.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.31, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 98.01, 0.0, 0.0, 0.0, 99.87, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.19, 0.54, 0.37, 3.99, 0.97, 0.54, 0.11, -0.09, 0.92, 1.68, 11.2, 1.06, 0.6, 0.25, 0.81, 11.54, 2.26, 1.56, 1.84, -0.04, 6.67, 0.87, 0.22, 1.43, 6.98, 0.16, 0.49, 2.03, 1.97, -0.26, 0.22, 1.38, 1.21, 1.33, 0.22, 2.86, 1.63]} \ No newline at end of file diff --git a/annotations_filtered/nMW1Rfbl0tE_filtered.json b/annotations_filtered/nMW1Rfbl0tE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..970cad73d636b1aeaf07b992ed21cd2081a61648 --- /dev/null +++ b/annotations_filtered/nMW1Rfbl0tE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.13], [25.0, 26.22], [27.0, 27.35], [31.0, 32.76], [34.0, 34.48], [35.0, 35.07], [35.0, 36.27], [38.0, 39.48], [41.0, 41.45], [43.0, 44.09], [44.0, 44.85], [46.0, 46.92], [48.0, 48.78], [51.0, 51.16], [52.0, 54.77], [56.0, 69.25], [72.0, 87.62], [92.0, 92.74], [93.0, 98.29], [98.0, 99.59], [100.0, 101.29], [104.0, 120.36], [123.0, 124.38], [125.0, 127.14], [128.0, 128.26], [131.0, 134.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, true, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.0, 33.68, 32.42, 0.0, 33.42, 0.0, 0.0, 31.27, 0.0, 37.47, 0.0, 40.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 56.59], ["musical instrument", 7.62], ["foghorn", 7.0]], [["music", 32.96], ["speech", 19.68], ["whale vocalization", 6.51]], [["music", 67.47], ["speech", 12.49], ["electronic music", 2.42]], null, [["speech", 42.78], ["music", 19.74], ["brass instrument", 5.31]], null, null, [["music", 52.62], ["speech", 7.22], ["livestock, farm animals, working animals", 4.89]], null, [["music", 22.22], ["hum", 6.41], ["musical instrument", 4.3]], null, [["music", 45.97], ["speech", 16.13], ["hum", 4.55]]], "duration": [1.13, 1.22, 0.35, 1.76, 0.48, 0.07, 1.27, 1.48, 0.45, 1.09, 0.85, 0.92, 0.78, 0.16, 2.77, 13.25, 15.62, 0.74, 5.29, 1.59, 1.29, 16.36, 1.38, 2.14, 0.26, 3.32]} \ No newline at end of file diff --git a/annotations_filtered/nMlDPsRwZE4_filtered.json b/annotations_filtered/nMlDPsRwZE4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5717b27d0842c24faec280ece39880207e03c760 --- /dev/null +++ b/annotations_filtered/nMlDPsRwZE4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 26.2], [27.0, 45.69]], "keep_status": [false, true], "silence_prob": [29.76, 29.63], "audiomae_on_audioset": [[["music", 62.08], ["wind noise (microphone)", 4.17], ["theremin", 3.94]], [["music", 54.06], ["flute", 6.94], ["theremin", 5.56]]], "duration": [21.2, 18.69]} \ No newline at end of file diff --git a/annotations_filtered/nMtW7uy5RrQ_filtered.json b/annotations_filtered/nMtW7uy5RrQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b83894e126ac65cf129e4dcc13723ce111ca0eb7 --- /dev/null +++ b/annotations_filtered/nMtW7uy5RrQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.96], [16.0, 16.7]], "keep_status": [false, false], "silence_prob": [30.22, 0.0], "audiomae_on_audioset": [[["music", 48.38], ["cacophony", 11.76], ["hum", 10.37]], null], "duration": [5.96, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/nNGz1GspkbM_filtered.json b/annotations_filtered/nNGz1GspkbM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7792c84b06795d4caf50f95aed3fbc50baa335fd --- /dev/null +++ b/annotations_filtered/nNGz1GspkbM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[65.0, 75.74], [77.0, 77.65], [81.0, 83.02], [85.0, 85.23], [87.0, 87.67], [89.0, 138.27], [138.0, 143.51], [150.0, 215.86]], "keep_status": [true, false, true, false, false, false, true, false], "silence_prob": [28.42, 0.0, 29.49, 0.0, 0.0, 0.0, 29.05, 0.0], "audiomae_on_audioset": [[["hum", 40.58], ["mains hum", 16.53], ["throbbing", 7.97]], null, [["music", 42.59], ["hum", 10.6], ["electronic music", 8.88]], null, null, null, [["speech", 22.14], ["whale vocalization", 15.89], ["hum", 12.13]], null], "duration": [10.74, 0.65, 2.02, 0.23, 0.67, 49.27, 5.51, 65.86]} \ No newline at end of file diff --git a/annotations_filtered/nNKsj8rQGHc_filtered.json b/annotations_filtered/nNKsj8rQGHc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6211351a38df991ab42b03637af61e7f1d6d2ef --- /dev/null +++ b/annotations_filtered/nNKsj8rQGHc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.4], [9.0, 13.8], [15.0, 16.39], [19.0, 22.05], [23.0, 25.78], [29.0, 30.43], [37.0, 36.69], [38.0, 38.26], [40.0, 40.54], [42.0, 43.66], [44.0, 47.7], [54.0, 56.34], [60.0, 61.32], [64.0, 64.69], [74.0, 73.63], [74.0, 75.49], [80.0, 83.76], [87.0, 87.98], [88.0, 89.51], [91.0, 95.79], [97.0, 104.46], [105.0, 106.07], [110.0, 111.3], [112.0, 115.38], [116.0, 119.35], [121.0, 121.68], [124.0, 123.84], [133.0, 135.03], [137.0, 142.65], [144.0, 145.91], [147.0, 147.09], [149.0, 153.42], [161.0, 178.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.99, 0.0, 99.36, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 99.68, 99.62, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.84, 99.87, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 100.0, 99.99, 0.0, 0.0, 99.05, 99.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 4.8, 1.39, 3.05, 2.78, 1.43, -0.31, 0.26, 0.54, 1.66, 3.7, 2.34, 1.32, 0.69, -0.37, 1.49, 3.76, 0.98, 1.51, 4.79, 7.46, 1.07, 1.3, 3.38, 3.35, 0.68, -0.16, 2.03, 5.65, 1.91, 0.09, 4.42, 17.77]} \ No newline at end of file diff --git a/annotations_filtered/nNLk8GMdFd8_filtered.json b/annotations_filtered/nNLk8GMdFd8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4efe3728d8550f08a89272fff888f5b1c3d6dc7 --- /dev/null +++ b/annotations_filtered/nNLk8GMdFd8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 41.01], [42.0, 51.88], [53.0, 69.97], [73.0, 92.31], [94.0, 101.73], [104.0, 104.58], [106.0, 110.34], [111.0, 112.21], [113.0, 113.49]], "keep_status": [true, false, false, true, false, false, false, false, false], "silence_prob": [32.05, 32.49, 32.41, 35.37, 99.48, 0.0, 99.44, 0.0, 0.0], "audiomae_on_audioset": [[["music", 48.49], ["musical instrument", 8.68], ["didgeridoo", 6.75]], [["music", 58.07], ["percussion", 10.59], ["drum", 6.75]], [["music", 60.37], ["crow", 10.51], ["caw", 4.19]], [["music", 41.5], ["cacophony", 16.24], ["didgeridoo", 10.45]], null, null, null, null, null], "duration": [5.01, 9.88, 16.97, 19.31, 7.73, 0.58, 4.34, 1.21, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/nNXIh6RrvNw_filtered.json b/annotations_filtered/nNXIh6RrvNw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac3fef94c3075142d767be7365ee25af8f45c525 --- /dev/null +++ b/annotations_filtered/nNXIh6RrvNw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.72], [16.0, 17.95], [20.0, 20.16], [30.0, 30.42], [34.0, 33.94], [43.0, 44.07], [46.0, 46.55], [49.0, 49.27], [50.0, 49.98], [53.0, 57.48], [62.0, 62.13], [65.0, 65.62], [70.0, 74.46], [100.0, 100.82], [103.0, 103.08], [106.0, 107.33], [107.0, 107.47], [107.0, 107.5], [114.0, 115.13], [116.0, 117.04], [118.0, 119.03], [127.0, 126.86], [129.0, 128.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.33, 0.0, 0.0, 99.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.72, 1.95, 0.16, 0.42, -0.06, 1.07, 0.55, 0.27, -0.02, 4.48, 0.13, 0.62, 4.46, 0.82, 0.08, 1.33, 0.47, 0.5, 1.13, 1.04, 1.03, -0.14, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/nNkIWyfowzA_filtered.json b/annotations_filtered/nNkIWyfowzA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3b958a29ea04fb339f9f89ab4ad00abf33dd7e5 --- /dev/null +++ b/annotations_filtered/nNkIWyfowzA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.67], [15.0, 14.76]], "keep_status": [true, false], "silence_prob": [29.79, 0.0], "audiomae_on_audioset": [[["buzz", 31.64], ["music", 17.79], ["breaking", 12.62]], null], "duration": [6.67, -0.24]} \ No newline at end of file diff --git a/annotations_filtered/nO7qxQsQK44_filtered.json b/annotations_filtered/nO7qxQsQK44_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5b67b79a44d34333f8bfb40ec225651c3fdf443 --- /dev/null +++ b/annotations_filtered/nO7qxQsQK44_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.55], [6.0, 7.47], [8.0, 14.59], [15.0, 16.14], [17.0, 20.87], [21.0, 21.95], [22.0, 24.75], [28.0, 28.39], [46.0, 48.37], [49.0, 55.76], [56.0, 57.89], [59.0, 59.14], [60.0, 60.12], [61.0, 61.43], [61.0, 61.52], [62.0, 62.53], [63.0, 63.22], [65.0, 75.2], [76.0, 77.62], [83.0, 83.64], [85.0, 87.02], [89.0, 89.19], [90.0, 93.18], [94.0, 94.15], [98.0, 104.19], [104.0, 104.85], [107.0, 107.28], [108.0, 109.49], [116.0, 115.97], [119.0, 127.89], [130.0, 133.46], [134.0, 137.91], [140.0, 140.07], [144.0, 144.21], [145.0, 145.83], [149.0, 149.59], [154.0, 153.91], [155.0, 156.03], [160.0, 161.67], [162.0, 162.95]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 44.78, 0.0, 72.75, 0.0, 50.61, 0.0, 98.59, 55.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.86, 0.0, 0.0, 97.33, 0.0, 35.54, 0.0, 41.78, 0.0, 0.0, 0.0, 0.0, 88.1, 98.73, 92.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 17.1], ["stomach rumble", 14.57], ["hum", 13.37]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 61.35], ["hum", 9.88], ["mains hum", 3.79]], null, null, null, null, [["speech", 29.38], ["beatboxing", 8.74], ["radio", 6.32]], null, [["speech", 89.14], ["radio", 6.24], ["inside, small room", 0.65]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.55, 1.47, 6.59, 1.14, 3.87, 0.95, 2.75, 0.39, 2.37, 6.76, 1.89, 0.14, 0.12, 0.43, 0.52, 0.53, 0.22, 10.2, 1.62, 0.64, 2.02, 0.19, 3.18, 0.15, 6.19, 0.85, 0.28, 1.49, -0.03, 8.89, 3.46, 3.91, 0.07, 0.21, 0.83, 0.59, -0.09, 1.03, 1.67, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/nODBN75vrH0_filtered.json b/annotations_filtered/nODBN75vrH0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ddd2cffcce7553443834264a85baab610bd473f --- /dev/null +++ b/annotations_filtered/nODBN75vrH0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 24.53], [26.0, 34.72], [47.0, 94.42], [95.0, 97.16], [98.0, 114.62], [119.0, 120.53]], "keep_status": [false, true, false, true, false, false], "silence_prob": [31.89, 33.33, 0.0, 37.25, 31.28, 0.0], "audiomae_on_audioset": [[["speech", 69.66], ["vehicle", 4.78], ["music", 3.43]], [["music", 28.26], ["buzz", 18.45], ["vehicle", 7.82]], null, [["speech", 34.24], ["buzz", 20.13], ["vehicle", 8.64]], [["music", 60.94], ["cacophony", 6.96], ["sidetone", 5.12]], null], "duration": [7.53, 8.72, 47.42, 2.16, 16.62, 1.53]} \ No newline at end of file diff --git a/annotations_filtered/nOFfrd6bOh0_filtered.json b/annotations_filtered/nOFfrd6bOh0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c30905c09096c1332f8aaa8d1283d99ff5ee2fcc --- /dev/null +++ b/annotations_filtered/nOFfrd6bOh0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 25.57], [42.0, 45.55], [46.0, 48.56], [52.0, 52.73], [53.0, 55.76], [56.0, 56.0], [61.0, 64.84], [65.0, 64.91], [65.0, 64.94], [65.0, 65.01], [65.0, 65.5], [68.0, 70.73], [75.0, 78.33], [85.0, 85.48], [92.0, 91.91], [97.0, 97.66], [108.0, 108.7]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.76, 92.97, 0.0, 66.63, 0.0, 37.89, 0.0, 0.0, 0.0, 0.0, 65.2, 40.41, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["fly, housefly", 33.4], ["speech", 12.68], ["mosquito", 11.57]], null, null, null, null, [["speech", 22.37], ["thunk", 13.81], ["boing", 12.19]], null, null, null, null, null, [["speech", 56.89], ["fart", 21.8], ["boing", 2.45]], null, null, null, null], "duration": [1.57, 3.55, 2.56, 0.73, 2.76, 0.0, 3.84, -0.09, -0.06, 0.01, 0.5, 2.73, 3.33, 0.48, -0.09, 0.66, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/nOQCz7STLIY_filtered.json b/annotations_filtered/nOQCz7STLIY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c41c72a7e87bb5c40599a973f533bb27928e4abd --- /dev/null +++ b/annotations_filtered/nOQCz7STLIY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.53], [11.0, 11.99], [14.0, 14.71], [20.0, 20.56], [28.0, 28.7], [30.0, 30.67], [31.0, 31.38], [33.0, 33.81], [36.0, 36.71], [47.0, 47.56], [48.0, 48.29], [51.0, 53.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 0.99, 0.71, 0.56, 0.7, 0.67, 0.38, 0.81, 0.71, 0.56, 0.29, 2.55]} \ No newline at end of file diff --git a/annotations_filtered/nOkJXxd0cNg_filtered.json b/annotations_filtered/nOkJXxd0cNg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e749e5a9c0d2ed78798b51f37cb3ccf86f483ce --- /dev/null +++ b/annotations_filtered/nOkJXxd0cNg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.22], [14.0, 14.72], [18.0, 18.23], [21.0, 20.65], [24.0, 26.27], [27.0, 27.63], [29.0, 30.89], [34.0, 34.65], [36.0, 37.89], [38.0, 39.65], [41.0, 42.47], [42.0, 43.41], [45.0, 45.2], [46.0, 45.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [72.46, 0.0, 0.0, 0.0, 80.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.22, 0.72, 0.23, -0.35, 2.27, 0.63, 1.89, 0.65, 1.89, 1.65, 1.47, 1.41, 0.2, -0.01]} \ No newline at end of file diff --git a/annotations_filtered/nOpwufXdkIk_filtered.json b/annotations_filtered/nOpwufXdkIk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..362e6687da249f56d99494189e508cdc8a5b90f0 --- /dev/null +++ b/annotations_filtered/nOpwufXdkIk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 27.41], [31.0, 33.18], [36.0, 37.32], [45.0, 46.89], [50.0, 50.14], [54.0, 55.02], [56.0, 57.35], [60.0, 60.05], [62.0, 62.63], [66.0, 66.95], [69.0, 70.51], [71.0, 72.57], [78.0, 78.38], [81.0, 82.39], [87.0, 87.25], [88.0, 89.36], [91.0, 91.52], [100.0, 100.89], [108.0, 108.75], [110.0, 111.01], [117.0, 118.03], [122.0, 122.54], [123.0, 123.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.92, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [20.41, 2.18, 1.32, 1.89, 0.14, 1.02, 1.35, 0.05, 0.63, 0.95, 1.51, 1.57, 0.38, 1.39, 0.25, 1.36, 0.52, 0.89, 0.75, 1.01, 1.03, 0.54, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/nOu9n4ulmRk_filtered.json b/annotations_filtered/nOu9n4ulmRk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a6c3e75d320a392946abbab65dfa2de6db644e5f --- /dev/null +++ b/annotations_filtered/nOu9n4ulmRk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.33], [11.0, 12.31], [15.0, 16.12], [18.0, 18.5], [31.0, 30.84], [31.0, 31.53], [33.0, 37.66], [56.0, 57.16], [65.0, 65.21], [88.0, 93.24], [94.0, 95.84]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.94, 0.0, 0.0, 29.65, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 54.22], ["crowd", 2.6], ["applause", 2.43]], null, null, [["buzz", 26.34], ["fly, housefly", 11.23], ["music", 9.76]], null], "duration": [0.33, 1.31, 1.12, 0.5, -0.16, 0.53, 4.66, 1.16, 0.21, 5.24, 1.84]} \ No newline at end of file diff --git a/annotations_filtered/nP-P4IYLJWY_filtered.json b/annotations_filtered/nP-P4IYLJWY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e91933dbd275829bca7bad32bbf134b2772f49e --- /dev/null +++ b/annotations_filtered/nP-P4IYLJWY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 20.17], [23.0, 40.69], [42.0, 47.73], [49.0, 55.32], [56.0, 73.48], [78.0, 91.64], [94.0, 109.85], [112.0, 125.17], [129.0, 137.88], [140.0, 142.15], [143.0, 143.67], [145.0, 163.43], [166.0, 166.43]], "keep_status": [true, false, false, true, false, false, true, false, true, true, false, true, false], "silence_prob": [29.19, 28.46, 29.07, 28.63, 28.57, 28.91, 28.82, 28.51, 28.63, 30.78, 0.0, 28.64, 0.0], "audiomae_on_audioset": [[["music", 48.64], ["throbbing", 9.59], ["hum", 6.68]], [["music", 74.37], ["cacophony", 3.02], ["throbbing", 2.58]], [["music", 37.57], ["throbbing", 25.76], ["hum", 12.45]], [["sound effect", 17.76], ["music", 17.22], ["hum", 9.93]], [["speech", 62.1], ["music", 19.87], ["hum", 3.02]], [["music", 63.99], ["electronic music", 6.1], ["didgeridoo", 3.54]], [["buzz", 29.13], ["music", 19.13], ["hum", 9.53]], [["speech", 48.91], ["music", 21.64], ["mains hum", 12.35]], [["music", 28.27], ["hum", 20.08], ["throbbing", 17.23]], [["music", 48.57], ["cacophony", 16.12], ["mains hum", 4.47]], null, [["music", 29.41], ["hum", 17.53], ["speech", 16.94]], null], "duration": [5.17, 17.69, 5.73, 6.32, 17.48, 13.64, 15.85, 13.17, 8.88, 2.15, 0.67, 18.43, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/nP7OKtlMO2w_filtered.json b/annotations_filtered/nP7OKtlMO2w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1485b409f024a6f2f197db06052c20b93817b554 --- /dev/null +++ b/annotations_filtered/nP7OKtlMO2w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.47], [19.0, 18.62], [20.0, 21.98], [23.0, 36.98], [38.0, 41.42], [43.0, 49.86], [53.0, 53.89], [61.0, 61.16], [65.0, 65.53], [67.0, 68.0], [70.0, 82.71], [85.0, 94.73], [106.0, 106.2], [116.0, 117.09], [127.0, 128.09], [133.0, 133.49], [150.0, 150.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.41, 31.81, 35.69, 0.0, 0.0, 0.0, 0.0, 37.38, 31.55, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 68.53], ["music", 5.79], ["hum", 4.39]], [["chopping (food)", 35.63], ["knock", 25.42], ["speech", 12.77]], [["hum", 52.26], ["throbbing", 34.01], ["heart sounds, heartbeat", 7.23]], null, null, null, null, [["music", 53.2], ["musical instrument", 8.85], ["synthesizer", 5.62]], [["music", 75.04], ["theremin", 10.34], ["humming", 1.73]], null, null, null, null, null], "duration": [0.47, -0.38, 1.98, 13.98, 3.42, 6.86, 0.89, 0.16, 0.53, 1.0, 12.71, 9.73, 0.2, 1.09, 1.09, 0.49, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/nPGxSotEa-c_filtered.json b/annotations_filtered/nPGxSotEa-c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56b3567b300815d63c9c5a44152043622e103a85 --- /dev/null +++ b/annotations_filtered/nPGxSotEa-c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 32.43], [38.0, 66.31], [67.0, 73.92], [76.0, 95.96], [98.0, 110.24], [111.0, 111.5], [112.0, 112.24], [115.0, 119.35], [124.0, 130.52]], "keep_status": [false, false, true, true, true, false, false, true, false], "silence_prob": [34.53, 29.8, 29.55, 30.59, 31.71, 0.0, 0.0, 31.14, 30.7], "audiomae_on_audioset": [[["music", 39.65], ["speech", 30.5], ["throbbing", 3.94]], [["speech", 36.76], ["music", 29.79], ["boing", 9.1]], [["electric shaver, electric razor", 26.51], ["music", 17.44], ["buzz", 6.1]], [["music", 38.0], ["vehicle", 14.68], ["outside, rural or natural", 5.81]], [["music", 47.52], ["whack, thwack", 7.62], ["fart", 6.01]], null, null, [["mosquito", 28.62], ["fly, housefly", 22.07], ["insect", 10.44]], [["cattle, bovinae", 38.66], ["moo", 36.5], ["livestock, farm animals, working animals", 20.67]]], "duration": [15.43, 28.31, 6.92, 19.96, 12.24, 0.5, 0.24, 4.35, 6.52]} \ No newline at end of file diff --git a/annotations_filtered/nPJFSx8RTzo_filtered.json b/annotations_filtered/nPJFSx8RTzo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..470d7927e721a6a2b3843ec1a81d167094aad054 --- /dev/null +++ b/annotations_filtered/nPJFSx8RTzo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.99], [6.0, 6.24], [14.0, 14.27], [19.0, 20.41], [22.0, 22.23], [24.0, 26.22], [30.0, 31.38], [32.0, 32.83], [35.0, 35.97], [40.0, 39.85], [41.0, 41.27], [48.0, 53.16], [54.0, 59.75], [62.0, 67.47], [71.0, 71.71], [76.0, 76.11], [77.0, 77.73], [78.0, 80.87], [83.0, 83.32], [85.0, 86.54], [87.0, 86.88]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.47, 0.0, 0.0, 0.0, 0.0, 0.0, 43.35, 34.28, 36.9, 0.0, 0.0, 0.0, 39.78, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 20.5], ["hum", 19.3], ["mains hum", 17.86]], null, null, null, null, null, [["bee, wasp, etc.", 34.77], ["fly, housefly", 25.56], ["insect", 24.43]], [["mains hum", 39.48], ["hum", 37.46], ["bee, wasp, etc.", 4.14]], [["hum", 44.11], ["mains hum", 20.52], ["speech", 5.72]], null, null, null, [["hum", 21.09], ["speech", 19.68], ["throbbing", 8.24]], null, null, null], "duration": [-0.01, 0.24, 0.27, 1.41, 0.23, 2.22, 1.38, 0.83, 0.97, -0.15, 0.27, 5.16, 5.75, 5.47, 0.71, 0.11, 0.73, 2.87, 0.32, 1.54, -0.12]} \ No newline at end of file diff --git a/annotations_filtered/nPXMny-9Ntk_filtered.json b/annotations_filtered/nPXMny-9Ntk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9300c729328b7459af95c170a86eea935b8d02a9 --- /dev/null +++ b/annotations_filtered/nPXMny-9Ntk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 17.76], [18.0, 27.89], [32.0, 32.95], [33.0, 33.98], [35.0, 41.39], [42.0, 52.69], [53.0, 78.07], [80.0, 95.23], [95.0, 96.92], [99.0, 99.5], [100.0, 99.87], [100.0, 100.41], [100.0, 101.02], [102.0, 125.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.87, 97.92, 0.0, 0.0, 59.59, 89.01, 93.91, 84.07, 0.0, 0.0, 0.0, 0.0, 0.0, 69.61], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.76, 9.89, 0.95, 0.98, 6.39, 10.69, 25.07, 15.23, 1.92, 0.5, -0.13, 0.41, 1.02, 23.36]} \ No newline at end of file diff --git a/annotations_filtered/nPeH0w6ZXZM_filtered.json b/annotations_filtered/nPeH0w6ZXZM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e95bd08c3a5e9402171cce92ed33fe2d3b747dfc --- /dev/null +++ b/annotations_filtered/nPeH0w6ZXZM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 26.27], [29.0, 29.3], [31.0, 38.11], [39.0, 41.0], [42.0, 69.79], [73.0, 76.44], [78.0, 81.09], [83.0, 83.17], [86.0, 85.56], [86.0, 87.22], [88.0, 90.24], [92.0, 93.18], [95.0, 96.58], [98.0, 98.9], [99.0, 99.81], [102.0, 103.44], [104.0, 105.93]], "keep_status": [false, false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.11, 0.0, 37.2, 46.86, 31.55, 36.51, 47.58, 0.0, 0.0, 0.0, 63.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 65.14], ["musical instrument", 11.8], ["brass instrument", 6.1]], null, [["music", 65.04], ["theremin", 8.44], ["musical instrument", 5.31]], [["music", 56.36], ["musical instrument", 6.9], ["clarinet", 6.24]], [["music", 61.76], ["musical instrument", 9.97], ["brass instrument", 6.32]], [["music", 42.62], ["musical instrument", 9.58], ["didgeridoo", 7.87]], [["music", 41.38], ["didgeridoo", 11.01], ["musical instrument", 7.84]], null, null, null, null, null, null, null, null, null, null], "duration": [19.27, 0.3, 7.11, 2.0, 27.79, 3.44, 3.09, 0.17, -0.44, 1.22, 2.24, 1.18, 1.58, 0.9, 0.81, 1.44, 1.93]} \ No newline at end of file diff --git a/annotations_filtered/nPjlPgeaD_M_filtered.json b/annotations_filtered/nPjlPgeaD_M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c45c057e76ddbb053b3d2f3ed55032db0badd898 --- /dev/null +++ b/annotations_filtered/nPjlPgeaD_M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.91], [8.0, 10.29], [12.0, 12.77], [14.0, 14.52], [24.0, 27.58], [30.0, 33.76], [35.0, 35.16], [39.0, 40.9], [44.0, 48.42], [49.0, 51.88], [53.0, 55.66]], "keep_status": [false, true, false, false, true, true, false, false, true, true, true], "silence_prob": [0.0, 35.51, 0.0, 0.0, 35.35, 42.15, 0.0, 0.0, 42.33, 41.34, 31.29], "audiomae_on_audioset": [null, [["frog", 30.42], ["croak", 8.39], ["music", 5.93]], null, null, [["music", 34.31], ["fly, housefly", 9.04], ["croak", 7.18]], [["hum", 22.81], ["mains hum", 16.61], ["sidetone", 13.39]], null, null, [["throbbing", 20.38], ["music", 13.24], ["busy signal", 8.32]], [["music", 34.65], ["ping", 5.83], ["synthesizer", 5.39]], [["music", 53.48], ["synthesizer", 9.54], ["musical instrument", 5.34]]], "duration": [0.91, 2.29, 0.77, 0.52, 3.58, 3.76, 0.16, 1.9, 4.42, 2.88, 2.66]} \ No newline at end of file diff --git a/annotations_filtered/nQ2Y1gm0fRU_filtered.json b/annotations_filtered/nQ2Y1gm0fRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09f5162a6dbfa77fda94c627748cb0c10d5f58c1 --- /dev/null +++ b/annotations_filtered/nQ2Y1gm0fRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.14], [53.0, 53.52], [56.0, 56.49], [62.0, 62.4], [67.0, 68.47], [78.0, 78.93], [97.0, 97.83], [99.0, 102.91], [105.0, 106.71], [116.0, 131.41], [135.0, 151.06], [153.0, 153.44], [154.0, 153.67], [154.0, 153.74], [154.0, 155.19]], "keep_status": [false, false, false, false, false, false, false, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.07, 0.0, 32.0, 31.93, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 39.1], ["speech", 10.82], ["didgeridoo", 8.44]], null, [["speech", 22.05], ["music", 21.16], ["throbbing", 9.67]], [["music", 36.17], ["throbbing", 10.95], ["speech", 7.56]], null, null, null, null], "duration": [0.14, 0.52, 0.49, 0.4, 1.47, 0.93, 0.83, 3.91, 1.71, 15.41, 16.06, 0.44, -0.33, -0.26, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/nQBrfPjwAfQ_filtered.json b/annotations_filtered/nQBrfPjwAfQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cbb0b1a712485eb44b9cbce197a9d2cc3fb9aac7 --- /dev/null +++ b/annotations_filtered/nQBrfPjwAfQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.43], [4.0, 4.11], [5.0, 5.02], [6.0, 6.54], [7.0, 15.89], [19.0, 25.05], [26.0, 26.5], [27.0, 27.5], [28.0, 33.35], [34.0, 36.02], [37.0, 37.83], [41.0, 42.74], [46.0, 48.3], [50.0, 50.58], [51.0, 51.34], [52.0, 53.11], [54.0, 54.43], [56.0, 56.32], [59.0, 60.96], [62.0, 62.87], [64.0, 65.26], [66.0, 67.04], [68.0, 68.72], [70.0, 76.98], [79.0, 79.44], [81.0, 81.55], [85.0, 85.31], [86.0, 87.12], [92.0, 92.48], [93.0, 94.31], [96.0, 96.58], [99.0, 99.13], [100.0, 101.53], [102.0, 103.0], [104.0, 104.75], [108.0, 109.83], [112.0, 113.14], [114.0, 115.03], [117.0, 116.8], [118.0, 118.88], [120.0, 120.18], [121.0, 121.53], [122.0, 123.33], [125.0, 126.44], [128.0, 128.95], [130.0, 131.16], [133.0, 133.73], [134.0, 139.68], [141.0, 143.73], [146.0, 147.01], [149.0, 149.74], [152.0, 153.69], [155.0, 155.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.83, 99.93, 0.0, 0.0, 99.99, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 98.1, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.43, 0.11, 0.02, 0.54, 8.89, 6.05, 0.5, 0.5, 5.35, 2.02, 0.83, 1.74, 2.3, 0.58, 0.34, 1.11, 0.43, 0.32, 1.96, 0.87, 1.26, 1.04, 0.72, 6.98, 0.44, 0.55, 0.31, 1.12, 0.48, 1.31, 0.58, 0.13, 1.53, 1.0, 0.75, 1.83, 1.14, 1.03, -0.2, 0.88, 0.18, 0.53, 1.33, 1.44, 0.95, 1.16, 0.73, 5.68, 2.73, 1.01, 0.74, 1.69, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/nQIfRCUlfz4_filtered.json b/annotations_filtered/nQIfRCUlfz4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9cb67d0398ce0ab725f194671cdce40956960f64 --- /dev/null +++ b/annotations_filtered/nQIfRCUlfz4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 19.35], [20.0, 21.41], [22.0, 88.21], [89.0, 92.89], [93.0, 93.7], [94.0, 103.3], [104.0, 105.24], [106.0, 108.01], [110.0, 110.62], [112.0, 112.56], [114.0, 114.45]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [53.22, 0.0, 0.0, 47.16, 0.0, 40.82, 0.0, 35.34, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["mains hum", 35.96], ["hum", 29.55], ["music", 11.48]], null, [["hum", 28.57], ["throbbing", 23.44], ["music", 17.91]], null, [["speech", 31.52], ["radio", 11.83], ["sidetone", 9.89]], null, null, null], "duration": [11.35, 1.41, 66.21, 3.89, 0.7, 9.3, 1.24, 2.01, 0.62, 0.56, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/nQLSbuSZzE8_filtered.json b/annotations_filtered/nQLSbuSZzE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77bdbccf3d8c1fbed1a018121d6d4ff064d365c6 --- /dev/null +++ b/annotations_filtered/nQLSbuSZzE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.16], [12.0, 13.98], [14.0, 28.17], [30.0, 31.51], [32.0, 33.66], [35.0, 35.63], [38.0, 39.29], [40.0, 40.32], [41.0, 41.5], [43.0, 45.72], [48.0, 48.34], [53.0, 52.95], [60.0, 63.88], [65.0, 65.11], [68.0, 68.54], [71.0, 81.82], [83.0, 89.21], [91.0, 97.39], [99.0, 99.4], [100.0, 102.9], [108.0, 110.32], [112.0, 112.21], [113.0, 115.52], [116.0, 124.26], [125.0, 126.62], [130.0, 131.21], [132.0, 135.5], [138.0, 138.5], [140.0, 140.32], [141.0, 140.59], [141.0, 141.2], [141.0, 144.22], [146.0, 155.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [41.98, 0.0, 52.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.1, 0.0, 0.0, 69.88, 0.0, 0.0, 75.72, 75.55, 98.99, 0.0, 94.52, 43.53, 0.0, 60.89, 73.67, 0.0, 0.0, 75.07, 0.0, 0.0, 0.0, 0.0, 54.5, 46.19], "audiomae_on_audioset": [[["music", 39.21], ["speech", 26.7], ["thunk", 20.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.36], ["electronic music", 6.7], ["speech", 6.65]], null, null, null, null, null, null, null, null, null, null, null, [["hum", 22.81], ["throbbing", 20.57], ["music", 16.11]]], "duration": [3.16, 1.98, 14.17, 1.51, 1.66, 0.63, 1.29, 0.32, 0.5, 2.72, 0.34, -0.05, 3.88, 0.11, 0.54, 10.82, 6.21, 6.39, 0.4, 2.9, 2.32, 0.21, 2.52, 8.26, 1.62, 1.21, 3.5, 0.5, 0.32, -0.41, 0.2, 3.22, 9.92]} \ No newline at end of file diff --git a/annotations_filtered/nQYsHLwXnMc_filtered.json b/annotations_filtered/nQYsHLwXnMc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..449255c896174a39b226bace0db70953401f45e2 --- /dev/null +++ b/annotations_filtered/nQYsHLwXnMc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 40.17], [41.0, 41.77], [43.0, 47.61], [49.0, 54.95], [58.0, 58.72], [61.0, 69.35], [70.0, 85.9], [88.0, 115.21]], "keep_status": [false, false, false, false, false, false, true, false], "silence_prob": [99.52, 0.0, 87.0, 61.57, 0.0, 36.76, 30.37, 54.36], "audiomae_on_audioset": [null, null, null, null, null, [["sidetone", 74.28], ["hum", 6.04], ["speech", 5.96]], [["speech", 32.99], ["hum", 17.69], ["mains hum", 16.68]], null], "duration": [2.17, 0.77, 4.61, 5.95, 0.72, 8.35, 15.9, 27.21]} \ No newline at end of file diff --git a/annotations_filtered/nQZd4bNOSAI_filtered.json b/annotations_filtered/nQZd4bNOSAI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d34ad3f304b2b31211a6d9b2c7f82b1feb64ac11 --- /dev/null +++ b/annotations_filtered/nQZd4bNOSAI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.3], [24.0, 24.27], [25.0, 25.41], [26.0, 28.71], [30.0, 32.09], [34.0, 34.96], [39.0, 41.18], [47.0, 59.27], [63.0, 64.77], [67.0, 69.18], [70.0, 73.03], [74.0, 75.66], [77.0, 77.6]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 60.05, 69.74, 0.0, 79.07, 49.73, 0.0, 66.39, 62.07, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 35.89], ["hum", 8.5], ["animal", 6.3]], null, null, null, null, null], "duration": [1.3, 0.27, 0.41, 2.71, 2.09, 0.96, 2.18, 12.27, 1.77, 2.18, 3.03, 1.66, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/nQeov6j0bsQ_filtered.json b/annotations_filtered/nQeov6j0bsQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e034be0ca862b06c224856e3b819ea2d0f811e2 --- /dev/null +++ b/annotations_filtered/nQeov6j0bsQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[68.0, 98.05], [100.0, 107.16], [110.0, 112.7], [116.0, 123.25], [125.0, 130.52]], "keep_status": [false, false, false, false, true], "silence_prob": [0.0, 33.19, 35.52, 33.6, 34.67], "audiomae_on_audioset": [null, [["music", 27.28], ["hum", 27.19], ["speech", 16.8]], [["music", 58.04], ["sidetone", 11.35], ["throbbing", 5.3]], [["music", 61.46], ["speech", 12.81], ["electronic music", 5.78]], [["music", 46.75], ["speech", 8.9], ["whale vocalization", 5.4]]], "duration": [30.05, 7.16, 2.7, 7.25, 5.52]} \ No newline at end of file diff --git a/annotations_filtered/nRLP98lG1YA_filtered.json b/annotations_filtered/nRLP98lG1YA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19f9c73cf7e1015701a49405203f831ef813c93c --- /dev/null +++ b/annotations_filtered/nRLP98lG1YA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.32], [4.0, 7.64], [8.0, 10.18], [13.0, 16.61], [18.0, 17.95], [19.0, 19.57], [20.0, 20.66], [21.0, 22.17], [23.0, 24.54], [26.0, 28.12], [32.0, 32.71], [39.0, 39.19], [40.0, 40.51], [41.0, 44.19], [44.0, 45.77], [47.0, 52.51], [53.0, 54.24], [55.0, 58.85], [60.0, 60.96], [62.0, 62.16], [65.0, 65.11], [70.0, 74.55], [75.0, 76.08], [78.0, 92.57], [93.0, 94.15], [95.0, 105.04], [106.0, 109.63], [114.0, 114.29], [115.0, 117.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false], "silence_prob": [0.0, 90.25, 100.0, 93.45, 0.0, 0.0, 0.0, 0.0, 0.0, 95.78, 0.0, 0.0, 0.0, 86.27, 0.0, 69.07, 0.0, 99.9, 0.0, 0.0, 0.0, 32.05, 0.0, 33.3, 0.0, 32.91, 37.89, 0.0, 38.42], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 25.22], ["cattle, bovinae", 11.75], ["moo", 11.0]], null, [["didgeridoo", 57.63], ["music", 36.78], ["musical instrument", 3.64]], null, [["music", 22.29], ["electric shaver, electric razor", 9.0], ["mains hum", 8.47]], [["music", 54.8], ["grunt", 11.38], ["animal", 3.21]], null, [["music", 45.16], ["noise", 15.59], ["fart", 13.27]]], "duration": [1.32, 3.64, 2.18, 3.61, -0.05, 0.57, 0.66, 1.17, 1.54, 2.12, 0.71, 0.19, 0.51, 3.19, 1.77, 5.51, 1.24, 3.85, 0.96, 0.16, 0.11, 4.55, 1.08, 14.57, 1.15, 10.04, 3.63, 0.29, 2.22]} \ No newline at end of file diff --git a/annotations_filtered/nRTjNEP6v2U_filtered.json b/annotations_filtered/nRTjNEP6v2U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1263ac01ff830751934495ca6d448c079633dfb9 --- /dev/null +++ b/annotations_filtered/nRTjNEP6v2U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 14.55], [16.0, 17.69], [29.0, 32.39], [38.0, 39.16], [43.0, 43.75], [45.0, 48.14], [50.0, 50.38], [52.0, 52.62], [58.0, 58.82], [61.0, 62.72], [65.0, 65.42], [66.0, 71.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.52, 0.0, 99.62, 0.0, 0.0, 89.54, 0.0, 0.0, 0.0, 0.0, 0.0, 99.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.55, 1.69, 3.39, 1.16, 0.75, 3.14, 0.38, 0.62, 0.82, 1.72, 0.42, 5.69]} \ No newline at end of file diff --git a/annotations_filtered/nRq905BT8HM_filtered.json b/annotations_filtered/nRq905BT8HM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6836c9c7cc913bba9540f7e35c3f0dfe0e14ce2c --- /dev/null +++ b/annotations_filtered/nRq905BT8HM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 39.33], [41.0, 49.45], [51.0, 63.37], [67.0, 69.2], [71.0, 72.6], [75.0, 84.28], [84.0, 88.65], [89.0, 93.28], [94.0, 95.18]], "keep_status": [false, false, false, true, false, false, false, false, false], "silence_prob": [100.0, 100.0, 99.97, 36.91, 0.0, 44.43, 74.44, 44.87, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 26.38], ["hum", 20.47], ["throbbing", 10.54]], null, [["tuning fork", 35.71], ["hum", 29.39], ["mains hum", 11.37]], null, [["hum", 42.14], ["mains hum", 41.6], ["speech", 9.26]], null], "duration": [2.33, 8.45, 12.37, 2.2, 1.6, 9.28, 4.65, 4.28, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/nS-0lfCTcrk_filtered.json b/annotations_filtered/nS-0lfCTcrk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eec002fd61f07498aba0ea2d9c9c2362bda98750 --- /dev/null +++ b/annotations_filtered/nS-0lfCTcrk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 18.33], [20.0, 23.23], [24.0, 30.35], [31.0, 53.81], [58.0, 64.88], [75.0, 82.14], [82.0, 114.62], [116.0, 116.23], [116.0, 116.67], [117.0, 120.38], [122.0, 129.83], [131.0, 135.94], [137.0, 139.8], [140.0, 141.45], [142.0, 142.82], [144.0, 148.39]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.44, 34.82, 36.61, 30.64, 31.7, 30.74, 0.0, 0.0, 0.0, 95.37, 100.0, 86.09, 51.18, 0.0, 0.0, 43.25], "audiomae_on_audioset": [[["music", 66.86], ["brass instrument", 5.69], ["musical instrument", 4.23]], [["music", 54.69], ["saxophone", 9.92], ["wind instrument, woodwind instrument", 5.57]], [["music", 50.8], ["musical instrument", 10.96], ["synthesizer", 8.09]], [["music", 55.86], ["musical instrument", 17.3], ["brass instrument", 7.68]], [["saxophone", 39.94], ["music", 18.56], ["brass instrument", 16.93]], [["music", 38.72], ["saxophone", 26.48], ["brass instrument", 10.05]], null, null, null, null, null, null, null, null, null, [["speech", 87.6], ["telephone", 4.49], ["inside, small room", 1.0]]], "duration": [9.33, 3.23, 6.35, 22.81, 6.88, 7.14, 32.62, 0.23, 0.67, 3.38, 7.83, 4.94, 2.8, 1.45, 0.82, 4.39]} \ No newline at end of file diff --git a/annotations_filtered/nS0fxM7sCHs_filtered.json b/annotations_filtered/nS0fxM7sCHs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38a89a2df4b2c4ea9e4a9c07eece80d28bceeecd --- /dev/null +++ b/annotations_filtered/nS0fxM7sCHs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.59], [15.0, 16.01], [23.0, 37.05], [38.0, 37.94], [38.0, 48.52], [61.0, 72.98], [77.0, 79.17], [80.0, 81.6], [84.0, 84.2], [87.0, 87.51], [97.0, 100.55], [104.0, 109.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [86.64, 0.0, 75.88, 0.0, 70.58, 50.71, 37.65, 0.0, 0.0, 0.0, 32.96, 30.37], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 54.83], ["theremin", 20.67], ["musical instrument", 5.2]], null, null, null, [["music", 37.75], ["gong", 15.94], ["ambient music", 15.47]], [["theremin", 80.79], ["music", 14.17], ["ambient music", 0.94]]], "duration": [4.59, 1.01, 14.05, -0.06, 10.52, 11.98, 2.17, 1.6, 0.2, 0.51, 3.55, 5.41]} \ No newline at end of file diff --git a/annotations_filtered/nS1ePEA5XeQ_filtered.json b/annotations_filtered/nS1ePEA5XeQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2ba946e08262c1019ad2823d65e6f9663d70332 --- /dev/null +++ b/annotations_filtered/nS1ePEA5XeQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.48], [8.0, 8.63], [12.0, 14.77], [34.0, 34.45], [38.0, 38.18], [43.0, 43.44], [47.0, 48.24], [50.0, 57.5], [58.0, 61.15], [63.0, 63.0], [63.0, 63.04], [64.0, 64.3], [64.0, 64.34], [64.0, 72.45], [75.0, 79.03], [79.0, 79.3], [79.0, 99.44], [101.0, 105.39], [109.0, 117.85]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, true, false, true, true, true], "silence_prob": [0.0, 0.0, 96.04, 0.0, 0.0, 0.0, 0.0, 34.72, 34.89, 0.0, 0.0, 0.0, 0.0, 37.27, 36.97, 0.0, 34.77, 35.55, 33.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 55.88], ["theremin", 5.71], ["speech", 3.22]], [["music", 22.83], ["speech", 22.18], ["hum", 10.75]], null, null, null, null, [["music", 66.58], ["cello", 3.93], ["clarinet", 2.63]], [["music", 44.71], ["trombone", 6.24], ["brass instrument", 6.19]], null, [["music", 39.27], ["speech", 21.22], ["animal", 7.03]], [["music", 34.98], ["speech", 6.04], ["animal", 4.76]], [["speech", 42.7], ["music", 24.13], ["hum", 2.81]]], "duration": [0.48, 0.63, 2.77, 0.45, 0.18, 0.44, 1.24, 7.5, 3.15, 0.0, 0.04, 0.3, 0.34, 8.45, 4.03, 0.3, 20.44, 4.39, 8.85]} \ No newline at end of file diff --git a/annotations_filtered/nS4Zfx9BSX0_filtered.json b/annotations_filtered/nS4Zfx9BSX0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bce913d62069fcd71a9407b7df354d460793fd9 --- /dev/null +++ b/annotations_filtered/nS4Zfx9BSX0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 23.75], [35.0, 41.93], [50.0, 73.09], [75.0, 83.84], [84.0, 84.48], [96.0, 96.55], [98.0, 98.07], [101.0, 101.17], [115.0, 115.8], [118.0, 117.93], [118.0, 122.98]], "keep_status": [true, true, true, true, false, false, false, false, false, false, false], "silence_prob": [34.3, 35.73, 33.82, 38.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.27], "audiomae_on_audioset": [[["music", 56.45], ["theremin", 6.81], ["throbbing", 4.91]], [["music", 54.08], ["didgeridoo", 5.54], ["effects unit", 4.89]], [["music", 54.27], ["guitar", 6.91], ["fart", 6.27]], [["music", 52.24], ["theremin", 12.05], ["musical instrument", 5.04]], null, null, null, null, null, null, [["music", 58.17], ["speech", 18.75], ["vibraphone", 2.32]]], "duration": [3.75, 6.93, 23.09, 8.84, 0.48, 0.55, 0.07, 0.17, 0.8, -0.07, 4.98]} \ No newline at end of file diff --git a/annotations_filtered/nS8tqsjySaI_filtered.json b/annotations_filtered/nS8tqsjySaI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ec27cc0c4990c87363a2c92e29250ec1a06ba5c --- /dev/null +++ b/annotations_filtered/nS8tqsjySaI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.63], [10.0, 12.12], [12.0, 12.99], [14.0, 15.99], [20.0, 20.61], [23.0, 24.41], [26.0, 25.78], [32.0, 32.61], [43.0, 43.78], [45.0, 45.37], [57.0, 58.75], [70.0, 71.79], [75.0, 75.57], [81.0, 81.77], [92.0, 93.7], [100.0, 103.13], [106.0, 107.59], [109.0, 110.73], [112.0, 111.99], [113.0, 122.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 72.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 0.0, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.63, 2.12, 0.99, 1.99, 0.61, 1.41, -0.22, 0.61, 0.78, 0.37, 1.75, 1.79, 0.57, 0.77, 1.7, 3.13, 1.59, 1.73, -0.01, 9.59]} \ No newline at end of file diff --git a/annotations_filtered/nSEGOd89xWw_filtered.json b/annotations_filtered/nSEGOd89xWw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e792d9c4b2dfec1b495b79c5364fd38f8e1f274d --- /dev/null +++ b/annotations_filtered/nSEGOd89xWw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [3.0, 3.82], [5.0, 6.24], [12.0, 12.97], [17.0, 16.92], [18.0, 18.72], [23.0, 24.07], [34.0, 48.66], [51.0, 51.26], [58.0, 81.11], [82.0, 83.2], [84.0, 85.65], [92.0, 92.85], [95.0, 96.31], [102.0, 102.84], [104.0, 105.21], [106.0, 106.59], [108.0, 108.31], [109.0, 110.54], [111.0, 111.11], [117.0, 117.66], [119.0, 119.04], [120.0, 120.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.09, 0.0, 31.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 87.29], ["speech", 3.08], ["musical instrument", 2.3]], null, [["music", 74.11], ["drum machine", 7.79], ["synthesizer", 6.63]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 0.82, 1.24, 0.97, -0.08, 0.72, 1.07, 14.66, 0.26, 23.11, 1.2, 1.65, 0.85, 1.31, 0.84, 1.21, 0.59, 0.31, 1.54, 0.11, 0.66, 0.04, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/nSH_S3LDUYI_filtered.json b/annotations_filtered/nSH_S3LDUYI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..668f10b570be9fda8550c7062974024493a5a915 --- /dev/null +++ b/annotations_filtered/nSH_S3LDUYI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.9], [14.0, 14.89], [20.0, 20.75], [26.0, 26.4], [32.0, 38.74], [41.0, 43.82], [50.0, 51.41], [54.0, 53.77], [57.0, 57.25], [69.0, 69.16], [71.0, 91.4], [95.0, 97.24], [103.0, 104.31], [105.0, 106.59], [107.0, 108.43], [109.0, 110.71], [112.0, 113.22], [115.0, 117.8], [123.0, 130.37], [135.0, 135.97], [137.0, 138.27], [140.0, 142.72], [145.0, 145.3], [147.0, 148.49], [151.0, 152.85], [162.0, 163.75]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.85, 29.45, 0.0, 0.0, 0.0, 0.0, 33.26, 88.83, 0.0, 0.0, 0.0, 0.0, 0.0, 89.36, 33.43, 0.0, 0.0, 32.43, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 78.97], ["static", 1.73], ["reggae", 1.25]], [["music", 49.01], ["carnatic music", 5.36], ["drum machine", 4.01]], null, null, null, null, [["music", 84.02], ["throbbing", 3.05], ["drum and bass", 2.95]], null, null, null, null, null, null, null, [["speech", 35.35], ["music", 25.45], ["throbbing", 13.01]], null, null, [["music", 52.12], ["drum and bass", 13.42], ["throbbing", 6.16]], null, null, null, null], "duration": [-0.1, 0.89, 0.75, 0.4, 6.74, 2.82, 1.41, -0.23, 0.25, 0.16, 20.4, 2.24, 1.31, 1.59, 1.43, 1.71, 1.22, 2.8, 7.37, 0.97, 1.27, 2.72, 0.3, 1.49, 1.85, 1.75]} \ No newline at end of file diff --git a/annotations_filtered/nSJxx_KUEes_filtered.json b/annotations_filtered/nSJxx_KUEes_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75898ac2dbe2a3bbeaf65e52e03e122ba0fc7eff --- /dev/null +++ b/annotations_filtered/nSJxx_KUEes_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.0], [6.0, 6.02], [7.0, 8.72], [10.0, 10.62], [11.0, 11.96], [19.0, 20.24], [21.0, 21.83], [23.0, 23.7], [24.0, 25.96], [27.0, 28.41], [30.0, 31.04], [32.0, 32.51], [33.0, 33.32], [34.0, 35.31], [36.0, 37.49], [40.0, 42.21], [48.0, 48.17], [51.0, 51.76], [54.0, 54.63], [57.0, 56.88], [63.0, 63.21], [71.0, 71.61], [78.0, 78.83], [82.0, 82.65], [87.0, 87.93], [89.0, 90.09], [92.0, 92.89], [94.0, 94.17], [96.0, 96.99], [108.0, 108.65], [110.0, 109.93], [111.0, 116.26], [118.0, 119.87], [121.0, 124.28], [126.0, 127.63], [129.0, 129.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 0.02, 1.72, 0.62, 0.96, 1.24, 0.83, 0.7, 1.96, 1.41, 1.04, 0.51, 0.32, 1.31, 1.49, 2.21, 0.17, 0.76, 0.63, -0.12, 0.21, 0.61, 0.83, 0.65, 0.93, 1.09, 0.89, 0.17, 0.99, 0.65, -0.07, 5.26, 1.87, 3.28, 1.63, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/nSO22k4XGUo_filtered.json b/annotations_filtered/nSO22k4XGUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1a910b5f01b4778ca7794dbd73761f4dc77855f --- /dev/null +++ b/annotations_filtered/nSO22k4XGUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.67], [6.0, 8.01], [9.0, 9.71], [16.0, 17.24], [18.0, 17.9], [20.0, 23.06], [24.0, 26.23], [27.0, 28.11], [32.0, 38.21], [40.0, 40.76], [42.0, 48.84], [50.0, 50.01], [58.0, 58.14], [59.0, 60.29], [69.0, 69.62], [78.0, 82.41], [85.0, 85.08], [90.0, 90.54], [91.0, 91.3], [92.0, 92.23], [95.0, 95.3], [110.0, 111.08], [116.0, 116.85], [117.0, 117.49], [120.0, 120.48]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.41, 0.0, 0.0, 0.0, 32.5, 97.22, 0.0, 53.04, 0.0, 34.34, 0.0, 0.0, 0.0, 0.0, 30.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 41.19], ["didgeridoo", 33.38], ["musical instrument", 2.47]], null, null, null, [["music", 41.5], ["didgeridoo", 11.15], ["synthesizer", 7.77]], null, null, null, null, [["speech", 55.33], ["music", 18.94], ["breaking", 8.92]], null, null, null, null, [["speech", 68.68], ["burst, pop", 4.93], ["radio", 3.15]], null, null, null, null, null, null, null, null, null], "duration": [0.67, 2.01, 0.71, 1.24, -0.1, 3.06, 2.23, 1.11, 6.21, 0.76, 6.84, 0.01, 0.14, 1.29, 0.62, 4.41, 0.08, 0.54, 0.3, 0.23, 0.3, 1.08, 0.85, 0.49, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/nTAYbwY6oeU_filtered.json b/annotations_filtered/nTAYbwY6oeU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..042282de44d3e4b9c9bcb29772c6086eb4892669 --- /dev/null +++ b/annotations_filtered/nTAYbwY6oeU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.22], [15.0, 20.8], [21.0, 45.03], [46.0, 56.44], [58.0, 58.65]], "keep_status": [false, true, true, true, false], "silence_prob": [29.76, 30.49, 29.72, 29.63, 0.0], "audiomae_on_audioset": [[["throbbing", 32.9], ["hum", 31.31], ["music", 21.15]], [["music", 48.76], ["throbbing", 10.09], ["electronic music", 7.57]], [["music", 57.57], ["cacophony", 4.76], ["throbbing", 3.45]], [["music", 42.91], ["throbbing", 12.52], ["hum", 9.32]], null], "duration": [4.22, 5.8, 24.03, 10.44, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/nTOUiTegqrA_filtered.json b/annotations_filtered/nTOUiTegqrA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48c9357ca8195bc6f809197995065fd83d486f02 --- /dev/null +++ b/annotations_filtered/nTOUiTegqrA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.86], [6.0, 11.28], [13.0, 12.97], [14.0, 25.27], [29.0, 29.51], [32.0, 33.32], [36.0, 37.45], [42.0, 42.13], [44.0, 44.12], [46.0, 46.01], [48.0, 48.24], [62.0, 63.32], [79.0, 80.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.36, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.86, 5.28, -0.03, 11.27, 0.51, 1.32, 1.45, 0.13, 0.12, 0.01, 0.24, 1.32, 1.59]} \ No newline at end of file diff --git a/annotations_filtered/nTh9qpzhunE_filtered.json b/annotations_filtered/nTh9qpzhunE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..674a0d83a1656e95de9d914774b21bc70861f83b --- /dev/null +++ b/annotations_filtered/nTh9qpzhunE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.92], [8.0, 9.05], [10.0, 11.23], [12.0, 12.34], [14.0, 15.3], [17.0, 17.14], [22.0, 22.08], [25.0, 25.41], [28.0, 29.13], [44.0, 44.09], [45.0, 45.62], [47.0, 47.39], [49.0, 49.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.92, 1.05, 1.23, 0.34, 1.3, 0.14, 0.08, 0.41, 1.13, 0.09, 0.62, 0.39, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/nToATRUkpMI_filtered.json b/annotations_filtered/nToATRUkpMI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a0338e5fb01426e764809dcc23204bdde4e45b6 --- /dev/null +++ b/annotations_filtered/nToATRUkpMI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.04], [4.0, 4.48], [6.0, 6.34], [9.0, 9.64], [11.0, 11.48], [12.0, 13.61], [16.0, 16.95], [25.0, 25.95], [35.0, 36.31], [37.0, 38.1], [39.0, 39.75], [41.0, 42.01], [44.0, 46.74], [52.0, 53.06], [57.0, 56.69], [58.0, 58.89], [60.0, 61.1], [68.0, 68.45], [69.0, 70.07], [72.0, 73.65], [75.0, 75.34], [81.0, 81.68], [103.0, 103.57], [108.0, 108.26], [119.0, 119.77], [124.0, 124.98], [127.0, 128.36], [129.0, 131.03], [132.0, 132.04], [133.0, 134.96], [136.0, 136.78], [138.0, 139.72], [140.0, 141.72], [146.0, 146.33], [154.0, 154.89], [155.0, 155.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 13.07], ["radio", 6.38], ["busy signal", 6.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 79.18], ["speech synthesizer", 2.94], ["inside, small room", 1.93]], null, null, null, null, null, null, null, null], "duration": [0.04, 0.48, 0.34, 0.64, 0.48, 1.61, 0.95, 0.95, 1.31, 1.1, 0.75, 1.01, 2.74, 1.06, -0.31, 0.89, 1.1, 0.45, 1.07, 1.65, 0.34, 0.68, 0.57, 0.26, 0.77, 0.98, 1.36, 2.03, 0.04, 1.96, 0.78, 1.72, 1.72, 0.33, 0.89, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/nTz_lWcgDhA_filtered.json b/annotations_filtered/nTz_lWcgDhA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eba204f84bd5ab3f130383ee5936f88add7f4e23 --- /dev/null +++ b/annotations_filtered/nTz_lWcgDhA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.13], [13.0, 18.13], [19.0, 19.52], [28.0, 30.72], [31.0, 32.46], [35.0, 36.14], [43.0, 43.28], [46.0, 46.53], [50.0, 51.46], [54.0, 55.09], [59.0, 59.51], [62.0, 62.11], [81.0, 81.62], [82.0, 82.09], [83.0, 87.93], [88.0, 90.22], [91.0, 91.91], [92.0, 93.09], [94.0, 95.28], [96.0, 97.02], [98.0, 99.42], [102.0, 109.86], [111.0, 112.04], [115.0, 115.18], [116.0, 117.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 100.0, 0.0, 60.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.09, 66.15, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.13, 5.13, 0.52, 2.72, 1.46, 1.14, 0.28, 0.53, 1.46, 1.09, 0.51, 0.11, 0.62, 0.09, 4.93, 2.22, 0.91, 1.09, 1.28, 1.02, 1.42, 7.86, 1.04, 0.18, 1.68]} \ No newline at end of file diff --git a/annotations_filtered/nUpmxMzBCjk_filtered.json b/annotations_filtered/nUpmxMzBCjk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..438888fa1eba5672cd405800bcd5ef878aabd425 --- /dev/null +++ b/annotations_filtered/nUpmxMzBCjk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.7], [8.0, 12.36], [14.0, 17.9], [25.0, 25.68], [27.0, 27.55], [30.0, 34.67], [35.0, 36.71], [37.0, 38.64], [40.0, 40.91], [42.0, 45.55], [48.0, 48.69], [54.0, 54.09], [56.0, 56.96], [59.0, 63.51], [64.0, 64.37], [84.0, 90.59], [93.0, 93.88], [108.0, 123.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [36.75, 60.14, 68.8, 0.0, 0.0, 47.82, 0.0, 0.0, 0.0, 99.85, 0.0, 0.0, 0.0, 36.31, 0.0, 29.6, 0.0, 29.01], "audiomae_on_audioset": [[["music", 42.59], ["trombone", 25.79], ["brass instrument", 9.07]], null, null, null, null, [["speech", 51.64], ["sidetone", 28.04], ["radio", 3.36]], null, null, null, null, null, null, null, [["sidetone", 33.99], ["noise", 8.94], ["music", 8.49]], null, [["speech", 44.57], ["vehicle", 23.4], ["car", 6.47]], null, [["music", 67.61], ["musical instrument", 9.62], ["didgeridoo", 5.21]]], "duration": [3.7, 4.36, 3.9, 0.68, 0.55, 4.67, 1.71, 1.64, 0.91, 3.55, 0.69, 0.09, 0.96, 4.51, 0.37, 6.59, 0.88, 15.82]} \ No newline at end of file diff --git a/annotations_filtered/nUxHF4O3GYU_filtered.json b/annotations_filtered/nUxHF4O3GYU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41370e49a15feb60be0535fbfc1a65a7252cc267 --- /dev/null +++ b/annotations_filtered/nUxHF4O3GYU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.41], [6.0, 6.96], [12.0, 15.85], [19.0, 19.23], [21.0, 20.75], [22.0, 22.15], [23.0, 24.85], [27.0, 27.43], [34.0, 35.13], [38.0, 39.21], [42.0, 42.67], [44.0, 46.31], [49.0, 51.22], [51.0, 56.76], [58.0, 58.09], [60.0, 62.7], [68.0, 70.16], [72.0, 73.87], [75.0, 75.69], [77.0, 78.51], [80.0, 80.97], [82.0, 86.48], [88.0, 89.65], [93.0, 96.28], [97.0, 99.2], [101.0, 101.26], [104.0, 105.06], [107.0, 108.94], [110.0, 118.56], [119.0, 126.0], [126.0, 129.86], [131.0, 141.62], [143.0, 144.36], [145.0, 146.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.29, 76.04, 32.68, 0.0, 44.57, 76.37, 0.0, 0.0, 0.0, 0.0, 83.34, 0.0, 40.93, 68.15, 0.0, 0.0, 0.0, 65.79, 53.84, 29.99, 57.09, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 19.8], ["speech", 19.65], ["mechanisms", 11.37]], null, [["music", 27.76], ["hum", 25.22], ["throbbing", 20.22]], null, null, null, null, null, null, null, [["music", 34.71], ["theremin", 28.19], ["speech", 4.35]], null, null, null, null, null, null, [["speech", 44.56], ["thunk", 24.09], ["breaking", 5.06]], null, null, null], "duration": [0.41, 0.96, 3.85, 0.23, -0.25, 0.15, 1.85, 0.43, 1.13, 1.21, 0.67, 2.31, 2.22, 5.76, 0.09, 2.7, 2.16, 1.87, 0.69, 1.51, 0.97, 4.48, 1.65, 3.28, 2.2, 0.26, 1.06, 1.94, 8.56, 7.0, 3.86, 10.62, 1.36, 1.75]} \ No newline at end of file diff --git a/annotations_filtered/nV9U23YXgiY_filtered.json b/annotations_filtered/nV9U23YXgiY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7835435a5b4f981c5151c94b81d494af99905c62 --- /dev/null +++ b/annotations_filtered/nV9U23YXgiY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.07], [12.0, 12.23], [13.0, 14.28], [16.0, 16.06], [19.0, 19.8], [20.0, 23.48], [24.0, 27.41], [29.0, 33.24], [35.0, 36.54], [41.0, 43.41], [45.0, 45.71], [50.0, 50.63], [53.0, 55.92], [57.0, 57.55], [60.0, 61.05], [65.0, 69.01], [74.0, 74.46], [79.0, 79.39], [81.0, 85.23], [86.0, 86.21], [91.0, 91.3], [93.0, 107.27], [111.0, 111.3], [116.0, 116.9], [122.0, 123.55], [125.0, 126.05], [127.0, 128.07], [129.0, 129.93], [130.0, 130.52]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 44.4, 39.72, 37.69, 0.0, 43.43, 0.0, 0.0, 36.34, 0.0, 0.0, 40.71, 0.0, 0.0, 44.07, 0.0, 0.0, 44.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 22.51], ["hum", 21.8], ["speech", 9.1]], [["foghorn", 49.75], ["speech", 21.53], ["music", 4.76]], [["music", 67.27], ["theremin", 5.25], ["synthesizer", 3.94]], null, [["music", 53.59], ["ambient music", 8.7], ["hum", 6.98]], null, null, [["music", 41.29], ["speech", 31.23], ["vehicle", 1.54]], null, null, [["music", 43.82], ["fly, housefly", 13.12], ["insect", 5.31]], null, null, [["music", 47.88], ["hum", 15.91], ["throbbing", 6.93]], null, null, [["music", 73.81], ["synthesizer", 4.86], ["musical instrument", 2.8]], null, null, null, null, null, null, null], "duration": [0.07, 0.23, 1.28, 0.06, 0.8, 3.48, 3.41, 4.24, 1.54, 2.41, 0.71, 0.63, 2.92, 0.55, 1.05, 4.01, 0.46, 0.39, 4.23, 0.21, 0.3, 14.27, 0.3, 0.9, 1.55, 1.05, 1.07, 0.93, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/nVKSBDddFxM_filtered.json b/annotations_filtered/nVKSBDddFxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc37fe79219626b7da30884959b4757ac5ea15d --- /dev/null +++ b/annotations_filtered/nVKSBDddFxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.07], [6.0, 7.42], [8.0, 10.84], [13.0, 17.47], [20.0, 24.97], [26.0, 29.74], [31.0, 31.82], [33.0, 42.67], [45.0, 46.2], [52.0, 54.72], [57.0, 57.3], [61.0, 66.58], [69.0, 70.39], [72.0, 73.62], [75.0, 77.06], [79.0, 83.3], [84.0, 87.57], [89.0, 104.94], [108.0, 115.57], [116.0, 118.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 70.72, 73.82, 82.07, 85.72, 0.0, 78.21, 0.0, 71.72, 0.0, 78.72, 0.0, 0.0, 68.15, 63.64, 76.2, 45.69, 38.43, 38.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 62.37], ["hum", 10.27], ["ambient music", 6.48]], [["music", 57.09], ["ambient music", 24.34], ["synthesizer", 2.85]], [["music", 47.44], ["ambient music", 23.03], ["electronic music", 7.55]]], "duration": [1.07, 1.42, 2.84, 4.47, 4.97, 3.74, 0.82, 9.67, 1.2, 2.72, 0.3, 5.58, 1.39, 1.62, 2.06, 4.3, 3.57, 15.94, 7.57, 2.66]} \ No newline at end of file diff --git a/annotations_filtered/nVhrWyZtYFk_filtered.json b/annotations_filtered/nVhrWyZtYFk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4473530abe4828f44ee0c0448b1dc4d082abf93 --- /dev/null +++ b/annotations_filtered/nVhrWyZtYFk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.71], [3.0, 5.64], [10.0, 13.61], [15.0, 18.37], [20.0, 20.87], [24.0, 29.07], [30.0, 32.78], [36.0, 37.76], [39.0, 40.04], [41.0, 43.93], [45.0, 45.93], [50.0, 53.03], [54.0, 62.06], [63.0, 66.7], [67.0, 71.58], [72.0, 75.86], [77.0, 79.56], [83.0, 86.95], [88.0, 90.21]], "keep_status": [true, false, true, true, false, true, true, false, false, false, false, true, false, false, true, true, true, false, true], "silence_prob": [29.8, 35.57, 37.59, 39.67, 0.0, 39.58, 42.86, 0.0, 0.0, 45.75, 0.0, 40.43, 52.51, 52.86, 44.93, 44.81, 37.38, 37.33, 41.09], "audiomae_on_audioset": [[["speech", 34.61], ["civil defense siren", 15.25], ["vehicle", 5.3]], [["speech", 59.2], ["mains hum", 7.87], ["hum", 5.08]], [["hum", 20.93], ["mains hum", 16.24], ["music", 12.73]], [["mains hum", 46.23], ["hum", 14.3], ["music", 9.32]], null, [["hum", 23.22], ["mains hum", 20.44], ["speech", 12.74]], [["noise", 34.76], ["hum", 17.72], ["mains hum", 9.99]], null, null, [["hum", 58.9], ["mains hum", 19.11], ["throbbing", 11.75]], null, [["speech", 25.89], ["mains hum", 16.73], ["hum", 8.26]], null, null, [["music", 18.8], ["gong", 18.35], ["hum", 10.58]], [["music", 42.83], ["synthesizer", 8.82], ["hum", 7.46]], [["music", 42.09], ["speech", 9.25], ["synthesizer", 8.5]], [["music", 55.87], ["synthesizer", 8.25], ["ambient music", 7.45]], [["music", 34.07], ["ambient music", 13.33], ["hum", 9.9]]], "duration": [2.71, 2.64, 3.61, 3.37, 0.87, 5.07, 2.78, 1.76, 1.04, 2.93, 0.93, 3.03, 8.06, 3.7, 4.58, 3.86, 2.56, 3.95, 2.21]} \ No newline at end of file diff --git a/annotations_filtered/nVpfljH55TQ_filtered.json b/annotations_filtered/nVpfljH55TQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f46eb5b738144958ba5444d9b6f6c74be4c36939 --- /dev/null +++ b/annotations_filtered/nVpfljH55TQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.76], [10.0, 10.23], [14.0, 14.82], [19.0, 19.68], [23.0, 24.17], [28.0, 28.41], [30.0, 30.0], [30.0, 31.01], [34.0, 34.33], [35.0, 35.99], [38.0, 39.75], [40.0, 41.61], [51.0, 51.22], [52.0, 55.81], [58.0, 58.43], [59.0, 61.62], [73.0, 74.26], [75.0, 75.61], [76.0, 76.55], [78.0, 79.44], [82.0, 82.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 41.64, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["beatboxing", 54.26], ["speech", 15.6], ["boing", 8.95]], null, null, null, null, null], "duration": [0.76, 0.23, 0.82, 0.68, 1.17, 0.41, 0.0, 1.01, 0.33, 0.99, 1.75, 1.61, 0.22, 3.81, 0.43, 2.62, 1.26, 0.61, 0.55, 1.44, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/nVrzbfxxcZ8_filtered.json b/annotations_filtered/nVrzbfxxcZ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..587256a099a87bcfcf2315715b760b571c7a6357 --- /dev/null +++ b/annotations_filtered/nVrzbfxxcZ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.23], [9.0, 9.37], [10.0, 19.97], [23.0, 23.01], [27.0, 27.57], [30.0, 30.0], [31.0, 90.44], [91.0, 93.19], [95.0, 103.27], [105.0, 106.73], [108.0, 109.0]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [29.0, 0.0, 27.96, 0.0, 0.0, 0.0, 0.0, 29.09, 28.63, 0.0, 0.0], "audiomae_on_audioset": [[["music", 58.63], ["throbbing", 17.8], ["hum", 7.6]], null, [["music", 65.18], ["throbbing", 6.12], ["hum", 3.28]], null, null, null, null, [["music", 56.43], ["throbbing", 12.37], ["hum", 7.12]], [["music", 38.11], ["throbbing", 15.76], ["hum", 14.19]], null, null], "duration": [5.23, 0.37, 9.97, 0.01, 0.57, 0.0, 59.44, 2.19, 8.27, 1.73, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/nVvMBs0TFWA_filtered.json b/annotations_filtered/nVvMBs0TFWA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46c33f6d8227fd594927a2885e2e4b29fc018cea --- /dev/null +++ b/annotations_filtered/nVvMBs0TFWA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.06], [7.0, 8.02], [11.0, 11.89], [13.0, 15.09], [15.0, 17.93], [20.0, 22.01], [24.0, 41.25], [43.0, 50.9], [53.0, 68.57], [70.0, 70.09], [74.0, 91.07], [92.0, 99.76], [100.0, 100.53], [102.0, 105.54], [106.0, 108.53], [110.0, 117.02], [118.0, 165.87], [168.0, 172.32]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [98.51, 0.0, 0.0, 81.53, 51.28, 99.99, 44.34, 51.6, 45.33, 0.0, 65.67, 82.97, 0.0, 86.64, 79.07, 61.47, 0.0, 36.72], "audiomae_on_audioset": [null, null, null, null, null, null, [["mains hum", 53.77], ["hum", 40.08], ["music", 1.6]], null, [["music", 29.41], ["speech", 10.42], ["didgeridoo", 4.08]], null, null, null, null, null, null, null, null, [["throbbing", 52.39], ["hum", 20.39], ["music", 15.29]]], "duration": [2.06, 1.02, 0.89, 2.09, 2.93, 2.01, 17.25, 7.9, 15.57, 0.09, 17.07, 7.76, 0.53, 3.54, 2.53, 7.02, 47.87, 4.32]} \ No newline at end of file diff --git a/annotations_filtered/nW-NiGp1gys_filtered.json b/annotations_filtered/nW-NiGp1gys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8218e207c14e89f93dc44a4bdceb9786d42028c3 --- /dev/null +++ b/annotations_filtered/nW-NiGp1gys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.3], [11.0, 14.17], [14.0, 14.3], [14.0, 15.47], [20.0, 20.44], [26.0, 26.25], [27.0, 28.07], [31.0, 31.99], [38.0, 38.28], [41.0, 41.42], [53.0, 54.75], [67.0, 70.65], [77.0, 77.43], [79.0, 107.62], [113.0, 113.29], [114.0, 114.05], [116.0, 119.62], [121.0, 121.61], [126.0, 126.33], [127.0, 129.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 38.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.02, 0.0, 31.07, 0.0, 0.0, 31.43, 0.0, 0.0, 99.99], "audiomae_on_audioset": [null, [["music", 57.73], ["speech", 11.55], ["musical instrument", 7.57]], null, null, null, null, null, null, null, null, null, [["mosquito", 19.44], ["frog", 15.79], ["music", 14.01]], null, [["music", 50.35], ["noise", 10.51], ["theremin", 4.77]], null, null, [["crowd", 21.03], ["speech", 18.33], ["cheering", 7.43]], null, null, null], "duration": [0.3, 3.17, 0.3, 1.47, 0.44, 0.25, 1.07, 0.99, 0.28, 0.42, 1.75, 3.65, 0.43, 28.62, 0.29, 0.05, 3.62, 0.61, 0.33, 2.93]} \ No newline at end of file diff --git a/annotations_filtered/nW-iQzgmyeI_filtered.json b/annotations_filtered/nW-iQzgmyeI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c56585e6d367420af17a49565977e692c3ce8cc --- /dev/null +++ b/annotations_filtered/nW-iQzgmyeI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.83], [11.0, 12.48], [15.0, 15.42], [17.0, 18.67], [22.0, 25.2], [26.0, 26.6], [34.0, 34.62], [36.0, 36.96], [40.0, 40.22], [42.0, 42.97], [47.0, 47.41], [61.0, 62.23], [65.0, 66.02], [71.0, 71.93], [73.0, 74.31], [76.0, 77.72], [81.0, 81.35], [83.0, 84.18], [85.0, 85.82], [87.0, 88.13], [93.0, 93.5], [94.0, 95.89], [98.0, 99.3], [101.0, 116.63], [118.0, 119.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.31, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["stomach rumble", 34.44], ["hum", 7.89], ["inside, small room", 5.63]], null], "duration": [1.83, 1.48, 0.42, 1.67, 3.2, 0.6, 0.62, 0.96, 0.22, 0.97, 0.41, 1.23, 1.02, 0.93, 1.31, 1.72, 0.35, 1.18, 0.82, 1.13, 0.5, 1.89, 1.3, 15.63, 1.62]} \ No newline at end of file diff --git a/annotations_filtered/nW92suQFQ5c_filtered.json b/annotations_filtered/nW92suQFQ5c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24f64d3d1b473ba97cb49292c8405521233a41f4 --- /dev/null +++ b/annotations_filtered/nW92suQFQ5c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 42.58], [45.0, 46.14], [48.0, 49.67], [52.0, 52.35], [55.0, 55.76], [61.0, 61.57], [63.0, 67.1], [69.0, 81.8]], "keep_status": [false, false, false, false, false, false, true, true], "silence_prob": [57.64, 0.0, 0.0, 0.0, 0.0, 0.0, 40.09, 44.55], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 35.12], ["rumble", 25.09], ["throbbing", 8.95]], [["music", 23.64], ["sine wave", 16.04], ["breaking", 9.09]]], "duration": [3.58, 1.14, 1.67, 0.35, 0.76, 0.57, 4.1, 12.8]} \ No newline at end of file diff --git a/annotations_filtered/nWAV_KcSkNw_filtered.json b/annotations_filtered/nWAV_KcSkNw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7ff2bd844641935496ce42588fb6c909e797329 --- /dev/null +++ b/annotations_filtered/nWAV_KcSkNw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.0], [11.0, 14.93], [16.0, 16.31], [20.0, 20.09], [22.0, 23.25], [24.0, 28.97], [32.0, 45.32], [48.0, 49.42], [55.0, 56.44], [61.0, 61.2], [67.0, 68.2], [69.0, 91.05], [93.0, 93.43], [98.0, 98.68], [99.0, 99.18], [99.0, 99.22], [99.0, 99.25], [99.0, 99.28], [100.0, 103.22], [109.0, 115.47]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 85.35, 0.0, 0.0, 0.0, 30.23, 31.93, 0.0, 0.0, 0.0, 0.0, 31.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.18, 31.13], "audiomae_on_audioset": [null, null, null, null, null, [["cattle, bovinae", 39.25], ["moo", 26.52], ["livestock, farm animals, working animals", 19.39]], [["crowd", 22.22], ["speech", 13.32], ["clip-clop", 11.79]], null, null, null, null, [["cattle, bovinae", 45.28], ["moo", 25.19], ["livestock, farm animals, working animals", 23.1]], null, null, null, null, null, null, [["livestock, farm animals, working animals", 46.05], ["cattle, bovinae", 30.31], ["moo", 23.38]], [["cattle, bovinae", 58.52], ["moo", 24.06], ["livestock, farm animals, working animals", 17.19]]], "duration": [0.0, 3.93, 0.31, 0.09, 1.25, 4.97, 13.32, 1.42, 1.44, 0.2, 1.2, 22.05, 0.43, 0.68, 0.18, 0.22, 0.25, 0.28, 3.22, 6.47]} \ No newline at end of file diff --git a/annotations_filtered/nWRelGmpmxQ_filtered.json b/annotations_filtered/nWRelGmpmxQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/nWRelGmpmxQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/nWRxPDhd3d0_filtered.json b/annotations_filtered/nWRxPDhd3d0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85481780bf35fc1dd6961feb23bfd75d3bc3b89f --- /dev/null +++ b/annotations_filtered/nWRxPDhd3d0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.68], [11.0, 11.42], [12.0, 17.96], [20.0, 20.29], [21.0, 21.46], [27.0, 27.06], [30.0, 33.42], [35.0, 38.87], [40.0, 40.8], [47.0, 48.32], [56.0, 57.42], [60.0, 60.52], [79.0, 79.25], [85.0, 86.16], [92.0, 92.15], [94.0, 95.27], [97.0, 98.07]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.97, 0.0, 0.0, 0.0, 56.25, 37.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 54.55], ["fart", 5.09], ["didgeridoo", 3.04]], null, null, null, null, [["speech", 51.13], ["sidetone", 21.74], ["mains hum", 5.27]], null, null, null, null, null, null, null, null, null], "duration": [1.68, 0.42, 5.96, 0.29, 0.46, 0.06, 3.42, 3.87, 0.8, 1.32, 1.42, 0.52, 0.25, 1.16, 0.15, 1.27, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/nWWSMiBag1k_filtered.json b/annotations_filtered/nWWSMiBag1k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d37c198d87ae690ff614ebffa697815c8d3122a --- /dev/null +++ b/annotations_filtered/nWWSMiBag1k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.46], [8.0, 8.65], [11.0, 13.12], [29.0, 29.61], [36.0, 36.83], [38.0, 37.88], [40.0, 42.2], [44.0, 45.77], [48.0, 56.34], [58.0, 57.89], [66.0, 66.68], [70.0, 71.47], [72.0, 76.94], [86.0, 88.65], [91.0, 91.67], [94.0, 102.51], [105.0, 116.29], [118.0, 120.06], [122.0, 124.24], [125.0, 127.01], [128.0, 134.42]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, true, true, true, false, true, false], "silence_prob": [0.0, 0.0, 31.05, 0.0, 0.0, 0.0, 44.93, 0.0, 37.13, 0.0, 0.0, 0.0, 41.93, 44.04, 0.0, 34.22, 38.3, 47.08, 41.09, 40.09, 55.46], "audiomae_on_audioset": [null, null, [["domestic animals, pets", 22.93], ["animal", 20.15], ["music", 18.82]], null, null, null, [["music", 57.75], ["speech", 8.18], ["musical instrument", 4.6]], null, [["music", 32.0], ["speech", 20.27], ["crushing", 6.08]], null, null, null, [["music", 65.3], ["speech", 14.24], ["musical instrument", 2.05]], [["music", 63.77], ["musical instrument", 3.52], ["foghorn", 2.83]], null, [["music", 46.93], ["speech", 5.41], ["musical instrument", 3.61]], [["music", 46.69], ["speech", 15.43], ["musical instrument", 5.12]], [["speech", 32.1], ["music", 29.55], ["musical instrument", 2.71]], [["music", 60.14], ["hum", 5.13], ["musical instrument", 4.79]], [["music", 46.44], ["mains hum", 11.8], ["hum", 8.81]], null], "duration": [0.46, 0.65, 2.12, 0.61, 0.83, -0.12, 2.2, 1.77, 8.34, -0.11, 0.68, 1.47, 4.94, 2.65, 0.67, 8.51, 11.29, 2.06, 2.24, 2.01, 6.42]} \ No newline at end of file diff --git a/annotations_filtered/nWd-gLPa5fs_filtered.json b/annotations_filtered/nWd-gLPa5fs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e18433c51d52494490357f95b008736542f935de --- /dev/null +++ b/annotations_filtered/nWd-gLPa5fs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.68], [7.0, 8.04], [11.0, 13.22], [16.0, 16.61], [17.0, 18.49], [21.0, 21.88], [25.0, 25.03], [26.0, 28.44], [30.0, 31.38], [32.0, 32.05], [34.0, 34.62], [42.0, 42.99], [45.0, 46.4], [48.0, 51.73], [53.0, 53.81], [57.0, 57.77], [60.0, 59.88], [62.0, 62.38], [63.0, 66.53], [67.0, 68.69], [70.0, 74.39], [76.0, 80.64], [82.0, 86.86], [90.0, 94.51], [96.0, 97.43], [100.0, 101.16], [104.0, 109.49], [110.0, 115.62], [118.0, 121.39], [123.0, 123.57], [130.0, 130.23], [133.0, 133.47], [137.0, 137.2], [139.0, 139.19], [141.0, 141.52], [143.0, 144.58], [154.0, 154.89], [158.0, 159.34], [162.0, 163.11], [166.0, 166.5], [169.0, 169.32], [170.0, 170.85], [174.0, 177.25]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 87.92, 0.0, 0.0, 0.0, 0.0, 44.07, 0.0, 0.0, 0.0, 0.0, 0.0, 35.55, 0.0, 0.0, 0.0, 0.0, 39.19, 0.0, 34.18, 59.24, 90.25, 71.57, 0.0, 0.0, 56.25, 54.36, 92.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["whale vocalization", 28.76], ["music", 18.71], ["hum", 6.22]], null, null, null, null, null, [["speech", 63.96], ["music", 6.75], ["didgeridoo", 6.63]], null, null, null, null, [["speech", 33.12], ["music", 30.17], ["theremin", 6.1]], null, [["speech", 50.63], ["music", 21.74], ["musical instrument", 3.25]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.68, 1.04, 2.22, 0.61, 1.49, 0.88, 0.03, 2.44, 1.38, 0.05, 0.62, 0.99, 1.4, 3.73, 0.81, 0.77, -0.12, 0.38, 3.53, 1.69, 4.39, 4.64, 4.86, 4.51, 1.43, 1.16, 5.49, 5.62, 3.39, 0.57, 0.23, 0.47, 0.2, 0.19, 0.52, 1.58, 0.89, 1.34, 1.11, 0.5, 0.32, 0.85, 3.25]} \ No newline at end of file diff --git a/annotations_filtered/nWwlcubR7s0_filtered.json b/annotations_filtered/nWwlcubR7s0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..586f7913c661adca0051e7a34b36fb99f7f219e4 --- /dev/null +++ b/annotations_filtered/nWwlcubR7s0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.39], [12.0, 13.09], [21.0, 22.27], [24.0, 24.61], [29.0, 30.94], [43.0, 45.64], [47.0, 47.88], [51.0, 53.33], [57.0, 57.99], [66.0, 66.46], [69.0, 71.63], [77.0, 77.4], [80.0, 81.41], [83.0, 83.17], [102.0, 101.71], [113.0, 113.22], [122.0, 121.93], [131.0, 132.9], [144.0, 147.18], [151.0, 151.29], [154.0, 164.25], [165.0, 165.72], [166.0, 166.82]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [35.44, 0.0, 0.0, 0.0, 0.0, 29.54, 0.0, 30.52, 0.0, 0.0, 60.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.04, 0.0, 33.97, 0.0, 0.0], "audiomae_on_audioset": [[["beatboxing", 32.52], ["music", 12.26], ["cough", 11.26]], null, null, null, null, [["music", 60.67], ["speech", 10.53], ["boing", 4.39]], null, [["music", 47.42], ["throbbing", 4.92], ["mains hum", 2.54]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 38.47], ["speech", 24.17], ["sonar", 5.89]], null, null], "duration": [2.39, 1.09, 1.27, 0.61, 1.94, 2.64, 0.88, 2.33, 0.99, 0.46, 2.63, 0.4, 1.41, 0.17, -0.29, 0.22, -0.07, 1.9, 3.18, 0.29, 10.25, 0.72, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/nXIu-RlvPJM_filtered.json b/annotations_filtered/nXIu-RlvPJM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80d74cd0075aa64f03ddf51e4c3b0c8bf479e7f3 --- /dev/null +++ b/annotations_filtered/nXIu-RlvPJM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.13], [5.0, 5.64], [6.0, 9.76], [11.0, 11.15], [13.0, 18.49], [19.0, 20.49], [22.0, 34.96], [39.0, 41.12], [46.0, 46.75], [48.0, 51.98], [53.0, 54.63], [58.0, 58.14], [62.0, 64.17], [68.0, 69.57], [70.0, 73.85], [76.0, 76.54], [78.0, 86.64], [88.0, 89.36], [92.0, 97.78], [100.0, 103.35], [103.0, 105.36], [109.0, 113.02], [115.0, 119.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [93.29, 0.0, 99.98, 0.0, 99.87, 0.0, 100.0, 100.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 100.0, 0.0, 99.99, 100.0, 99.1, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.13, 0.64, 3.76, 0.15, 5.49, 1.49, 12.96, 2.12, 0.75, 3.98, 1.63, 0.14, 2.17, 1.57, 3.85, 0.54, 8.64, 1.36, 5.78, 3.35, 2.36, 4.02, 4.35]} \ No newline at end of file diff --git a/annotations_filtered/nXJxxahiC3A_filtered.json b/annotations_filtered/nXJxxahiC3A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b580cd1a1e61fbe8aa6a3a5cd2193606c8201f30 --- /dev/null +++ b/annotations_filtered/nXJxxahiC3A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 36.34], [42.0, 42.85], [45.0, 45.99], [47.0, 47.63], [50.0, 53.01], [54.0, 55.73], [60.0, 63.51], [64.0, 66.12], [68.0, 69.08], [70.0, 71.12], [72.0, 74.11], [75.0, 74.93], [75.0, 76.28], [78.0, 78.19], [87.0, 90.56], [93.0, 94.24], [96.0, 97.75], [100.0, 101.51], [108.0, 109.44], [113.0, 113.76], [115.0, 115.96], [119.0, 120.41], [121.0, 121.17], [123.0, 123.69], [129.0, 129.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 63.74, 0.0, 68.28, 74.29, 0.0, 0.0, 75.72, 0.0, 0.0, 0.0, 46.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 23.62], ["mosquito", 13.37], ["speech", 10.7]], null, null, null, null, null, null, null, null, null, null], "duration": [0.34, 0.85, 0.99, 0.63, 3.01, 1.73, 3.51, 2.12, 1.08, 1.12, 2.11, -0.07, 1.28, 0.19, 3.56, 1.24, 1.75, 1.51, 1.44, 0.76, 0.96, 1.41, 0.17, 0.69, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/nXSfDMvXAxw_filtered.json b/annotations_filtered/nXSfDMvXAxw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce2377b1e19e8a20dc7ac5392b4b1f6b5258eeaf --- /dev/null +++ b/annotations_filtered/nXSfDMvXAxw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.35], [10.0, 12.72], [20.0, 21.42], [24.0, 24.54], [27.0, 27.65], [33.0, 34.35], [35.0, 36.58], [51.0, 57.06], [57.0, 58.31], [59.0, 64.25], [66.0, 69.45], [71.0, 71.59], [73.0, 73.82], [75.0, 75.02], [76.0, 76.52]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.16, 0.0, 0.0, 0.0, 0.0, 0.0, 48.1, 0.0, 67.13, 58.22, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["fart", 25.51], ["noise", 5.91], ["frog", 4.62]], null, null, null, null, null, [["fly, housefly", 28.26], ["mosquito", 23.77], ["whale vocalization", 5.42]], null, null, null, null, null, null, null], "duration": [1.35, 2.72, 1.42, 0.54, 0.65, 1.35, 1.58, 6.06, 1.31, 5.25, 3.45, 0.59, 0.82, 0.02, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/nXV8YHeJfOs_filtered.json b/annotations_filtered/nXV8YHeJfOs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21abc3cde6070ac332715f8d548be3826513ddb8 --- /dev/null +++ b/annotations_filtered/nXV8YHeJfOs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 28.85], [30.0, 30.72], [31.0, 33.67], [37.0, 45.44], [46.0, 87.83], [89.0, 89.56], [91.0, 92.87], [95.0, 96.01], [97.0, 99.33], [100.0, 107.55], [109.0, 109.8], [111.0, 111.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.49, 0.0, 30.71, 30.34, 0.0, 0.0, 0.0, 0.0, 35.63, 30.55, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 39.71], ["music", 17.7], ["cacophony", 17.17]], null, [["music", 68.75], ["speech", 9.92], ["smash, crash", 2.78]], [["music", 58.05], ["speech", 15.7], ["hum", 4.65]], null, null, null, null, [["music", 47.67], ["throbbing", 22.68], ["hum", 6.85]], [["throbbing", 48.01], ["music", 18.0], ["hum", 16.28]], null, null], "duration": [19.85, 0.72, 2.67, 8.44, 41.83, 0.56, 1.87, 1.01, 2.33, 7.55, 0.8, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/nXait2wHOQc_filtered.json b/annotations_filtered/nXait2wHOQc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a2d9dbc3d14be197bb501cf73ebae2566a95fe22 --- /dev/null +++ b/annotations_filtered/nXait2wHOQc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.96], [18.0, 19.13], [26.0, 27.38], [32.0, 32.58], [33.0, 33.74], [34.0, 38.13], [39.0, 39.93], [43.0, 43.14], [47.0, 50.35], [53.0, 54.73], [55.0, 56.67], [58.0, 62.04], [67.0, 67.63], [72.0, 72.44], [75.0, 76.05], [78.0, 79.03], [83.0, 85.02], [86.0, 86.97], [93.0, 93.24], [94.0, 98.15], [107.0, 108.06], [110.0, 112.8], [113.0, 117.29], [117.0, 118.15], [120.0, 125.85], [127.0, 130.3], [132.0, 138.64], [141.0, 149.74], [154.0, 155.9], [158.0, 159.16], [163.0, 163.81], [165.0, 165.6], [167.0, 169.05], [171.0, 171.32], [176.0, 176.47], [180.0, 181.92], [182.0, 182.04], [182.0, 182.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.44, 0.0, 0.0, 0.0, 0.0, 71.87, 0.0, 0.0, 85.35, 0.0, 0.0, 93.91, 0.0, 0.0, 0.0, 0.0, 49.09, 0.0, 0.0, 91.98, 0.0, 73.82, 89.19, 0.0, 43.66, 44.9, 49.68, 44.4, 0.0, 0.0, 0.0, 0.0, 73.21, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.97], ["music", 35.01], ["boing", 3.12]], null, null, null, null, null, null, null, [["speech", 37.17], ["music", 31.95], ["boing", 5.89]], [["speech", 33.06], ["music", 16.09], ["livestock, farm animals, working animals", 7.69]], [["music", 50.53], ["livestock, farm animals, working animals", 7.0], ["boing", 4.87]], [["music", 58.2], ["speech", 11.16], ["boing", 10.57]], null, null, null, null, null, null, null, null, null, null], "duration": [3.96, 1.13, 1.38, 0.58, 0.74, 4.13, 0.93, 0.14, 3.35, 1.73, 1.67, 4.04, 0.63, 0.44, 1.05, 1.03, 2.02, 0.97, 0.24, 4.15, 1.06, 2.8, 4.29, 1.15, 5.85, 3.3, 6.64, 8.74, 1.9, 1.16, 0.81, 0.6, 2.05, 0.32, 0.47, 1.92, 0.04, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/nXjnagPujjE_filtered.json b/annotations_filtered/nXjnagPujjE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..668b19f4449a0340279c85652c56946163df7bfa --- /dev/null +++ b/annotations_filtered/nXjnagPujjE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.07], [7.0, 10.98], [11.0, 11.84], [15.0, 17.29], [19.0, 25.27], [31.0, 36.86], [38.0, 38.87], [46.0, 49.17], [54.0, 63.09], [65.0, 65.11], [66.0, 79.0], [83.0, 95.17], [95.0, 95.61], [97.0, 107.84], [109.0, 110.0]], "keep_status": [false, true, false, false, false, true, false, false, true, false, true, true, false, false, false], "silence_prob": [0.0, 33.15, 0.0, 52.33, 34.95, 40.07, 0.0, 63.96, 32.51, 0.0, 32.62, 31.78, 0.0, 32.52, 0.0], "audiomae_on_audioset": [null, [["echo", 20.89], ["animal", 12.2], ["roar", 10.3]], null, null, [["livestock, farm animals, working animals", 44.11], ["moo", 28.11], ["cattle, bovinae", 25.52]], [["music", 47.69], ["musical instrument", 6.43], ["guitar", 4.64]], null, null, [["music", 57.57], ["speech", 6.11], ["musical instrument", 4.54]], null, [["cattle, bovinae", 17.96], ["music", 15.21], ["speech", 14.54]], [["fly, housefly", 12.42], ["livestock, farm animals, working animals", 10.66], ["animal", 10.23]], null, [["livestock, farm animals, working animals", 37.77], ["cattle, bovinae", 34.62], ["moo", 26.4]], null], "duration": [0.07, 3.98, 0.84, 2.29, 6.27, 5.86, 0.87, 3.17, 9.09, 0.11, 13.0, 12.17, 0.61, 10.84, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/nXmtkGrPEuU_filtered.json b/annotations_filtered/nXmtkGrPEuU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a979dff181bf9d54b9ae67391a8f421fdcb2dda --- /dev/null +++ b/annotations_filtered/nXmtkGrPEuU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 13.96], [15.0, 16.06], [18.0, 17.78], [21.0, 22.17], [25.0, 25.47], [44.0, 44.61], [48.0, 48.78], [53.0, 53.25], [58.0, 57.67], [73.0, 73.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [10.96, 1.06, -0.22, 1.17, 0.47, 0.61, 0.78, 0.25, -0.33, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/nXoPEmh39ls_filtered.json b/annotations_filtered/nXoPEmh39ls_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..638375adbd512fc81fbfd6d0bc1701a929566f28 --- /dev/null +++ b/annotations_filtered/nXoPEmh39ls_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.06], [16.0, 18.15], [20.0, 23.36], [25.0, 26.76], [28.0, 29.25], [30.0, 38.31], [39.0, 40.05], [41.0, 45.45], [46.0, 47.56], [50.0, 49.94], [53.0, 55.86], [57.0, 60.57], [61.0, 62.95], [66.0, 69.28], [70.0, 71.9], [73.0, 74.01], [74.0, 81.06], [82.0, 101.68], [103.0, 124.9], [126.0, 126.82], [130.0, 147.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.54, 95.78, 0.0, 0.0, 94.52, 0.0, 100.0, 0.0, 0.0, 99.31, 99.91, 0.0, 99.59, 0.0, 0.0, 97.92, 81.89, 37.0, 0.0, 97.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 62.54], ["sidetone", 15.35], ["theremin", 3.61]], null, null], "duration": [1.06, 2.15, 3.36, 1.76, 1.25, 8.31, 1.05, 4.45, 1.56, -0.06, 2.86, 3.57, 1.95, 3.28, 1.9, 1.01, 7.06, 19.68, 21.9, 0.82, 17.24]} \ No newline at end of file diff --git a/annotations_filtered/nXrsB2RMo2w_filtered.json b/annotations_filtered/nXrsB2RMo2w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e70bcbcaaae8dc635ecbd79e80a8597e78d7eff --- /dev/null +++ b/annotations_filtered/nXrsB2RMo2w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 55.49], [57.0, 57.82], [59.0, 60.3], [61.0, 62.26], [63.0, 108.87], [110.0, 110.24], [111.0, 113.48], [116.0, 116.09], [116.0, 116.46], [117.0, 118.29], [121.0, 121.88], [123.0, 127.11], [128.0, 129.68], [130.0, 132.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.55, 0.0, 0.0, 0.0, 0.0, 51.02, 0.0, 40.43], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 55.97], ["speech", 30.32], ["dial tone", 5.23]]], "duration": [38.49, 0.82, 1.3, 1.26, 45.87, 0.24, 2.48, 0.09, 0.46, 1.29, 0.88, 4.11, 1.68, 2.41]} \ No newline at end of file diff --git a/annotations_filtered/nYb42fv8pMU_filtered.json b/annotations_filtered/nYb42fv8pMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02364a250ee3e30e86625dac6c2a24a8d82bb416 --- /dev/null +++ b/annotations_filtered/nYb42fv8pMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.46], [5.0, 5.36], [9.0, 13.66], [19.0, 19.33], [21.0, 22.77], [23.0, 24.54], [29.0, 30.27], [33.0, 33.12], [34.0, 33.91], [38.0, 41.94], [43.0, 48.37], [49.0, 51.43], [53.0, 55.81], [57.0, 57.23], [58.0, 60.71], [64.0, 65.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 98.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.32, 50.86, 69.07, 67.0, 0.0, 32.77, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 52.14], ["noise", 10.44], ["whale vocalization", 6.86]], null], "duration": [1.46, 0.36, 4.66, 0.33, 1.77, 1.54, 1.27, 0.12, -0.09, 3.94, 5.37, 2.43, 2.81, 0.23, 2.71, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/nYhuIXk_CPk_filtered.json b/annotations_filtered/nYhuIXk_CPk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a892f73e05b0a0d19aa915e73664afc24e5e9a72 --- /dev/null +++ b/annotations_filtered/nYhuIXk_CPk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.66], [13.0, 16.19], [18.0, 18.99], [22.0, 21.84], [23.0, 23.45], [25.0, 25.84], [26.0, 26.0], [32.0, 39.95], [42.0, 50.19], [53.0, 53.0], [53.0, 54.57], [56.0, 56.44], [56.0, 65.75], [67.0, 79.93], [81.0, 80.84], [85.0, 88.03], [91.0, 110.02], [113.0, 113.07], [114.0, 117.41]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, false, false, true, false, true, true, false, true], "silence_prob": [36.24, 35.09, 0.0, 0.0, 0.0, 0.0, 0.0, 37.37, 36.98, 0.0, 0.0, 0.0, 30.6, 31.01, 0.0, 30.09, 30.36, 0.0, 30.66], "audiomae_on_audioset": [[["hum", 41.99], ["mains hum", 30.23], ["throbbing", 22.76]], [["music", 24.89], ["hum", 16.15], ["throbbing", 13.22]], null, null, null, null, null, [["music", 37.84], ["speech", 36.51], ["sidetone", 7.65]], [["music", 24.94], ["speech", 16.23], ["hum", 7.8]], null, null, null, [["music", 66.56], ["speech", 4.97], ["animal", 2.83]], [["speech", 41.45], ["fire", 9.94], ["outside, rural or natural", 5.01]], null, [["music", 19.0], ["speech", 14.2], ["vehicle", 5.44]], [["livestock, farm animals, working animals", 23.64], ["cattle, bovinae", 14.97], ["music", 12.11]], null, [["music", 24.64], ["noise", 22.52], ["speech", 6.45]]], "duration": [5.66, 3.19, 0.99, -0.16, 0.45, 0.84, 0.0, 7.95, 8.19, 0.0, 1.57, 0.44, 9.75, 12.93, -0.16, 3.03, 19.02, 0.07, 3.41]} \ No newline at end of file diff --git a/annotations_filtered/nYkD6bPe9Ho_filtered.json b/annotations_filtered/nYkD6bPe9Ho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7562d006f460b15d2d3cb9553acf08ba54599a2 --- /dev/null +++ b/annotations_filtered/nYkD6bPe9Ho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.78], [9.0, 98.58], [106.0, 130.44]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 29.5], "audiomae_on_audioset": [null, null, [["music", 29.78], ["hum", 27.97], ["throbbing", 18.55]]], "duration": [1.78, 89.58, 24.44]} \ No newline at end of file diff --git a/annotations_filtered/nYvvM0FXKWQ_filtered.json b/annotations_filtered/nYvvM0FXKWQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa677631e4f81621c1812a428b064f0bbac5bad5 --- /dev/null +++ b/annotations_filtered/nYvvM0FXKWQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.13], [10.0, 11.8], [13.0, 16.44], [22.0, 25.12], [28.0, 30.3], [31.0, 33.27], [39.0, 40.51], [42.0, 42.48], [45.0, 49.01], [53.0, 73.31], [85.0, 85.31], [86.0, 86.26], [88.0, 89.78], [94.0, 95.23], [97.0, 97.63], [101.0, 101.49], [102.0, 138.82], [139.0, 139.23], [140.0, 142.08], [148.0, 149.86], [154.0, 154.21], [156.0, 160.1]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 92.8, 89.19, 66.63, 56.55, 0.0, 0.0, 29.99, 49.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.47, 0.0, 0.0, 32.42], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 51.3], ["hum", 7.95], ["explosion", 5.34]], [["music", 73.48], ["theremin", 6.99], ["soundtrack music", 3.45]], null, null, null, null, null, null, null, null, null, null, null, [["music", 43.05], ["throbbing", 11.28], ["hum", 4.79]]], "duration": [1.13, 1.8, 3.44, 3.12, 2.3, 2.27, 1.51, 0.48, 4.01, 20.31, 0.31, 0.26, 1.78, 1.23, 0.63, 0.49, 36.82, 0.23, 2.08, 1.86, 0.21, 4.1]} \ No newline at end of file diff --git a/annotations_filtered/nZE2tGoC0H4_filtered.json b/annotations_filtered/nZE2tGoC0H4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30e4f1faa5afb1a4f5ce21caac017ba94345bafd --- /dev/null +++ b/annotations_filtered/nZE2tGoC0H4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 37.44], [39.0, 52.73], [55.0, 56.79], [58.0, 62.83], [68.0, 71.27], [73.0, 76.27], [77.0, 78.95], [80.0, 84.57]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [71.43, 49.97, 0.0, 54.04, 82.97, 83.88, 0.0, 95.64], "audiomae_on_audioset": [null, [["music", 69.04], ["speech", 5.64], ["throbbing", 3.29]], null, null, null, null, null, null], "duration": [12.44, 13.73, 1.79, 4.83, 3.27, 3.27, 1.95, 4.57]} \ No newline at end of file diff --git a/annotations_filtered/nZWo6dP2zVw_filtered.json b/annotations_filtered/nZWo6dP2zVw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb5585c047509e197da0d30bdd0668f27704a45d --- /dev/null +++ b/annotations_filtered/nZWo6dP2zVw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.76], [16.0, 18.94], [19.0, 25.05], [27.0, 35.73], [38.0, 39.34], [40.0, 41.89], [47.0, 47.82], [50.0, 52.81], [53.0, 53.54], [54.0, 55.92], [57.0, 62.82], [64.0, 72.39], [73.0, 77.09], [82.0, 88.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [99.92, 99.97, 97.22, 99.56, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 68.8, 70.72, 84.25, 37.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 27.56], ["speech", 25.67], ["hum", 9.73]]], "duration": [5.76, 2.94, 6.05, 8.73, 1.34, 1.89, 0.82, 2.81, 0.54, 1.92, 5.82, 8.39, 4.09, 6.65]} \ No newline at end of file diff --git a/annotations_filtered/nZq8AiBXhiI_filtered.json b/annotations_filtered/nZq8AiBXhiI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7cc37c5c37defabfe0a145f7976a4f9efd0cbc0 --- /dev/null +++ b/annotations_filtered/nZq8AiBXhiI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.47], [6.0, 6.91], [11.0, 15.09], [16.0, 25.68], [26.0, 26.76], [27.0, 28.16], [29.0, 31.14], [31.0, 37.39], [40.0, 41.88], [43.0, 45.64], [48.0, 50.95], [53.0, 55.11], [56.0, 57.59], [60.0, 63.14], [64.0, 66.56], [68.0, 69.57], [71.0, 73.36], [74.0, 74.92], [76.0, 75.98], [77.0, 78.7], [80.0, 82.63], [83.0, 84.94], [85.0, 87.71], [89.0, 90.9], [92.0, 95.42], [97.0, 101.43], [104.0, 105.33], [108.0, 110.12], [111.0, 114.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 99.82, 0.0, 0.0, 99.31, 98.73, 0.0, 100.0, 100.0, 100.0, 0.0, 100.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 94.07, 0.0, 84.43, 0.0, 100.0, 98.93, 0.0, 66.03, 57.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 0.91, 4.09, 9.68, 0.76, 1.16, 2.14, 6.39, 1.88, 2.64, 2.95, 2.11, 1.59, 3.14, 2.56, 1.57, 2.36, 0.92, -0.02, 1.7, 2.63, 1.94, 2.71, 1.9, 3.42, 4.43, 1.33, 2.12, 3.57]} \ No newline at end of file diff --git a/annotations_filtered/nZy7fW9IO0s_filtered.json b/annotations_filtered/nZy7fW9IO0s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f28e6aa6e8aea02a72ad04a86b90b90617185110 --- /dev/null +++ b/annotations_filtered/nZy7fW9IO0s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.9], [30.0, 31.43], [33.0, 40.73], [43.0, 45.08], [48.0, 51.43], [53.0, 55.36], [57.0, 68.62], [75.0, 102.15]], "keep_status": [false, false, true, false, true, true, true, true], "silence_prob": [0.0, 0.0, 45.65, 55.81, 32.24, 45.11, 29.45, 29.64], "audiomae_on_audioset": [null, null, [["throbbing", 23.16], ["music", 21.75], ["hum", 19.78]], null, [["music", 32.83], ["throbbing", 14.15], ["hum", 9.25]], [["hum", 22.47], ["throbbing", 12.17], ["rumble", 5.38]], [["smash, crash", 36.39], ["breaking", 13.28], ["music", 11.1]], [["music", 37.28], ["speech", 16.45], ["explosion", 5.41]]], "duration": [0.9, 1.43, 7.73, 2.08, 3.43, 2.36, 11.62, 27.15]} \ No newline at end of file diff --git a/annotations_filtered/n_3Fsg5qGfk_filtered.json b/annotations_filtered/n_3Fsg5qGfk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa7a32dbbd46625a6978fd6e7972e0ed1eed426f --- /dev/null +++ b/annotations_filtered/n_3Fsg5qGfk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.42], [14.0, 14.44], [15.0, 17.09], [18.0, 32.68], [35.0, 35.55], [39.0, 45.5], [46.0, 45.59], [46.0, 45.64], [46.0, 45.69], [46.0, 45.77], [46.0, 60.0], [63.0, 62.82], [65.0, 66.38], [67.0, 67.64], [68.0, 70.02], [70.0, 73.58], [75.0, 78.21], [82.0, 85.14], [86.0, 87.18], [89.0, 92.13], [93.0, 94.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 96.04, 70.44, 0.0, 31.89, 0.0, 0.0, 0.0, 0.0, 58.64, 0.0, 0.0, 0.0, 33.12, 76.7, 94.81, 91.13, 0.0, 77.36, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 59.98], ["music", 16.83], ["explosion", 5.29]], null, null, null, null, null, null, null, null, [["speech", 41.19], ["music", 9.35], ["boing", 6.62]], null, null, null, null, null, null], "duration": [0.42, 0.44, 2.09, 14.68, 0.55, 6.5, -0.41, -0.36, -0.31, -0.23, 14.0, -0.18, 1.38, 0.64, 2.02, 3.58, 3.21, 3.14, 1.18, 3.13, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/n_c7JtDNNUo_filtered.json b/annotations_filtered/n_c7JtDNNUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04ca06ba3f4e2d633306f6447f422a0a948967d4 --- /dev/null +++ b/annotations_filtered/n_c7JtDNNUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 22.08], [24.0, 24.19], [31.0, 31.85], [32.0, 33.45]], "keep_status": [true, false, false, false], "silence_prob": [29.66, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 18.46], ["eruption", 13.89], ["mains hum", 11.93]], null, null, null], "duration": [14.08, 0.19, 0.85, 1.45]} \ No newline at end of file diff --git a/annotations_filtered/n_ci8BbMilc_filtered.json b/annotations_filtered/n_ci8BbMilc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6cb22331a35606ad74e741daedf08bebb2c5f1e --- /dev/null +++ b/annotations_filtered/n_ci8BbMilc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.29], [3.0, 3.35], [4.0, 23.28], [49.0, 59.73], [67.0, 68.28], [92.0, 92.84], [100.0, 101.02], [105.0, 105.85], [107.0, 117.58], [119.0, 127.25], [129.0, 128.95], [130.0, 130.96], [131.0, 132.19]], "keep_status": [false, false, true, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 41.12, 63.64, 0.0, 0.0, 0.0, 0.0, 30.18, 30.95, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 50.34], ["musical instrument", 8.34], ["synthesizer", 3.85]], null, null, null, null, null, [["speech", 29.08], ["music", 16.03], ["groan", 5.4]], [["fart", 37.45], ["crying, sobbing", 12.66], ["speech", 11.7]], null, null, null], "duration": [0.29, 0.35, 19.28, 10.73, 1.28, 0.84, 1.02, 0.85, 10.58, 8.25, -0.05, 0.96, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/n_z0TcZkPzg_filtered.json b/annotations_filtered/n_z0TcZkPzg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6862282df47460fe370019e8dffc799f88be0a3 --- /dev/null +++ b/annotations_filtered/n_z0TcZkPzg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.02], [12.0, 12.31], [12.0, 17.09], [25.0, 25.35], [26.0, 26.49], [40.0, 41.15], [42.0, 44.95], [46.0, 46.97], [51.0, 51.73], [54.0, 55.07], [58.0, 69.01], [71.0, 70.95], [71.0, 71.12], [72.0, 84.72], [85.0, 87.99], [90.0, 91.08], [92.0, 93.45], [95.0, 96.85], [99.0, 99.33], [102.0, 102.96], [105.0, 106.22], [113.0, 118.99], [120.0, 120.36], [124.0, 124.92]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [46.19, 0.0, 42.67, 0.0, 0.0, 0.0, 69.07, 0.0, 0.0, 0.0, 54.56, 0.0, 0.0, 97.0, 92.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.0, 0.0, 0.0], "audiomae_on_audioset": [[["whale vocalization", 43.44], ["music", 14.62], ["speech", 6.65]], null, [["music", 23.87], ["foghorn", 22.99], ["speech", 12.0]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["busy signal", 16.71], ["speech", 12.05], ["dial tone", 8.23]], null, null], "duration": [4.02, 0.31, 5.09, 0.35, 0.49, 1.15, 2.95, 0.97, 0.73, 1.07, 11.01, -0.05, 0.12, 12.72, 2.99, 1.08, 1.45, 1.85, 0.33, 0.96, 1.22, 5.99, 0.36, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/naKm_rLxRCs_filtered.json b/annotations_filtered/naKm_rLxRCs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac35f7ee78e07b0fafd605063f9380de5800793a --- /dev/null +++ b/annotations_filtered/naKm_rLxRCs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.62], [6.0, 6.37], [9.0, 10.67], [13.0, 19.33], [24.0, 25.71], [27.0, 30.35], [31.0, 37.67], [44.0, 78.56], [88.0, 92.74], [93.0, 92.89], [93.0, 93.9], [95.0, 97.71], [99.0, 126.64], [127.0, 134.32], [137.0, 138.16], [139.0, 144.91], [145.0, 150.47]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 79.24, 0.0, 98.99, 33.06, 0.0, 35.47, 0.0, 0.0, 45.33, 64.63, 53.34, 0.0, 43.1, 29.5], "audiomae_on_audioset": [null, null, null, null, null, null, [["organ", 25.32], ["keyboard (musical)", 21.72], ["music", 15.29]], null, [["music", 27.32], ["hum", 22.69], ["mains hum", 15.84]], null, null, [["music", 38.68], ["hum", 8.71], ["squish", 5.58]], null, null, null, [["music", 32.6], ["whale vocalization", 30.49], ["theremin", 8.57]], [["music", 64.25], ["speech", 6.66], ["musical instrument", 4.92]]], "duration": [0.62, 0.37, 1.67, 6.33, 1.71, 3.35, 6.67, 34.56, 4.74, -0.11, 0.9, 2.71, 27.64, 7.32, 1.16, 5.91, 5.47]} \ No newline at end of file diff --git a/annotations_filtered/naTncfYgYtU_filtered.json b/annotations_filtered/naTncfYgYtU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b14e8f243e801ba08ae0b2e9712a9961600dc120 --- /dev/null +++ b/annotations_filtered/naTncfYgYtU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 29.83], [34.0, 44.47], [46.0, 50.03], [51.0, 52.89], [57.0, 58.13], [60.0, 60.32], [61.0, 62.38], [69.0, 69.55], [70.0, 73.26], [75.0, 74.88], [75.0, 76.37], [77.0, 100.57], [106.0, 107.32]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.02, 93.29, 0.0, 0.0, 0.0, 0.0, 0.0, 71.72, 0.0, 0.0, 37.78, 0.0], "audiomae_on_audioset": [null, [["whack, thwack", 18.15], ["sound effect", 6.54], ["speech", 4.25]], null, null, null, null, null, null, null, null, null, [["music", 62.43], ["hum", 4.65], ["musical instrument", 4.12]], null], "duration": [1.83, 10.47, 4.03, 1.89, 1.13, 0.32, 1.38, 0.55, 3.26, -0.12, 1.37, 23.57, 1.32]} \ No newline at end of file diff --git a/annotations_filtered/nauLgZISozs_filtered.json b/annotations_filtered/nauLgZISozs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e8e9bc3700a0b21ddf75823682f5faa8772e2db --- /dev/null +++ b/annotations_filtered/nauLgZISozs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.62], [5.0, 5.95], [12.0, 12.88], [13.0, 13.47], [19.0, 20.98], [27.0, 27.68], [40.0, 40.22], [43.0, 43.9], [47.0, 47.17], [48.0, 48.69], [50.0, 51.06], [57.0, 58.5], [65.0, 67.95], [75.0, 76.13], [83.0, 84.03], [85.0, 87.05], [90.0, 90.46], [91.0, 92.45], [95.0, 96.67], [98.0, 98.12], [104.0, 104.77], [106.0, 106.79], [107.0, 108.58], [110.0, 110.54], [112.0, 111.99], [115.0, 116.09], [117.0, 118.25], [121.0, 120.88], [124.0, 125.0], [126.0, 127.38], [129.0, 129.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.45, 0.0, 0.0, 37.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 19.14], ["boing", 11.99], ["reverberation", 8.69]], null, null, [["insect", 30.24], ["fly, housefly", 29.54], ["speech", 11.63]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 0.95, 0.88, 0.47, 1.98, 0.68, 0.22, 0.9, 0.17, 0.69, 1.06, 1.5, 2.95, 1.13, 1.03, 2.05, 0.46, 1.45, 1.67, 0.12, 0.77, 0.79, 1.58, 0.54, -0.01, 1.09, 1.25, -0.12, 1.0, 1.38, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/nbssDN3Y75Q_filtered.json b/annotations_filtered/nbssDN3Y75Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d82f2459f87bb11582d3d77fb383e8ed01e94b27 --- /dev/null +++ b/annotations_filtered/nbssDN3Y75Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 14.67], [15.0, 16.34], [18.0, 19.7], [21.0, 22.08], [22.0, 23.57], [24.0, 25.08], [25.0, 25.19], [26.0, 26.77], [29.0, 31.21], [36.0, 38.4], [40.0, 42.5], [45.0, 50.38], [51.0, 56.13], [58.0, 64.77], [66.0, 69.5], [71.0, 73.5], [74.0, 75.27], [76.0, 83.69], [84.0, 96.8], [98.0, 99.94], [101.0, 101.9], [104.0, 105.24], [106.0, 118.45], [131.0, 130.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, true, false], "silence_prob": [71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.42, 65.44, 80.46, 36.65, 37.59, 62.89, 58.64, 31.29, 0.0, 34.13, 45.24, 0.0, 0.0, 0.0, 32.29, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.79], ["music", 22.71], ["hum", 10.37]], [["whale vocalization", 42.36], ["music", 14.83], ["hum", 13.64]], null, null, [["hum", 28.61], ["music", 18.83], ["mains hum", 17.77]], null, [["music", 31.29], ["noise", 13.97], ["hum", 10.21]], [["music", 53.28], ["hum", 7.08], ["didgeridoo", 5.69]], null, null, null, [["music", 43.38], ["didgeridoo", 12.58], ["hum", 8.96]], null], "duration": [5.67, 1.34, 1.7, 1.08, 1.57, 1.08, 0.19, 0.77, 2.21, 2.4, 2.5, 5.38, 5.13, 6.77, 3.5, 2.5, 1.27, 7.69, 12.8, 1.94, 0.9, 1.24, 12.45, -0.09]} \ No newline at end of file diff --git a/annotations_filtered/nby0t43dlIs_filtered.json b/annotations_filtered/nby0t43dlIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4609e47b8c2f27731809528c2bb5593a0ded57f --- /dev/null +++ b/annotations_filtered/nby0t43dlIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.33], [24.0, 25.68], [27.0, 34.62], [35.0, 36.66], [40.0, 40.8], [42.0, 43.73], [48.0, 49.52], [52.0, 51.97], [54.0, 55.63], [57.0, 58.45], [59.0, 60.57], [61.0, 63.02]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.61], "audiomae_on_audioset": [null, null, [["music", 33.27], ["mains hum", 22.2], ["hum", 11.02]], null, null, null, null, null, null, null, null, [["speech", 40.3], ["dial tone", 21.03], ["telephone", 9.44]]], "duration": [0.33, 1.68, 7.62, 1.66, 0.8, 1.73, 1.52, -0.03, 1.63, 1.45, 1.57, 2.02]} \ No newline at end of file diff --git a/annotations_filtered/nc0LwkqYGpM_filtered.json b/annotations_filtered/nc0LwkqYGpM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58ccf12e74f6c42ae743ff77cf94f1eadcdb08f5 --- /dev/null +++ b/annotations_filtered/nc0LwkqYGpM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.17], [39.0, 39.46], [43.0, 42.82], [47.0, 46.84], [61.0, 61.42], [95.0, 97.48]], "keep_status": [false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.57], "audiomae_on_audioset": [null, null, null, null, null, [["noise", 28.83], ["fart", 11.67], ["music", 11.18]]], "duration": [1.17, 0.46, -0.18, -0.16, 0.42, 2.48]} \ No newline at end of file diff --git a/annotations_filtered/ncOY7vtsY8I_filtered.json b/annotations_filtered/ncOY7vtsY8I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a30b2bbd67fa391f2865e510e8f1209889b447a0 --- /dev/null +++ b/annotations_filtered/ncOY7vtsY8I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.74], [4.0, 10.89], [14.0, 15.63], [16.0, 21.78], [23.0, 25.42], [26.0, 33.76], [35.0, 39.01], [41.0, 42.69], [44.0, 51.92], [53.0, 54.45], [56.0, 57.28], [59.0, 60.74], [66.0, 68.82], [70.0, 71.02], [71.0, 73.14], [74.0, 75.69], [76.0, 79.34], [80.0, 87.03], [90.0, 91.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 100.0, 99.44, 100.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 99.99, 0.0, 90.08, 0.0, 99.96, 99.95, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.74, 6.89, 1.63, 5.78, 2.42, 7.76, 4.01, 1.69, 7.92, 1.45, 1.28, 1.74, 2.82, 1.02, 2.14, 1.69, 3.34, 7.03, 1.76]} \ No newline at end of file diff --git a/annotations_filtered/ncnq2pu4PlE_filtered.json b/annotations_filtered/ncnq2pu4PlE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e9fbcff31b8372ff287ac489f6357db93c65069 --- /dev/null +++ b/annotations_filtered/ncnq2pu4PlE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.04], [11.0, 20.61], [21.0, 26.32], [28.0, 36.14], [37.0, 38.25], [39.0, 40.51], [47.0, 50.58], [55.0, 56.37], [65.0, 68.0], [74.0, 76.69], [77.0, 87.83], [89.0, 91.84], [93.0, 97.01], [98.0, 99.74], [101.0, 101.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.73, 95.37, 99.48, 0.0, 0.0, 99.68, 0.0, 66.76, 81.35, 77.36, 83.16, 92.48, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.04, 9.61, 5.32, 8.14, 1.25, 1.51, 3.58, 1.37, 3.0, 2.69, 10.83, 2.84, 4.01, 1.74, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/nd3MVcbnfAc_filtered.json b/annotations_filtered/nd3MVcbnfAc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..664e411742b35af820184683219fb5e95e3e2c6d --- /dev/null +++ b/annotations_filtered/nd3MVcbnfAc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 14.05], [15.0, 37.29], [42.0, 44.73]], "keep_status": [false, true, false], "silence_prob": [69.2, 30.41, 33.28], "audiomae_on_audioset": [null, [["music", 42.93], ["speech", 8.22], ["hum", 7.77]], [["music", 52.07], ["hum", 10.49], ["throbbing", 10.03]]], "duration": [7.05, 22.29, 2.73]} \ No newline at end of file diff --git a/annotations_filtered/ndItN7hhtII_filtered.json b/annotations_filtered/ndItN7hhtII_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0269a8291c0d367f3c96047bbb315e85bf2f4f67 --- /dev/null +++ b/annotations_filtered/ndItN7hhtII_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.98], [9.0, 10.25], [11.0, 11.91], [13.0, 14.0], [15.0, 15.9], [18.0, 18.0], [20.0, 20.44], [21.0, 21.81], [23.0, 23.57], [26.0, 28.17], [30.0, 30.59], [32.0, 32.81], [36.0, 36.32], [37.0, 39.77], [42.0, 45.17], [47.0, 48.66], [49.0, 55.92], [57.0, 59.29], [60.0, 62.53], [69.0, 75.19], [83.0, 84.15], [85.0, 85.33], [86.0, 85.68], [88.0, 88.91], [100.0, 102.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.03, 0.0, 0.0, 0.0, 61.57, 84.25, 0.0, 37.98, 79.76, 69.61, 47.62, 0.0, 0.0, 0.0, 0.0, 30.24], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["doorbell", 43.06], ["music", 6.12], ["speech", 4.54]], null, null, [["insect", 24.31], ["fly, housefly", 19.51], ["music", 9.24]], null, null, null, null, [["speech", 29.18], ["doorbell", 11.12], ["moo", 6.68]]], "duration": [-0.02, 1.25, 0.91, 1.0, 0.9, 0.0, 0.44, 0.81, 0.57, 2.17, 0.59, 0.81, 0.32, 2.77, 3.17, 1.66, 6.92, 2.29, 2.53, 6.19, 1.15, 0.33, -0.32, 0.91, 2.63]} \ No newline at end of file diff --git a/annotations_filtered/ndfLW-xm9Xk_filtered.json b/annotations_filtered/ndfLW-xm9Xk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bae59279a64cecb79e5dea6155ac09240c2f6a0a --- /dev/null +++ b/annotations_filtered/ndfLW-xm9Xk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.51], [6.0, 7.23], [8.0, 8.48], [11.0, 12.02], [14.0, 14.4], [15.0, 15.13], [29.0, 49.1]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.49], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 46.14], ["music", 37.62], ["didgeridoo", 3.13]]], "duration": [1.51, 1.23, 0.48, 1.02, 0.4, 0.13, 20.1]} \ No newline at end of file diff --git a/annotations_filtered/ndpVsMLr424_filtered.json b/annotations_filtered/ndpVsMLr424_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d59e35b9db381b19db8fc58772ad46d3e30c59f --- /dev/null +++ b/annotations_filtered/ndpVsMLr424_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 28.73], [30.0, 30.27], [31.0, 58.09]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 29.99], "audiomae_on_audioset": [null, null, [["music", 60.76], ["throbbing", 14.31], ["hum", 5.13]]], "duration": [0.73, 0.27, 27.09]} \ No newline at end of file diff --git a/annotations_filtered/ndrLDbtM-CY_filtered.json b/annotations_filtered/ndrLDbtM-CY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e4b5206390d9c44fd8c3153d9fcee29ff5dc6e2 --- /dev/null +++ b/annotations_filtered/ndrLDbtM-CY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.81], [17.0, 16.83], [21.0, 21.78], [23.0, 23.48]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.81, -0.17, 0.78, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/ndrr3vif10w_filtered.json b/annotations_filtered/ndrr3vif10w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c4afc034dfeb964a71ab29a9a5d140ab1718602 --- /dev/null +++ b/annotations_filtered/ndrr3vif10w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.14], [8.0, 8.63], [11.0, 19.89], [23.0, 24.16], [26.0, 26.81], [27.0, 27.75], [29.0, 30.94], [37.0, 37.66], [39.0, 40.88], [46.0, 46.35], [48.0, 47.93], [50.0, 51.78], [55.0, 55.8], [70.0, 70.43], [76.0, 76.5], [79.0, 79.56], [80.0, 81.62], [86.0, 86.27], [89.0, 90.48], [91.0, 104.99], [106.0, 109.65], [110.0, 113.34], [115.0, 117.64]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.5, 0.0, 91.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.54, 80.29, 51.71, 81.17], "audiomae_on_audioset": [[["busy signal", 8.0], ["dial tone", 6.16], ["speech", 6.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.14, 0.63, 8.89, 1.16, 0.81, 0.75, 1.94, 0.66, 1.88, 0.35, -0.07, 1.78, 0.8, 0.43, 0.5, 0.56, 1.62, 0.27, 1.48, 13.99, 3.65, 3.34, 2.64]} \ No newline at end of file diff --git a/annotations_filtered/neFpFiuvYsQ_filtered.json b/annotations_filtered/neFpFiuvYsQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc3cfe6bd12dc8994398cb493f0dbf6c6b0f7513 --- /dev/null +++ b/annotations_filtered/neFpFiuvYsQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.81], [2.0, 4.89], [7.0, 7.2], [8.0, 9.36], [12.0, 12.63], [15.0, 15.9], [22.0, 23.01], [38.0, 41.2], [45.0, 46.21], [51.0, 52.03], [54.0, 54.62], [56.0, 56.3], [60.0, 60.99], [65.0, 65.91], [73.0, 73.82], [74.0, 75.91], [79.0, 80.18], [94.0, 95.1], [116.0, 116.5], [118.0, 118.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 75.88, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 2.89, 0.2, 1.36, 0.63, 0.9, 1.01, 3.2, 1.21, 1.03, 0.62, 0.3, 0.99, 0.91, 0.82, 1.91, 1.18, 1.1, 0.5, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/neVOaWPM_Mk_filtered.json b/annotations_filtered/neVOaWPM_Mk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9278b57aab1e37a4241d8eb9cd576a543be71fd --- /dev/null +++ b/annotations_filtered/neVOaWPM_Mk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.24], [11.0, 14.69], [18.0, 23.4], [25.0, 30.97], [33.0, 41.01], [43.0, 43.11], [46.0, 45.87], [48.0, 61.03], [62.0, 63.66]], "keep_status": [false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 40.64, 32.9, 34.47, 35.2, 0.0, 0.0, 38.58, 0.0], "audiomae_on_audioset": [null, [["speech", 39.93], ["tuning fork", 21.56], ["busy signal", 13.56]], [["speech", 50.64], ["thunk", 30.04], ["music", 11.61]], [["music", 33.5], ["speech", 16.83], ["musical instrument", 9.38]], [["music", 47.65], ["speech", 34.79], ["thunk", 4.43]], null, null, [["speech", 63.2], ["boiling", 2.65], ["liquid", 2.33]], null], "duration": [1.24, 3.69, 5.4, 5.97, 8.01, 0.11, -0.13, 13.03, 1.66]} \ No newline at end of file diff --git a/annotations_filtered/nejXDl9BPbY_filtered.json b/annotations_filtered/nejXDl9BPbY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6c98d78b4c1a6285f126151e3a66c426f3a4a45 --- /dev/null +++ b/annotations_filtered/nejXDl9BPbY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.07], [8.0, 8.77], [14.0, 14.37], [23.0, 23.08], [31.0, 39.39], [40.0, 46.35], [47.0, 46.92], [47.0, 47.17], [47.0, 47.22], [47.0, 54.92], [58.0, 60.99], [63.0, 63.71], [67.0, 66.97], [68.0, 69.15], [72.0, 72.5], [77.0, 79.59], [81.0, 82.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 60.6, 90.25, 0.0, 0.0, 0.0, 99.96, 100.0, 0.0, 0.0, 0.0, 0.0, 93.6, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.07, 0.77, 0.37, 0.08, 8.39, 6.35, -0.08, 0.17, 0.22, 7.92, 2.99, 0.71, -0.03, 1.15, 0.5, 2.59, 1.61]} \ No newline at end of file diff --git a/annotations_filtered/nekzfohNwuY_filtered.json b/annotations_filtered/nekzfohNwuY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcc3cea1d0e9470f1d3a47ef1467a189d0610fee --- /dev/null +++ b/annotations_filtered/nekzfohNwuY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.05], [7.0, 8.02], [9.0, 10.12], [11.0, 12.14], [13.0, 15.23], [18.0, 19.74], [21.0, 21.95], [26.0, 26.7], [28.0, 28.8], [31.0, 31.82], [32.0, 32.97], [34.0, 34.45], [35.0, 36.36], [57.0, 56.62], [57.0, 57.1], [57.0, 57.18], [58.0, 58.28], [61.0, 61.96], [65.0, 65.74], [69.0, 69.92], [72.0, 72.5], [73.0, 73.4], [74.0, 74.34], [77.0, 78.43], [79.0, 82.05], [84.0, 84.64], [90.0, 90.93], [100.0, 100.14], [105.0, 109.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 0.0, 0.0, 50.21], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.05, 1.02, 1.12, 1.14, 2.23, 1.74, 0.95, 0.7, 0.8, 0.82, 0.97, 0.45, 1.36, -0.38, 0.1, 0.18, 0.28, 0.96, 0.74, 0.92, 0.5, 0.4, 0.34, 1.43, 3.05, 0.64, 0.93, 0.14, 4.02]} \ No newline at end of file diff --git a/annotations_filtered/nepc-GLWtfc_filtered.json b/annotations_filtered/nepc-GLWtfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd323da0e7167d2d0e3d4ee078716e606e3471f7 --- /dev/null +++ b/annotations_filtered/nepc-GLWtfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.21], [7.0, 7.7], [9.0, 9.26], [10.0, 11.62], [12.0, 15.04], [16.0, 16.23], [18.0, 19.11], [21.0, 22.05], [24.0, 26.91], [28.0, 31.5], [34.0, 35.82], [37.0, 37.44], [39.0, 42.45], [48.0, 48.09], [51.0, 52.81], [57.0, 57.01], [59.0, 61.64], [63.0, 75.79], [76.0, 77.55], [78.0, 78.54], [79.0, 80.1], [81.0, 81.51]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 56.7, 0.0, 0.0, 0.0, 33.52, 42.69, 0.0, 0.0, 96.42, 0.0, 0.0, 0.0, 100.0, 98.86, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 41.77], ["cattle, bovinae", 29.85], ["moo", 28.25]], [["hum", 10.67], ["explosion", 7.76], ["speech", 7.31]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 0.7, 0.26, 1.62, 3.04, 0.23, 1.11, 1.05, 2.91, 3.5, 1.82, 0.44, 3.45, 0.09, 1.81, 0.01, 2.64, 12.79, 1.55, 0.54, 1.1, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/nfC8sEnM_5A_filtered.json b/annotations_filtered/nfC8sEnM_5A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..066e423d0f7dac35a896e6fc7e43326f87917464 --- /dev/null +++ b/annotations_filtered/nfC8sEnM_5A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.62], [16.0, 18.32], [20.0, 24.26], [29.0, 39.36], [44.0, 45.06], [49.0, 49.76], [50.0, 52.35], [59.0, 58.87], [69.0, 71.25], [72.0, 72.72], [77.0, 76.86], [77.0, 80.33], [90.0, 172.45], [175.0, 190.95], [191.0, 194.53]], "keep_status": [false, true, true, false, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [45.52, 39.94, 44.32, 36.3, 0.0, 0.0, 34.55, 0.0, 33.59, 0.0, 0.0, 32.56, 0.0, 31.77, 34.41], "audiomae_on_audioset": [[["music", 58.98], ["didgeridoo", 14.65], ["bass guitar", 3.04]], [["music", 15.39], ["boing", 12.13], ["fart", 7.86]], [["music", 54.35], ["bass guitar", 7.29], ["guitar", 5.1]], [["music", 71.83], ["synthetic singing", 3.47], ["echo", 2.21]], null, null, [["music", 29.43], ["foghorn", 19.53], ["speech", 12.91]], null, [["music", 57.38], ["guitar", 4.2], ["musical instrument", 3.24]], null, null, [["music", 62.05], ["boing", 12.39], ["singing", 2.76]], null, [["music", 59.69], ["rattle (instrument)", 19.84], ["musical instrument", 2.26]], [["music", 80.75], ["musical instrument", 0.96], ["effects unit", 0.74]]], "duration": [4.62, 2.32, 4.26, 10.36, 1.06, 0.76, 2.35, -0.13, 2.25, 0.72, -0.14, 3.33, 82.45, 15.95, 3.53]} \ No newline at end of file diff --git a/annotations_filtered/nfFsHF8guzM_filtered.json b/annotations_filtered/nfFsHF8guzM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1eb952860edc0e0818efd3a1af7089c3d1da472d --- /dev/null +++ b/annotations_filtered/nfFsHF8guzM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.3], [10.0, 10.08], [11.0, 24.75], [29.0, 30.5], [31.0, 31.46], [34.0, 36.21], [42.0, 41.94], [43.0, 43.92], [47.0, 47.04], [49.0, 49.11], [54.0, 55.27], [56.0, 56.03], [58.0, 59.02], [61.0, 61.32], [63.0, 63.05], [66.0, 65.65], [67.0, 67.22], [70.0, 70.39], [72.0, 73.26], [74.0, 74.61], [75.0, 75.09], [80.0, 81.62], [84.0, 85.43], [87.0, 89.09], [90.0, 90.96], [98.0, 99.17], [101.0, 101.95], [108.0, 110.96]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 34.11, 0.0, 0.0, 33.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.23, 0.0, 0.0, 0.0, 47.2], "audiomae_on_audioset": [null, null, [["music", 28.34], ["speech", 16.3], ["vehicle", 4.43]], null, null, [["livestock, farm animals, working animals", 38.11], ["cattle, bovinae", 37.86], ["moo", 23.65]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.94], ["speech", 10.34], ["didgeridoo", 4.7]], null, null, null, [["livestock, farm animals, working animals", 37.19], ["cattle, bovinae", 27.62], ["moo", 11.78]]], "duration": [0.3, 0.08, 13.75, 1.5, 0.46, 2.21, -0.06, 0.92, 0.04, 0.11, 1.27, 0.03, 1.02, 0.32, 0.05, -0.35, 0.22, 0.39, 1.26, 0.61, 0.09, 1.62, 1.43, 2.09, 0.96, 1.17, 0.95, 2.96]} \ No newline at end of file diff --git a/annotations_filtered/nfGKHa_mn20_filtered.json b/annotations_filtered/nfGKHa_mn20_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c23a3a245398197924ccd9b7969614f8725fd315 --- /dev/null +++ b/annotations_filtered/nfGKHa_mn20_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.32], [14.0, 14.35], [25.0, 25.0], [35.0, 34.84], [38.0, 37.86], [52.0, 52.44], [94.0, 94.73], [102.0, 103.37], [108.0, 110.47], [112.0, 113.91], [114.0, 119.92], [120.0, 123.57], [125.0, 126.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.3, 0.0, 36.44, 48.31, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["hum", 32.21], ["throbbing", 23.26], ["speech", 23.2]], [["hum", 44.41], ["mains hum", 27.92], ["electric shaver, electric razor", 10.94]], null], "duration": [0.32, 0.35, 0.0, -0.16, -0.14, 0.44, 0.73, 1.37, 2.47, 1.91, 5.92, 3.57, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/nfQr0dDL8jg_filtered.json b/annotations_filtered/nfQr0dDL8jg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90c0bb5a8665cd07dc4a2435fb134ae7e54e15bd --- /dev/null +++ b/annotations_filtered/nfQr0dDL8jg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.64], [18.0, 59.64], [61.0, 64.89], [65.0, 97.85]], "keep_status": [false, false, false, false], "silence_prob": [55.18, 0.0, 43.61, 0.0], "audiomae_on_audioset": [null, null, [["music", 64.14], ["didgeridoo", 20.37], ["theremin", 4.04]], null], "duration": [2.64, 41.64, 3.89, 32.85]} \ No newline at end of file diff --git a/annotations_filtered/nfV87TgYH78_filtered.json b/annotations_filtered/nfV87TgYH78_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00f287aa6dc45aa31e51ad27c21288798e275c4e --- /dev/null +++ b/annotations_filtered/nfV87TgYH78_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.99], [23.0, 24.65], [25.0, 24.87], [25.0, 30.67], [33.0, 69.42], [70.0, 75.79], [80.0, 85.21], [87.0, 98.31], [102.0, 107.64], [108.0, 138.2], [140.0, 143.31], [146.0, 161.94]], "keep_status": [false, false, false, true, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 40.68, 0.0, 35.92, 30.57, 31.49, 38.37, 0.0, 44.9, 31.51], "audiomae_on_audioset": [null, null, null, [["speech", 39.91], ["vehicle", 15.52], ["car", 10.4]], null, [["music", 36.62], ["hum", 24.12], ["mains hum", 8.21]], [["music", 42.57], ["hum", 24.72], ["throbbing", 14.53]], [["buzz", 25.97], ["vehicle", 18.64], ["car", 12.46]], [["music", 71.71], ["electronic music", 6.78], ["ambient music", 2.37]], null, [["throbbing", 28.92], ["hum", 26.04], ["eruption", 17.78]], [["mains hum", 35.38], ["hum", 26.86], ["buzz", 10.17]]], "duration": [0.99, 1.65, -0.13, 5.67, 36.42, 5.79, 5.21, 11.31, 5.64, 30.2, 3.31, 15.94]} \ No newline at end of file diff --git a/annotations_filtered/nfk-kn7YP04_filtered.json b/annotations_filtered/nfk-kn7YP04_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ab06d9bdce708164158963dc7d1d1bf35a13ca4 --- /dev/null +++ b/annotations_filtered/nfk-kn7YP04_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.33], [9.0, 10.47], [13.0, 14.05], [15.0, 15.72], [18.0, 19.08], [20.0, 22.32], [23.0, 24.71], [26.0, 26.42], [33.0, 34.08], [43.0, 66.66], [69.0, 74.36], [76.0, 76.6], [77.0, 79.76], [85.0, 90.63], [127.0, 130.35], [135.0, 143.36], [145.0, 152.04], [154.0, 154.52], [156.0, 156.63], [158.0, 159.07], [160.0, 163.93], [166.0, 166.92], [169.0, 169.82], [171.0, 173.53], [174.0, 173.77]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 30.78, 29.66, 0.0, 67.63, 36.98, 42.72, 31.16, 34.7, 0.0, 0.0, 0.0, 34.41, 0.0, 0.0, 31.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["grunt", 43.4], ["speech", 7.19], ["fart", 5.43]], [["speech", 58.33], ["explosion", 16.15], ["burst, pop", 9.08]], null, null, [["speech", 63.23], ["boing", 16.52], ["fart", 2.44]], [["boing", 44.43], ["music", 22.2], ["speech", 3.51]], [["speech", 67.95], ["fart", 17.55], ["music", 1.89]], [["speech", 29.96], ["insect", 12.06], ["fly, housefly", 8.99]], null, null, null, [["speech", 24.21], ["cattle, bovinae", 21.46], ["moo", 13.91]], null, null, [["speech", 62.14], ["cattle, bovinae", 6.31], ["moo", 4.02]], null], "duration": [0.33, 1.47, 1.05, 0.72, 1.08, 2.32, 1.71, 0.42, 1.08, 23.66, 5.36, 0.6, 2.76, 5.63, 3.35, 8.36, 7.04, 0.52, 0.63, 1.07, 3.93, 0.92, 0.82, 2.53, -0.23]} \ No newline at end of file diff --git a/annotations_filtered/nfoIqJWYqX4_filtered.json b/annotations_filtered/nfoIqJWYqX4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d16d572f91c6788217c618f58fd08e584413e96 --- /dev/null +++ b/annotations_filtered/nfoIqJWYqX4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.98], [5.0, 5.26], [8.0, 15.53], [18.0, 21.44], [22.0, 25.32], [27.0, 27.82], [29.0, 28.61], [33.0, 34.18], [37.0, 56.54], [59.0, 66.6], [70.0, 71.76], [76.0, 76.92], [77.0, 78.97], [79.0, 82.61], [85.0, 87.69], [88.0, 89.82], [90.0, 92.18], [94.0, 95.89], [98.0, 115.91], [117.0, 120.65], [122.0, 122.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 89.01, 98.8, 95.78, 0.0, 0.0, 0.0, 99.62, 98.44, 0.0, 0.0, 0.0, 99.99, 99.98, 0.0, 100.0, 0.0, 99.93, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.98, 0.26, 7.53, 3.44, 3.32, 0.82, -0.39, 1.18, 19.54, 7.6, 1.76, 0.92, 1.97, 3.61, 2.69, 1.82, 2.18, 1.89, 17.91, 3.65, 0.18]} \ No newline at end of file diff --git a/annotations_filtered/nfzJCrxKVMU_filtered.json b/annotations_filtered/nfzJCrxKVMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57b21fe7cd3d62f454a133cfd72f1e2fde57669c --- /dev/null +++ b/annotations_filtered/nfzJCrxKVMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.11], [11.0, 11.48], [18.0, 20.43], [26.0, 25.78], [55.0, 55.86], [57.0, 59.34], [62.0, 62.77], [67.0, 67.02], [68.0, 68.79], [70.0, 71.98], [73.0, 74.82], [76.0, 76.01], [80.0, 80.05], [84.0, 84.72], [85.0, 86.41], [87.0, 86.58], [92.0, 96.21], [115.0, 115.26], [118.0, 118.4], [120.0, 124.06], [131.0, 132.92], [138.0, 140.21], [143.0, 147.43], [148.0, 162.82], [168.0, 169.8], [174.0, 174.06], [180.0, 179.73], [182.0, 184.72]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 66.51, 0.0, 0.0, 32.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.92, 0.0, 0.0, 31.89, 0.0, 33.98, 30.57, 31.82, 0.0, 0.0, 0.0, 75.23], "audiomae_on_audioset": [null, null, null, null, null, [["music", 50.83], ["trombone", 7.87], ["musical instrument", 6.3]], null, null, null, null, null, null, null, null, null, null, [["music", 62.1], ["brass instrument", 3.94], ["saxophone", 3.72]], null, null, [["music", 63.46], ["carnatic music", 26.3], ["classical music", 1.65]], null, [["music", 28.64], ["trombone", 23.42], ["brass instrument", 22.15]], [["music", 62.0], ["classical music", 6.15], ["musical instrument", 5.0]], [["music", 54.84], ["speech", 18.74], ["theremin", 2.86]], null, null, null, null], "duration": [0.11, 0.48, 2.43, -0.22, 0.86, 2.34, 0.77, 0.02, 0.79, 1.98, 1.82, 0.01, 0.05, 0.72, 1.41, -0.42, 4.21, 0.26, 0.4, 4.06, 1.92, 2.21, 4.43, 14.82, 1.8, 0.06, -0.27, 2.72]} \ No newline at end of file diff --git a/annotations_filtered/ng95gpwSjZU_filtered.json b/annotations_filtered/ng95gpwSjZU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ed5a72e18bee9f7742a221da760d5fba5cd4575 --- /dev/null +++ b/annotations_filtered/ng95gpwSjZU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.22], [5.0, 7.1], [9.0, 10.59], [14.0, 15.7], [19.0, 19.11], [22.0, 26.45], [27.0, 29.89], [30.0, 32.09], [38.0, 40.22], [41.0, 42.09], [46.0, 46.18], [46.0, 46.41], [48.0, 48.96], [50.0, 52.83], [61.0, 61.74], [84.0, 84.64], [86.0, 87.12], [88.0, 88.11], [88.0, 89.14], [91.0, 92.89], [98.0, 99.93], [110.0, 110.61], [119.0, 120.83], [129.0, 129.61], [131.0, 132.27], [135.0, 136.41], [141.0, 142.37], [144.0, 145.35], [147.0, 146.82], [148.0, 147.82], [149.0, 149.67], [153.0, 153.3], [159.0, 162.4], [167.0, 167.8], [169.0, 170.33], [174.0, 174.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.21, 0.0, 0.0, 0.0, 58.89, 51.71, 55.11, 76.04, 0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["gong", 40.58], ["music", 28.15], ["singing bowl", 9.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.51], ["theremin", 7.06], ["didgeridoo", 2.84]], null, null, null], "duration": [0.22, 2.1, 1.59, 1.7, 0.11, 4.45, 2.89, 2.09, 2.22, 1.09, 0.18, 0.41, 0.96, 2.83, 0.74, 0.64, 1.12, 0.11, 1.14, 1.89, 1.93, 0.61, 1.83, 0.61, 1.27, 1.41, 1.37, 1.35, -0.18, -0.18, 0.67, 0.3, 3.4, 0.8, 1.33, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/ng9LMtcmqNs_filtered.json b/annotations_filtered/ng9LMtcmqNs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11057908b07d38c3e5de9cbff9a83a0747fb17d4 --- /dev/null +++ b/annotations_filtered/ng9LMtcmqNs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 25.19], [26.0, 30.4], [33.0, 32.73], [35.0, 34.89], [35.0, 37.44], [38.0, 38.25], [39.0, 40.46], [44.0, 44.64], [46.0, 46.45], [48.0, 48.3], [55.0, 55.02], [59.0, 61.28], [70.0, 72.76], [74.0, 75.32], [76.0, 76.33], [82.0, 104.16], [106.0, 113.41], [118.0, 118.08], [118.0, 120.48], [121.0, 124.43]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [58.98, 43.85, 0.0, 0.0, 97.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 72.6, 0.0, 0.0, 33.85, 32.97, 0.0, 51.88, 99.98], "audiomae_on_audioset": [null, [["speech", 29.74], ["music", 24.25], ["thunk", 13.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 65.06], ["music", 25.07], ["explosion", 3.2]], [["speech", 35.97], ["boing", 33.91], ["music", 16.52]], null, null, null], "duration": [4.19, 4.4, -0.27, -0.11, 2.44, 0.25, 1.46, 0.64, 0.45, 0.3, 0.02, 2.28, 2.76, 1.32, 0.33, 22.16, 7.41, 0.08, 2.48, 3.43]} \ No newline at end of file diff --git a/annotations_filtered/ngLX1uDh-eg_filtered.json b/annotations_filtered/ngLX1uDh-eg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9bae35ea95a4572fae153321520bc698ec5fc86 --- /dev/null +++ b/annotations_filtered/ngLX1uDh-eg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.45], [12.0, 13.85], [16.0, 17.27], [18.0, 19.21], [21.0, 50.53], [55.0, 56.02], [65.0, 66.66], [68.0, 69.84], [73.0, 73.67], [80.0, 81.8], [83.0, 83.13], [85.0, 84.87], [93.0, 94.05], [98.0, 99.59], [101.0, 108.99], [110.0, 111.01], [116.0, 116.46], [119.0, 120.18], [120.0, 120.23], [120.0, 122.45], [125.0, 125.68], [131.0, 131.52], [135.0, 135.11], [140.0, 139.75], [154.0, 169.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.97, 0.0, 0.0, 0.0, 0.0, 37.82, 0.0, 0.0, 0.0, 0.0, 36.78], "audiomae_on_audioset": [null, null, null, null, [["music", 71.93], ["electronic music", 3.43], ["drum and bass", 3.4]], null, null, null, null, null, null, null, null, null, [["music", 47.98], ["synthesizer", 22.54], ["keyboard (musical)", 4.39]], null, null, null, null, [["music", 53.58], ["musical instrument", 4.95], ["synthesizer", 4.0]], null, null, null, null, [["music", 55.79], ["didgeridoo", 7.98], ["singing", 3.91]]], "duration": [0.45, 1.85, 1.27, 1.21, 29.53, 1.02, 1.66, 1.84, 0.67, 1.8, 0.13, -0.13, 1.05, 1.59, 7.99, 1.01, 0.46, 1.18, 0.23, 2.45, 0.68, 0.52, 0.11, -0.25, 15.3]} \ No newline at end of file diff --git a/annotations_filtered/ngRthItc3Yc_filtered.json b/annotations_filtered/ngRthItc3Yc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bdecbca0080fc7088946684bd6d5d4c45cc4ecf --- /dev/null +++ b/annotations_filtered/ngRthItc3Yc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 131.67], [141.0, 143.99], [145.0, 146.11], [146.0, 153.15], [155.0, 155.68], [157.0, 157.74]], "keep_status": [false, true, false, false, false, false], "silence_prob": [0.0, 31.52, 0.0, 30.82, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 21.8], ["music", 18.99], ["throbbing", 11.68]], null, [["hum", 41.79], ["throbbing", 24.0], ["music", 12.97]], null, null], "duration": [128.67, 2.99, 1.11, 7.15, 0.68, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/ngSM_wxh0lE_filtered.json b/annotations_filtered/ngSM_wxh0lE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..063d1350ff13e74f08aa7c41e8ef59cc6cb7d20a --- /dev/null +++ b/annotations_filtered/ngSM_wxh0lE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 57.55], [79.0, 79.57], [82.0, 83.13], [94.0, 94.68]], "keep_status": [true, false, false, false], "silence_prob": [31.71, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 56.83], ["crowd", 10.08], ["speech", 2.24]], null, null, null], "duration": [16.55, 0.57, 1.13, 0.68]} \ No newline at end of file diff --git a/annotations_filtered/ngThTIjgCMw_filtered.json b/annotations_filtered/ngThTIjgCMw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10d09f0826ab5b3b519bf8bdb635b6bcee5672da --- /dev/null +++ b/annotations_filtered/ngThTIjgCMw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 37.23]], "keep_status": [false], "silence_prob": [30.04], "audiomae_on_audioset": [[["music", 40.85], ["throbbing", 26.09], ["hum", 23.53]]], "duration": [24.23]} \ No newline at end of file diff --git a/annotations_filtered/ngdsRt31sIc_filtered.json b/annotations_filtered/ngdsRt31sIc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88a973ddf842aff8aa106d0eb401607144c37245 --- /dev/null +++ b/annotations_filtered/ngdsRt31sIc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.16], [13.0, 31.04], [31.0, 31.14], [31.0, 31.63], [33.0, 35.16], [37.0, 46.33], [48.0, 73.62], [77.0, 77.13], [78.0, 80.35], [82.0, 109.44], [113.0, 113.49], [114.0, 114.94], [116.0, 116.85]], "keep_status": [true, false, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [31.87, 33.54, 0.0, 0.0, 34.27, 30.48, 30.46, 0.0, 75.88, 31.89, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 47.82], ["music", 8.68], ["explosion", 6.18]], [["speech", 62.58], ["music", 5.48], ["electric shaver, electric razor", 4.81]], null, null, [["speech", 12.83], ["whip", 6.84], ["music", 6.58]], [["music", 47.62], ["speech", 19.76], ["didgeridoo", 15.13]], [["music", 55.79], ["hum", 5.45], ["throbbing", 4.28]], null, null, [["grunt", 68.52], ["music", 7.24], ["groan", 3.86]], null, null, null], "duration": [4.16, 18.04, 0.14, 0.63, 2.16, 9.33, 25.62, 0.13, 2.35, 27.44, 0.49, 0.94, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/ngeORuhnajc_filtered.json b/annotations_filtered/ngeORuhnajc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ee8cbca36b3103fadf7801afb2219eebe87770f --- /dev/null +++ b/annotations_filtered/ngeORuhnajc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.17], [19.0, 33.39], [34.0, 36.37], [40.0, 59.51], [61.0, 63.86], [67.0, 67.96], [70.0, 70.78], [74.0, 75.96], [79.0, 86.76], [88.0, 103.79], [107.0, 107.91], [109.0, 121.36]], "keep_status": [false, true, false, false, false, false, false, false, true, true, false, true], "silence_prob": [0.0, 37.89, 100.0, 45.3, 78.38, 0.0, 0.0, 0.0, 32.55, 32.02, 0.0, 32.12], "audiomae_on_audioset": [null, [["speech", 45.59], ["cattle, bovinae", 6.79], ["livestock, farm animals, working animals", 6.1]], null, [["speech", 71.32], ["music", 3.03], ["sidetone", 2.78]], null, null, null, null, [["cattle, bovinae", 23.54], ["livestock, farm animals, working animals", 21.54], ["speech", 19.5]], [["speech", 21.98], ["cattle, bovinae", 7.48], ["boat, water vehicle", 7.13]], null, [["speech", 23.02], ["fly, housefly", 17.23], ["insect", 11.09]]], "duration": [1.17, 14.39, 2.37, 19.51, 2.86, 0.96, 0.78, 1.96, 7.76, 15.79, 0.91, 12.36]} \ No newline at end of file diff --git a/annotations_filtered/nggWTNLFifA_filtered.json b/annotations_filtered/nggWTNLFifA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d77bb0238c47060ac077363e29eb1e1f971bdfa5 --- /dev/null +++ b/annotations_filtered/nggWTNLFifA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.84], [9.0, 50.97], [52.0, 52.46], [53.0, 60.0]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 57.25], "audiomae_on_audioset": [null, null, null, null], "duration": [1.84, 41.97, 0.46, 7.0]} \ No newline at end of file diff --git a/annotations_filtered/nh8mjiSlAws_filtered.json b/annotations_filtered/nh8mjiSlAws_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..227a9a3198f0eaa18ddf09daae4856fb6e1cf961 --- /dev/null +++ b/annotations_filtered/nh8mjiSlAws_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.3], [8.0, 8.6], [9.0, 9.96], [10.0, 11.28], [11.0, 12.77], [13.0, 14.4], [18.0, 22.42], [25.0, 25.89], [30.0, 30.77], [31.0, 31.23], [35.0, 35.26], [36.0, 36.09], [36.0, 39.92], [40.0, 54.14], [74.0, 75.63], [79.0, 79.08], [80.0, 80.91], [88.0, 89.61], [90.0, 90.8], [91.0, 92.89], [100.0, 104.5], [109.0, 109.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [71.14, 0.0, 0.0, 0.0, 0.0, 0.0, 71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 51.6, 42.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.55, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 33.58], ["music", 14.59], ["mains hum", 14.48]], null, null, null, null, null, null, null, null], "duration": [3.3, 0.6, 0.96, 1.28, 1.77, 1.4, 4.42, 0.89, 0.77, 0.23, 0.26, 0.09, 3.92, 14.14, 1.63, 0.08, 0.91, 1.61, 0.8, 1.89, 4.5, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/nhKgGtFIqXY_filtered.json b/annotations_filtered/nhKgGtFIqXY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9d1a5facd0a7ca385faeea199b458152265d2dd --- /dev/null +++ b/annotations_filtered/nhKgGtFIqXY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.62], [6.0, 7.4], [11.0, 11.35], [12.0, 16.66], [19.0, 19.2], [20.0, 20.8], [24.0, 24.83], [26.0, 26.33], [27.0, 49.15], [51.0, 58.41], [60.0, 66.41], [69.0, 69.75], [71.0, 71.68], [74.0, 75.03], [75.0, 76.74], [78.0, 79.51], [80.0, 81.8], [82.0, 82.83], [84.0, 84.23], [87.0, 90.32], [91.0, 98.24], [101.0, 102.02], [103.0, 108.85], [110.0, 111.3], [112.0, 115.8], [119.0, 118.94], [120.0, 121.47], [122.0, 122.88], [125.0, 124.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 0.0, 99.98, 99.87, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 95.78, 0.0, 99.84, 0.0, 87.37, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.62, 1.4, 0.35, 4.66, 0.2, 0.8, 0.83, 0.33, 22.15, 7.41, 6.41, 0.75, 0.68, 1.03, 1.74, 1.51, 1.8, 0.83, 0.23, 3.32, 7.24, 1.02, 5.85, 1.3, 3.8, -0.06, 1.47, 0.88, -0.29]} \ No newline at end of file diff --git a/annotations_filtered/nhP_9bFQvjg_filtered.json b/annotations_filtered/nhP_9bFQvjg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4f7a6ee2134eb5d31892777387f9baecb231eb8 --- /dev/null +++ b/annotations_filtered/nhP_9bFQvjg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[116.0, 120.39]], "keep_status": [true], "silence_prob": [33.3], "audiomae_on_audioset": [[["music", 45.68], ["organ", 14.38], ["theremin", 7.31]]], "duration": [4.39]} \ No newline at end of file diff --git a/annotations_filtered/nhm5xXXqzqE_filtered.json b/annotations_filtered/nhm5xXXqzqE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca329bd7f654bf548ffdb7d100619be210e46c6c --- /dev/null +++ b/annotations_filtered/nhm5xXXqzqE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 88.45]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [41.45]} \ No newline at end of file diff --git a/annotations_filtered/nhomGXOMYmc_filtered.json b/annotations_filtered/nhomGXOMYmc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..baa9f44339233eba7dcb2685176127fe7118860b --- /dev/null +++ b/annotations_filtered/nhomGXOMYmc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.0], [7.0, 7.86], [9.0, 9.81], [11.0, 12.11], [13.0, 17.2], [23.0, 23.97], [26.0, 25.98], [27.0, 31.23], [32.0, 32.63], [34.0, 34.57], [44.0, 44.39], [45.0, 45.55], [46.0, 48.68], [49.0, 51.43], [55.0, 55.11], [64.0, 66.93], [70.0, 71.14], [73.0, 72.59], [76.0, 76.17], [77.0, 79.54], [84.0, 86.93], [88.0, 90.46], [91.0, 91.86], [104.0, 104.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 52.62, 0.0, 0.0, 34.9, 0.0, 0.0, 0.0, 0.0, 47.43, 74.13, 0.0, 41.56, 0.0, 0.0, 0.0, 46.33, 42.19, 37.59, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 63.0], ["sidetone", 21.09], ["speech synthesizer", 3.21]], null, null, null, null, [["speech", 48.84], ["music", 13.46], ["wind instrument, woodwind instrument", 7.27]], null, null, [["music", 23.24], ["didgeridoo", 9.77], ["thunk", 6.92]], null, null, null, [["music", 51.36], ["musical instrument", 8.82], ["didgeridoo", 3.35]], [["music", 37.31], ["speech", 21.26], ["musical instrument", 5.65]], [["music", 48.47], ["clang", 14.19], ["coin (dropping)", 10.4]], null, null], "duration": [1.0, 0.86, 0.81, 1.11, 4.2, 0.97, -0.02, 4.23, 0.63, 0.57, 0.39, 0.55, 2.68, 2.43, 0.11, 2.93, 1.14, -0.41, 0.17, 2.54, 2.93, 2.46, 0.86, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/nhvRzLcCk40_filtered.json b/annotations_filtered/nhvRzLcCk40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..215d3e27547d75c8d888bd29c2ba2611d3d8814f --- /dev/null +++ b/annotations_filtered/nhvRzLcCk40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 17.95], [20.0, 24.63], [27.0, 60.67], [63.0, 78.53], [80.0, 112.83], [114.0, 116.43], [119.0, 126.52], [131.0, 175.09], [176.0, 176.1]], "keep_status": [false, false, false, true, false, true, true, false, false], "silence_prob": [57.17, 70.02, 0.0, 30.81, 0.0, 29.62, 33.26, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 19.88], ["cacophony", 9.74], ["explosion", 8.21]], null, [["music", 33.79], ["hum", 6.3], ["mains hum", 5.33]], [["music", 29.67], ["synthesizer", 18.96], ["hum", 8.56]], null, null], "duration": [4.95, 4.63, 33.67, 15.53, 32.83, 2.43, 7.52, 44.09, 0.1]} \ No newline at end of file diff --git a/annotations_filtered/nhwtMOjWerg_filtered.json b/annotations_filtered/nhwtMOjWerg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24855acdb704fe145b773824a03cefd2c2a0a58e --- /dev/null +++ b/annotations_filtered/nhwtMOjWerg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.1], [20.0, 22.13], [23.0, 23.92], [25.0, 25.81], [27.0, 27.53], [32.0, 36.48], [37.0, 37.81], [40.0, 41.1], [44.0, 45.22], [47.0, 48.3], [49.0, 50.43], [53.0, 53.32], [55.0, 55.56], [78.0, 80.33], [85.0, 86.81], [91.0, 91.59], [94.0, 94.24], [96.0, 97.48], [99.0, 100.52], [101.0, 110.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [99.88, 100.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.54, 0.0, 0.0, 0.0, 0.0, 0.0, 45.08], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 51.68], ["fart", 3.31], ["field recording", 2.89]], null, null, null, null, null, [["music", 44.38], ["throbbing", 9.24], ["hum", 8.09]]], "duration": [2.1, 2.13, 0.92, 0.81, 0.53, 4.48, 0.81, 1.1, 1.22, 1.3, 1.43, 0.32, 0.56, 2.33, 1.81, 0.59, 0.24, 1.48, 1.52, 9.05]} \ No newline at end of file diff --git a/annotations_filtered/niZKrt4XAZE_filtered.json b/annotations_filtered/niZKrt4XAZE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d9f949efba071f59ebf6440e0138d30613582c1 --- /dev/null +++ b/annotations_filtered/niZKrt4XAZE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.89], [10.0, 12.33], [25.0, 25.51], [31.0, 31.58], [35.0, 36.88], [39.0, 39.68], [44.0, 43.95], [57.0, 58.6], [59.0, 65.57], [66.0, 65.94], [67.0, 67.12], [68.0, 68.77], [71.0, 71.51], [75.0, 75.17], [76.0, 80.37], [82.0, 84.86], [86.0, 87.56], [94.0, 98.59], [99.0, 123.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.1, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 82.79, 33.76], "audiomae_on_audioset": [null, [["speech", 60.07], ["music", 9.57], ["thunk", 7.5]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 68.08], ["fly, housefly", 2.55], ["stomach rumble", 2.51]]], "duration": [0.89, 2.33, 0.51, 0.58, 1.88, 0.68, -0.05, 1.6, 6.57, -0.06, 0.12, 0.77, 0.51, 0.17, 4.37, 2.86, 1.56, 4.59, 24.15]} \ No newline at end of file diff --git a/annotations_filtered/nic5WxX4BCo_filtered.json b/annotations_filtered/nic5WxX4BCo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ab3a7d2e451049c8e8a81d4151168e35074a2ff --- /dev/null +++ b/annotations_filtered/nic5WxX4BCo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 50.99], [54.0, 55.39], [58.0, 59.19], [59.0, 59.43], [59.0, 83.96], [88.0, 93.48], [93.0, 93.55], [95.0, 101.12]], "keep_status": [true, false, false, false, false, true, false, false], "silence_prob": [38.03, 0.0, 0.0, 0.0, 35.81, 29.88, 0.0, 30.83], "audiomae_on_audioset": [[["music", 43.01], ["hum", 11.49], ["mains hum", 5.16]], null, null, null, [["didgeridoo", 46.53], ["music", 33.0], ["speech", 2.99]], [["music", 36.22], ["synthesizer", 9.22], ["noise", 9.07]], null, [["music", 62.01], ["hum", 8.1], ["mains hum", 5.39]]], "duration": [11.99, 1.39, 1.19, 0.43, 24.96, 5.48, 0.55, 6.12]} \ No newline at end of file diff --git a/annotations_filtered/nifcKdVjpbw_filtered.json b/annotations_filtered/nifcKdVjpbw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c8334439369637dc68fdea13c4ce49efdef3236 --- /dev/null +++ b/annotations_filtered/nifcKdVjpbw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.18], [10.0, 10.57], [23.0, 25.59], [27.0, 27.45], [29.0, 29.05], [36.0, 35.83], [44.0, 46.55], [50.0, 50.62], [52.0, 52.57], [53.0, 53.15], [57.0, 57.64], [59.0, 58.95], [61.0, 61.69], [63.0, 108.24], [115.0, 116.11], [116.0, 119.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.48], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.74], ["speech", 34.1], ["hum", 8.1]]], "duration": [0.18, 0.57, 2.59, 0.45, 0.05, -0.17, 2.55, 0.62, 0.57, 0.15, 0.64, -0.05, 0.69, 45.24, 1.11, 3.65]} \ No newline at end of file diff --git a/annotations_filtered/nimkNFEKUkY_filtered.json b/annotations_filtered/nimkNFEKUkY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d04b56570e7c7a8bdb81f17613fce44d182dfd7b --- /dev/null +++ b/annotations_filtered/nimkNFEKUkY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.89], [8.0, 9.73], [10.0, 12.65], [13.0, 14.91], [16.0, 16.11], [17.0, 17.27], [18.0, 18.71], [19.0, 20.12], [21.0, 32.44], [33.0, 45.67], [48.0, 52.0], [54.0, 54.45], [59.0, 82.38], [83.0, 83.1], [84.0, 97.16]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 60.42, 0.0, 0.0, 0.0, 0.0, 0.0, 45.18, 40.22, 37.67, 0.0, 31.06, 0.0, 77.03], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 74.64], ["synthesizer", 8.2], ["musical instrument", 1.93]], [["music", 58.12], ["harmonic", 4.51], ["synthesizer", 4.23]], [["music", 57.07], ["bow-wow", 3.88], ["fowl", 3.45]], null, [["music", 89.51], ["independent music", 1.04], ["country", 0.89]], null, null], "duration": [1.89, 1.73, 2.65, 1.91, 0.11, 0.27, 0.71, 1.12, 11.44, 12.67, 4.0, 0.45, 23.38, 0.1, 13.16]} \ No newline at end of file diff --git a/annotations_filtered/nip7ztfMngk_filtered.json b/annotations_filtered/nip7ztfMngk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6fb6c49a64a1e7e1241341fac3c921e485af5b5 --- /dev/null +++ b/annotations_filtered/nip7ztfMngk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.81], [7.0, 8.51], [12.0, 15.28], [16.0, 17.46], [19.0, 18.86], [20.0, 24.53], [25.0, 29.57], [31.0, 37.35], [39.0, 42.04]], "keep_status": [false, false, true, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 42.3, 0.0, 0.0, 43.74, 36.28, 43.4, 48.48], "audiomae_on_audioset": [null, null, [["water", 15.15], ["gush", 7.35], ["hum", 6.64]], null, null, [["mains hum", 18.34], ["hum", 16.16], ["water", 13.69]], [["drip", 20.14], ["music", 6.75], ["whale vocalization", 5.59]], [["fly, housefly", 34.89], ["mosquito", 24.3], ["insect", 17.9]], [["speech", 69.41], ["inside, small room", 6.07], ["water", 4.18]]], "duration": [0.81, 1.51, 3.28, 1.46, -0.14, 4.53, 4.57, 6.35, 3.04]} \ No newline at end of file diff --git a/annotations_filtered/niul8Hy-3wk_filtered.json b/annotations_filtered/niul8Hy-3wk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7cd74075b14f829b68a1502c8a862bb83b11db19 --- /dev/null +++ b/annotations_filtered/niul8Hy-3wk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.45], [6.0, 7.65], [9.0, 9.32], [12.0, 13.86], [15.0, 16.12], [17.0, 18.76], [20.0, 21.1], [22.0, 23.04], [24.0, 25.93], [27.0, 27.85], [29.0, 30.38], [32.0, 32.56], [35.0, 36.22], [37.0, 38.89], [41.0, 45.22], [49.0, 49.42], [60.0, 60.59], [63.0, 66.88], [69.0, 70.9], [72.0, 74.09], [75.0, 76.49], [78.0, 79.62], [82.0, 83.1], [85.0, 86.91], [88.0, 89.8], [91.0, 92.58], [94.0, 95.57], [97.0, 98.46], [100.0, 103.62], [108.0, 109.48], [113.0, 114.03], [124.0, 123.89], [128.0, 132.17], [134.0, 139.01], [143.0, 155.14], [156.0, 163.49], [164.0, 165.3], [169.0, 169.79], [172.0, 173.11], [176.0, 187.42], [188.0, 188.89], [189.0, 189.9], [191.0, 191.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 97.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 99.99, 42.76, 82.43, 89.19, 0.0, 0.0, 0.0, 45.98, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 47.94], ["moo", 35.56], ["livestock, farm animals, working animals", 15.84]], null, null, null, null, null, [["music", 62.37], ["didgeridoo", 2.26], ["musical instrument", 2.14]], null, null, null], "duration": [0.45, 1.65, 0.32, 1.86, 1.12, 1.76, 1.1, 1.04, 1.93, 0.85, 1.38, 0.56, 1.22, 1.89, 4.22, 0.42, 0.59, 3.88, 1.9, 2.09, 1.49, 1.62, 1.1, 1.91, 1.8, 1.58, 1.57, 1.46, 3.62, 1.48, 1.03, -0.11, 4.17, 5.01, 12.14, 7.49, 1.3, 0.79, 1.11, 11.42, 0.89, 0.9, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/nixHRzTvCUE_filtered.json b/annotations_filtered/nixHRzTvCUE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7226b3fcfa28aa54a4f018561350c1f11dd82643 --- /dev/null +++ b/annotations_filtered/nixHRzTvCUE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 22.82], [24.0, 24.49], [27.0, 29.25], [33.0, 33.13], [35.0, 36.71], [38.0, 40.76], [42.0, 44.04], [44.0, 44.22], [44.0, 44.31], [44.0, 45.62], [46.0, 48.29], [49.0, 50.89], [52.0, 52.83], [54.0, 53.91], [58.0, 59.39], [60.0, 129.47], [129.0, 129.56], [130.0, 145.77], [149.0, 153.01], [156.0, 175.24]], "keep_status": [true, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, true], "silence_prob": [31.9, 0.0, 35.02, 0.0, 0.0, 86.27, 46.68, 0.0, 0.0, 0.0, 33.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.02, 28.68, 30.7], "audiomae_on_audioset": [[["hum", 28.05], ["music", 9.44], ["mains hum", 6.24]], null, [["beatboxing", 10.27], ["gasp", 8.03], ["grunt", 7.83]], null, null, null, [["speech", 60.01], ["music", 16.93], ["radio", 3.36]], null, null, null, [["sound effect", 8.41], ["fly, housefly", 8.32], ["music", 7.12]], null, null, null, null, null, null, [["throbbing", 38.53], ["hum", 30.08], ["music", 12.56]], [["mains hum", 37.35], ["hum", 25.8], ["rumble", 4.92]], [["music", 45.38], ["hum", 10.13], ["mains hum", 5.85]]], "duration": [18.82, 0.49, 2.25, 0.13, 1.71, 2.76, 2.04, 0.22, 0.31, 1.62, 2.29, 1.89, 0.83, -0.09, 1.39, 69.47, 0.56, 15.77, 4.01, 19.24]} \ No newline at end of file diff --git a/annotations_filtered/njFOIvoN9pc_filtered.json b/annotations_filtered/njFOIvoN9pc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..696230d14a071dad7f538d1db8664e281287493a --- /dev/null +++ b/annotations_filtered/njFOIvoN9pc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 27.19], [29.0, 29.54], [32.0, 33.76], [35.0, 36.76], [38.0, 37.67], [47.0, 47.85], [57.0, 57.81], [58.0, 63.19], [64.0, 64.4], [70.0, 76.74], [78.0, 77.8], [78.0, 82.24], [83.0, 83.76], [89.0, 89.36], [90.0, 95.2], [97.0, 101.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.25, 0.0, 99.9, 0.0, 99.52, 0.0, 0.0, 99.95, 99.71], "audiomae_on_audioset": [[["music", 67.37], ["hum", 4.27], ["theremin", 3.0]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.19, 0.54, 1.76, 1.76, -0.33, 0.85, 0.81, 5.19, 0.4, 6.74, -0.2, 4.24, 0.76, 0.36, 5.2, 4.61]} \ No newline at end of file diff --git a/annotations_filtered/njHGa4f1LwY_filtered.json b/annotations_filtered/njHGa4f1LwY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b1e42a304ea1a15f53d0d5af80b1ccf77fa6c66 --- /dev/null +++ b/annotations_filtered/njHGa4f1LwY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.19], [2.0, 3.7], [5.0, 7.69], [11.0, 12.21], [15.0, 15.65], [16.0, 16.73], [17.0, 18.91], [21.0, 21.46], [22.0, 22.6], [24.0, 25.64], [27.0, 27.28], [29.0, 31.35], [32.0, 32.9], [33.0, 45.3], [48.0, 51.43], [53.0, 54.4], [55.0, 58.83], [60.0, 62.09], [67.0, 69.43], [71.0, 72.84], [75.0, 78.58], [81.0, 85.13], [86.0, 98.49], [100.0, 104.06], [107.0, 108.21], [109.0, 120.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 99.96, 100.0, 0.0, 100.0, 100.0, 99.99, 0.0, 99.95, 99.97, 99.59, 98.59, 0.0, 92.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.19, 1.7, 2.69, 1.21, 0.65, 0.73, 1.91, 0.46, 0.6, 1.64, 0.28, 2.35, 0.9, 12.3, 3.43, 1.4, 3.83, 2.09, 2.43, 1.84, 3.58, 4.13, 12.49, 4.06, 1.21, 11.51]} \ No newline at end of file diff --git a/annotations_filtered/njfu6wuNC_w_filtered.json b/annotations_filtered/njfu6wuNC_w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5969abc120c5d1d3a705dc65dabeeba877e48851 --- /dev/null +++ b/annotations_filtered/njfu6wuNC_w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.23], [5.0, 6.51], [8.0, 8.6], [11.0, 11.48], [12.0, 13.04], [14.0, 15.08], [19.0, 23.95], [25.0, 28.66], [29.0, 33.0], [34.0, 41.91], [44.0, 43.61], [44.0, 44.95], [47.0, 51.65], [54.0, 58.65], [61.0, 61.62], [63.0, 66.16], [67.0, 69.92], [71.0, 75.78], [78.0, 80.1], [82.0, 82.14], [83.0, 85.14], [88.0, 89.94], [92.0, 103.6], [104.0, 106.42], [107.0, 108.8], [110.0, 112.73], [113.0, 113.46], [116.0, 116.38], [128.0, 128.46], [133.0, 133.73], [137.0, 137.29]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [57.01, 0.0, 0.0, 0.0, 0.0, 0.0, 42.02, 42.39, 36.73, 37.47, 0.0, 0.0, 35.85, 41.3, 0.0, 37.44, 47.82, 47.78, 62.37, 0.0, 51.02, 0.0, 43.4, 35.12, 0.0, 39.91, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 25.1], ["speech", 20.89], ["mains hum", 14.68]], [["hum", 45.03], ["mains hum", 37.99], ["music", 4.4]], [["speech", 32.54], ["mains hum", 32.26], ["hum", 19.34]], [["hum", 43.62], ["mains hum", 27.24], ["throbbing", 3.85]], null, null, [["speech", 45.23], ["hum", 26.02], ["mains hum", 8.98]], [["hum", 21.51], ["mains hum", 7.66], ["vehicle", 5.4]], null, [["mains hum", 34.78], ["hum", 32.13], ["music", 8.71]], [["hum", 16.39], ["mains hum", 7.97], ["vehicle", 5.81]], [["hum", 13.36], ["vehicle", 8.85], ["mains hum", 6.33]], null, null, null, null, [["hum", 44.26], ["mains hum", 32.43], ["whale vocalization", 8.76]], [["hum", 45.87], ["mains hum", 39.09], ["throbbing", 3.83]], null, [["mains hum", 49.74], ["hum", 37.84], ["throbbing", 1.54]], null, null, null, null, null], "duration": [2.23, 1.51, 0.6, 0.48, 1.04, 1.08, 4.95, 3.66, 4.0, 7.91, -0.39, 0.95, 4.65, 4.65, 0.62, 3.16, 2.92, 4.78, 2.1, 0.14, 2.14, 1.94, 11.6, 2.42, 1.8, 2.73, 0.46, 0.38, 0.46, 0.73, 0.29]} \ No newline at end of file diff --git a/annotations_filtered/njlI82MV0gk_filtered.json b/annotations_filtered/njlI82MV0gk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98dab9af8a5d6e18315c5b534e243b83a525fc0d --- /dev/null +++ b/annotations_filtered/njlI82MV0gk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[90.0, 91.57], [92.0, 94.66], [96.0, 97.17], [116.0, 117.56], [125.0, 126.42], [128.0, 127.99]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 48.69, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 40.31], ["music", 33.81], ["gong", 3.79]], null, null, null, null], "duration": [1.57, 2.66, 1.17, 1.56, 1.42, -0.01]} \ No newline at end of file diff --git a/annotations_filtered/njnCT6sD1Bk_filtered.json b/annotations_filtered/njnCT6sD1Bk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..680ad3efff3b1dc2daa19cd5ed62956d2f2e3256 --- /dev/null +++ b/annotations_filtered/njnCT6sD1Bk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.72], [7.0, 10.99], [12.0, 12.78], [17.0, 17.9], [18.0, 19.2], [21.0, 21.59], [25.0, 25.95], [30.0, 37.07], [39.0, 39.43], [41.0, 41.67], [43.0, 45.0], [49.0, 51.66], [53.0, 56.24], [58.0, 58.46]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, true, false], "silence_prob": [39.74, 39.63, 0.0, 0.0, 0.0, 0.0, 0.0, 36.34, 0.0, 0.0, 52.56, 30.8, 31.58, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 41.87], ["moo", 35.17], ["livestock, farm animals, working animals", 18.32]], [["speech", 54.84], ["music", 19.07], ["hum", 3.76]], null, null, null, null, null, [["speech", 16.48], ["music", 14.54], ["fly, housefly", 6.57]], null, null, null, [["whale vocalization", 48.8], ["music", 7.26], ["vehicle", 3.92]], [["speech", 29.28], ["music", 12.38], ["vehicle", 4.83]], null], "duration": [2.72, 3.99, 0.78, 0.9, 1.2, 0.59, 0.95, 7.07, 0.43, 0.67, 2.0, 2.66, 3.24, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/njq3H2iy2X0_filtered.json b/annotations_filtered/njq3H2iy2X0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9323f50b976120dc3e6c3e2550a7cecab38884d --- /dev/null +++ b/annotations_filtered/njq3H2iy2X0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.48], [6.0, 7.32], [8.0, 8.21], [16.0, 17.32], [31.0, 31.29], [40.0, 45.22], [47.0, 48.57], [49.0, 50.62], [58.0, 61.48], [81.0, 81.57], [83.0, 83.59], [85.0, 85.75], [87.0, 87.24], [100.0, 101.46], [104.0, 105.73], [110.0, 110.35], [117.0, 118.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 59.42, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 1.32, 0.21, 1.32, 0.29, 5.22, 1.57, 1.62, 3.48, 0.57, 0.59, 0.75, 0.24, 1.46, 1.73, 0.35, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/njz1p35e_EU_filtered.json b/annotations_filtered/njz1p35e_EU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a13359b0f51e5d7226559bd999fe2871677dcea8 --- /dev/null +++ b/annotations_filtered/njz1p35e_EU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.67], [11.0, 11.42], [24.0, 30.0], [33.0, 32.91], [36.0, 43.14], [43.0, 43.92], [44.0, 57.52], [70.0, 71.78], [75.0, 97.24], [99.0, 108.87], [111.0, 132.39], [132.0, 132.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.24, 0.0, 31.69, 0.0, 31.28, 0.0, 29.94, 29.79, 50.16, 0.0], "audiomae_on_audioset": [null, null, [["music", 76.17], ["theremin", 6.39], ["musical instrument", 4.25]], null, [["speech", 43.97], ["music", 17.29], ["sidetone", 14.87]], null, [["music", 45.4], ["speech", 26.66], ["musical instrument", 2.66]], null, [["music", 41.32], ["gong", 24.64], ["theremin", 9.74]], [["music", 54.32], ["theremin", 27.69], ["musical instrument", 7.08]], null, null], "duration": [1.67, 0.42, 6.0, -0.09, 7.14, 0.92, 13.52, 1.78, 22.24, 9.87, 21.39, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/nkQAhpLBok8_filtered.json b/annotations_filtered/nkQAhpLBok8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5e02c12dd65432b41633db446df8ff2c34bf257 --- /dev/null +++ b/annotations_filtered/nkQAhpLBok8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.47], [9.0, 10.15], [12.0, 13.58], [14.0, 16.44], [18.0, 23.53], [25.0, 24.75], [27.0, 47.66], [56.0, 56.96], [58.0, 65.01], [67.0, 68.5], [70.0, 76.54], [79.0, 86.49], [87.0, 93.63], [95.0, 106.03], [108.0, 108.24], [109.0, 109.59], [113.0, 114.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 56.86, 100.0, 0.0, 90.08, 0.0, 69.47, 0.0, 84.8, 76.37, 67.25, 56.63, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.47, 1.15, 1.58, 2.44, 5.53, -0.25, 20.66, 0.96, 7.01, 1.5, 6.54, 7.49, 6.63, 11.03, 0.24, 0.59, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/nkUx3zstpbU_filtered.json b/annotations_filtered/nkUx3zstpbU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d15cad41a08569af2fbd05c3f93353e4016330bb --- /dev/null +++ b/annotations_filtered/nkUx3zstpbU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.31], [10.0, 10.4], [12.0, 16.39], [17.0, 34.74], [37.0, 42.45], [45.0, 64.2], [65.0, 74.01], [76.0, 77.13], [78.0, 89.33], [90.0, 93.21], [94.0, 96.85], [100.0, 104.67], [106.0, 112.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 72.9, 75.23, 100.0, 30.44, 0.0, 53.84, 35.92, 28.99, 38.93, 29.81], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 73.79], ["explosion", 4.39], ["sidetone", 2.46]], null, null, [["cattle, bovinae", 48.79], ["livestock, farm animals, working animals", 23.73], ["moo", 18.28]], [["explosion", 41.34], ["speech", 26.65], ["eruption", 11.47]], [["sidetone", 73.43], ["boing", 5.27], ["speech", 4.8]], [["steam whistle", 61.26], ["music", 5.29], ["train", 3.81]]], "duration": [1.31, 0.4, 4.39, 17.74, 5.45, 19.2, 9.01, 1.13, 11.33, 3.21, 2.85, 4.67, 6.77]} \ No newline at end of file diff --git a/annotations_filtered/nkVK4JHRQfk_filtered.json b/annotations_filtered/nkVK4JHRQfk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/nkVK4JHRQfk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/nkelgV49oGQ_filtered.json b/annotations_filtered/nkelgV49oGQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2fc6fd2f40d8c63ec16270152997aa2fe47b092 --- /dev/null +++ b/annotations_filtered/nkelgV49oGQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.52], [13.0, 13.32], [17.0, 17.63], [20.0, 22.37], [23.0, 23.7], [24.0, 29.79], [34.0, 34.52], [36.0, 36.21], [39.0, 39.65], [40.0, 47.43], [48.0, 51.34], [58.0, 60.83], [64.0, 64.93], [68.0, 68.77], [70.0, 70.73], [74.0, 73.92], [75.0, 76.37], [78.0, 79.57], [84.0, 88.32], [90.0, 90.69], [92.0, 92.8], [94.0, 112.77], [114.0, 114.54], [116.0, 116.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.99, 0.0, 99.52, 0.0, 0.0, 0.0, 86.82, 81.53, 92.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.07, 0.0, 0.0, 66.03, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 0.32, 0.63, 2.37, 0.7, 5.79, 0.52, 0.21, 0.65, 7.43, 3.34, 2.83, 0.93, 0.77, 0.73, -0.08, 1.37, 1.57, 4.32, 0.69, 0.8, 18.77, 0.54, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/nkuKrymtuCg_filtered.json b/annotations_filtered/nkuKrymtuCg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..863ef5108e83d2184491896c57e988b26a9f633a --- /dev/null +++ b/annotations_filtered/nkuKrymtuCg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 11.28], [12.0, 33.4], [34.0, 35.09], [37.0, 37.76], [40.0, 48.24], [49.0, 52.42], [54.0, 54.87], [55.0, 59.17], [60.0, 94.44], [96.0, 100.11], [102.0, 103.17]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [75.23, 33.91, 0.0, 0.0, 99.8, 99.31, 0.0, 78.04, 0.0, 29.48, 0.0], "audiomae_on_audioset": [null, [["breaking", 38.56], ["glass", 6.61], ["boing", 4.54]], null, null, null, null, null, null, null, [["music", 41.88], ["carnatic music", 15.81], ["musical instrument", 7.35]], null], "duration": [9.28, 21.4, 1.09, 0.76, 8.24, 3.42, 0.87, 4.17, 34.44, 4.11, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/nkwyt0ytVJI_filtered.json b/annotations_filtered/nkwyt0ytVJI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9243cff7b9e61855ae8acaf06bfe2dc283317594 --- /dev/null +++ b/annotations_filtered/nkwyt0ytVJI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 54.51], [56.0, 56.22], [57.0, 60.57], [65.0, 79.14], [90.0, 90.37], [91.0, 100.52], [104.0, 105.39], [108.0, 119.82]], "keep_status": [false, false, false, false, false, true, false, true], "silence_prob": [72.01, 0.0, 51.44, 41.32, 0.0, 42.28, 0.0, 32.82], "audiomae_on_audioset": [null, null, null, [["speech", 59.07], ["hum", 11.48], ["mains hum", 6.06]], null, [["speech", 21.56], ["livestock, farm animals, working animals", 16.93], ["cattle, bovinae", 13.16]], null, [["explosion", 14.82], ["speech", 12.0], ["burst, pop", 9.75]]], "duration": [24.51, 0.22, 3.57, 14.14, 0.37, 9.52, 1.39, 11.82]} \ No newline at end of file diff --git a/annotations_filtered/nl8PQAfhi28_filtered.json b/annotations_filtered/nl8PQAfhi28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f1dd26bbd580fe25a67755c6fddc4c281ea469f --- /dev/null +++ b/annotations_filtered/nl8PQAfhi28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.98], [6.0, 6.18], [7.0, 10.2], [12.0, 12.75], [16.0, 16.46], [18.0, 21.1], [23.0, 23.68], [31.0, 33.69], [36.0, 38.16], [39.0, 39.09], [41.0, 41.25], [42.0, 43.83], [46.0, 46.45], [49.0, 49.08], [51.0, 52.25], [55.0, 56.05], [67.0, 69.43]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 37.27, 0.0, 0.0, 55.74, 0.0, 53.91, 46.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.98], "audiomae_on_audioset": [null, null, [["speech", 31.1], ["sidetone", 11.05], ["hum", 7.82]], null, null, null, null, null, [["whale vocalization", 14.43], ["insect", 11.73], ["mains hum", 9.88]], null, null, null, null, null, null, null, [["whale vocalization", 18.67], ["music", 12.36], ["didgeridoo", 10.33]]], "duration": [0.98, 0.18, 3.2, 0.75, 0.46, 3.1, 0.68, 2.69, 2.16, 0.09, 0.25, 1.83, 0.45, 0.08, 1.25, 1.05, 2.43]} \ No newline at end of file diff --git a/annotations_filtered/nlH_5ejw7Gs_filtered.json b/annotations_filtered/nlH_5ejw7Gs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..14fa0c0c4f35bb86936192a199fbd908b795bf79 --- /dev/null +++ b/annotations_filtered/nlH_5ejw7Gs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 35.82], [36.0, 43.31], [44.0, 45.01], [45.0, 45.12], [45.0, 84.23], [85.0, 84.96], [87.0, 87.96], [89.0, 93.61], [96.0, 98.37], [99.0, 106.44], [107.0, 115.65], [116.0, 116.01], [116.0, 116.8], [117.0, 117.73], [119.0, 122.22], [126.0, 129.64], [133.0, 146.04], [148.0, 162.73]], "keep_status": [true, false, false, false, false, false, false, true, true, true, false, false, false, false, true, false, false, true], "silence_prob": [42.96, 57.01, 0.0, 0.0, 0.0, 0.0, 0.0, 31.14, 32.28, 35.84, 34.6, 0.0, 0.0, 0.0, 33.78, 33.23, 31.09, 33.46], "audiomae_on_audioset": [[["speech", 33.51], ["cattle, bovinae", 8.66], ["horse", 6.51]], null, null, null, null, null, null, [["insect", 18.24], ["livestock, farm animals, working animals", 17.4], ["fly, housefly", 9.07]], [["civil defense siren", 26.07], ["crowd", 8.24], ["cheering", 6.05]], [["music", 28.3], ["animal", 12.75], ["speech", 7.25]], [["bagpipes", 52.09], ["music", 16.28], ["vehicle", 4.01]], null, null, null, [["music", 25.68], ["speech", 16.54], ["skateboard", 4.5]], [["music", 57.43], ["speech", 12.38], ["bagpipes", 2.7]], [["cattle, bovinae", 31.03], ["moo", 28.48], ["livestock, farm animals, working animals", 18.23]], [["whale vocalization", 52.84], ["animal", 7.53], ["fly, housefly", 3.21]]], "duration": [14.82, 7.31, 1.01, 0.12, 39.23, -0.04, 0.96, 4.61, 2.37, 7.44, 8.65, 0.01, 0.8, 0.73, 3.22, 3.64, 13.04, 14.73]} \ No newline at end of file diff --git a/annotations_filtered/nlJqcYb65o0_filtered.json b/annotations_filtered/nlJqcYb65o0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d119775aae6df2c60025fdecd3ba032a0e5b2a9 --- /dev/null +++ b/annotations_filtered/nlJqcYb65o0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[102.0, 136.32], [139.0, 146.65]], "keep_status": [false, true], "silence_prob": [0.0, 32.0], "audiomae_on_audioset": [null, [["music", 48.25], ["speech", 5.68], ["vehicle", 5.0]]], "duration": [34.32, 7.65]} \ No newline at end of file diff --git a/annotations_filtered/nlOF6YhAoJQ_filtered.json b/annotations_filtered/nlOF6YhAoJQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78d8f67b1e252409cd23c455c74734a2c1f42893 --- /dev/null +++ b/annotations_filtered/nlOF6YhAoJQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.34], [14.0, 16.04], [17.0, 21.95], [22.0, 30.48], [33.0, 34.25], [44.0, 44.32], [51.0, 51.12], [52.0, 56.25], [57.0, 60.49], [62.0, 65.99], [67.0, 66.6], [67.0, 66.7], [67.0, 70.11], [72.0, 72.57], [73.0, 72.99], [75.0, 78.46], [80.0, 80.74], [81.0, 101.04], [102.0, 103.69], [104.0, 110.83], [111.0, 112.7], [114.0, 130.44], [131.0, 133.52], [134.0, 135.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.99, 100.0, 96.04, 0.0, 0.0, 0.0, 99.82, 99.88, 99.9, 0.0, 0.0, 100.0, 0.0, 0.0, 99.82, 0.0, 99.91, 0.0, 99.99, 0.0, 99.99, 82.43, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.34, 2.04, 4.95, 8.48, 1.25, 0.32, 0.12, 4.25, 3.49, 3.99, -0.4, -0.3, 3.11, 0.57, -0.01, 3.46, 0.74, 20.04, 1.69, 6.83, 1.7, 16.44, 2.52, 1.16]} \ No newline at end of file diff --git a/annotations_filtered/nm86_ZWeUzk_filtered.json b/annotations_filtered/nm86_ZWeUzk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea59904c509fd5005a1c7376a6fc9f1eaa1716c2 --- /dev/null +++ b/annotations_filtered/nm86_ZWeUzk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.65], [6.0, 13.02], [13.0, 13.63], [18.0, 22.49], [30.0, 40.14], [45.0, 49.18], [54.0, 60.76], [61.0, 76.32], [85.0, 87.34], [91.0, 96.01], [102.0, 103.25], [107.0, 107.5], [108.0, 108.73], [110.0, 110.29], [122.0, 130.94], [135.0, 135.67], [139.0, 139.4], [139.0, 144.63]], "keep_status": [false, false, false, true, true, true, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 29.12, 0.0, 28.63, 28.66, 34.38, 28.65, 31.97, 36.04, 29.69, 0.0, 0.0, 0.0, 0.0, 28.54, 0.0, 0.0, 28.17], "audiomae_on_audioset": [null, [["mains hum", 36.13], ["hum", 25.19], ["speech", 11.62]], null, [["breaking", 28.92], ["music", 17.03], ["speech", 10.81]], [["music", 48.29], ["cowbell", 5.21], ["thump, thud", 3.55]], [["music", 32.01], ["throbbing", 19.13], ["speech", 14.06]], [["sidetone", 45.08], ["music", 18.7], ["throbbing", 8.59]], [["speech", 37.4], ["music", 37.09], ["didgeridoo", 11.96]], [["speech", 43.2], ["music", 23.02], ["throbbing", 4.25]], [["music", 31.12], ["throbbing", 18.08], ["hum", 11.19]], null, null, null, null, [["explosion", 33.7], ["burst, pop", 8.03], ["smash, crash", 7.51]], null, null, [["speech", 79.61], ["music", 6.24], ["vehicle", 1.75]]], "duration": [0.65, 7.02, 0.63, 4.49, 10.14, 4.18, 6.76, 15.32, 2.34, 5.01, 1.25, 0.5, 0.73, 0.29, 8.94, 0.67, 0.4, 5.63]} \ No newline at end of file diff --git a/annotations_filtered/nma6daFY6b0_filtered.json b/annotations_filtered/nma6daFY6b0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..258775f7466f58bfb43a834ce84838160f3ef987 --- /dev/null +++ b/annotations_filtered/nma6daFY6b0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.79], [5.0, 6.52], [9.0, 9.19], [12.0, 12.29], [13.0, 13.68], [15.0, 16.56], [18.0, 18.5], [20.0, 22.99], [24.0, 29.54], [30.0, 31.06], [36.0, 36.14], [38.0, 38.67], [40.0, 41.05], [43.0, 44.27], [46.0, 47.66], [52.0, 52.54], [55.0, 62.02], [65.0, 66.45], [75.0, 75.78], [77.0, 77.21], [78.0, 87.54], [88.0, 130.35]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.79, 48.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.4, 0.0, 0.0, 0.0, 34.56, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["throbbing", 32.75], ["hum", 20.64], ["music", 7.06]], [["music", 37.17], ["hum", 12.33], ["electronic music", 9.28]], null, null, null, null, null, null, null, [["throbbing", 52.22], ["hum", 25.49], ["music", 9.36]], null, null, null, [["breaking", 37.95], ["hum", 19.2], ["music", 8.72]], null], "duration": [0.79, 1.52, 0.19, 0.29, 0.68, 1.56, 0.5, 2.99, 5.54, 1.06, 0.14, 0.67, 1.05, 1.27, 1.66, 0.54, 7.02, 1.45, 0.78, 0.21, 9.54, 42.35]} \ No newline at end of file diff --git a/annotations_filtered/nmaCobIvt2w_filtered.json b/annotations_filtered/nmaCobIvt2w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ede4a7d56b578ca903b7fa3488dfb55a9f66bf3 --- /dev/null +++ b/annotations_filtered/nmaCobIvt2w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.94], [10.0, 11.6], [14.0, 15.94], [28.0, 38.31], [44.0, 45.25], [48.0, 48.12], [51.0, 55.43], [58.0, 58.14], [68.0, 68.23], [71.0, 70.7], [73.0, 73.57], [77.0, 81.04], [82.0, 91.83], [103.0, 106.1], [111.0, 135.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 32.48, 0.0, 0.0, 31.85, 0.0, 0.0, 0.0, 0.0, 35.33, 33.7, 38.56, 31.15], "audiomae_on_audioset": [null, null, null, [["music", 64.98], ["electronic music", 8.24], ["trance music", 7.38]], null, null, [["music", 47.78], ["throbbing", 15.77], ["trance music", 10.38]], null, null, null, null, [["music", 61.55], ["speech", 22.48], ["electronic music", 3.2]], [["music", 72.72], ["throbbing", 8.98], ["hum", 6.23]], [["music", 43.1], ["sidetone", 6.52], ["throbbing", 6.19]], [["music", 53.46], ["speech", 4.81], ["throbbing", 4.36]]], "duration": [-0.06, 1.6, 1.94, 10.31, 1.25, 0.12, 4.43, 0.14, 0.23, -0.3, 0.57, 4.04, 9.83, 3.1, 24.57]} \ No newline at end of file diff --git a/annotations_filtered/nn-nEk5kpz0_filtered.json b/annotations_filtered/nn-nEk5kpz0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d7ffed67685f2d3aa0d3a0e5d174dff7cf1655d --- /dev/null +++ b/annotations_filtered/nn-nEk5kpz0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 11.4], [13.0, 14.2], [19.0, 19.18], [22.0, 22.03], [25.0, 25.2], [32.0, 32.64], [35.0, 35.56], [37.0, 37.02], [38.0, 39.04], [46.0, 46.8], [53.0, 57.0], [57.0, 58.01], [59.0, 62.34], [67.0, 67.96], [71.0, 77.75], [88.0, 88.21], [90.0, 90.49], [92.0, 96.45], [98.0, 99.06], [100.0, 100.25], [102.0, 106.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, true], "silence_prob": [36.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.9, 0.0, 35.17, 0.0, 33.52, 0.0, 0.0, 31.2, 0.0, 0.0, 35.33], "audiomae_on_audioset": [[["speech", 39.13], ["sidetone", 30.89], ["hum", 5.43]], null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 15.78], ["hum", 14.87], ["music", 10.08]], null, [["music", 21.95], ["hum", 14.76], ["mains hum", 13.19]], null, null, [["didgeridoo", 51.29], ["music", 37.99], ["musical instrument", 4.79]], null, null, [["hum", 27.44], ["mains hum", 22.43], ["noise", 8.59]]], "duration": [10.4, 1.2, 0.18, 0.03, 0.2, 0.64, 0.56, 0.02, 1.04, 0.8, 4.0, 1.01, 3.34, 0.96, 6.75, 0.21, 0.49, 4.45, 1.06, 0.25, 4.19]} \ No newline at end of file diff --git a/annotations_filtered/nn1qvGiHvLc_filtered.json b/annotations_filtered/nn1qvGiHvLc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..025426a4a8b2594554d567d0cfabcacd0040309b --- /dev/null +++ b/annotations_filtered/nn1qvGiHvLc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 104.26], [107.0, 109.58], [114.0, 117.81], [120.0, 120.19]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 28.47, 29.73, 0.0], "audiomae_on_audioset": [null, [["music", 24.14], ["speech", 20.05], ["fart", 17.76]], [["music", 65.58], ["sidetone", 11.68], ["throbbing", 6.17]], null], "duration": [73.26, 2.58, 3.81, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/nn3I6-DBLJM_filtered.json b/annotations_filtered/nn3I6-DBLJM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1db1e791bd4987bda81b4b093821fb0c861e6854 --- /dev/null +++ b/annotations_filtered/nn3I6-DBLJM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.1], [12.0, 12.14], [15.0, 15.63], [58.0, 59.49], [61.0, 61.65], [72.0, 71.86], [96.0, 96.36], [110.0, 117.44], [130.0, 131.16], [142.0, 142.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.34, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [1.1, 0.14, 0.63, 1.49, 0.65, -0.14, 0.36, 7.44, 1.16, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/nnESedN4vSI_filtered.json b/annotations_filtered/nnESedN4vSI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..05df66e0c4d2833866c266d640257d4b352073a2 --- /dev/null +++ b/annotations_filtered/nnESedN4vSI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.69], [14.0, 15.21], [19.0, 19.2], [26.0, 26.72], [36.0, 38.45], [40.0, 47.14], [51.0, 54.43], [73.0, 73.52], [79.0, 79.19], [81.0, 80.6], [81.0, 81.8], [86.0, 85.75], [99.0, 100.65], [102.0, 102.2], [104.0, 104.84], [106.0, 106.83], [108.0, 110.59], [113.0, 113.07], [114.0, 117.09], [119.0, 119.45], [120.0, 121.27], [122.0, 121.81], [122.0, 123.89], [125.0, 130.33]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 39.89, 60.7, 38.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.06, 0.0, 42.33, 0.0, 0.0, 0.0, 0.0, 28.59], "audiomae_on_audioset": [null, null, null, null, [["music", 47.95], ["throbbing", 13.68], ["synthesizer", 9.12]], null, [["sine wave", 39.99], ["chirp tone", 7.13], ["noise", 6.35]], null, null, null, null, null, null, null, null, null, [["fly, housefly", 28.31], ["insect", 13.96], ["hum", 8.38]], null, [["fly, housefly", 17.43], ["music", 17.34], ["speech", 11.06]], null, null, null, null, [["music", 65.35], ["synthesizer", 3.43], ["throbbing", 3.15]]], "duration": [0.69, 1.21, 0.2, 0.72, 2.45, 7.14, 3.43, 0.52, 0.19, -0.4, 0.8, -0.25, 1.65, 0.2, 0.84, 0.83, 2.59, 0.07, 3.09, 0.45, 1.27, -0.19, 1.89, 5.33]} \ No newline at end of file diff --git a/annotations_filtered/nna-IuI5SDk_filtered.json b/annotations_filtered/nna-IuI5SDk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7a16e249f6de6fbd65823e101f395ff507e40a9 --- /dev/null +++ b/annotations_filtered/nna-IuI5SDk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 11.28], [13.0, 19.6], [20.0, 24.93], [45.0, 62.06], [65.0, 68.55], [75.0, 81.6], [82.0, 82.86], [84.0, 88.5], [92.0, 109.78], [112.0, 114.25], [116.0, 120.63], [122.0, 131.23]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [45.36, 49.27, 49.5, 39.17, 44.96, 48.1, 0.0, 46.9, 41.52, 47.98, 42.3, 45.11], "audiomae_on_audioset": [[["music", 68.37], ["didgeridoo", 7.72], ["swing music", 3.72]], [["music", 58.82], ["didgeridoo", 11.58], ["musical instrument", 3.44]], [["music", 68.34], ["didgeridoo", 3.82], ["singing", 2.04]], [["music", 63.39], ["didgeridoo", 6.9], ["electronic music", 2.24]], [["music", 63.89], ["didgeridoo", 12.09], ["musical instrument", 2.27]], [["music", 87.5], ["musical instrument", 1.39], ["didgeridoo", 1.19]], null, [["music", 70.42], ["throbbing", 3.45], ["singing", 1.83]], [["music", 53.95], ["didgeridoo", 10.44], ["singing", 4.47]], [["music", 55.38], ["speech", 15.74], ["musical instrument", 2.13]], [["music", 67.16], ["didgeridoo", 4.84], ["sitar", 1.87]], [["music", 69.26], ["didgeridoo", 12.75], ["synthesizer", 1.83]]], "duration": [11.28, 6.6, 4.93, 17.06, 3.55, 6.6, 0.86, 4.5, 17.78, 2.25, 4.63, 9.23]} \ No newline at end of file diff --git a/annotations_filtered/no5XxM0OY4o_filtered.json b/annotations_filtered/no5XxM0OY4o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf2bde1928ff43e32441d03ddfe8d086e5edb3d9 --- /dev/null +++ b/annotations_filtered/no5XxM0OY4o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 26.13], [28.0, 31.45], [39.0, 40.96], [44.0, 55.17], [66.0, 77.21], [99.0, 99.77], [101.0, 101.34]], "keep_status": [false, true, false, true, true, false, false], "silence_prob": [94.07, 28.26, 0.0, 38.15, 30.55, 0.0, 0.0], "audiomae_on_audioset": [null, [["whack, thwack", 54.69], ["thunk", 9.68], ["speech", 2.29]], null, [["music", 22.58], ["hum", 7.78], ["groan", 5.85]], [["fly, housefly", 21.23], ["speech", 19.25], ["insect", 19.03]], null, null], "duration": [2.13, 3.45, 1.96, 11.17, 11.21, 0.77, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/no7XR7s8Z7o_filtered.json b/annotations_filtered/no7XR7s8Z7o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1c2d989e634b0be67a60303a65b416e7f25238e --- /dev/null +++ b/annotations_filtered/no7XR7s8Z7o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 12.26], [13.0, 53.91]], "keep_status": [false, false], "silence_prob": [30.56, 0.0], "audiomae_on_audioset": [[["music", 77.92], ["skidding", 3.4], ["synthesizer", 3.19]], null], "duration": [11.26, 40.91]} \ No newline at end of file diff --git a/annotations_filtered/noLAdkr7WzY_filtered.json b/annotations_filtered/noLAdkr7WzY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ced8dcc9fd17be692864bb18063eacdd4401ad2e --- /dev/null +++ b/annotations_filtered/noLAdkr7WzY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 32.07], [32.0, 34.01], [36.0, 39.04], [40.0, 41.07], [42.0, 42.75], [44.0, 45.62], [48.0, 50.09], [54.0, 54.33], [56.0, 56.05], [58.0, 60.56], [62.0, 62.85], [65.0, 65.26], [68.0, 69.3], [69.0, 72.1], [74.0, 74.49], [76.0, 76.76], [78.0, 78.51], [80.0, 82.29], [85.0, 85.09], [87.0, 87.64], [90.0, 90.76], [92.0, 93.87], [95.0, 98.56], [100.0, 102.0]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 42.91, 90.25, 0.0, 0.0, 0.0, 47.9, 0.0, 0.0, 74.76, 0.0, 0.0, 0.0, 50.02, 0.0, 0.0, 0.0, 82.25, 0.0, 0.0, 0.0, 0.0, 82.61, 87.19], "audiomae_on_audioset": [null, [["sine wave", 18.68], ["speech", 16.08], ["dial tone", 10.11]], null, null, null, null, [["frog", 46.51], ["speech", 15.55], ["telephone", 5.96]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [30.07, 2.01, 3.04, 1.07, 0.75, 1.62, 2.09, 0.33, 0.05, 2.56, 0.85, 0.26, 1.3, 3.1, 0.49, 0.76, 0.51, 2.29, 0.09, 0.64, 0.76, 1.87, 3.56, 2.0]} \ No newline at end of file diff --git a/annotations_filtered/noT3bA3Ibyk_filtered.json b/annotations_filtered/noT3bA3Ibyk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09cb4f5903d05f9283ea5adafb9462dd2b840e03 --- /dev/null +++ b/annotations_filtered/noT3bA3Ibyk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 12.93], [14.0, 20.63], [26.0, 27.72], [29.0, 33.93], [36.0, 69.57], [71.0, 71.59], [76.0, 77.18], [78.0, 81.19], [84.0, 85.65], [89.0, 98.34], [101.0, 101.76], [104.0, 106.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [72.6, 57.09, 0.0, 46.4, 0.0, 0.0, 0.0, 63.96, 0.0, 93.91, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, [["fart", 70.38], ["speech", 6.96], ["livestock, farm animals, working animals", 3.87]], null, null, null, null, null, null, null, null], "duration": [7.93, 6.63, 1.72, 4.93, 33.57, 0.59, 1.18, 3.19, 1.65, 9.34, 0.76, 2.25]} \ No newline at end of file diff --git a/annotations_filtered/noq0Lb6lVEI_filtered.json b/annotations_filtered/noq0Lb6lVEI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31abcc3339641f2e64155f70277743ff44233bdb --- /dev/null +++ b/annotations_filtered/noq0Lb6lVEI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.52], [11.0, 10.56], [15.0, 19.33], [23.0, 46.85], [48.0, 61.4], [63.0, 64.3], [66.0, 71.07], [84.0, 93.48], [94.0, 95.27], [114.0, 114.32], [120.0, 120.14], [127.0, 130.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.61, 0.0, 40.81, 37.36, 35.59, 0.0, 30.71, 30.68, 0.0, 0.0, 0.0, 36.8], "audiomae_on_audioset": [[["speech", 35.8], ["music", 33.75], ["fart", 2.41]], null, [["music", 73.65], ["synthesizer", 8.88], ["sidetone", 3.7]], [["music", 63.48], ["speech", 14.69], ["coin (dropping)", 9.16]], [["quack", 40.98], ["music", 32.12], ["duck", 6.63]], null, [["speech", 75.88], ["music", 8.84], ["boing", 2.71]], [["speech", 43.9], ["music", 36.41], ["electric shaver, electric razor", 6.48]], null, null, null, [["music", 62.32], ["speech", 9.96], ["didgeridoo", 8.34]]], "duration": [6.52, -0.44, 4.33, 23.85, 13.4, 1.3, 5.07, 9.48, 1.27, 0.32, 0.14, 3.0]} \ No newline at end of file diff --git a/annotations_filtered/notFMAwEQeM_filtered.json b/annotations_filtered/notFMAwEQeM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21fcf38e4f69d20056801644a7ace57128b7abff --- /dev/null +++ b/annotations_filtered/notFMAwEQeM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.54], [10.0, 11.4], [13.0, 17.51], [41.0, 42.35], [49.0, 62.29], [72.0, 71.95], [75.0, 79.37], [89.0, 90.05], [93.0, 93.28], [95.0, 95.67], [100.0, 102.68], [105.0, 107.86], [110.0, 123.69], [128.0, 161.81], [165.0, 165.32], [167.0, 167.22], [169.0, 193.08], [195.0, 195.18], [199.0, 200.01], [201.0, 229.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 29.8, 0.0, 31.53, 0.0, 37.4, 0.0, 0.0, 0.0, 32.3, 29.43, 29.13, 0.0, 0.0, 0.0, 28.51, 0.0, 0.0, 30.45], "audiomae_on_audioset": [null, null, [["music", 67.02], ["throbbing", 14.08], ["hum", 5.89]], null, [["music", 76.75], ["carnatic music", 4.33], ["musical instrument", 2.88]], null, [["music", 50.9], ["throbbing", 14.82], ["hum", 5.06]], null, null, null, [["hum", 20.94], ["mains hum", 18.94], ["rumble", 11.5]], [["speech", 23.88], ["buzz", 10.25], ["vehicle", 7.13]], [["buzz", 43.65], ["music", 18.1], ["electric shaver, electric razor", 7.11]], null, null, null, [["music", 58.46], ["throbbing", 10.34], ["buzz", 7.36]], null, null, [["music", 67.12], ["scary music", 22.92], ["speech", 3.68]]], "duration": [0.54, 1.4, 4.51, 1.35, 13.29, -0.05, 4.37, 1.05, 0.28, 0.67, 2.68, 2.86, 13.69, 33.81, 0.32, 0.22, 24.08, 0.18, 1.01, 28.78]} \ No newline at end of file diff --git a/annotations_filtered/nouLQZCXW4A_filtered.json b/annotations_filtered/nouLQZCXW4A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7591e446f93ae222c1914cf0cf942d454377e7b5 --- /dev/null +++ b/annotations_filtered/nouLQZCXW4A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.83], [9.0, 16.93], [20.0, 20.55], [22.0, 22.01], [30.0, 29.93], [38.0, 38.91], [42.0, 50.94], [64.0, 64.39]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.66, 0.0, 0.0, 0.0, 0.0, 63.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.83, 7.93, 0.55, 0.01, -0.07, 0.91, 8.94, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/np-ndDy9YJ0_filtered.json b/annotations_filtered/np-ndDy9YJ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ee4740151dafa85a2ea8919c9b84164019ca9e7 --- /dev/null +++ b/annotations_filtered/np-ndDy9YJ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.21], [10.0, 10.44], [11.0, 11.91], [31.0, 31.9], [33.0, 33.3], [35.0, 36.75], [53.0, 53.7], [65.0, 66.5], [73.0, 73.03], [86.0, 86.59], [94.0, 96.21], [107.0, 108.01], [109.0, 109.29], [110.0, 109.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.93, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 41.05], ["guitar", 4.87], ["cough", 4.0]], null, null, null], "duration": [0.21, 0.44, 0.91, 0.9, 0.3, 1.75, 0.7, 1.5, 0.03, 0.59, 2.21, 1.01, 0.29, -0.1]} \ No newline at end of file diff --git a/annotations_filtered/npSYPN8LXas_filtered.json b/annotations_filtered/npSYPN8LXas_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12d09db5fe03e49074c22e34051e01e16c837011 --- /dev/null +++ b/annotations_filtered/npSYPN8LXas_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.14], [9.0, 10.13], [13.0, 13.49], [15.0, 14.96], [39.0, 39.8], [49.0, 50.08], [51.0, 51.44], [53.0, 53.05], [54.0, 55.19], [59.0, 60.32], [61.0, 61.64], [65.0, 65.58], [68.0, 68.61], [75.0, 76.15], [77.0, 77.79], [78.0, 78.39], [82.0, 82.71], [88.0, 88.77], [105.0, 106.42], [108.0, 108.65], [109.0, 110.02], [111.0, 111.54], [114.0, 115.53], [118.0, 118.03], [122.0, 122.66], [162.0, 162.73], [164.0, 164.86], [167.0, 168.12]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["fly, housefly", 34.37], ["insect", 15.49], ["mosquito", 7.86]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.14, 1.13, 0.49, -0.04, 0.8, 1.08, 0.44, 0.05, 1.19, 1.32, 0.64, 0.58, 0.61, 1.15, 0.79, 0.39, 0.71, 0.77, 1.42, 0.65, 1.02, 0.54, 1.53, 0.03, 0.66, 0.73, 0.86, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/npaJix_AarM_filtered.json b/annotations_filtered/npaJix_AarM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca6336695ba253a835eb367a45893c482015e16e --- /dev/null +++ b/annotations_filtered/npaJix_AarM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.88], [12.0, 12.46], [13.0, 13.78], [16.0, 16.24], [17.0, 20.61], [22.0, 21.95], [22.0, 51.17], [52.0, 53.79], [66.0, 66.14], [72.0, 75.59], [78.0, 78.49], [81.0, 81.33], [84.0, 84.16], [85.0, 86.29], [87.0, 87.0], [88.0, 98.29], [100.0, 100.3], [101.0, 104.73], [107.0, 108.92], [110.0, 115.26], [116.0, 117.51], [118.0, 125.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, true], "silence_prob": [76.37, 0.0, 0.0, 0.0, 66.15, 0.0, 57.72, 0.0, 0.0, 40.7, 0.0, 0.0, 0.0, 0.0, 0.0, 41.68, 0.0, 29.48, 0.0, 33.63, 0.0, 37.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 58.89], ["didgeridoo", 12.54], ["speech", 4.84]], null, null, null, null, null, [["music", 41.79], ["speech", 22.87], ["hum", 7.19]], null, [["music", 41.06], ["hum", 15.51], ["mains hum", 11.2]], null, [["music", 31.02], ["hum", 17.88], ["mains hum", 10.66]], null, [["music", 20.72], ["hum", 11.64], ["whack, thwack", 11.44]]], "duration": [2.88, 0.46, 0.78, 0.24, 3.61, -0.05, 29.17, 1.79, 0.14, 3.59, 0.49, 0.33, 0.16, 1.29, 0.0, 10.29, 0.3, 3.73, 1.92, 5.26, 1.51, 7.22]} \ No newline at end of file diff --git a/annotations_filtered/npaLKZ0Egus_filtered.json b/annotations_filtered/npaLKZ0Egus_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..575f5e133d6ad7d838a2b65c146a3b725a48524f --- /dev/null +++ b/annotations_filtered/npaLKZ0Egus_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 31.31], [32.0, 33.08], [36.0, 39.06], [43.0, 51.0], [52.0, 52.91], [54.0, 70.23], [71.0, 100.36], [103.0, 127.04], [129.0, 168.39], [169.0, 178.04], [182.0, 181.79], [182.0, 182.44], [187.0, 188.6]], "keep_status": [true, false, true, true, false, false, false, true, false, false, false, false, false], "silence_prob": [30.03, 0.0, 31.65, 30.57, 0.0, 29.13, 29.04, 29.17, 0.0, 33.59, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 53.78], ["didgeridoo", 7.73], ["frog", 4.49]], null, [["music", 33.52], ["throbbing", 16.31], ["hum", 6.91]], [["music", 54.08], ["throbbing", 9.42], ["quack", 5.67]], null, [["speech", 38.02], ["music", 36.41], ["animal", 4.71]], [["music", 40.26], ["speech", 29.8], ["throbbing", 8.82]], [["music", 45.85], ["throbbing", 13.4], ["hum", 4.88]], null, [["speech", 56.06], ["music", 19.6], ["theremin", 3.06]], null, null, null], "duration": [6.31, 1.08, 3.06, 8.0, 0.91, 16.23, 29.36, 24.04, 39.39, 9.04, -0.21, 0.44, 1.6]} \ No newline at end of file diff --git a/annotations_filtered/npkzgnKAgXU_filtered.json b/annotations_filtered/npkzgnKAgXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fdf5c7d8fe3b7ef925bec66b788993dbaafa3c42 --- /dev/null +++ b/annotations_filtered/npkzgnKAgXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.05], [5.0, 6.99], [8.0, 9.19], [15.0, 24.63], [25.0, 32.95], [36.0, 39.63], [42.0, 61.7], [63.0, 71.31], [72.0, 71.96], [72.0, 78.75], [79.0, 80.23], [81.0, 82.17], [83.0, 87.52], [88.0, 88.64], [89.0, 89.31], [92.0, 95.1], [100.0, 106.91], [110.0, 111.2], [113.0, 113.49], [115.0, 117.53], [119.0, 128.82]], "keep_status": [false, false, false, false, true, true, false, true, false, false, false, false, true, false, false, true, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 29.8, 29.74, 30.48, 29.7, 30.75, 0.0, 30.53, 0.0, 0.0, 30.02, 0.0, 0.0, 29.66, 29.6, 0.0, 0.0, 30.17, 29.65], "audiomae_on_audioset": [null, null, null, [["speech", 43.2], ["music", 29.82], ["sidetone", 3.16]], [["music", 17.82], ["cattle, bovinae", 13.06], ["livestock, farm animals, working animals", 12.22]], [["music", 42.39], ["speech", 17.98], ["hum", 5.74]], [["music", 41.81], ["speech", 27.82], ["throbbing", 7.11]], [["music", 51.58], ["whack, thwack", 8.07], ["throbbing", 6.92]], null, [["music", 42.32], ["speech", 24.48], ["hum", 8.33]], null, null, [["music", 42.9], ["speech", 13.28], ["didgeridoo", 7.23]], null, null, [["music", 19.69], ["speech", 10.32], ["hum", 9.98]], [["music", 28.87], ["throbbing", 21.01], ["hum", 13.83]], null, null, [["music", 35.05], ["electronic music", 17.02], ["hum", 12.34]], [["music", 70.74], ["musical instrument", 3.53], ["smash, crash", 2.08]]], "duration": [1.05, 1.99, 1.19, 9.63, 7.95, 3.63, 19.7, 8.31, -0.04, 6.75, 1.23, 1.17, 4.52, 0.64, 0.31, 3.1, 6.91, 1.2, 0.49, 2.53, 9.82]} \ No newline at end of file diff --git a/annotations_filtered/nprJvYKz3QQ_filtered.json b/annotations_filtered/nprJvYKz3QQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b023c454c149b224e7ee893c5742925b5bc1c347 --- /dev/null +++ b/annotations_filtered/nprJvYKz3QQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.12], [15.0, 15.03], [15.0, 15.06], [15.0, 16.5], [25.0, 25.0], [26.0, 26.13], [28.0, 28.14], [30.0, 30.96], [33.0, 33.67], [35.0, 35.38], [37.0, 37.39], [41.0, 40.93], [42.0, 42.63], [44.0, 44.0], [49.0, 49.4], [52.0, 55.98], [56.0, 56.73], [57.0, 74.58], [76.0, 75.96], [77.0, 78.41], [79.0, 81.28], [82.0, 82.83], [83.0, 83.64], [84.0, 84.74], [86.0, 92.13], [92.0, 99.27], [100.0, 100.45], [101.0, 101.55], [107.0, 108.48], [109.0, 109.53], [110.0, 111.91], [114.0, 115.94], [116.0, 117.56], [118.0, 118.69], [120.0, 123.4], [124.0, 125.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.16, 0.0, 36.45, 0.0, 0.0, 66.39, 0.0, 0.0, 0.0, 85.72, 87.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 22.96], ["speech", 22.7], ["hum", 16.91]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.12, 0.03, 0.06, 1.5, 0.0, 0.13, 0.14, 0.96, 0.67, 0.38, 0.39, -0.07, 0.63, 0.0, 0.4, 3.98, 0.73, 17.58, -0.04, 1.41, 2.28, 0.83, 0.64, 0.74, 6.13, 7.27, 0.45, 0.55, 1.48, 0.53, 1.91, 1.94, 1.56, 0.69, 3.4, 1.95]} \ No newline at end of file diff --git a/annotations_filtered/npvFfvyT8Pc_filtered.json b/annotations_filtered/npvFfvyT8Pc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c94d6ba65e14939e6324f229cd940e0ec9b24a3 --- /dev/null +++ b/annotations_filtered/npvFfvyT8Pc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.13], [7.0, 7.75], [8.0, 9.02], [10.0, 11.08], [14.0, 15.23], [16.0, 17.61], [22.0, 22.65], [24.0, 27.11], [29.0, 30.01], [32.0, 32.0], [34.0, 34.21], [35.0, 36.61], [37.0, 38.31], [41.0, 41.62], [42.0, 43.21], [47.0, 47.7], [53.0, 53.13], [55.0, 55.12], [58.0, 58.46], [61.0, 61.3], [65.0, 66.02], [68.0, 69.03], [70.0, 71.54], [73.0, 73.8], [75.0, 76.69], [80.0, 79.98], [83.0, 84.25], [85.0, 86.48]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 32.13], ["hum", 15.98], ["mains hum", 14.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.13, 0.75, 1.02, 1.08, 1.23, 1.61, 0.65, 3.11, 1.01, 0.0, 0.21, 1.61, 1.31, 0.62, 1.21, 0.7, 0.13, 0.12, 0.46, 0.3, 1.02, 1.03, 1.54, 0.8, 1.69, -0.02, 1.25, 1.48]} \ No newline at end of file diff --git a/annotations_filtered/nq382fby2yU_filtered.json b/annotations_filtered/nq382fby2yU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/nq382fby2yU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/nqEL7fP4Rvs_filtered.json b/annotations_filtered/nqEL7fP4Rvs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8463c25562e40fcaf738b59032f91c00045ed3b4 --- /dev/null +++ b/annotations_filtered/nqEL7fP4Rvs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 54.75], [57.0, 66.5]], "keep_status": [false, true], "silence_prob": [0.0, 28.35], "audiomae_on_audioset": [null, [["speech", 46.45], ["music", 14.25], ["explosion", 4.45]]], "duration": [44.75, 9.5]} \ No newline at end of file diff --git a/annotations_filtered/nqF0yFLjiXs_filtered.json b/annotations_filtered/nqF0yFLjiXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f4c0cfc3c02a361aac384b248c9d7a9d431b3c1 --- /dev/null +++ b/annotations_filtered/nqF0yFLjiXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 11.84], [13.0, 14.01], [15.0, 17.32], [17.0, 17.49], [18.0, 17.52], [18.0, 23.79], [24.0, 29.0], [31.0, 30.99], [32.0, 73.31], [75.0, 85.8], [90.0, 92.15], [102.0, 109.65], [112.0, 113.26], [122.0, 133.95], [134.0, 135.62], [137.0, 139.04]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 72.6, 0.0, 0.0, 37.35, 76.04, 0.0, 0.0, 44.09, 35.27, 36.15, 0.0, 30.6, 0.0, 34.64], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 21.42], ["noise", 14.75], ["mains hum", 10.0]], null, null, null, [["speech", 28.47], ["fart", 14.76], ["whale vocalization", 12.78]], [["whale vocalization", 30.31], ["mains hum", 26.95], ["hum", 17.55]], [["hum", 27.35], ["mains hum", 9.81], ["clang", 7.94]], null, [["music", 57.73], ["carnatic music", 9.29], ["musical instrument", 4.33]], null, [["music", 40.81], ["theremin", 4.2], ["musical instrument", 3.45]]], "duration": [-0.16, 1.01, 2.32, 0.49, -0.48, 5.79, 5.0, -0.01, 41.31, 10.8, 2.15, 7.65, 1.26, 11.95, 1.62, 2.04]} \ No newline at end of file diff --git a/annotations_filtered/nqK7Kk3ZKvY_filtered.json b/annotations_filtered/nqK7Kk3ZKvY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b23995110dfb14c6972e45637b4fa29ed00257c4 --- /dev/null +++ b/annotations_filtered/nqK7Kk3ZKvY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[101.0, 106.54], [107.0, 108.26], [111.0, 115.89]], "keep_status": [false, false, false], "silence_prob": [79.59, 0.0, 67.63], "audiomae_on_audioset": [null, null, null], "duration": [5.54, 1.26, 4.89]} \ No newline at end of file diff --git a/annotations_filtered/nqaJ3f0z3Lw_filtered.json b/annotations_filtered/nqaJ3f0z3Lw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e41de50b02b420dd10a1869b9633d26701d1e8e --- /dev/null +++ b/annotations_filtered/nqaJ3f0z3Lw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 19.74], [25.0, 34.03], [38.0, 46.01], [49.0, 50.97], [60.0, 60.4]], "keep_status": [false, true, false, false, false], "silence_prob": [30.71, 36.29, 72.16, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 67.65], ["buzz", 5.5], ["eruption", 3.52]], [["hum", 35.81], ["speech", 14.0], ["mains hum", 7.94]], null, null, null], "duration": [11.74, 9.03, 8.01, 1.97, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/nqz6wwDRWiE_filtered.json b/annotations_filtered/nqz6wwDRWiE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1e610a1b141602854bd356623808521b889062f --- /dev/null +++ b/annotations_filtered/nqz6wwDRWiE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.82], [8.0, 10.07], [10.0, 11.62], [13.0, 13.76], [15.0, 15.18], [16.0, 16.73], [17.0, 18.69], [25.0, 24.7], [32.0, 32.36], [39.0, 39.63], [41.0, 41.62], [44.0, 45.25], [46.0, 46.85], [47.0, 48.73], [49.0, 50.25], [52.0, 53.08], [56.0, 55.97], [63.0, 63.31], [67.0, 66.99], [76.0, 76.25], [77.0, 77.84], [78.0, 79.12], [81.0, 81.5], [92.0, 93.24], [95.0, 95.64], [96.0, 97.34], [100.0, 100.11], [100.0, 100.53], [101.0, 101.53], [110.0, 112.23], [115.0, 116.14], [124.0, 124.34], [126.0, 127.47], [133.0, 134.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 52.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.68, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 19.38], ["radio", 9.66], ["fart", 5.19]], null, null, null, null], "duration": [0.82, 2.07, 1.62, 0.76, 0.18, 0.73, 1.69, -0.3, 0.36, 0.63, 0.62, 1.25, 0.85, 1.73, 1.25, 1.08, -0.03, 0.31, -0.01, 0.25, 0.84, 1.12, 0.5, 1.24, 0.64, 1.34, 0.11, 0.53, 0.53, 2.23, 1.14, 0.34, 1.47, 1.77]} \ No newline at end of file diff --git a/annotations_filtered/nqzkyfeS2Oo_filtered.json b/annotations_filtered/nqzkyfeS2Oo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a926665100d94556dae505f8f3d3a683f1fc1183 --- /dev/null +++ b/annotations_filtered/nqzkyfeS2Oo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 20.92], [24.0, 29.64], [30.0, 30.92], [32.0, 32.93], [36.0, 38.72], [43.0, 44.17], [45.0, 46.84], [49.0, 53.37], [54.0, 54.87], [56.0, 56.78], [58.0, 59.36], [61.0, 61.7], [62.0, 63.49], [64.0, 71.95], [73.0, 85.99], [88.0, 97.34], [99.0, 99.28], [100.0, 100.62], [102.0, 102.42], [104.0, 111.2], [111.0, 127.79], [129.0, 129.39], [131.0, 131.77], [133.0, 151.21], [152.0, 153.6], [156.0, 156.25], [158.0, 158.45], [160.0, 165.5], [169.0, 171.66], [173.0, 173.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, false, false, false, false, true, true, false], "silence_prob": [52.98, 92.64, 0.0, 0.0, 56.78, 0.0, 0.0, 76.86, 0.0, 0.0, 0.0, 0.0, 0.0, 53.1, 29.67, 30.32, 0.0, 0.0, 0.0, 35.78, 31.32, 0.0, 0.0, 35.26, 0.0, 0.0, 0.0, 35.56, 44.96, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 26.17], ["music", 15.1], ["mains hum", 14.11]], [["music", 18.12], ["hum", 11.77], ["noise", 10.07]], null, null, null, [["speech", 42.81], ["hum", 25.35], ["mains hum", 9.84]], [["hum", 22.47], ["music", 17.57], ["throbbing", 8.54]], null, null, [["speech", 34.71], ["hum", 24.28], ["music", 17.01]], null, null, null, [["music", 23.12], ["speech", 21.71], ["sidetone", 18.62]], [["music", 33.48], ["hum", 14.59], ["ambient music", 6.9]], null], "duration": [5.92, 5.64, 0.92, 0.93, 2.72, 1.17, 1.84, 4.37, 0.87, 0.78, 1.36, 0.7, 1.49, 7.95, 12.99, 9.34, 0.28, 0.62, 0.42, 7.2, 16.79, 0.39, 0.77, 18.21, 1.6, 0.25, 0.45, 5.5, 2.66, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/nr1sLngjJXQ_filtered.json b/annotations_filtered/nr1sLngjJXQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bc923938318c834e924aa7db5082fb3b6260616 --- /dev/null +++ b/annotations_filtered/nr1sLngjJXQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.61], [9.0, 23.67], [26.0, 80.45], [83.0, 83.47], [83.0, 83.51], [87.0, 146.57], [147.0, 167.91], [171.0, 175.71], [176.0, 177.28]], "keep_status": [true, false, false, false, false, false, true, true, false], "silence_prob": [31.71, 33.63, 0.0, 0.0, 0.0, 0.0, 30.71, 30.89, 0.0], "audiomae_on_audioset": [[["music", 30.49], ["smash, crash", 21.46], ["throbbing", 6.23]], [["music", 71.92], ["throbbing", 4.22], ["hum", 2.82]], null, null, null, null, [["music", 19.39], ["fart", 17.78], ["speech", 16.6]], [["music", 45.63], ["noise", 17.08], ["hum", 6.56]], null], "duration": [2.61, 14.67, 54.45, 0.47, 0.51, 59.57, 20.91, 4.71, 1.28]} \ No newline at end of file diff --git a/annotations_filtered/nr7ui14-O_Q_filtered.json b/annotations_filtered/nr7ui14-O_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a70ccd5d249615066dfaa47a7f3d4d53ec42b6ba --- /dev/null +++ b/annotations_filtered/nr7ui14-O_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 20.93], [22.0, 23.7], [26.0, 27.23], [28.0, 31.63], [32.0, 33.22], [35.0, 35.78], [36.0, 36.8], [38.0, 42.57], [47.0, 48.34], [50.0, 50.6], [53.0, 66.78], [68.0, 67.91], [71.0, 72.0], [74.0, 75.27], [77.0, 77.35], [79.0, 79.68], [82.0, 83.0], [84.0, 86.12], [92.0, 94.02], [96.0, 96.69], [100.0, 100.9], [102.0, 103.62], [105.0, 105.66], [107.0, 108.45], [111.0, 112.78], [114.0, 115.89], [119.0, 119.75], [121.0, 122.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.68, 0.0, 0.0, 49.36, 0.0, 0.0, 0.0, 76.2, 0.0, 0.0, 33.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 67.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 42.78], ["theremin", 37.89], ["speech", 5.32]], null, null, [["music", 48.56], ["theremin", 26.71], ["civil defense siren", 4.02]], null, null, null, null, null, null, [["buzz", 28.13], ["hum", 24.82], ["mains hum", 14.87]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [11.93, 1.7, 1.23, 3.63, 1.22, 0.78, 0.8, 4.57, 1.34, 0.6, 13.78, -0.09, 1.0, 1.27, 0.35, 0.68, 1.0, 2.12, 2.02, 0.69, 0.9, 1.62, 0.66, 1.45, 1.78, 1.89, 0.75, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/nrizm2gnQBo_filtered.json b/annotations_filtered/nrizm2gnQBo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2047532b4bb33b3482a980598d8b9c13c621e84 --- /dev/null +++ b/annotations_filtered/nrizm2gnQBo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.55], [10.0, 10.27], [11.0, 12.43], [14.0, 15.11], [17.0, 18.15], [19.0, 19.4], [24.0, 24.46], [26.0, 41.44], [42.0, 43.71], [46.0, 47.16], [48.0, 49.2], [50.0, 52.59], [53.0, 53.87], [55.0, 58.5], [60.0, 60.93], [64.0, 66.72], [68.0, 70.66], [72.0, 76.6], [78.0, 90.14], [93.0, 94.15], [98.0, 98.54], [104.0, 103.77], [107.0, 107.92], [115.0, 115.99], [117.0, 117.51], [120.0, 122.13], [123.0, 123.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 46.97, 0.0, 41.28, 0.0, 77.53, 72.9, 38.79, 38.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.84, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 41.82], ["musical instrument", 13.14], ["french horn", 9.13]], null, [["music", 42.26], ["theremin", 19.82], ["synthesizer", 9.19]], null, null, null, [["music", 54.76], ["theremin", 22.62], ["musical instrument", 4.14]], [["music", 60.58], ["ambient music", 11.28], ["synthesizer", 10.48]], null, null, null, null, null, null, [["music", 51.31], ["theremin", 14.99], ["musical instrument", 3.69]], null], "duration": [0.55, 0.27, 1.43, 1.11, 1.15, 0.4, 0.46, 15.44, 1.71, 1.16, 1.2, 2.59, 0.87, 3.5, 0.93, 2.72, 2.66, 4.6, 12.14, 1.15, 0.54, -0.23, 0.92, 0.99, 0.51, 2.13, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/nrqg6wxuqFo_filtered.json b/annotations_filtered/nrqg6wxuqFo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..215629d0077435cf5a224e4f04bca6aaf0234939 --- /dev/null +++ b/annotations_filtered/nrqg6wxuqFo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.48], [15.0, 15.21], [16.0, 17.76], [18.0, 24.48], [25.0, 27.04], [28.0, 28.65], [29.0, 29.84], [33.0, 34.8], [40.0, 42.6], [45.0, 45.66], [47.0, 51.27], [52.0, 54.72], [56.0, 57.74], [58.0, 63.27], [64.0, 65.08], [68.0, 69.47], [73.0, 75.37], [79.0, 81.58], [82.0, 85.83], [86.0, 90.42], [91.0, 94.37], [99.0, 102.64], [103.0, 108.03], [109.0, 109.86], [110.0, 121.34], [122.0, 123.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 99.36, 0.0, 100.0, 99.98, 0.0, 99.76, 0.0, 0.0, 100.0, 100.0, 99.99, 99.99, 100.0, 100.0, 100.0, 0.0, 99.99, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.48, 0.21, 1.76, 6.48, 2.04, 0.65, 0.84, 1.8, 2.6, 0.66, 4.27, 2.72, 1.74, 5.27, 1.08, 1.47, 2.37, 2.58, 3.83, 4.42, 3.37, 3.64, 5.03, 0.86, 11.34, 1.8]} \ No newline at end of file diff --git a/annotations_filtered/nrqxmQr-uto_filtered.json b/annotations_filtered/nrqxmQr-uto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f81a6afc2880d43e31dec962f1c6acca08c4bf8e --- /dev/null +++ b/annotations_filtered/nrqxmQr-uto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.06], [10.0, 10.57], [11.0, 11.67], [26.0, 26.11], [41.0, 41.01], [72.0, 72.15], [78.0, 81.28], [89.0, 90.26], [106.0, 109.27], [112.0, 112.01], [115.0, 115.26], [120.0, 120.68], [122.0, 122.71], [124.0, 123.89]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.63, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 39.58], ["brass instrument", 8.52], ["musical instrument", 5.85]], null, null, null, null, null, null, null], "duration": [1.06, 0.57, 0.67, 0.11, 0.01, 0.15, 3.28, 1.26, 3.27, 0.01, 0.26, 0.68, 0.71, -0.11]} \ No newline at end of file diff --git a/annotations_filtered/ns-qtoxnAS8_filtered.json b/annotations_filtered/ns-qtoxnAS8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9728ce14155d0790085fe3576dc518ba83c1d1d --- /dev/null +++ b/annotations_filtered/ns-qtoxnAS8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.11], [5.0, 5.34], [10.0, 9.63], [13.0, 16.68], [20.0, 20.88], [26.0, 26.23], [29.0, 29.73], [33.0, 32.95], [36.0, 37.89], [44.0, 48.95], [50.0, 51.07], [53.0, 56.46], [57.0, 64.05], [89.0, 89.21], [112.0, 113.97], [116.0, 115.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 47.62, 0.0, 0.0, 0.0, 0.0, 0.0, 64.18, 0.0, 67.76, 50.91, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 44.15], ["throbbing", 26.14], ["mains hum", 8.59]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.11, 0.34, -0.37, 3.68, 0.88, 0.23, 0.73, -0.05, 1.89, 4.95, 1.07, 3.46, 7.05, 0.21, 1.97, -0.2]} \ No newline at end of file diff --git a/annotations_filtered/ns3j2exbdbU_filtered.json b/annotations_filtered/ns3j2exbdbU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fa9ea383513586863baeca79345ef03c60c1d5d --- /dev/null +++ b/annotations_filtered/ns3j2exbdbU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.34], [16.0, 16.33], [19.0, 19.8], [30.0, 32.24], [35.0, 34.86], [73.0, 74.21], [79.0, 80.23], [82.0, 83.98], [89.0, 91.13], [96.0, 121.74], [123.0, 128.93], [131.0, 132.04], [133.0, 133.52], [135.0, 137.27], [145.0, 146.33], [148.0, 149.23], [150.0, 151.5], [152.0, 152.52], [153.0, 153.84], [156.0, 163.38], [164.0, 170.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.95, 0.0, 0.0, 97.64, 0.0, 0.0, 0.0, 0.0, 100.0, 99.99, 100.0, 0.0, 0.0, 98.66, 0.0, 0.0, 0.0, 0.0, 0.0, 97.64, 99.73], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.34, 0.33, 0.8, 2.24, -0.14, 1.21, 1.23, 1.98, 2.13, 25.74, 5.93, 1.04, 0.52, 2.27, 1.33, 1.23, 1.5, 0.52, 0.84, 7.38, 6.63]} \ No newline at end of file diff --git a/annotations_filtered/ns7B5fzH11c_filtered.json b/annotations_filtered/ns7B5fzH11c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c043b551088d4a409a022120806a210650a5e9a0 --- /dev/null +++ b/annotations_filtered/ns7B5fzH11c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.25], [21.0, 26.1], [31.0, 38.77], [40.0, 39.95], [40.0, 57.48], [59.0, 59.36], [62.0, 62.9], [63.0, 65.1], [67.0, 69.55], [71.0, 80.13]], "keep_status": [false, true, true, false, true, false, false, false, false, true], "silence_prob": [0.0, 38.03, 46.05, 0.0, 38.7, 0.0, 0.0, 55.6, 45.08, 48.69], "audiomae_on_audioset": [null, [["speech", 45.98], ["music", 15.23], ["hum", 5.99]], [["speech", 20.38], ["mains hum", 17.64], ["music", 17.36]], null, [["music", 44.67], ["didgeridoo", 16.22], ["speech", 4.34]], null, null, null, [["didgeridoo", 79.69], ["music", 12.83], ["musical instrument", 1.43]], [["music", 24.37], ["speech", 19.67], ["fart", 18.01]]], "duration": [0.25, 5.1, 7.77, -0.05, 17.48, 0.36, 0.9, 2.1, 2.55, 9.13]} \ No newline at end of file diff --git a/annotations_filtered/ns9WcZlqv_I_filtered.json b/annotations_filtered/ns9WcZlqv_I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c96fbf6e4be040c8f9c0494f8e34ea60daf96a0e --- /dev/null +++ b/annotations_filtered/ns9WcZlqv_I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 21.0], [22.0, 24.0], [26.0, 31.23], [33.0, 35.23], [35.0, 37.4], [38.0, 40.66], [42.0, 49.01], [49.0, 53.43], [56.0, 56.35], [57.0, 73.16], [74.0, 76.25], [77.0, 78.44], [80.0, 81.46], [85.0, 87.32], [88.0, 90.88], [91.0, 92.21], [92.0, 93.77], [97.0, 103.01], [106.0, 108.13], [112.0, 112.99], [113.0, 119.67], [121.0, 126.4], [127.0, 126.74], [127.0, 129.03], [130.0, 130.94], [131.0, 134.6], [136.0, 138.48], [139.0, 139.09], [140.0, 143.18], [144.0, 146.1], [146.0, 149.28], [151.0, 152.95], [153.0, 153.96], [157.0, 165.11], [167.0, 169.74], [171.0, 175.39], [176.0, 177.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false, true, false, true, true, false, true, false, true, false, false, true, false, false, false], "silence_prob": [82.97, 89.72, 88.83, 96.29, 71.43, 90.78, 91.81, 92.31, 0.0, 51.55, 73.82, 0.0, 0.0, 92.8, 49.18, 0.0, 0.0, 98.01, 82.61, 0.0, 40.82, 43.35, 0.0, 36.61, 0.0, 37.56, 38.78, 0.0, 40.68, 49.04, 40.71, 0.0, 0.0, 39.35, 90.25, 94.52, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 15.91], ["hum", 11.13], ["whale vocalization", 5.47]], null, null, null, null, null, [["singing bowl", 17.6], ["music", 14.12], ["whimper", 12.05]], [["music", 31.22], ["electronic music", 16.19], ["ambient music", 10.44]], null, [["gasp", 19.01], ["gong", 10.96], ["caw", 9.94]], null, [["music", 20.56], ["whale vocalization", 18.67], ["animal", 8.03]], [["caw", 32.29], ["crow", 23.89], ["music", 6.92]], null, [["gong", 19.77], ["music", 16.8], ["speech", 6.66]], [["music", 63.79], ["singing bowl", 10.22], ["gong", 4.19]], [["music", 18.15], ["groan", 13.23], ["whimper", 7.64]], null, null, [["music", 43.25], ["singing bowl", 12.44], ["mains hum", 4.4]], null, null, null], "duration": [15.0, 2.0, 5.23, 2.23, 2.4, 2.66, 7.01, 4.43, 0.35, 16.16, 2.25, 1.44, 1.46, 2.32, 2.88, 1.21, 1.77, 6.01, 2.13, 0.99, 6.67, 5.4, -0.26, 2.03, 0.94, 3.6, 2.48, 0.09, 3.18, 2.1, 3.28, 1.95, 0.96, 8.11, 2.74, 4.39, 1.52]} \ No newline at end of file diff --git a/annotations_filtered/nsQtI33UbGI_filtered.json b/annotations_filtered/nsQtI33UbGI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06c1f330ee3f4ddf670699cf9ba91312c84d018f --- /dev/null +++ b/annotations_filtered/nsQtI33UbGI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.19], [22.0, 22.87], [31.0, 31.63], [33.0, 35.01]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 50.02], "audiomae_on_audioset": [null, null, null, null], "duration": [1.19, 0.87, 0.63, 2.01]} \ No newline at end of file diff --git a/annotations_filtered/ns_HTpxc-g4_filtered.json b/annotations_filtered/ns_HTpxc-g4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b5527f7d91cc22b2db037fe34dc2505f4363ed0 --- /dev/null +++ b/annotations_filtered/ns_HTpxc-g4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.05], [4.0, 4.9], [6.0, 7.32], [8.0, 8.5], [10.0, 12.06], [14.0, 16.85], [22.0, 23.06], [24.0, 24.17], [27.0, 27.94], [31.0, 31.46], [32.0, 33.71], [38.0, 38.26], [40.0, 41.34], [42.0, 43.44], [45.0, 45.55], [47.0, 48.3], [51.0, 52.14], [54.0, 55.39], [56.0, 57.05], [58.0, 59.37], [60.0, 60.88], [62.0, 62.21], [64.0, 64.61], [66.0, 66.5], [68.0, 69.3], [71.0, 81.58], [83.0, 83.07], [84.0, 85.85], [87.0, 86.95], [90.0, 90.86]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 52.33, 47.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.71, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["sonar", 32.13], ["music", 18.1], ["gong", 11.04]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.05, 0.9, 1.32, 0.5, 2.06, 2.85, 1.06, 0.17, 0.94, 0.46, 1.71, 0.26, 1.34, 1.44, 0.55, 1.3, 1.14, 1.39, 1.05, 1.37, 0.88, 0.21, 0.61, 0.5, 1.3, 10.58, 0.07, 1.85, -0.05, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/nshLAILEN4w_filtered.json b/annotations_filtered/nshLAILEN4w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7b3e9a945aa088990400780b14f10ca558da889 --- /dev/null +++ b/annotations_filtered/nshLAILEN4w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.37], [5.0, 6.34], [13.0, 13.32], [19.0, 26.99], [30.0, 32.8], [33.0, 37.84], [39.0, 53.99], [55.0, 66.83], [68.0, 69.13], [70.0, 71.68], [77.0, 81.11], [82.0, 83.61], [85.0, 87.42]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 58.05, 46.86, 44.29, 38.82, 38.56, 0.0, 0.0, 29.96, 0.0, 47.39], "audiomae_on_audioset": [null, null, null, null, [["music", 50.8], ["didgeridoo", 6.89], ["musical instrument", 6.55]], [["music", 68.23], ["speech", 14.43], ["synthesizer", 2.92]], [["music", 53.38], ["speech", 18.01], ["synthesizer", 8.85]], [["music", 63.71], ["throbbing", 16.24], ["hum", 8.36]], null, null, [["speech", 31.89], ["music", 18.48], ["vehicle", 3.08]], null, [["music", 40.35], ["didgeridoo", 19.62], ["cattle, bovinae", 3.66]]], "duration": [1.37, 1.34, 0.32, 7.99, 2.8, 4.84, 14.99, 11.83, 1.13, 1.68, 4.11, 1.61, 2.42]} \ No newline at end of file diff --git a/annotations_filtered/ntALVSmIUrg_filtered.json b/annotations_filtered/ntALVSmIUrg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ca856f9ff6fe78f49a992598f4178d82e660552 --- /dev/null +++ b/annotations_filtered/ntALVSmIUrg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.64], [3.0, 3.89], [5.0, 5.14], [7.0, 8.45], [9.0, 95.0]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.64, 0.89, 0.14, 1.45, 86.0]} \ No newline at end of file diff --git a/annotations_filtered/ntC0xJo2bSU_filtered.json b/annotations_filtered/ntC0xJo2bSU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2c4252b88aa66b29225fb38473692c56caa189d --- /dev/null +++ b/annotations_filtered/ntC0xJo2bSU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.03], [8.0, 10.05], [11.0, 17.79], [20.0, 20.58], [22.0, 48.47], [51.0, 63.0], [64.0, 120.58]], "keep_status": [false, false, false, false, true, false, false], "silence_prob": [0.0, 96.04, 74.29, 0.0, 49.13, 88.83, 0.0], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 31.31], ["hum", 21.66], ["music", 7.56]], null, null], "duration": [1.03, 2.05, 6.79, 0.58, 26.47, 12.0, 56.58]} \ No newline at end of file diff --git a/annotations_filtered/ntGBzcfpKYg_filtered.json b/annotations_filtered/ntGBzcfpKYg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3b1492a701d6aa987e98722e52b5efddf52190b --- /dev/null +++ b/annotations_filtered/ntGBzcfpKYg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.02], [6.0, 13.02], [16.0, 21.2], [23.0, 22.81], [27.0, 27.53], [33.0, 33.05], [33.0, 34.52], [39.0, 41.05], [43.0, 46.4], [47.0, 50.67], [52.0, 53.03], [55.0, 56.13], [59.0, 60.81], [63.0, 64.03], [75.0, 75.51], [78.0, 79.37], [82.0, 82.27], [83.0, 84.79], [85.0, 85.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [77.03, 68.54, 52.98, 0.0, 0.0, 0.0, 0.0, 89.72, 78.04, 76.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.02, 7.02, 5.2, -0.19, 0.53, 0.05, 1.52, 2.05, 3.4, 3.67, 1.03, 1.13, 1.81, 1.03, 0.51, 1.37, 0.27, 1.79, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/ntKYG1LdbV8_filtered.json b/annotations_filtered/ntKYG1LdbV8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4911f6dd23e74d43dd67c41df81313f135c5d80f --- /dev/null +++ b/annotations_filtered/ntKYG1LdbV8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 32.05], [33.0, 34.65], [41.0, 41.79], [46.0, 46.21], [47.0, 48.57]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [1.05, 1.65, 0.79, 0.21, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/ntQrC5iclmI_filtered.json b/annotations_filtered/ntQrC5iclmI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba00a717bc6368218a9cf92b251b5051f0ef5c6c --- /dev/null +++ b/annotations_filtered/ntQrC5iclmI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.84], [3.0, 3.69], [6.0, 6.93], [7.0, 8.18], [11.0, 10.69], [16.0, 20.16], [22.0, 23.58], [24.0, 25.17], [27.0, 27.23], [29.0, 29.64], [33.0, 32.93], [34.0, 35.19], [37.0, 38.69], [40.0, 41.23], [42.0, 42.2], [48.0, 48.34], [50.0, 51.11], [62.0, 62.31], [68.0, 68.5], [69.0, 69.69], [73.0, 73.52], [76.0, 76.96], [82.0, 81.94], [82.0, 82.21], [85.0, 85.06], [86.0, 86.51], [91.0, 91.2], [94.0, 95.18], [96.0, 96.18], [105.0, 117.02], [124.0, 126.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.77, 47.35], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 31.88], ["didgeridoo", 25.54], ["speech", 25.43]], [["speech", 35.21], ["music", 26.63], ["guitar", 7.13]]], "duration": [0.84, 0.69, 0.93, 1.18, -0.31, 4.16, 1.58, 1.17, 0.23, 0.64, -0.07, 1.19, 1.69, 1.23, 0.2, 0.34, 1.11, 0.31, 0.5, 0.69, 0.52, 0.96, -0.06, 0.21, 0.06, 0.51, 0.2, 1.18, 0.18, 12.02, 2.76]} \ No newline at end of file diff --git a/annotations_filtered/ntgrRUML2ic_filtered.json b/annotations_filtered/ntgrRUML2ic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29f1333cdfe18561a35fef7cf54c223ca97d84e7 --- /dev/null +++ b/annotations_filtered/ntgrRUML2ic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.01], [6.0, 7.42], [9.0, 10.74], [14.0, 15.47], [17.0, 17.17], [20.0, 22.06], [25.0, 25.83], [28.0, 29.13], [34.0, 35.46], [38.0, 37.93], [40.0, 40.95], [42.0, 46.65], [55.0, 55.11], [59.0, 58.9], [59.0, 59.86], [66.0, 66.83], [68.0, 68.45], [69.0, 69.2], [69.0, 69.69], [89.0, 89.83], [99.0, 98.9], [103.0, 103.74], [111.0, 111.7], [113.0, 113.53], [135.0, 135.67], [144.0, 145.15], [151.0, 151.78], [154.0, 154.48], [156.0, 155.76], [156.0, 157.0], [158.0, 159.09], [162.0, 162.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 1.42, 1.74, 1.47, 0.17, 2.06, 0.83, 1.13, 1.46, -0.07, 0.95, 4.65, 0.11, -0.1, 0.86, 0.83, 0.45, 0.2, 0.69, 0.83, -0.1, 0.74, 0.7, 0.53, 0.67, 1.15, 0.78, 0.48, -0.24, 1.0, 1.09, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/ntirWguFrfM_filtered.json b/annotations_filtered/ntirWguFrfM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e43a3040777f911bd8e6192cf8fe0e0fed5007bd --- /dev/null +++ b/annotations_filtered/ntirWguFrfM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.43], [4.0, 4.82], [8.0, 8.06], [10.0, 10.86], [13.0, 12.85], [27.0, 33.44], [40.0, 40.44], [45.0, 45.72], [46.0, 46.67], [77.0, 77.35], [80.0, 82.19], [84.0, 88.3], [90.0, 97.14], [99.0, 100.57], [107.0, 107.84], [110.0, 111.21], [115.0, 115.45], [121.0, 121.88], [123.0, 123.48], [125.0, 126.0], [134.0, 137.59], [143.0, 149.47], [152.0, 157.01], [161.0, 171.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 36.64, 0.0, 0.0, 0.0, 0.0, 94.52, 55.11, 82.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.43, 36.55, 35.18, 38.42], "audiomae_on_audioset": [null, null, null, null, null, [["livestock, farm animals, working animals", 41.26], ["cattle, bovinae", 21.27], ["moo", 16.62]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 18.84], ["cattle, bovinae", 8.3], ["moo", 8.24]], [["music", 48.32], ["whale vocalization", 17.09], ["howl", 4.55]], [["music", 40.95], ["speech", 8.45], ["explosion", 7.4]]], "duration": [0.43, 0.82, 0.06, 0.86, -0.15, 6.44, 0.44, 0.72, 0.67, 0.35, 2.19, 4.3, 7.14, 1.57, 0.84, 1.21, 0.45, 0.88, 0.48, 1.0, 3.59, 6.47, 5.01, 10.96]} \ No newline at end of file diff --git a/annotations_filtered/ntnqp7-SG7k_filtered.json b/annotations_filtered/ntnqp7-SG7k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4c7e03785dd5bf070e0c2bf2b2d586f49215277 --- /dev/null +++ b/annotations_filtered/ntnqp7-SG7k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.07], [6.0, 9.04], [11.0, 13.44], [14.0, 14.59], [16.0, 29.42], [31.0, 30.94], [32.0, 36.34], [37.0, 47.85], [49.0, 48.84], [50.0, 55.09], [56.0, 61.69], [65.0, 67.44], [68.0, 71.12], [73.0, 72.87], [74.0, 77.77], [79.0, 82.02], [83.0, 86.43], [87.0, 87.84], [89.0, 89.55], [91.0, 91.98], [93.0, 95.27], [96.0, 105.97], [107.0, 110.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.54, 80.64, 99.56, 0.0, 94.37, 0.0, 97.33, 89.01, 0.0, 96.89, 83.88, 74.13, 88.1, 0.0, 82.97, 94.95, 91.64, 0.0, 0.0, 0.0, 87.37, 90.6, 79.94], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.07, 3.04, 2.44, 0.59, 13.42, -0.06, 4.34, 10.85, -0.16, 5.09, 5.69, 2.44, 3.12, -0.13, 3.77, 3.02, 3.43, 0.84, 0.55, 0.98, 2.27, 9.97, 3.13]} \ No newline at end of file diff --git a/annotations_filtered/ntsuIs20RW0_filtered.json b/annotations_filtered/ntsuIs20RW0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d07c9ecf02589856cea1082471a86424e2465c1 --- /dev/null +++ b/annotations_filtered/ntsuIs20RW0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.64], [5.0, 6.99], [13.0, 16.11], [23.0, 23.13], [25.0, 26.42], [28.0, 29.66], [34.0, 34.65], [35.0, 35.73], [41.0, 41.59], [43.0, 45.18], [48.0, 49.32], [51.0, 51.56], [55.0, 55.59], [58.0, 59.68], [63.0, 65.69], [67.0, 67.58], [75.0, 75.14], [77.0, 80.11], [81.0, 81.7], [106.0, 106.08], [112.0, 112.5], [115.0, 115.13], [124.0, 123.77], [124.0, 124.31], [131.0, 131.85], [142.0, 142.96], [150.0, 152.9], [158.0, 157.79], [163.0, 163.0], [167.0, 168.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.02, 0.0, 0.0, 0.0, 0.0, 53.47, 0.0, 0.0, 35.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.05, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 63.14], ["drum machine", 4.28], ["musical instrument", 2.95]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 33.78], ["speech", 14.85], ["synthesizer", 5.91]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, 1.99, 3.11, 0.13, 1.42, 1.66, 0.65, 0.73, 0.59, 2.18, 1.32, 0.56, 0.59, 1.68, 2.69, 0.58, 0.14, 3.11, 0.7, 0.08, 0.5, 0.13, -0.23, 0.31, 0.85, 0.96, 2.9, -0.21, 0.0, 1.13]} \ No newline at end of file diff --git a/annotations_filtered/nuPd4L7_0uQ_filtered.json b/annotations_filtered/nuPd4L7_0uQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4905850885b484878388e641ce42e5149f376153 --- /dev/null +++ b/annotations_filtered/nuPd4L7_0uQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.74], [8.0, 9.05], [17.0, 17.41], [22.0, 24.98], [26.0, 26.84], [29.0, 29.05], [31.0, 31.08], [31.0, 32.36], [39.0, 40.8], [43.0, 43.09], [45.0, 45.71], [48.0, 48.57], [50.0, 49.86], [51.0, 51.63], [53.0, 54.08], [55.0, 58.28], [63.0, 68.62], [71.0, 71.32], [76.0, 77.09], [78.0, 86.75], [88.0, 88.01], [88.0, 96.45], [99.0, 128.92], [130.0, 131.08]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false], "silence_prob": [32.78, 0.0, 0.0, 32.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.68, 30.76, 0.0, 0.0, 30.05, 0.0, 30.07, 30.62, 0.0], "audiomae_on_audioset": [[["music", 40.08], ["cattle, bovinae", 5.66], ["didgeridoo", 5.46]], null, null, [["music", 37.06], ["mains hum", 18.48], ["hum", 12.85]], null, null, null, null, null, null, null, null, null, null, null, [["music", 44.15], ["didgeridoo", 7.54], ["noise", 6.18]], [["throbbing", 36.44], ["music", 32.74], ["hum", 11.09]], null, null, [["music", 68.08], ["speech", 11.54], ["electronic music", 3.73]], null, [["music", 37.09], ["speech", 17.31], ["electronic music", 6.14]], [["music", 32.46], ["reverberation", 10.71], ["synthesizer", 7.38]], null], "duration": [2.74, 1.05, 0.41, 2.98, 0.84, 0.05, 0.08, 1.36, 1.8, 0.09, 0.71, 0.57, -0.14, 0.63, 1.08, 3.28, 5.62, 0.32, 1.09, 8.75, 0.01, 8.45, 29.92, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/nuVY83HU5Mw_filtered.json b/annotations_filtered/nuVY83HU5Mw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf35612a71a4934f9724e9c55fd6218e7c83e982 --- /dev/null +++ b/annotations_filtered/nuVY83HU5Mw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.05], [4.0, 16.01], [17.0, 17.34], [19.0, 27.95], [28.0, 27.99], [28.0, 28.02], [28.0, 28.05], [28.0, 28.46], [34.0, 48.98], [56.0, 62.78], [64.0, 64.98], [70.0, 71.66], [75.0, 92.67], [93.0, 110.79], [115.0, 119.3]], "keep_status": [false, false, false, true, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 32.06, 0.0, 31.03, 0.0, 0.0, 0.0, 0.0, 31.29, 36.51, 0.0, 0.0, 33.9, 32.16, 30.23], "audiomae_on_audioset": [null, [["speech", 52.8], ["music", 19.13], ["sidetone", 3.52]], null, [["music", 51.56], ["brass instrument", 6.65], ["trombone", 5.26]], null, null, null, null, [["music", 87.5], ["brass instrument", 2.61], ["musical instrument", 2.34]], [["music", 47.94], ["theremin", 10.73], ["musical instrument", 10.01]], null, null, [["music", 59.22], ["synthesizer", 13.12], ["musical instrument", 6.91]], [["music", 54.57], ["brass instrument", 9.84], ["musical instrument", 9.59]], [["music", 37.09], ["echo", 9.87], ["didgeridoo", 7.32]]], "duration": [0.05, 12.01, 0.34, 8.95, -0.01, 0.02, 0.05, 0.46, 14.98, 6.78, 0.98, 1.66, 17.67, 17.79, 4.3]} \ No newline at end of file diff --git a/annotations_filtered/nuVzF_r0kHQ_filtered.json b/annotations_filtered/nuVzF_r0kHQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..061fab451e8301fa2dd697f75bb2fa1380d309c0 --- /dev/null +++ b/annotations_filtered/nuVzF_r0kHQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.62], [12.0, 15.89], [17.0, 32.61], [33.0, 53.06], [54.0, 57.7], [61.0, 63.04], [65.0, 70.06], [73.0, 77.35], [78.0, 82.04]], "keep_status": [false, false, false, true, false, false, false, false, false], "silence_prob": [64.86, 99.31, 82.97, 38.59, 97.73, 71.29, 82.07, 86.45, 99.87], "audiomae_on_audioset": [null, null, null, [["hum", 18.07], ["hammer", 9.5], ["fly, housefly", 8.7]], null, null, null, null, null], "duration": [2.62, 3.89, 15.61, 20.06, 3.7, 2.04, 5.06, 4.35, 4.04]} \ No newline at end of file diff --git a/annotations_filtered/nudL_t9u78o_filtered.json b/annotations_filtered/nudL_t9u78o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38f0766aec91806cda192cf5242f2b0cdc6e212d --- /dev/null +++ b/annotations_filtered/nudL_t9u78o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.79], [11.0, 10.86], [11.0, 10.96], [11.0, 11.03], [11.0, 11.06], [11.0, 48.74], [58.0, 78.0], [80.0, 97.63], [100.0, 100.55], [101.0, 108.06], [108.0, 108.36], [108.0, 111.77], [114.0, 145.27], [146.0, 159.34], [160.0, 164.39], [169.0, 175.69], [176.0, 175.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.57, 33.49, 0.0, 34.35, 0.0, 28.99, 0.0, 43.35, 99.84, 31.24, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 60.56], ["mains hum", 15.18], ["music", 14.24]], [["whale vocalization", 37.45], ["music", 36.98], ["electronic music", 4.49]], null, [["hum", 45.9], ["mains hum", 24.97], ["music", 16.41]], null, [["music", 36.59], ["noise", 14.47], ["speech", 10.94]], null, [["music", 49.06], ["sonar", 9.34], ["singing bowl", 5.33]], null, [["music", 60.06], ["theremin", 5.86], ["hum", 4.66]], null], "duration": [-0.21, -0.14, -0.04, 0.03, 0.06, 37.74, 20.0, 17.63, 0.55, 7.06, 0.36, 3.77, 31.27, 13.34, 4.39, 6.69, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/nukRk0WMspo_filtered.json b/annotations_filtered/nukRk0WMspo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9234153fc8709f475a2895e45bdba64ef2c722f3 --- /dev/null +++ b/annotations_filtered/nukRk0WMspo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.91], [13.0, 14.05], [17.0, 17.09], [21.0, 20.97], [22.0, 22.38], [24.0, 24.26], [29.0, 29.74], [31.0, 31.83], [32.0, 32.51], [38.0, 39.12], [58.0, 60.84], [62.0, 69.21], [70.0, 73.03], [74.0, 77.21], [80.0, 84.06], [86.0, 87.29], [88.0, 90.24], [108.0, 108.41], [112.0, 112.97], [116.0, 119.8], [120.0, 121.93], [122.0, 125.54], [129.0, 129.83], [132.0, 135.08], [137.0, 138.28], [146.0, 146.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 90.6, 74.13, 92.64, 64.52, 0.0, 72.01, 0.0, 0.0, 100.0, 0.0, 85.9, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.09, 1.05, 0.09, -0.03, 0.38, 0.26, 0.74, 0.83, 0.51, 1.12, 2.84, 7.21, 3.03, 3.21, 4.06, 1.29, 2.24, 0.41, 0.97, 3.8, 1.93, 3.54, 0.83, 3.08, 1.28, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/nur4g4r1LN4_filtered.json b/annotations_filtered/nur4g4r1LN4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ac856fe674b7787498768db90635358e18045cd --- /dev/null +++ b/annotations_filtered/nur4g4r1LN4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 55.54], [56.0, 57.77], [59.0, 65.77], [68.0, 69.01], [69.0, 113.81], [115.0, 121.02], [122.0, 140.76], [141.0, 144.69], [146.0, 165.59]], "keep_status": [true, false, true, false, false, true, true, true, true], "silence_prob": [29.65, 0.0, 30.65, 0.0, 0.0, 29.22, 31.13, 30.53, 30.87], "audiomae_on_audioset": [[["animal", 8.95], ["hum", 6.94], ["heart sounds, heartbeat", 5.58]], null, [["arrow", 9.66], ["insect", 6.27], ["explosion", 6.25]], null, null, [["rumble", 39.19], ["speech", 14.1], ["hum", 7.12]], [["squish", 15.2], ["snake", 10.35], ["gurgling", 5.59]], [["speech", 39.66], ["whale vocalization", 7.66], ["rumble", 5.75]], [["whale vocalization", 19.57], ["gurgling", 9.37], ["white noise", 7.58]]], "duration": [24.54, 1.77, 6.77, 1.01, 44.81, 6.02, 18.76, 3.69, 19.59]} \ No newline at end of file diff --git a/annotations_filtered/nvAZrrDwecI_filtered.json b/annotations_filtered/nvAZrrDwecI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45e4f6f850577c7531bf07becce518459a7c68fc --- /dev/null +++ b/annotations_filtered/nvAZrrDwecI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.34], [8.0, 11.04], [12.0, 13.68], [15.0, 15.28], [19.0, 18.76], [29.0, 30.45], [31.0, 31.87], [35.0, 35.8], [39.0, 39.8], [41.0, 40.78], [43.0, 43.7], [46.0, 49.98], [51.0, 52.22], [57.0, 60.84], [61.0, 61.86], [65.0, 66.31], [67.0, 67.2], [73.0, 73.79], [78.0, 79.44], [84.0, 85.36], [86.0, 88.6], [90.0, 91.15], [92.0, 92.87], [96.0, 96.53], [97.0, 111.42], [113.0, 112.77], [113.0, 113.14], [114.0, 115.16], [115.0, 116.41], [116.0, 120.7], [124.0, 124.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 91.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.3, 0.0, 74.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.39, 0.0, 0.0, 0.0, 60.23, 0.0, 0.0, 0.0, 0.0, 48.65, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 32.61], ["music", 20.98], ["hum", 5.9]], null], "duration": [0.34, 3.04, 1.68, 0.28, -0.24, 1.45, 0.87, 0.8, 0.8, -0.22, 0.7, 3.98, 1.22, 3.84, 0.86, 1.31, 0.2, 0.79, 1.44, 1.36, 2.6, 1.15, 0.87, 0.53, 14.42, -0.23, 0.14, 1.16, 1.41, 4.7, 0.36]} \ No newline at end of file diff --git a/annotations_filtered/nvFln5J-6uY_filtered.json b/annotations_filtered/nvFln5J-6uY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3cd118886a3d949fa8781eafaa3b2cbd1b576c0e --- /dev/null +++ b/annotations_filtered/nvFln5J-6uY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.37], [10.0, 11.26], [12.0, 13.09], [15.0, 15.4], [17.0, 17.78], [18.0, 19.67], [22.0, 22.52], [23.0, 23.68], [27.0, 27.21], [28.0, 28.76], [30.0, 31.67], [35.0, 37.35], [39.0, 39.5], [44.0, 46.67], [49.0, 49.44], [63.0, 62.99], [63.0, 65.67], [67.0, 67.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [70.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.22, 0.0, 66.63, 0.0, 0.0, 47.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 37.43], ["speech", 29.91], ["hum", 8.37]], null], "duration": [3.37, 1.26, 1.09, 0.4, 0.78, 1.67, 0.52, 0.68, 0.21, 0.76, 1.67, 2.35, 0.5, 2.67, 0.44, -0.01, 2.67, 0.1]} \ No newline at end of file diff --git a/annotations_filtered/nvdBfpA8r4o_filtered.json b/annotations_filtered/nvdBfpA8r4o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c07275d606de2ddc08962be2d5697244ec884e7d --- /dev/null +++ b/annotations_filtered/nvdBfpA8r4o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.82], [17.0, 18.35], [20.0, 31.6], [33.0, 41.82], [44.0, 51.49], [53.0, 56.22], [57.0, 58.58], [60.0, 68.05], [70.0, 73.16], [74.0, 130.87], [132.0, 132.24], [134.0, 136.56], [138.0, 138.45], [140.0, 141.34], [142.0, 144.02], [145.0, 146.58], [147.0, 147.63], [149.0, 150.99], [154.0, 154.36], [155.0, 156.03], [157.0, 157.99], [161.0, 161.69], [163.0, 164.37], [165.0, 167.66], [169.0, 169.69], [172.0, 172.44], [173.0, 176.79], [178.0, 181.5], [183.0, 183.34], [184.0, 186.36], [190.0, 192.37], [194.0, 194.46], [195.0, 202.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.96, 92.8, 100.0, 99.71, 0.0, 98.1, 99.98, 0.0, 0.0, 99.97, 0.0, 0.0, 98.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.59, 0.0, 0.0, 95.37, 74.92, 0.0, 69.47, 73.82, 0.0, 81.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 25.09], ["boing", 19.24], ["sidetone", 6.8]], null, null, null, null, null, null, null, null, null], "duration": [0.82, 1.35, 11.6, 8.82, 7.49, 3.22, 1.58, 8.05, 3.16, 56.87, 0.24, 2.56, 0.45, 1.34, 2.02, 1.58, 0.63, 1.99, 0.36, 1.03, 0.99, 0.69, 1.37, 2.66, 0.69, 0.44, 3.79, 3.5, 0.34, 2.36, 2.37, 0.46, 7.34]} \ No newline at end of file diff --git a/annotations_filtered/nvldRH4OC_k_filtered.json b/annotations_filtered/nvldRH4OC_k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..294d914ae7669f49166eafb3e72c9344ba129a94 --- /dev/null +++ b/annotations_filtered/nvldRH4OC_k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.64], [18.0, 18.4], [31.0, 37.18], [37.0, 54.45]], "keep_status": [false, false, true, false], "silence_prob": [31.85, 0.0, 29.63, 29.92], "audiomae_on_audioset": [[["music", 39.1], ["boing", 20.45], ["speech", 18.52]], null, [["hum", 34.87], ["music", 16.79], ["mains hum", 16.09]], [["speech", 39.32], ["music", 30.31], ["synthesizer", 6.86]]], "duration": [3.64, 0.4, 6.18, 17.45]} \ No newline at end of file diff --git a/annotations_filtered/nwQ5zHdDFng_filtered.json b/annotations_filtered/nwQ5zHdDFng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f03b83fb00541387987488a6f9c41d3ebe94caa6 --- /dev/null +++ b/annotations_filtered/nwQ5zHdDFng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 36.53], [38.0, 37.89], [38.0, 38.97], [44.0, 57.48], [59.0, 66.39], [67.0, 67.51], [68.0, 69.36], [71.0, 71.52], [72.0, 72.52], [74.0, 74.43], [77.0, 78.31], [79.0, 79.64], [81.0, 82.21], [83.0, 83.67], [86.0, 87.39], [88.0, 88.53], [93.0, 95.15], [96.0, 97.93], [99.0, 100.45], [102.0, 102.69], [103.0, 104.45], [105.0, 107.08], [107.0, 122.89]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 44.75, 35.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.07, 0.0, 0.0, 0.0, 0.0, 31.88, 42.3], "audiomae_on_audioset": [null, null, null, [["animal", 8.4], ["bouncing", 7.49], ["rowboat, canoe, kayak", 7.31]], [["speech", 44.4], ["radio", 33.32], ["noise", 3.88]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.79], ["echo", 8.86], ["didgeridoo", 7.86]], [["speech", 76.22], ["radio", 15.79], ["sidetone", 2.39]]], "duration": [0.53, -0.11, 0.97, 13.48, 7.39, 0.51, 1.36, 0.52, 0.52, 0.43, 1.31, 0.64, 1.21, 0.67, 1.39, 0.53, 2.15, 1.93, 1.45, 0.69, 1.45, 2.08, 15.89]} \ No newline at end of file diff --git a/annotations_filtered/nwrLvq5W58o_filtered.json b/annotations_filtered/nwrLvq5W58o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..808572335bb2c72fe6dc2b03f1e551609db15aaa --- /dev/null +++ b/annotations_filtered/nwrLvq5W58o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.62], [11.0, 16.28], [17.0, 16.97], [18.0, 18.84], [27.0, 27.18], [28.0, 33.91], [43.0, 43.97], [47.0, 48.36], [49.0, 48.59], [49.0, 49.0], [54.0, 55.8], [56.0, 57.91], [64.0, 64.3], [67.0, 68.28], [71.0, 109.93], [111.0, 112.36], [113.0, 134.38], [137.0, 137.44], [139.0, 139.38], [141.0, 143.85], [145.0, 145.49], [146.0, 149.49], [151.0, 155.31], [157.0, 161.42], [165.0, 165.11], [169.0, 169.59]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 29.43, 0.0, 0.0, 0.0, 32.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.63, 0.0, 0.0, 29.55, 0.0, 31.39, 30.88, 31.93, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 61.69], ["speech", 18.75], ["sound effect", 2.92]], null, null, null, [["music", 13.9], ["cattle, bovinae", 9.0], ["speech", 8.88]], null, null, null, null, null, null, null, null, null, null, [["music", 83.59], ["theremin", 2.47], ["scary music", 1.54]], null, null, [["music", 30.71], ["sound effect", 10.95], ["speech", 10.21]], null, [["music", 52.76], ["throbbing", 22.35], ["hum", 4.42]], [["whack, thwack", 32.93], ["music", 29.09], ["thunk", 6.15]], [["whack, thwack", 38.41], ["music", 24.84], ["fly, housefly", 7.26]], null, null], "duration": [0.62, 5.28, -0.03, 0.84, 0.18, 5.91, 0.97, 1.36, -0.41, 0.0, 1.8, 1.91, 0.3, 1.28, 38.93, 1.36, 21.38, 0.44, 0.38, 2.85, 0.49, 3.49, 4.31, 4.42, 0.11, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/nwt-V8xfwkQ_filtered.json b/annotations_filtered/nwt-V8xfwkQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ed540f1de616005525fd6350a859fb678a213cb --- /dev/null +++ b/annotations_filtered/nwt-V8xfwkQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.83], [11.0, 12.06], [13.0, 60.89], [62.0, 62.48], [63.0, 77.94], [79.0, 108.43], [111.0, 124.55], [125.0, 155.61], [156.0, 156.63]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [32.3, 0.0, 0.0, 0.0, 29.5, 29.63, 30.73, 0.0, 0.0], "audiomae_on_audioset": [[["music", 75.46], ["hum", 7.12], ["throbbing", 3.44]], null, null, null, [["speech", 72.9], ["music", 6.87], ["outside, rural or natural", 2.46]], [["hum", 43.82], ["throbbing", 12.0], ["mains hum", 11.98]], [["whack, thwack", 46.34], ["speech", 14.85], ["whip", 12.59]], null, null], "duration": [2.83, 1.06, 47.89, 0.48, 14.94, 29.43, 13.55, 30.61, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/nx002D9N6qU_filtered.json b/annotations_filtered/nx002D9N6qU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2806280ae5013ccd4e0cd761933d72775af64e06 --- /dev/null +++ b/annotations_filtered/nx002D9N6qU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 34.64], [36.0, 42.94], [44.0, 60.13], [63.0, 63.26], [63.0, 66.07], [68.0, 71.41], [73.0, 75.41], [77.0, 81.53], [83.0, 96.67]], "keep_status": [false, true, true, false, true, false, true, true, false], "silence_prob": [48.74, 46.22, 31.55, 0.0, 31.77, 39.09, 35.52, 32.77, 33.7], "audiomae_on_audioset": [[["throbbing", 45.08], ["music", 21.89], ["hum", 9.65]], [["music", 38.94], ["throbbing", 21.98], ["hum", 3.98]], [["music", 33.47], ["trombone", 11.82], ["brass instrument", 8.66]], null, [["music", 36.64], ["musical instrument", 9.86], ["brass instrument", 6.68]], [["music", 66.8], ["musical instrument", 10.3], ["classical music", 1.9]], [["music", 20.95], ["musical instrument", 17.09], ["speech", 7.71]], [["music", 38.69], ["speech", 21.38], ["theremin", 4.38]], [["music", 52.34], ["brass instrument", 20.02], ["musical instrument", 7.36]]], "duration": [17.64, 6.94, 16.13, 0.26, 3.07, 3.41, 2.41, 4.53, 13.67]} \ No newline at end of file diff --git a/annotations_filtered/nxHTPahkN6M_filtered.json b/annotations_filtered/nxHTPahkN6M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e9148243ba9f287c9627e7970bc893b532a2851 --- /dev/null +++ b/annotations_filtered/nxHTPahkN6M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.13], [4.0, 8.41], [10.0, 11.28], [13.0, 13.74], [15.0, 15.63], [17.0, 19.41], [22.0, 23.03], [24.0, 25.37], [27.0, 27.09], [44.0, 45.62], [47.0, 49.55], [50.0, 51.54], [53.0, 53.67], [54.0, 55.65], [68.0, 67.63], [69.0, 70.21], [90.0, 90.68], [92.0, 93.95], [98.0, 98.64], [101.0, 103.45], [105.0, 109.41], [110.0, 110.94], [115.0, 117.22], [123.0, 123.6], [125.0, 127.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.17, 0.0, 0.0, 0.0, 54.9, 0.0, 0.0, 0.0, 0.0, 82.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.27, 82.97, 0.0, 87.74, 0.0, 50.21], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.13, 4.41, 1.28, 0.74, 0.63, 2.41, 1.03, 1.37, 0.09, 1.62, 2.55, 1.54, 0.67, 1.65, -0.37, 1.21, 0.68, 1.95, 0.64, 2.45, 4.41, 0.94, 2.22, 0.6, 2.21]} \ No newline at end of file diff --git a/annotations_filtered/nxRZisFQdTE_filtered.json b/annotations_filtered/nxRZisFQdTE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef81936cc35036f663750857326dcdaed2a3f7c1 --- /dev/null +++ b/annotations_filtered/nxRZisFQdTE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.2], [11.0, 11.48], [15.0, 16.41], [24.0, 24.29], [29.0, 37.93], [40.0, 40.81], [42.0, 42.94], [45.0, 47.87], [59.0, 59.78], [67.0, 68.17], [72.0, 72.54], [89.0, 92.75], [97.0, 101.46], [102.0, 103.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 39.72, 0.0, 0.0, 88.1, 0.0, 0.0, 0.0, 94.07, 36.67, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 75.49], ["speech", 11.44], ["throbbing", 2.77]], null, null, null, null, null, null, null, [["speech", 57.11], ["whale vocalization", 3.9], ["cheering", 3.1]], null], "duration": [1.2, 0.48, 1.41, 0.29, 8.93, 0.81, 0.94, 2.87, 0.78, 1.17, 0.54, 3.75, 4.46, 1.32]} \ No newline at end of file diff --git a/annotations_filtered/nxTEOyfchP8_filtered.json b/annotations_filtered/nxTEOyfchP8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a80a915f1ed65996db70b704baf0f381982974b --- /dev/null +++ b/annotations_filtered/nxTEOyfchP8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 17.19], [20.0, 27.31], [28.0, 28.71], [31.0, 32.1], [33.0, 33.52], [35.0, 40.24], [46.0, 46.89], [49.0, 52.34], [54.0, 54.68], [61.0, 81.09], [82.0, 82.54], [83.0, 82.86], [88.0, 91.93], [93.0, 95.27], [101.0, 100.9], [103.0, 103.57], [104.0, 106.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [71.0, 84.98, 0.0, 0.0, 0.0, 90.6, 0.0, 100.0, 0.0, 33.71, 0.0, 0.0, 76.7, 69.47, 0.0, 0.0, 49.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 74.5], ["music", 11.48], ["noise", 2.39]], null, null, null, null, null, null, [["music", 43.75], ["speech", 32.69], ["hum", 2.16]]], "duration": [3.19, 7.31, 0.71, 1.1, 0.52, 5.24, 0.89, 3.34, 0.68, 20.09, 0.54, -0.14, 3.93, 2.27, -0.1, 0.57, 2.03]} \ No newline at end of file diff --git a/annotations_filtered/nxWj-7FF4CI_filtered.json b/annotations_filtered/nxWj-7FF4CI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/nxWj-7FF4CI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/nxc6kwBYFSM_filtered.json b/annotations_filtered/nxc6kwBYFSM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b805fbb024b092425487d82e9929bbcfa8338e8 --- /dev/null +++ b/annotations_filtered/nxc6kwBYFSM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 22.5], [40.0, 41.0], [42.0, 43.31], [43.0, 51.88], [60.0, 61.97], [69.0, 69.25], [74.0, 75.05], [76.0, 77.85], [83.0, 85.99], [98.0, 98.58], [101.0, 101.55], [105.0, 109.65], [113.0, 115.43], [116.0, 116.5], [126.0, 128.39]], "keep_status": [true, false, false, true, false, false, false, false, true, false, false, true, false, false, true], "silence_prob": [30.48, 0.0, 0.0, 31.5, 0.0, 0.0, 0.0, 0.0, 29.7, 0.0, 0.0, 29.54, 36.02, 0.0, 30.74], "audiomae_on_audioset": [[["whale vocalization", 58.02], ["livestock, farm animals, working animals", 4.71], ["moo", 2.64]], null, null, [["speech", 22.41], ["didgeridoo", 9.4], ["fart", 8.1]], null, null, null, null, [["groan", 14.35], ["whale vocalization", 13.34], ["screaming", 13.27]], null, null, [["speech", 49.34], ["groan", 10.42], ["screaming", 7.09]], [["cattle, bovinae", 46.21], ["livestock, farm animals, working animals", 26.15], ["moo", 14.46]], null, [["fart", 18.54], ["beatboxing", 11.65], ["groan", 8.27]]], "duration": [2.5, 1.0, 1.31, 8.88, 1.97, 0.25, 1.05, 1.85, 2.99, 0.58, 0.55, 4.65, 2.43, 0.5, 2.39]} \ No newline at end of file diff --git a/annotations_filtered/nxdpR5oyCOs_filtered.json b/annotations_filtered/nxdpR5oyCOs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4602f5b0689655bfc75a63973e7b24f612be2204 --- /dev/null +++ b/annotations_filtered/nxdpR5oyCOs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.53], [34.0, 34.45], [56.0, 60.03], [76.0, 75.96], [78.0, 79.14]], "keep_status": [false, false, true, false, false], "silence_prob": [0.0, 0.0, 32.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 22.32], ["moo", 14.59], ["livestock, farm animals, working animals", 8.75]], null, null], "duration": [0.53, 0.45, 4.03, -0.04, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/nxmaYsZjnXo_filtered.json b/annotations_filtered/nxmaYsZjnXo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c33e65509716dd26144b46c3fd2dee1b98652d8a --- /dev/null +++ b/annotations_filtered/nxmaYsZjnXo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.36], [9.0, 12.07], [14.0, 16.14], [16.0, 17.22], [21.0, 22.01], [24.0, 24.34], [25.0, 31.87], [35.0, 44.68], [49.0, 52.12], [56.0, 56.64], [58.0, 62.36], [64.0, 63.93], [65.0, 67.1], [68.0, 88.67], [91.0, 92.52], [95.0, 96.18], [98.0, 98.47], [99.0, 100.35], [101.0, 102.07], [103.0, 103.72], [105.0, 105.83], [107.0, 108.45], [110.0, 111.0], [114.0, 116.01], [120.0, 120.93], [122.0, 123.2], [125.0, 125.85], [128.0, 130.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [85.9, 98.1, 99.91, 0.0, 0.0, 0.0, 97.92, 99.05, 100.0, 0.0, 100.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.01, 0.0, 0.0, 0.0, 99.84], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.36, 3.07, 2.14, 1.22, 1.01, 0.34, 6.87, 9.68, 3.12, 0.64, 4.36, -0.07, 2.1, 20.67, 1.52, 1.18, 0.47, 1.35, 1.07, 0.72, 0.83, 1.45, 1.0, 2.01, 0.93, 1.2, 0.85, 2.06]} \ No newline at end of file diff --git a/annotations_filtered/nxvXYa6n0pY_filtered.json b/annotations_filtered/nxvXYa6n0pY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce897ec26166461dae8ae0513cc1508d83faa4eb --- /dev/null +++ b/annotations_filtered/nxvXYa6n0pY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.33], [8.0, 9.02], [11.0, 11.13], [16.0, 17.61], [20.0, 21.39], [22.0, 22.86], [24.0, 27.97], [30.0, 30.4], [33.0, 34.7], [36.0, 51.8], [53.0, 55.58], [57.0, 58.97], [60.0, 65.23], [69.0, 74.53], [77.0, 77.33], [78.0, 78.8], [82.0, 83.32], [85.0, 88.92], [91.0, 92.21], [94.0, 94.37], [98.0, 98.56], [100.0, 100.43], [106.0, 107.49], [109.0, 110.27], [114.0, 116.36], [118.0, 118.59], [120.0, 121.32], [124.0, 124.14], [130.0, 129.96], [136.0, 138.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [81.71, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05, 0.0, 0.0, 50.66, 94.52, 0.0, 52.27, 31.1, 0.0, 0.0, 0.0, 99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.76, 0.0, 0.0, 0.0, 0.0, 80.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["explosion", 24.9], ["gunshot, gunfire", 19.12], ["machine gun", 15.32]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.33, 1.02, 0.13, 1.61, 1.39, 0.86, 3.97, 0.4, 1.7, 15.8, 2.58, 1.97, 5.23, 5.53, 0.33, 0.8, 1.32, 3.92, 1.21, 0.37, 0.56, 0.43, 1.49, 1.27, 2.36, 0.59, 1.32, 0.14, -0.04, 2.43]} \ No newline at end of file diff --git a/annotations_filtered/nyKJeXDoqnw_filtered.json b/annotations_filtered/nyKJeXDoqnw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3b1c3e6dae189703bed3b1556b06e2acc1b9ca4 --- /dev/null +++ b/annotations_filtered/nyKJeXDoqnw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.03], [7.0, 8.11], [9.0, 9.63], [12.0, 12.95], [14.0, 15.11], [17.0, 18.13], [19.0, 19.57], [22.0, 21.79], [23.0, 22.65], [26.0, 27.72], [28.0, 28.92], [34.0, 35.97], [38.0, 39.21], [39.0, 40.0], [42.0, 42.6], [43.0, 44.0], [46.0, 46.8], [49.0, 49.62], [50.0, 50.52], [52.0, 52.98], [56.0, 55.75], [57.0, 57.6], [58.0, 59.78], [60.0, 61.03], [62.0, 63.37], [64.0, 67.12], [71.0, 72.67], [76.0, 77.31], [79.0, 81.5], [84.0, 86.54], [89.0, 95.84], [98.0, 99.12], [115.0, 116.31], [117.0, 119.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 99.56, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.03, 1.11, 0.63, 0.95, 1.11, 1.13, 0.57, -0.21, -0.35, 1.72, 0.92, 1.97, 1.21, 1.0, 0.6, 1.0, 0.8, 0.62, 0.52, 0.98, -0.25, 0.6, 1.78, 1.03, 1.37, 3.12, 1.67, 1.31, 2.5, 2.54, 6.84, 1.12, 1.31, 2.47]} \ No newline at end of file diff --git a/annotations_filtered/nyMtN_aHC_8_filtered.json b/annotations_filtered/nyMtN_aHC_8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcf54069975b5ee9fa7395002e539aa6f7e9dcea --- /dev/null +++ b/annotations_filtered/nyMtN_aHC_8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.51], [8.0, 11.84], [12.0, 14.45], [15.0, 15.99], [17.0, 22.6], [23.0, 23.87], [26.0, 26.45], [29.0, 30.08], [31.0, 31.82], [33.0, 33.24], [34.0, 35.04], [37.0, 37.4], [38.0, 45.03], [46.0, 46.35], [48.0, 48.76], [50.0, 50.97], [52.0, 53.22], [53.0, 55.63], [56.0, 56.84], [58.0, 59.24], [62.0, 62.46], [63.0, 63.91], [65.0, 66.07], [68.0, 68.4], [70.0, 72.33], [73.0, 74.78], [76.0, 78.26], [79.0, 80.33], [81.0, 82.43], [84.0, 84.28], [85.0, 85.9], [87.0, 88.35], [89.0, 90.49], [91.0, 92.26], [93.0, 94.63], [95.0, 96.52], [97.0, 98.39], [99.0, 101.09], [102.0, 105.73], [106.0, 107.03], [108.0, 108.3], [110.0, 110.83], [112.0, 113.02], [115.0, 118.47], [122.0, 122.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 53.34, 72.9, 0.0, 60.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.31, 0.0, 0.0, 0.0, 0.0, 46.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.52, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 80.11, 0.0, 0.0, 0.0, 0.0, 48.65, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 38.82], ["radio", 15.74], ["telephone", 5.94]], null, null, null, null, null, null, [["speech", 54.86], ["dial tone", 12.93], ["tuning fork", 10.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["noise", 36.74], ["radio", 17.12], ["hum", 8.15]], null], "duration": [0.51, 3.84, 2.45, 0.99, 5.6, 0.87, 0.45, 1.08, 0.82, 0.24, 1.04, 0.4, 7.03, 0.35, 0.76, 0.97, 1.22, 2.63, 0.84, 1.24, 0.46, 0.91, 1.07, 0.4, 2.33, 1.78, 2.26, 1.33, 1.43, 0.28, 0.9, 1.35, 1.49, 1.26, 1.63, 1.52, 1.39, 2.09, 3.73, 1.03, 0.3, 0.83, 1.02, 3.47, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/nyn04CxGBLs_filtered.json b/annotations_filtered/nyn04CxGBLs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f4ec81f81cbcc65a3862b282cb7f877152bb0e0 --- /dev/null +++ b/annotations_filtered/nyn04CxGBLs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 54.8]], "keep_status": [false], "silence_prob": [33.8], "audiomae_on_audioset": [[["hum", 49.39], ["mains hum", 18.89], ["music", 7.26]]], "duration": [5.8]} \ No newline at end of file diff --git a/annotations_filtered/nzjEYhUtRGc_filtered.json b/annotations_filtered/nzjEYhUtRGc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dbab43185faa9b9f711ee7d7bc0d3d92a773f5f1 --- /dev/null +++ b/annotations_filtered/nzjEYhUtRGc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.92], [6.0, 6.81], [10.0, 31.85], [35.0, 38.69], [41.0, 52.89], [53.0, 67.96], [69.0, 69.26], [70.0, 129.56]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [55.81, 0.0, 32.58, 33.41, 32.64, 32.11, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 37.67], ["speech", 18.13], ["throbbing", 16.95]], [["music", 31.31], ["speech", 23.89], ["breaking", 18.95]], [["music", 39.13], ["speech", 30.89], ["smash, crash", 11.36]], [["music", 56.45], ["throbbing", 11.49], ["hum", 4.89]], null, null], "duration": [3.92, 0.81, 21.85, 3.69, 11.89, 14.96, 0.26, 59.56]} \ No newline at end of file diff --git a/annotations_filtered/nzz_3bQHyiY_filtered.json b/annotations_filtered/nzz_3bQHyiY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62b47a1e20e86a3773e1da9da17a2ee9ebc2c752 --- /dev/null +++ b/annotations_filtered/nzz_3bQHyiY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 34.86], [36.0, 38.23], [40.0, 110.74], [111.0, 131.89], [132.0, 131.94]], "keep_status": [false, false, false, true, false], "silence_prob": [32.01, 97.22, 0.0, 35.7, 0.0], "audiomae_on_audioset": [[["music", 37.17], ["hum", 25.15], ["mains hum", 16.23]], null, null, [["speech", 17.83], ["music", 17.33], ["rumble", 15.02]], null], "duration": [24.86, 2.23, 70.74, 20.89, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/o-0PQaLy0lc_filtered.json b/annotations_filtered/o-0PQaLy0lc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22ccebfda16ca002c424a5c5fee7f12d9e11ff8f --- /dev/null +++ b/annotations_filtered/o-0PQaLy0lc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.48], [10.0, 10.74], [12.0, 13.34], [17.0, 27.94], [29.0, 32.07], [35.0, 35.23], [38.0, 38.31], [40.0, 40.68], [41.0, 49.05], [50.0, 52.54], [53.0, 53.64], [54.0, 56.59], [74.0, 83.57], [84.0, 85.29], [92.0, 99.17], [101.0, 101.73], [103.0, 103.45], [104.0, 105.63], [117.0, 117.07], [117.0, 120.09], [129.0, 130.44], [133.0, 133.37], [134.0, 134.87], [135.0, 135.8], [139.0, 145.61], [146.0, 147.56], [152.0, 152.71], [160.0, 160.79], [162.0, 162.24], [165.0, 165.96], [167.0, 167.83], [175.0, 175.66], [178.0, 183.36], [184.0, 189.01], [193.0, 194.21], [198.0, 198.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 77.03, 81.0, 0.0, 0.0, 0.0, 34.82, 49.78, 0.0, 51.82, 65.79, 0.0, 63.74, 0.0, 0.0, 0.0, 0.0, 44.34, 0.0, 0.0, 0.0, 0.0, 71.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.36, 95.37, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 36.38], ["boing", 21.79], ["speech", 13.63]], [["speech", 61.55], ["music", 21.16], ["sidetone", 1.26]], null, null, null, null, null, null, null, null, null, [["speech", 36.43], ["music", 19.48], ["snicker", 5.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 0.74, 1.34, 10.94, 3.07, 0.23, 0.31, 0.68, 8.05, 2.54, 0.64, 2.59, 9.57, 1.29, 7.17, 0.73, 0.45, 1.63, 0.07, 3.09, 1.44, 0.37, 0.87, 0.8, 6.61, 1.56, 0.71, 0.79, 0.24, 0.96, 0.83, 0.66, 5.36, 5.01, 1.21, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/o-6E3Hd2OW0_filtered.json b/annotations_filtered/o-6E3Hd2OW0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee49ed42355364dde2ea14b4f8b69291e6052c1e --- /dev/null +++ b/annotations_filtered/o-6E3Hd2OW0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 36.15], [37.0, 63.88], [68.0, 67.86], [75.0, 116.33], [118.0, 121.07], [126.0, 127.3], [128.0, 133.03]], "keep_status": [false, false, false, false, true, false, false], "silence_prob": [38.88, 37.03, 0.0, 0.0, 30.0, 0.0, 31.93], "audiomae_on_audioset": [[["music", 34.23], ["hum", 22.22], ["mains hum", 17.6]], [["hum", 43.11], ["music", 19.12], ["throbbing", 17.78]], null, null, [["explosion", 24.11], ["burst, pop", 11.95], ["whack, thwack", 9.87]], null, [["insect", 35.47], ["fly, housefly", 24.8], ["speech", 11.17]]], "duration": [6.15, 26.88, -0.14, 41.33, 3.07, 1.3, 5.03]} \ No newline at end of file diff --git a/annotations_filtered/o-Hcz6we0mk_filtered.json b/annotations_filtered/o-Hcz6we0mk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..507fb61e87584231496bbe3ecb5f65fd4a1f2bc3 --- /dev/null +++ b/annotations_filtered/o-Hcz6we0mk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[80.0, 82.58], [83.0, 83.13], [83.0, 93.48], [96.0, 117.59], [118.0, 127.53]], "keep_status": [true, false, true, true, true], "silence_prob": [40.52, 0.0, 32.77, 35.12, 38.36], "audiomae_on_audioset": [[["speech", 54.24], ["music", 9.16], ["whale vocalization", 6.06]], null, [["speech", 43.36], ["whimper", 9.68], ["explosion", 8.82]], [["music", 11.31], ["noise", 10.09], ["effects unit", 7.47]], [["music", 20.04], ["speech", 15.4], ["boing", 10.94]]], "duration": [2.58, 0.13, 10.48, 21.59, 9.53]} \ No newline at end of file diff --git a/annotations_filtered/o-OKsTWIVxk_filtered.json b/annotations_filtered/o-OKsTWIVxk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..547062b6f0e71e0455a0fd50948eaa3443c24858 --- /dev/null +++ b/annotations_filtered/o-OKsTWIVxk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.18], [12.0, 17.14], [19.0, 19.28], [34.0, 33.71], [34.0, 33.74], [37.0, 36.83], [47.0, 47.21], [49.0, 49.67], [61.0, 65.16], [69.0, 70.87], [73.0, 85.41], [86.0, 86.8], [100.0, 100.6], [101.0, 101.24], [103.0, 103.74], [105.0, 105.29], [114.0, 114.88], [117.0, 117.07], [126.0, 125.81], [129.0, 129.78], [141.0, 141.24], [142.0, 143.75], [144.0, 144.68], [151.0, 151.07]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.92, 0.0, 30.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 37.47], ["hum", 16.85], ["mains hum", 14.57]], null, null, null, null, null, null, [["sidetone", 37.03], ["music", 34.33], ["speech", 11.38]], null, [["music", 77.34], ["boing", 3.31], ["synthesizer", 3.23]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.18, 5.14, 0.28, -0.29, -0.26, -0.17, 0.21, 0.67, 4.16, 1.87, 12.41, 0.8, 0.6, 0.24, 0.74, 0.29, 0.88, 0.07, -0.19, 0.78, 0.24, 1.75, 0.68, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/o-_ochO9CFQ_filtered.json b/annotations_filtered/o-_ochO9CFQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eace1008a72ceae8fc77ac43d047f6c72ce5fb65 --- /dev/null +++ b/annotations_filtered/o-_ochO9CFQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.42], [3.0, 3.54], [16.0, 16.9], [27.0, 31.82], [33.0, 34.67], [36.0, 39.26], [42.0, 42.57], [44.0, 44.79], [46.0, 47.48], [49.0, 49.4], [54.0, 54.4], [56.0, 56.76], [58.0, 57.96], [60.0, 60.3], [61.0, 61.62], [62.0, 64.64], [65.0, 66.16], [70.0, 70.75], [71.0, 74.09], [76.0, 75.88], [76.0, 77.75], [81.0, 87.93], [89.0, 90.51], [92.0, 94.36], [95.0, 98.02], [99.0, 104.52], [106.0, 128.9], [130.0, 168.66], [170.0, 172.69], [176.0, 178.41], [179.0, 179.66], [181.0, 182.43], [184.0, 188.74], [191.0, 195.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.59, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 0.0, 0.0, 99.05, 0.0, 0.0, 97.0, 0.0, 99.52, 99.21, 99.96, 94.95, 0.0, 88.28, 99.92, 0.0, 0.0, 81.89, 61.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 0.54, 0.9, 4.82, 1.67, 3.26, 0.57, 0.79, 1.48, 0.4, 0.4, 0.76, -0.04, 0.3, 0.62, 2.64, 1.16, 0.75, 3.09, -0.12, 1.75, 6.93, 1.51, 2.36, 3.02, 5.52, 22.9, 38.66, 2.69, 2.41, 0.66, 1.43, 4.74, 4.13]} \ No newline at end of file diff --git a/annotations_filtered/o-cA_1F05bU_filtered.json b/annotations_filtered/o-cA_1F05bU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12acb35a878ca506bfaefcbb984e586cfee2c6da --- /dev/null +++ b/annotations_filtered/o-cA_1F05bU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.64], [5.0, 6.56], [8.0, 8.16], [10.0, 11.03], [12.0, 13.15], [14.0, 20.14], [21.0, 27.21], [29.0, 29.39], [32.0, 33.67], [35.0, 35.24], [38.0, 38.45], [44.0, 47.58], [49.0, 50.13], [54.0, 54.85], [56.0, 56.83], [58.0, 58.33], [60.0, 60.44], [62.0, 64.44], [66.0, 65.94], [67.0, 83.78], [84.0, 84.38], [86.0, 91.42], [92.0, 102.27], [103.0, 111.37], [122.0, 131.68], [140.0, 142.59]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 87.55, 30.3, 0.0, 0.0, 0.0, 0.0, 61.37, 0.0, 0.0, 0.0, 0.0, 0.0, 98.27, 0.0, 54.23, 0.0, 52.45, 48.14, 31.95, 50.71, 91.3], "audiomae_on_audioset": [null, null, null, null, null, null, [["explosion", 29.28], ["burst, pop", 26.23], ["speech", 13.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.66], ["electric shaver, electric razor", 21.52], ["hum", 12.87]], [["speech", 29.08], ["explosion", 18.85], ["burst, pop", 9.34]], null, null], "duration": [1.64, 1.56, 0.16, 1.03, 1.15, 6.14, 6.21, 0.39, 1.67, 0.24, 0.45, 3.58, 1.13, 0.85, 0.83, 0.33, 0.44, 2.44, -0.06, 16.78, 0.38, 5.42, 10.27, 8.37, 9.68, 2.59]} \ No newline at end of file diff --git a/annotations_filtered/o-e8eejeHLA_filtered.json b/annotations_filtered/o-e8eejeHLA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af50d1aec82dab5e97af1d35a6f4400ac1ecdba8 --- /dev/null +++ b/annotations_filtered/o-e8eejeHLA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 46.13], [47.0, 48.17], [55.0, 55.32], [57.0, 57.65], [59.0, 59.24], [60.0, 62.5], [63.0, 64.23], [65.0, 69.11], [70.0, 70.21], [70.0, 70.77], [71.0, 74.63], [77.0, 77.18], [78.0, 78.38], [80.0, 80.43], [83.0, 83.74], [84.0, 84.7], [86.0, 86.04], [87.0, 87.39], [90.0, 96.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 97.64, 0.0, 51.34, 0.0, 0.0, 61.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 21.83], ["synthesizer", 15.69], ["noise", 12.47]]], "duration": [35.13, 1.17, 0.32, 0.65, 0.24, 2.5, 1.23, 4.11, 0.21, 0.77, 3.63, 0.18, 0.38, 0.43, 0.74, 0.7, 0.04, 0.39, 6.01]} \ No newline at end of file diff --git a/annotations_filtered/o-iPiN_YHjY_filtered.json b/annotations_filtered/o-iPiN_YHjY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1fcfeea8414b5d32056586dd87e3a86c893203dc --- /dev/null +++ b/annotations_filtered/o-iPiN_YHjY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.63], [6.0, 9.17], [12.0, 13.41], [18.0, 19.57], [24.0, 25.32], [27.0, 28.21], [29.0, 30.15], [31.0, 32.41], [34.0, 36.44], [37.0, 39.97], [44.0, 45.89], [47.0, 49.22], [52.0, 53.32], [54.0, 55.07], [57.0, 57.99], [59.0, 60.99], [66.0, 67.73], [69.0, 70.21], [72.0, 73.92], [75.0, 78.21], [80.0, 82.14], [83.0, 85.73], [87.0, 91.03], [92.0, 94.27], [96.0, 102.54], [105.0, 106.35], [109.0, 112.92], [114.0, 119.26], [121.0, 123.47], [124.0, 128.44], [131.0, 134.74], [136.0, 139.87], [141.0, 145.89], [147.0, 151.55], [152.0, 155.07], [156.0, 156.41], [157.0, 157.57], [166.0, 170.88]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, true, true, false, false, false], "silence_prob": [0.0, 60.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.29, 47.5, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 99.68, 48.39, 73.51, 44.46, 65.91, 0.0, 58.55, 49.22, 57.4, 41.28, 56.25, 47.27, 45.59, 43.48, 31.87, 0.0, 0.0, 29.32], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 22.52], ["hum", 19.64], ["mains hum", 6.71]], null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 52.66], ["speech", 16.99], ["dial tone", 10.03]], null, [["mains hum", 27.23], ["hum", 26.3], ["sidetone", 19.88]], null, null, null, [["music", 28.37], ["hum", 25.28], ["speech", 9.54]], null, [["music", 52.86], ["speech", 30.46], ["effects unit", 3.11]], null, [["music", 20.04], ["effects unit", 18.47], ["speech", 11.11]], [["music", 43.9], ["hum", 18.1], ["throbbing", 5.25]], [["music", 35.32], ["hum", 18.74], ["throbbing", 8.53]], [["music", 45.81], ["theremin", 15.09], ["sitar", 4.17]], null, null, [["music", 47.41], ["didgeridoo", 21.62], ["mains hum", 7.07]]], "duration": [1.63, 3.17, 1.41, 1.57, 1.32, 1.21, 1.15, 1.41, 2.44, 2.97, 1.89, 2.22, 1.32, 1.07, 0.99, 1.99, 1.73, 1.21, 1.92, 3.21, 2.14, 2.73, 4.03, 2.27, 6.54, 1.35, 3.92, 5.26, 2.47, 4.44, 3.74, 3.87, 4.89, 4.55, 3.07, 0.41, 0.57, 4.88]} \ No newline at end of file diff --git a/annotations_filtered/o-kmndqHfF0_filtered.json b/annotations_filtered/o-kmndqHfF0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..461273a30e4947570a3408b0b9ce0b6b5d9c4265 --- /dev/null +++ b/annotations_filtered/o-kmndqHfF0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.89], [11.0, 10.98], [21.0, 21.98], [28.0, 28.44], [29.0, 30.37], [33.0, 33.32], [33.0, 33.37], [38.0, 40.2], [42.0, 47.63], [50.0, 51.0], [54.0, 54.77], [56.0, 56.42], [58.0, 59.39], [60.0, 62.83], [65.0, 64.96], [69.0, 69.82], [71.0, 71.81], [75.0, 75.22], [77.0, 77.25], [80.0, 80.87], [81.0, 81.9], [83.0, 86.81], [88.0, 89.04], [90.0, 90.44], [91.0, 92.47], [93.0, 93.58], [95.0, 96.48], [98.0, 100.99], [103.0, 104.3], [104.0, 105.16], [107.0, 109.0], [113.0, 113.68], [116.0, 122.32], [126.0, 129.73], [130.0, 130.5], [132.0, 132.49], [135.0, 136.19], [137.0, 140.76], [141.0, 143.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.36, 74.29, 0.0, 0.0, 0.0, 0.0, 70.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 69.07, 0.0, 96.04, 50.71, 0.0, 0.0, 0.0, 96.54, 99.84], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 83.17], ["telephone", 2.61], ["inside, small room", 1.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, -0.02, 0.98, 0.44, 1.37, 0.32, 0.37, 2.2, 5.63, 1.0, 0.77, 0.42, 1.39, 2.83, -0.04, 0.82, 0.81, 0.22, 0.25, 0.87, 0.9, 3.81, 1.04, 0.44, 1.47, 0.58, 1.48, 2.99, 1.3, 1.16, 2.0, 0.68, 6.32, 3.73, 0.5, 0.49, 1.19, 3.76, 2.28]} \ No newline at end of file diff --git a/annotations_filtered/o07ecRzkLuM_filtered.json b/annotations_filtered/o07ecRzkLuM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..841373c48d1fe3edf50c3645a7ee74eb62bade6f --- /dev/null +++ b/annotations_filtered/o07ecRzkLuM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.87], [13.0, 14.86], [18.0, 19.79], [20.0, 19.82], [20.0, 22.79], [35.0, 36.37], [43.0, 43.31], [46.0, 46.13], [51.0, 51.09], [54.0, 55.63], [60.0, 60.4], [62.0, 62.77], [64.0, 64.94], [66.0, 68.15], [69.0, 69.99], [74.0, 74.82], [76.0, 76.49], [77.0, 77.82], [79.0, 79.84], [83.0, 82.88], [83.0, 86.97], [93.0, 95.13], [96.0, 96.35], [103.0, 105.33], [106.0, 105.66], [111.0, 118.1], [121.0, 121.39]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, false], "silence_prob": [36.7, 0.0, 0.0, 0.0, 40.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.44, 30.98, 0.0, 55.67, 0.0, 39.91, 0.0], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 57.46], ["cattle, bovinae", 20.87], ["moo", 10.21]], null, null, null, [["bee, wasp, etc.", 23.23], ["fly, housefly", 13.95], ["livestock, farm animals, working animals", 13.32]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 29.32], ["moo", 12.13], ["cattle, bovinae", 8.41]], [["speech", 23.13], ["cattle, bovinae", 12.72], ["fart", 8.59]], null, null, null, [["speech", 21.85], ["music", 20.01], ["mains hum", 13.43]], null], "duration": [3.87, 1.86, 1.79, -0.18, 2.79, 1.37, 0.31, 0.13, 0.09, 1.63, 0.4, 0.77, 0.94, 2.15, 0.99, 0.82, 0.49, 0.82, 0.84, -0.12, 3.97, 2.13, 0.35, 2.33, -0.34, 7.1, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/o0wTt_xDlpk_filtered.json b/annotations_filtered/o0wTt_xDlpk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45a249280bfba7a9fa4a114e7327f3bc324866a6 --- /dev/null +++ b/annotations_filtered/o0wTt_xDlpk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[145.0, 146.82], [148.0, 149.22], [151.0, 152.66]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [1.82, 1.22, 1.66]} \ No newline at end of file diff --git a/annotations_filtered/o1DgvimHOvw_filtered.json b/annotations_filtered/o1DgvimHOvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1fe7a14489ee7347005e644de36e52c70741ce2d --- /dev/null +++ b/annotations_filtered/o1DgvimHOvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.28], [9.0, 11.69], [20.0, 19.8], [22.0, 24.16], [25.0, 32.73], [34.0, 38.79], [46.0, 47.01], [48.0, 51.0], [52.0, 52.1], [54.0, 56.66], [57.0, 57.65], [58.0, 58.62], [63.0, 65.99], [71.0, 71.96], [73.0, 73.47], [74.0, 74.68], [76.0, 76.28], [77.0, 78.85], [80.0, 81.97], [83.0, 82.9], [83.0, 84.52], [88.0, 88.99], [94.0, 94.59], [97.0, 98.42], [101.0, 102.36], [107.0, 109.65], [110.0, 117.78], [120.0, 121.66], [124.0, 124.34], [126.0, 126.91], [128.0, 130.71], [133.0, 133.91], [145.0, 145.66], [150.0, 150.62], [158.0, 158.35], [162.0, 162.8], [164.0, 165.84], [168.0, 168.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [73.51, 41.66, 0.0, 87.19, 53.16, 50.51, 0.0, 70.44, 0.0, 32.61, 0.0, 0.0, 34.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.68, 39.99, 0.0, 0.0, 0.0, 35.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 54.82], ["sine wave", 12.7], ["burping, eructation", 10.4]], null, null, null, null, null, null, null, [["speech", 87.54], ["inside, small room", 1.27], ["telephone", 1.02]], null, null, [["speech", 44.75], ["animal", 4.11], ["whale vocalization", 3.96]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 30.78], ["sine wave", 11.92], ["chirp tone", 7.52]], [["speech", 31.61], ["music", 17.42], ["chirp tone", 7.74]], null, null, null, [["speech", 69.96], ["music", 7.43], ["beatboxing", 4.51]], null, null, null, null, null, null, null], "duration": [2.28, 2.69, -0.2, 2.16, 7.73, 4.79, 1.01, 3.0, 0.1, 2.66, 0.65, 0.62, 2.99, 0.96, 0.47, 0.68, 0.28, 1.85, 1.97, -0.1, 1.52, 0.99, 0.59, 1.42, 1.36, 2.65, 7.78, 1.66, 0.34, 0.91, 2.71, 0.91, 0.66, 0.62, 0.35, 0.8, 1.84, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/o1Izq-E3o7Y_filtered.json b/annotations_filtered/o1Izq-E3o7Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..393343c04bf3e203fa03a2c6c5fa2752c9606610 --- /dev/null +++ b/annotations_filtered/o1Izq-E3o7Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 12.01], [13.0, 14.08], [15.0, 20.41], [21.0, 26.05], [27.0, 38.67], [39.0, 40.71], [46.0, 45.96], [50.0, 72.79], [73.0, 76.84], [78.0, 79.07], [80.0, 95.25], [99.0, 99.82], [100.0, 106.98], [110.0, 111.79], [119.0, 121.74], [123.0, 124.07], [130.0, 173.55], [174.0, 174.5]], "keep_status": [true, false, false, true, true, false, false, false, true, false, false, false, true, false, true, false, false, false], "silence_prob": [30.85, 0.0, 41.98, 34.32, 32.84, 0.0, 0.0, 32.5, 30.88, 0.0, 30.89, 0.0, 30.88, 0.0, 33.6, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 30.07], ["trombone", 22.87], ["brass instrument", 16.07]], null, [["foghorn", 67.56], ["music", 8.61], ["echo", 2.17]], [["music", 34.57], ["foghorn", 9.9], ["gong", 5.96]], [["gong", 33.17], ["music", 27.59], ["hum", 4.37]], null, null, [["music", 60.9], ["theremin", 11.95], ["musical instrument", 7.95]], [["speech", 29.3], ["echo", 20.87], ["outside, urban or manmade", 2.61]], null, [["music", 60.8], ["echo", 5.85], ["gong", 3.89]], null, [["speech", 37.25], ["music", 16.62], ["echo", 4.3]], null, [["music", 21.52], ["throbbing", 15.99], ["hum", 13.93]], null, null, null], "duration": [8.01, 1.08, 5.41, 5.05, 11.67, 1.71, -0.04, 22.79, 3.84, 1.07, 15.25, 0.82, 6.98, 1.79, 2.74, 1.07, 43.55, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/o1JgvBy3_cA_filtered.json b/annotations_filtered/o1JgvBy3_cA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43437562184bb326857aa3e6e7496a97ce9ad8bb --- /dev/null +++ b/annotations_filtered/o1JgvBy3_cA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.8], [10.0, 11.35], [14.0, 65.58], [67.0, 73.65], [75.0, 75.54], [77.0, 90.29]], "keep_status": [false, false, false, false, false, false], "silence_prob": [31.71, 0.0, 0.0, 30.77, 0.0, 31.72], "audiomae_on_audioset": [[["moo", 36.14], ["cattle, bovinae", 31.14], ["livestock, farm animals, working animals", 13.19]], null, null, [["music", 47.12], ["throbbing", 13.57], ["mains hum", 11.52]], null, [["music", 30.77], ["hum", 23.44], ["throbbing", 17.58]]], "duration": [4.8, 1.35, 51.58, 6.65, 0.54, 13.29]} \ No newline at end of file diff --git a/annotations_filtered/o1RMSG4bnrg_filtered.json b/annotations_filtered/o1RMSG4bnrg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2b12149865c182d0cf0597075ebd189dca0092d --- /dev/null +++ b/annotations_filtered/o1RMSG4bnrg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.16], [8.0, 8.67], [9.0, 11.74], [12.0, 13.27], [14.0, 15.31], [16.0, 16.75], [18.0, 20.46], [23.0, 23.19], [26.0, 27.03], [29.0, 31.04], [32.0, 32.63], [33.0, 34.35], [37.0, 38.69], [46.0, 47.95], [49.0, 49.17], [52.0, 53.72], [55.0, 56.3], [59.0, 60.59], [61.0, 66.45], [67.0, 68.74], [70.0, 70.75], [73.0, 74.33], [75.0, 75.68], [77.0, 77.41], [78.0, 79.24], [81.0, 83.86], [85.0, 85.53], [88.0, 87.78], [89.0, 90.1], [91.0, 91.88], [96.0, 96.26], [99.0, 99.08], [100.0, 100.82], [111.0, 112.72], [115.0, 117.29], [120.0, 123.31], [129.0, 133.41], [142.0, 153.67], [155.0, 154.99], [156.0, 156.57], [157.0, 157.82], [159.0, 159.16], [160.0, 160.78], [163.0, 163.09], [167.0, 167.88], [171.0, 171.21], [172.0, 171.96], [174.0, 174.75], [178.0, 178.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.02, 0.0, 0.0, 0.0, 97.11, 0.0, 0.0, 95.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.37, 32.91, 30.81, 80.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 67.1], ["sidetone", 3.84], ["vehicle", 3.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 27.01], ["radio", 6.66], ["mains hum", 5.84]], null, null, null, null, null, null, null, null, null, [["gunshot, gunfire", 26.19], ["burst, pop", 8.82], ["explosion", 6.07]], [["noise", 7.91], ["firecracker", 7.65], ["gunshot, gunfire", 7.51]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 0.67, 2.74, 1.27, 1.31, 0.75, 2.46, 0.19, 1.03, 2.04, 0.63, 1.35, 1.69, 1.95, 0.17, 1.72, 1.3, 1.59, 5.45, 1.74, 0.75, 1.33, 0.68, 0.41, 1.24, 2.86, 0.53, -0.22, 1.1, 0.88, 0.26, 0.08, 0.82, 1.72, 2.29, 3.31, 4.41, 11.67, -0.01, 0.57, 0.82, 0.16, 0.78, 0.09, 0.88, 0.21, -0.04, 0.75, 0.17]} \ No newline at end of file diff --git a/annotations_filtered/o1SrrJNjIh8_filtered.json b/annotations_filtered/o1SrrJNjIh8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc71bdaac3785edb1daed2fb8d008e021aade852 --- /dev/null +++ b/annotations_filtered/o1SrrJNjIh8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.54], [4.0, 3.82], [6.0, 6.42], [8.0, 8.72], [13.0, 13.9], [16.0, 17.19], [18.0, 18.74], [24.0, 25.95], [28.0, 28.8], [30.0, 30.82], [31.0, 32.36], [33.0, 33.37], [34.0, 34.77], [36.0, 35.99], [37.0, 38.97], [40.0, 40.46], [41.0, 42.53], [44.0, 44.83], [45.0, 52.91], [55.0, 57.77], [61.0, 67.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.96, 37.01, 30.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 53.11], ["livestock, farm animals, working animals", 9.16], ["moo", 7.82]], [["speech", 38.79], ["outside, rural or natural", 5.26], ["field recording", 5.14]], [["speech", 35.33], ["livestock, farm animals, working animals", 9.26], ["cattle, bovinae", 5.42]]], "duration": [0.54, -0.18, 0.42, 0.72, 0.9, 1.19, 0.74, 1.95, 0.8, 0.82, 1.36, 0.37, 0.77, -0.01, 1.97, 0.46, 1.53, 0.83, 7.91, 2.77, 6.53]} \ No newline at end of file diff --git a/annotations_filtered/o1_U-Iem8fA_filtered.json b/annotations_filtered/o1_U-Iem8fA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..270cf084c971f7e8b027e8b86e317607f3dd4cfa --- /dev/null +++ b/annotations_filtered/o1_U-Iem8fA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 21.32], [24.0, 26.65], [28.0, 32.26], [36.0, 45.59], [49.0, 61.96], [64.0, 86.81], [91.0, 105.9], [108.0, 125.04], [126.0, 125.85], [127.0, 134.99]], "keep_status": [false, true, true, false, true, false, false, true, false, true], "silence_prob": [0.0, 30.3, 30.08, 30.68, 30.01, 30.08, 31.09, 31.08, 0.0, 31.17], "audiomae_on_audioset": [null, [["music", 32.71], ["boom", 8.2], ["cacophony", 5.77]], [["music", 25.0], ["hum", 20.09], ["throbbing", 15.32]], [["music", 59.32], ["cacophony", 13.45], ["synthesizer", 5.85]], [["music", 48.82], ["synthesizer", 7.48], ["theremin", 5.93]], [["music", 44.34], ["cacophony", 19.9], ["throbbing", 10.88]], [["sidetone", 54.9], ["music", 22.33], ["hum", 5.56]], [["music", 15.85], ["hum", 14.47], ["speech", 8.08]], null, [["music", 47.85], ["synthesizer", 7.71], ["cacophony", 6.29]]], "duration": [1.32, 2.65, 4.26, 9.59, 12.96, 22.81, 14.9, 17.04, -0.15, 7.99]} \ No newline at end of file diff --git a/annotations_filtered/o1nS19OOD-U_filtered.json b/annotations_filtered/o1nS19OOD-U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16b6141b3f461eb31c99109f277a6eee9c7036ae --- /dev/null +++ b/annotations_filtered/o1nS19OOD-U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.84], [13.0, 15.72], [17.0, 17.29], [19.0, 19.97], [22.0, 23.46], [24.0, 24.31], [27.0, 29.02], [35.0, 38.52], [44.0, 45.1], [46.0, 47.76], [49.0, 49.77], [50.0, 52.19], [53.0, 55.32], [56.0, 56.42], [57.0, 58.4], [59.0, 60.93], [65.0, 66.58], [67.0, 69.77], [73.0, 73.75], [75.0, 75.74], [77.0, 79.19], [82.0, 82.46], [84.0, 86.0], [89.0, 89.34], [93.0, 94.07], [96.0, 97.41], [99.0, 100.67], [102.0, 104.79], [108.0, 120.5], [125.0, 126.08]], "keep_status": [true, true, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [44.6, 37.3, 0.0, 0.0, 0.0, 0.0, 52.33, 49.27, 0.0, 0.0, 0.0, 39.58, 82.43, 0.0, 0.0, 0.0, 0.0, 75.55, 0.0, 0.0, 55.67, 0.0, 62.27, 0.0, 0.0, 0.0, 0.0, 53.91, 50.21, 0.0], "audiomae_on_audioset": [[["hum", 32.55], ["music", 17.96], ["throbbing", 12.55]], [["music", 38.12], ["mains hum", 11.71], ["speech", 10.04]], null, null, null, null, null, [["music", 27.69], ["hum", 15.69], ["mains hum", 4.69]], null, null, null, [["speech", 24.97], ["hum", 24.84], ["mains hum", 17.86]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.84, 2.72, 0.29, 0.97, 1.46, 0.31, 2.02, 3.52, 1.1, 1.76, 0.77, 2.19, 2.32, 0.42, 1.4, 1.93, 1.58, 2.77, 0.75, 0.74, 2.19, 0.46, 2.0, 0.34, 1.07, 1.41, 1.67, 2.79, 12.5, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/o2J59hT1Vto_filtered.json b/annotations_filtered/o2J59hT1Vto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32e6b26ea8be7d749e46be30cdf4bd2571dedb97 --- /dev/null +++ b/annotations_filtered/o2J59hT1Vto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.89], [11.0, 12.78], [14.0, 14.93], [15.0, 16.53], [17.0, 17.76], [19.0, 20.04], [21.0, 21.79], [22.0, 23.6], [25.0, 25.37], [26.0, 27.09], [28.0, 29.79], [31.0, 33.18], [34.0, 62.26], [63.0, 64.54], [65.0, 69.8], [73.0, 77.28], [79.0, 85.09], [89.0, 89.21], [91.0, 92.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.54, 71.14, 0.0, 95.51, 77.87, 64.41, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.89, 1.78, 0.93, 1.53, 0.76, 1.04, 0.79, 1.6, 0.37, 1.09, 1.79, 2.18, 28.26, 1.54, 4.8, 4.28, 6.09, 0.21, 1.5]} \ No newline at end of file diff --git a/annotations_filtered/o2VM3B_izXw_filtered.json b/annotations_filtered/o2VM3B_izXw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc307e5ce4579ad5a22993b1542ca3cff741ad1e --- /dev/null +++ b/annotations_filtered/o2VM3B_izXw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.92], [21.0, 21.79], [24.0, 23.8], [25.0, 25.46], [26.0, 26.57], [32.0, 33.49], [35.0, 36.49], [37.0, 37.56], [38.0, 38.99], [43.0, 43.9], [51.0, 51.7], [52.0, 52.05], [52.0, 53.28], [54.0, 55.0], [56.0, 57.15], [59.0, 64.77], [82.0, 82.19], [86.0, 87.2], [90.0, 91.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.64, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 68.0], ["explosion", 11.72], ["burst, pop", 5.48]], null, null, null], "duration": [0.92, 0.79, -0.2, 0.46, 0.57, 1.49, 1.49, 0.56, 0.99, 0.9, 0.7, 0.05, 1.28, 1.0, 1.15, 5.77, 0.19, 1.2, 1.3]} \ No newline at end of file diff --git a/annotations_filtered/o2oR9qYeySU_filtered.json b/annotations_filtered/o2oR9qYeySU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d20146273019737e2c11c688198e839e802e060 --- /dev/null +++ b/annotations_filtered/o2oR9qYeySU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.48], [6.0, 16.23], [19.0, 26.74], [27.0, 36.51], [40.0, 42.35], [43.0, 50.38], [52.0, 64.03], [64.0, 71.24], [76.0, 124.09], [125.0, 126.37]], "keep_status": [false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 35.92, 74.76, 57.32, 73.36, 36.25, 59.51, 86.45, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 21.74], ["hum", 12.34], ["mains hum", 9.97]], null, null, null, [["animal", 23.58], ["livestock, farm animals, working animals", 19.04], ["moo", 18.85]], null, null, null, null], "duration": [0.48, 10.23, 7.74, 9.51, 2.35, 7.38, 12.03, 7.24, 48.09, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/o2vw_iYBAyY_filtered.json b/annotations_filtered/o2vw_iYBAyY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4339f9492b6de53c9844b52577dd8cd414a7384 --- /dev/null +++ b/annotations_filtered/o2vw_iYBAyY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.81], [2.0, 2.59], [4.0, 3.82], [5.0, 9.44], [9.0, 10.93], [14.0, 15.3], [17.0, 24.51], [25.0, 26.15], [27.0, 32.83], [33.0, 47.04], [49.0, 53.32], [55.0, 55.54], [58.0, 68.84], [69.0, 84.81], [86.0, 91.27], [93.0, 93.88], [95.0, 95.15], [99.0, 99.4], [101.0, 101.28], [106.0, 109.66], [111.0, 111.72], [113.0, 114.13], [117.0, 118.1], [119.0, 119.58], [120.0, 121.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.61, 0.0, 0.0, 41.87, 0.0, 61.57, 43.66, 34.27, 0.0, 37.77, 49.78, 47.98, 0.0, 0.0, 0.0, 0.0, 36.83, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 38.25], ["speech", 31.11], ["fly, housefly", 2.87]], null, null, [["fly, housefly", 33.88], ["mosquito", 20.25], ["insect", 18.19]], null, null, [["whale vocalization", 45.15], ["music", 32.17], ["speech", 2.07]], [["foghorn", 42.44], ["music", 19.59], ["speech", 4.16]], null, [["music", 48.77], ["speech", 9.25], ["theremin", 6.79]], [["whale vocalization", 68.81], ["music", 20.38], ["rowboat, canoe, kayak", 1.17]], [["speech", 43.15], ["frog", 11.96], ["music", 10.8]], null, null, null, null, [["frog", 27.35], ["speech", 24.15], ["mosquito", 7.72]], null, null, null, null, null], "duration": [0.81, 0.59, -0.18, 4.44, 1.93, 1.3, 7.51, 1.15, 5.83, 14.04, 4.32, 0.54, 10.84, 15.81, 5.27, 0.88, 0.15, 0.4, 0.28, 3.66, 0.72, 1.13, 1.1, 0.58, 1.34]} \ No newline at end of file diff --git a/annotations_filtered/o2wFqjb9AU0_filtered.json b/annotations_filtered/o2wFqjb9AU0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c13d767a25613527d4c962dd031c9e04e51f1078 --- /dev/null +++ b/annotations_filtered/o2wFqjb9AU0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.56], [11.0, 11.97], [14.0, 16.38], [17.0, 17.9], [21.0, 22.22], [23.0, 27.33], [30.0, 31.35], [33.0, 44.44], [46.0, 46.28], [47.0, 50.26], [51.0, 52.81], [56.0, 56.02], [60.0, 65.3], [67.0, 67.37], [74.0, 74.61], [76.0, 77.72], [78.0, 80.0], [88.0, 88.35], [95.0, 95.01], [96.0, 96.45], [97.0, 98.78], [100.0, 100.72], [102.0, 102.69], [106.0, 107.1], [112.0, 113.14], [114.0, 114.96], [116.0, 117.31], [119.0, 119.2], [120.0, 120.85], [123.0, 123.67], [130.0, 131.08], [133.0, 133.81], [136.0, 140.29], [141.0, 142.6], [143.0, 144.31], [146.0, 147.99], [149.0, 149.98], [151.0, 152.04], [153.0, 154.5], [157.0, 164.76], [166.0, 167.0], [168.0, 177.5], [178.0, 178.51]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [38.04, 0.0, 97.92, 0.0, 0.0, 97.0, 0.0, 63.31, 0.0, 63.21, 0.0, 0.0, 69.47, 0.0, 0.0, 0.0, 84.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.16, 0.0, 32.0, 0.0], "audiomae_on_audioset": [[["whale vocalization", 27.16], ["music", 19.08], ["crying, sobbing", 7.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 28.26], ["music", 20.29], ["mains hum", 14.98]], null], "duration": [6.56, 0.97, 2.38, 0.9, 1.22, 4.33, 1.35, 11.44, 0.28, 3.26, 1.81, 0.02, 5.3, 0.37, 0.61, 1.72, 2.0, 0.35, 0.01, 0.45, 1.78, 0.72, 0.69, 1.1, 1.14, 0.96, 1.31, 0.2, 0.85, 0.67, 1.08, 0.81, 4.29, 1.6, 1.31, 1.99, 0.98, 1.04, 1.5, 7.76, 1.0, 9.5, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/o2wVetrydrY_filtered.json b/annotations_filtered/o2wVetrydrY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0683cfb5ef7c99452a315c095dfd6ee5bdacdc82 --- /dev/null +++ b/annotations_filtered/o2wVetrydrY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 3.16], [7.0, 21.95], [25.0, 29.15], [32.0, 51.85], [52.0, 54.46], [59.0, 62.28], [65.0, 67.19], [72.0, 73.36], [83.0, 83.1], [92.0, 97.95], [101.0, 107.89], [110.0, 110.47], [112.0, 112.94], [116.0, 117.46], [119.0, 127.47]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, true], "silence_prob": [38.51, 33.16, 30.31, 32.34, 31.2, 31.03, 30.78, 0.0, 0.0, 30.76, 32.44, 0.0, 0.0, 0.0, 46.09], "audiomae_on_audioset": [[["music", 59.12], ["didgeridoo", 9.28], ["theremin", 5.61]], [["music", 87.19], ["musical instrument", 1.75], ["effects unit", 1.65]], [["music", 28.71], ["livestock, farm animals, working animals", 23.83], ["moo", 17.89]], [["cattle, bovinae", 33.3], ["music", 26.97], ["moo", 21.44]], [["music", 48.79], ["hum", 8.79], ["throbbing", 6.07]], [["music", 77.18], ["musical instrument", 3.37], ["synthesizer", 1.19]], [["music", 68.9], ["didgeridoo", 3.99], ["musical instrument", 2.73]], null, null, [["music", 37.14], ["moo", 8.46], ["cattle, bovinae", 7.31]], [["music", 61.54], ["didgeridoo", 8.42], ["theremin", 6.25]], null, null, null, [["music", 30.07], ["speech", 18.27], ["sidetone", 13.64]]], "duration": [3.16, 14.95, 4.15, 19.85, 2.46, 3.28, 2.19, 1.36, 0.1, 5.95, 6.89, 0.47, 0.94, 1.46, 8.47]} \ No newline at end of file diff --git a/annotations_filtered/o2xprwwIMXM_filtered.json b/annotations_filtered/o2xprwwIMXM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..15d01f2419f9228870e99a90112e50227807c814 --- /dev/null +++ b/annotations_filtered/o2xprwwIMXM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.07], [8.0, 10.17], [15.0, 16.12], [17.0, 17.88], [18.0, 19.8], [23.0, 23.04], [30.0, 30.59], [32.0, 33.4], [39.0, 40.47], [45.0, 49.94], [50.0, 51.7], [52.0, 53.0], [56.0, 56.74], [58.0, 59.78], [62.0, 63.26], [69.0, 70.95], [72.0, 76.82], [77.0, 78.65], [80.0, 80.62], [83.0, 83.12], [87.0, 100.97], [103.0, 104.26], [105.0, 108.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 88.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.81, 0.0, 0.0, 0.0, 32.73, 0.0, 77.2], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 62.19], ["hum", 8.3], ["ambient music", 8.19]], null, null], "duration": [0.07, 2.17, 1.12, 0.88, 1.8, 0.04, 0.59, 1.4, 1.47, 4.94, 1.7, 1.0, 0.74, 1.78, 1.26, 1.95, 4.82, 1.65, 0.62, 0.12, 13.97, 1.26, 3.26]} \ No newline at end of file diff --git a/annotations_filtered/o36m-2TPwck_filtered.json b/annotations_filtered/o36m-2TPwck_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3c187d7398812b8f427f8be73fdc8e024b1428c --- /dev/null +++ b/annotations_filtered/o36m-2TPwck_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 18.96], [20.0, 30.72], [32.0, 47.83], [52.0, 54.67], [55.0, 55.59], [56.0, 56.91], [57.0, 58.11], [61.0, 72.05], [73.0, 76.91], [78.0, 106.19], [109.0, 138.43]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [56.63, 61.27, 63.31, 97.73, 0.0, 0.0, 0.0, 97.43, 65.2, 38.32, 45.33], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["hum", 31.37], ["throbbing", 19.6], ["music", 17.73]], [["animal", 16.49], ["shofar", 14.73], ["whale vocalization", 10.86]]], "duration": [10.96, 10.72, 15.83, 2.67, 0.59, 0.91, 1.11, 11.05, 3.91, 28.19, 29.43]} \ No newline at end of file diff --git a/annotations_filtered/o3aqMjrFf5k_filtered.json b/annotations_filtered/o3aqMjrFf5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7926d38ddf4e49d3d06231c413c43f100345909 --- /dev/null +++ b/annotations_filtered/o3aqMjrFf5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.37], [11.0, 10.83], [15.0, 14.57], [15.0, 14.61]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [1.37, -0.17, -0.43, -0.39]} \ No newline at end of file diff --git a/annotations_filtered/o3s4QiK4MSM_filtered.json b/annotations_filtered/o3s4QiK4MSM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d0065eff5b7bc818752b43024d82bc272f9ac30 --- /dev/null +++ b/annotations_filtered/o3s4QiK4MSM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.73], [7.0, 21.3], [24.0, 40.0], [42.0, 42.09], [43.0, 43.6], [44.0, 44.61], [46.0, 46.16], [47.0, 48.24], [51.0, 52.57], [53.0, 55.02], [60.0, 65.42], [71.0, 71.88], [74.0, 74.85], [76.0, 76.2], [78.0, 78.21], [79.0, 80.5], [85.0, 88.53], [92.0, 95.05], [96.0, 97.83], [99.0, 99.79], [100.0, 134.94], [136.0, 147.85], [149.0, 150.2]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 32.92, 46.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.68, 50.26, 0.0, 0.0, 0.0, 0.0, 0.0, 44.37, 57.32, 0.0, 0.0, 0.0, 40.38, 0.0], "audiomae_on_audioset": [null, [["speech", 56.67], ["throbbing", 11.58], ["stomach rumble", 3.43]], [["hum", 41.23], ["throbbing", 15.2], ["mains hum", 9.5]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 31.96], ["boing", 12.25], ["speech", 9.0]], null, null, null, null, [["music", 47.17], ["didgeridoo", 34.04], ["musical instrument", 2.85]], null], "duration": [1.73, 14.3, 16.0, 0.09, 0.6, 0.61, 0.16, 1.24, 1.57, 2.02, 5.42, 0.88, 0.85, 0.2, 0.21, 1.5, 3.53, 3.05, 1.83, 0.79, 34.94, 11.85, 1.2]} \ No newline at end of file diff --git a/annotations_filtered/o3sj7nGzC64_filtered.json b/annotations_filtered/o3sj7nGzC64_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5aa29909c1a1033921ad2e02c2186815e94e498 --- /dev/null +++ b/annotations_filtered/o3sj7nGzC64_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[64.0, 65.01], [67.0, 75.0], [76.0, 81.14], [84.0, 90.05], [92.0, 99.17], [100.0, 106.35], [109.0, 110.34], [113.0, 114.52], [116.0, 116.85], [118.0, 119.47], [121.0, 121.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 69.61, 65.91, 61.97, 97.64, 32.5, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["theremin", 75.97], ["music", 16.88], ["synthesizer", 1.88]], null, null, null, null, null], "duration": [1.01, 8.0, 5.14, 6.05, 7.17, 6.35, 1.34, 1.52, 0.85, 1.47, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/o3uf4YSwY9I_filtered.json b/annotations_filtered/o3uf4YSwY9I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32af783f29bba7ee3eadc15bc80208ec85810c81 --- /dev/null +++ b/annotations_filtered/o3uf4YSwY9I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.89], [23.0, 23.48], [27.0, 28.19], [34.0, 35.28], [37.0, 37.96], [38.0, 39.58], [40.0, 42.15], [43.0, 44.05], [46.0, 46.21], [53.0, 53.08], [53.0, 53.32], [54.0, 54.73], [63.0, 64.83], [68.0, 69.72], [71.0, 71.61], [81.0, 81.5], [83.0, 83.3], [86.0, 89.83], [91.0, 91.84], [97.0, 97.06], [103.0, 104.23], [110.0, 110.51], [112.0, 112.73], [120.0, 121.53], [123.0, 123.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 0.48, 1.19, 1.28, 0.96, 1.58, 2.15, 1.05, 0.21, 0.08, 0.32, 0.73, 1.83, 1.72, 0.61, 0.5, 0.3, 3.83, 0.84, 0.06, 1.23, 0.51, 0.73, 1.53, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/o3vv1SPEv1c_filtered.json b/annotations_filtered/o3vv1SPEv1c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b3706fe42acc93ce3eba54a417720ac5ebc141e --- /dev/null +++ b/annotations_filtered/o3vv1SPEv1c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.32], [4.0, 7.38], [9.0, 11.06], [12.0, 14.4], [17.0, 17.17], [20.0, 21.59], [30.0, 33.2], [38.0, 38.64], [43.0, 42.75], [50.0, 50.52], [53.0, 52.79], [59.0, 58.72], [65.0, 65.01], [72.0, 72.33], [85.0, 87.13], [88.0, 88.72], [91.0, 92.25], [93.0, 94.58], [97.0, 97.68], [103.0, 104.95], [116.0, 115.96], [117.0, 117.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 50.66, 69.47, 66.76, 0.0, 0.0, 53.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.32, 3.38, 2.06, 2.4, 0.17, 1.59, 3.2, 0.64, -0.25, 0.52, -0.21, -0.28, 0.01, 0.33, 2.13, 0.72, 1.25, 1.58, 0.68, 1.95, -0.04, 0.17]} \ No newline at end of file diff --git a/annotations_filtered/o3w6MouV4NE_filtered.json b/annotations_filtered/o3w6MouV4NE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea99f083092a9503296c42abedfbbcac5cbb96b1 --- /dev/null +++ b/annotations_filtered/o3w6MouV4NE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 19.08], [20.0, 24.16], [25.0, 36.85], [38.0, 63.54], [64.0, 63.61], [64.0, 64.54], [66.0, 79.57]], "keep_status": [false, false, true, false, false, false, true], "silence_prob": [74.13, 98.1, 43.51, 31.9, 0.0, 0.0, 34.48], "audiomae_on_audioset": [null, null, [["music", 38.66], ["whale vocalization", 14.98], ["hum", 13.04]], [["music", 57.69], ["scary music", 11.9], ["hum", 7.18]], null, null, [["speech", 23.25], ["animal", 22.28], ["whale vocalization", 14.76]]], "duration": [19.08, 4.16, 11.85, 25.54, -0.39, 0.54, 13.57]} \ No newline at end of file diff --git a/annotations_filtered/o3ya6zEv3eM_filtered.json b/annotations_filtered/o3ya6zEv3eM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87edc9a5ce70cf14afbe10c47d80c85d2b3e5218 --- /dev/null +++ b/annotations_filtered/o3ya6zEv3eM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.84], [24.0, 43.8], [46.0, 93.77], [102.0, 114.67], [120.0, 120.28], [122.0, 121.8], [122.0, 122.76], [132.0, 132.71], [133.0, 150.5], [151.0, 151.56], [156.0, 158.16], [162.0, 161.65], [167.0, 167.36], [172.0, 172.94]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 28.85, 0.0, 30.26, 0.0, 0.0, 0.0, 0.0, 27.89, 0.0, 33.06, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 26.68], ["hum", 24.69], ["throbbing", 14.07]], null, [["music", 69.17], ["throbbing", 10.19], ["hum", 6.33]], null, null, null, null, [["music", 73.4], ["electronic music", 12.93], ["hum", 3.17]], null, [["radio", 33.81], ["speech", 30.59], ["sidetone", 25.38]], null, null, null], "duration": [0.84, 19.8, 47.77, 12.67, 0.28, -0.2, 0.76, 0.71, 17.5, 0.56, 2.16, -0.35, 0.36, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/o4ARk91_ptU_filtered.json b/annotations_filtered/o4ARk91_ptU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b26ead05096d27237226c6d9aedcc8216b3de2e8 --- /dev/null +++ b/annotations_filtered/o4ARk91_ptU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.5], [6.0, 8.7], [9.0, 32.29], [36.0, 90.49], [92.0, 101.92], [103.0, 104.52]], "keep_status": [false, false, false, false, true, false], "silence_prob": [0.0, 100.0, 37.39, 0.0, 44.49, 0.0], "audiomae_on_audioset": [null, null, [["sidetone", 49.74], ["speech", 26.12], ["fly, housefly", 3.07]], null, [["fart", 25.33], ["fly, housefly", 10.57], ["grunt", 9.53]], null], "duration": [1.5, 2.7, 23.29, 54.49, 9.92, 1.52]} \ No newline at end of file diff --git a/annotations_filtered/o4UVXgAzYb0_filtered.json b/annotations_filtered/o4UVXgAzYb0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bc22f2d2f06dfc0bba6e2e4704c4815aea61eeb --- /dev/null +++ b/annotations_filtered/o4UVXgAzYb0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.65], [5.0, 13.07], [14.0, 16.17], [17.0, 18.98], [22.0, 21.91], [25.0, 29.37], [31.0, 31.68], [34.0, 35.67], [36.0, 39.63], [41.0, 50.25], [51.0, 67.78], [71.0, 97.53], [98.0, 97.56], [98.0, 97.6], [105.0, 105.39]], "keep_status": [false, true, false, false, false, true, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 47.94, 95.78, 0.0, 0.0, 48.74, 0.0, 0.0, 88.28, 33.32, 30.34, 30.98, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 25.86], ["hum", 9.16], ["slosh", 8.37]], null, null, null, [["music", 20.21], ["roaring cats (lions, tigers)", 17.24], ["animal", 7.34]], null, null, null, [["music", 57.65], ["speech", 16.52], ["whack, thwack", 5.4]], [["music", 56.43], ["speech", 2.56], ["boing", 2.3]], [["music", 47.98], ["speech", 11.01], ["whip", 10.95]], null, null, null], "duration": [0.65, 8.07, 2.17, 1.98, -0.09, 4.37, 0.68, 1.67, 3.63, 9.25, 16.78, 26.53, -0.44, -0.4, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/o4lq3SOB8sw_filtered.json b/annotations_filtered/o4lq3SOB8sw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da5f633869d783b22efe941092eed431bdfe4aec --- /dev/null +++ b/annotations_filtered/o4lq3SOB8sw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.04], [11.0, 41.32], [42.0, 43.51], [44.0, 44.74], [47.0, 50.99], [53.0, 54.19], [60.0, 60.24], [67.0, 67.46], [67.0, 67.49], [68.0, 67.61], [70.0, 71.17], [73.0, 83.25], [86.0, 85.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 49.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.23, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 38.7], ["throbbing", 23.97], ["hum", 18.46]], null, null, null, null, null, null, [["music", 58.04], ["throbbing", 15.0], ["hum", 10.18]], null], "duration": [0.04, 30.32, 1.51, 0.74, 3.99, 1.19, 0.24, 0.46, 0.49, -0.39, 1.17, 10.25, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/o5CBItcNkFs_filtered.json b/annotations_filtered/o5CBItcNkFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51e072e36970d52b38614ad28ae21d496bb4c716 --- /dev/null +++ b/annotations_filtered/o5CBItcNkFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 50.41], [51.0, 98.96], [100.0, 103.57], [106.0, 107.15]], "keep_status": [false, false, true, false], "silence_prob": [0.0, 0.0, 43.98, 0.0], "audiomae_on_audioset": [null, null, [["fart", 21.25], ["speech", 15.54], ["livestock, farm animals, working animals", 10.34]], null], "duration": [0.41, 47.96, 3.57, 1.15]} \ No newline at end of file diff --git a/annotations_filtered/o5FT3IGXtAk_filtered.json b/annotations_filtered/o5FT3IGXtAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1501e4d6cd735490ce851a1e1ae20143765223ca --- /dev/null +++ b/annotations_filtered/o5FT3IGXtAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.88], [7.0, 9.05], [13.0, 18.15], [19.0, 19.47], [20.0, 21.2], [27.0, 28.29], [31.0, 31.85], [38.0, 38.55], [40.0, 41.18], [45.0, 46.45], [49.0, 48.9], [52.0, 52.02], [57.0, 57.89], [67.0, 67.36], [69.0, 69.28], [77.0, 77.36], [79.0, 79.81], [80.0, 81.01], [81.0, 82.51], [83.0, 83.73], [84.0, 84.89], [87.0, 86.95], [89.0, 90.76], [94.0, 95.44], [97.0, 99.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.2, 50.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.44], "audiomae_on_audioset": [null, [["speech", 35.21], ["sidetone", 26.28], ["radio", 19.03]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.12, 2.05, 5.15, 0.47, 1.2, 1.29, 0.85, 0.55, 1.18, 1.45, -0.1, 0.02, 0.89, 0.36, 0.28, 0.36, 0.81, 1.01, 1.51, 0.73, 0.89, -0.05, 1.76, 1.44, 2.59]} \ No newline at end of file diff --git a/annotations_filtered/o69EA3eSDf0_filtered.json b/annotations_filtered/o69EA3eSDf0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4be5e2a96c1bcb0a58357015472b878bd386dc0c --- /dev/null +++ b/annotations_filtered/o69EA3eSDf0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.45], [6.0, 5.66], [9.0, 11.96], [18.0, 19.35], [20.0, 21.19], [22.0, 24.09], [26.0, 27.43], [33.0, 34.5], [35.0, 36.48], [42.0, 42.87], [47.0, 47.58], [50.0, 50.31], [54.0, 55.53], [57.0, 57.74], [59.0, 60.4], [62.0, 62.43], [65.0, 66.01], [66.0, 67.1], [67.0, 72.79], [74.0, 75.57], [85.0, 88.97], [91.0, 92.08], [92.0, 95.44], [97.0, 98.07], [100.0, 100.63], [104.0, 105.41], [106.0, 107.57], [110.0, 111.23], [112.0, 114.86], [117.0, 118.39], [120.0, 120.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 99.92, 0.0, 0.0, 94.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.73, 0.0, 42.11, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 32.88, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 89.93], ["fart", 1.35], ["inside, small room", 1.11]], null, [["speech", 51.53], ["hum", 13.24], ["mains hum", 3.53]], null, null, null, null, null, null, null, [["busy signal", 27.57], ["synthetic singing", 5.01], ["sine wave", 3.48]], null, null], "duration": [0.45, -0.34, 2.96, 1.35, 1.19, 2.09, 1.43, 1.5, 1.48, 0.87, 0.58, 0.31, 1.53, 0.74, 1.4, 0.43, 1.01, 1.1, 5.79, 1.57, 3.97, 1.08, 3.44, 1.07, 0.63, 1.41, 1.57, 1.23, 2.86, 1.39, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/o6FUdj0_fGY_filtered.json b/annotations_filtered/o6FUdj0_fGY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1458bb85b2da82fb9215aacc3fc76c0e5508de44 --- /dev/null +++ b/annotations_filtered/o6FUdj0_fGY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[74.0, 74.19], [97.0, 99.39], [113.0, 116.41], [116.0, 116.53], [117.0, 122.84], [124.0, 125.91], [131.0, 131.45], [142.0, 143.28]], "keep_status": [false, true, false, false, false, false, false, false], "silence_prob": [0.0, 32.4, 64.41, 0.0, 50.11, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 25.35], ["animal", 12.22], ["grunt", 11.25]], null, null, null, null, null, null], "duration": [0.19, 2.39, 3.41, 0.53, 5.84, 1.91, 0.45, 1.28]} \ No newline at end of file diff --git a/annotations_filtered/o6Jkz5TQv84_filtered.json b/annotations_filtered/o6Jkz5TQv84_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6208bb50292741066dc96233a9bd16200fdb368 --- /dev/null +++ b/annotations_filtered/o6Jkz5TQv84_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.92], [15.0, 15.53], [19.0, 18.93], [29.0, 29.86], [31.0, 31.68], [33.0, 35.58], [36.0, 40.2], [46.0, 46.03], [48.0, 47.98], [49.0, 53.1], [64.0, 66.26], [69.0, 70.95], [77.0, 77.16], [87.0, 87.91], [90.0, 90.48], [101.0, 104.04], [105.0, 108.51], [115.0, 116.24], [119.0, 120.14], [126.0, 126.99], [131.0, 134.16], [135.0, 139.9], [149.0, 149.96], [152.0, 163.71], [164.0, 165.03], [168.0, 172.47]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 66.03, 40.71, 0.0, 0.0, 30.91, 31.48, 0.0, 0.0, 0.0, 0.0, 32.21, 35.2, 0.0, 0.0, 0.0, 38.26, 30.28, 0.0, 32.68, 0.0, 30.01], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 35.02], ["music", 20.99], ["throbbing", 14.97]], null, null, [["electric shaver, electric razor", 30.24], ["mains hum", 16.06], ["hum", 12.9]], [["music", 50.16], ["throbbing", 16.14], ["hum", 11.91]], null, null, null, null, [["music", 46.27], ["throbbing", 16.89], ["hum", 14.14]], [["music", 41.47], ["throbbing", 24.27], ["hum", 14.58]], null, null, null, [["throbbing", 37.41], ["music", 36.47], ["hum", 9.69]], [["hum", 45.06], ["throbbing", 14.87], ["mains hum", 13.49]], null, [["music", 53.26], ["throbbing", 19.87], ["hum", 12.4]], null, [["speech", 35.18], ["music", 12.48], ["hum", 7.9]]], "duration": [1.92, 0.53, -0.07, 0.86, 0.68, 2.58, 4.2, 0.03, -0.02, 4.1, 2.26, 1.95, 0.16, 0.91, 0.48, 3.04, 3.51, 1.24, 1.14, 0.99, 3.16, 4.9, 0.96, 11.71, 1.03, 4.47]} \ No newline at end of file diff --git a/annotations_filtered/o6MDdOWCCT8_filtered.json b/annotations_filtered/o6MDdOWCCT8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ba11f6a4aeffe8b73aad45e0610bafbec9b3ece --- /dev/null +++ b/annotations_filtered/o6MDdOWCCT8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.6], [12.0, 15.4], [16.0, 16.85], [17.0, 18.03], [18.0, 18.81], [19.0, 21.32], [24.0, 24.17], [35.0, 34.87], [40.0, 41.44], [45.0, 44.76], [110.0, 110.0], [111.0, 112.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.89, 0.0, 0.0, 0.0, 34.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 48.09], ["music", 27.51], ["boing", 12.4]], null, null, null, [["sidetone", 46.6], ["speech", 21.29], ["music", 17.02]], null, null, null, null, null, null], "duration": [1.6, 3.4, 0.85, 1.03, 0.81, 2.32, 0.17, -0.13, 1.44, -0.24, 0.0, 1.13]} \ No newline at end of file diff --git a/annotations_filtered/o6TYEHyv00Y_filtered.json b/annotations_filtered/o6TYEHyv00Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3acc6a35dba8e5450958a16220617e8a6eb38628 --- /dev/null +++ b/annotations_filtered/o6TYEHyv00Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.38], [30.0, 30.6], [33.0, 33.27], [35.0, 35.65], [39.0, 39.63], [40.0, 41.57]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [1.38, 0.6, 0.27, 0.65, 0.63, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/o6hrLFJq63E_filtered.json b/annotations_filtered/o6hrLFJq63E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2052a9f3b54e53c6f671d06c76c7ca687ffe497c --- /dev/null +++ b/annotations_filtered/o6hrLFJq63E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.97], [29.0, 29.93], [32.0, 34.1], [53.0, 54.01], [54.0, 54.11], [60.0, 60.81], [62.0, 63.69], [81.0, 81.78], [93.0, 93.82], [104.0, 104.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 52.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.97, 0.93, 2.1, 1.01, 0.11, 0.81, 1.69, 0.78, 0.82, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/o6synmrDXqU_filtered.json b/annotations_filtered/o6synmrDXqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e351d2716cdc6d6aacb1f1c38c2ccaa3cbd00258 --- /dev/null +++ b/annotations_filtered/o6synmrDXqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.69], [8.0, 8.46], [26.0, 28.0], [37.0, 39.65], [40.0, 39.68], [40.0, 40.85], [51.0, 51.39], [53.0, 55.24], [59.0, 59.64], [60.0, 60.79], [74.0, 74.58], [79.0, 79.07], [95.0, 101.49], [111.0, 112.01], [113.0, 113.64], [116.0, 116.16], [120.0, 120.34], [122.0, 122.25], [128.0, 133.27], [133.0, 133.49], [134.0, 137.13], [140.0, 141.1], [141.0, 141.18], [144.0, 146.21], [150.0, 164.19]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, true, true], "silence_prob": [0.0, 0.0, 71.72, 49.09, 0.0, 0.0, 0.0, 60.6, 0.0, 0.0, 0.0, 0.0, 29.84, 0.0, 0.0, 0.0, 0.0, 0.0, 29.72, 0.0, 29.35, 0.0, 0.0, 29.8, 29.57], "audiomae_on_audioset": [null, null, null, [["music", 40.32], ["speech", 23.87], ["theremin", 2.85]], null, null, null, null, null, null, null, null, [["music", 68.21], ["singing", 5.88], ["male singing", 5.86]], null, null, null, null, null, [["music", 56.49], ["singing", 5.89], ["musical instrument", 2.77]], null, [["fly, housefly", 18.85], ["music", 12.13], ["insect", 12.04]], null, null, [["boing", 38.93], ["music", 18.97], ["thunk", 10.42]], [["music", 64.5], ["singing", 3.67], ["pop music", 1.71]]], "duration": [0.69, 0.46, 2.0, 2.65, -0.32, 0.85, 0.39, 2.24, 0.64, 0.79, 0.58, 0.07, 6.49, 1.01, 0.64, 0.16, 0.34, 0.25, 5.27, 0.49, 3.13, 1.1, 0.18, 2.21, 14.19]} \ No newline at end of file diff --git a/annotations_filtered/o6zEapyz33o_filtered.json b/annotations_filtered/o6zEapyz33o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..209d12250a97b9f854d227e07bfad64eabbaeb54 --- /dev/null +++ b/annotations_filtered/o6zEapyz33o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.18], [9.0, 10.88], [14.0, 14.07], [15.0, 15.82], [16.0, 17.24], [22.0, 24.09], [24.0, 31.99], [33.0, 33.2], [34.0, 38.57], [39.0, 41.86], [44.0, 45.57], [46.0, 47.85]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 49.27, 53.59, 0.0, 63.74, 35.33, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["sidetone", 45.59], ["speech", 14.99], ["radio", 9.89]], null, null, null, [["speech", 25.65], ["music", 12.95], ["bee, wasp, etc.", 8.39]], null, null], "duration": [0.18, 1.88, 0.07, 0.82, 1.24, 2.09, 7.99, 0.2, 4.57, 2.86, 1.57, 1.85]} \ No newline at end of file diff --git a/annotations_filtered/o7WSgC9oGic_filtered.json b/annotations_filtered/o7WSgC9oGic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e20df844cdee61dd806168dde05a3103b4e9aa90 --- /dev/null +++ b/annotations_filtered/o7WSgC9oGic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.62], [12.0, 12.82], [15.0, 16.19], [18.0, 18.12], [20.0, 20.16], [21.0, 20.93], [23.0, 26.45], [27.0, 28.41], [31.0, 31.55], [33.0, 34.3], [37.0, 38.53], [40.0, 47.55], [50.0, 60.29], [62.0, 71.56], [75.0, 75.05], [79.0, 80.89], [82.0, 100.8], [102.0, 103.47], [104.0, 105.81], [112.0, 113.43], [115.0, 118.08], [121.0, 120.92], [124.0, 140.73], [143.0, 142.94], [147.0, 147.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.13, 0.0, 0.0, 0.0, 0.0, 94.37, 94.52, 93.29, 0.0, 0.0, 93.91, 0.0, 0.0, 0.0, 34.94, 0.0, 37.24, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 77.15], ["baby laughter", 4.67], ["laughter", 2.99]], null, [["speech", 28.52], ["whack, thwack", 9.17], ["door", 8.66]], null, null], "duration": [0.62, 0.82, 1.19, 0.12, 0.16, -0.07, 3.45, 1.41, 0.55, 1.3, 1.53, 7.55, 10.29, 9.56, 0.05, 1.89, 18.8, 1.47, 1.81, 1.43, 3.08, -0.08, 16.73, -0.06, 0.55]} \ No newline at end of file diff --git a/annotations_filtered/o7_kf3hUg30_filtered.json b/annotations_filtered/o7_kf3hUg30_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee31c9959f213a5f98191aa83dba61834fdcb076 --- /dev/null +++ b/annotations_filtered/o7_kf3hUg30_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.35], [19.0, 27.94], [34.0, 35.72], [37.0, 66.36], [69.0, 74.12], [75.0, 76.27], [76.0, 76.5]], "keep_status": [false, true, false, true, false, false, false], "silence_prob": [0.0, 28.78, 0.0, 29.5, 94.66, 0.0, 0.0], "audiomae_on_audioset": [null, [["race car, auto racing", 16.98], ["music", 10.97], ["car", 10.46]], null, [["music", 25.25], ["wild animals", 17.55], ["roaring cats (lions, tigers)", 13.45]], null, null, null], "duration": [0.35, 8.94, 1.72, 29.36, 5.12, 1.27, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/o7zebTh4tHo_filtered.json b/annotations_filtered/o7zebTh4tHo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e5c5c54575778b08fc6cbebf8b32b0b13154c1e --- /dev/null +++ b/annotations_filtered/o7zebTh4tHo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.71], [22.0, 22.79], [25.0, 25.44], [27.0, 27.16], [29.0, 42.85], [45.0, 49.27], [50.0, 51.43], [53.0, 56.98]], "keep_status": [false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 36.15, 62.99, 0.0, 99.52], "audiomae_on_audioset": [null, null, null, null, [["electric shaver, electric razor", 22.13], ["breaking", 11.03], ["music", 6.87]], null, null, null], "duration": [1.71, 0.79, 0.44, 0.16, 13.85, 4.27, 1.43, 3.98]} \ No newline at end of file diff --git a/annotations_filtered/o8A2gIt799I_filtered.json b/annotations_filtered/o8A2gIt799I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9784948bc3c19923fa262b4fd611e68fac829fa --- /dev/null +++ b/annotations_filtered/o8A2gIt799I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 25.98], [27.0, 27.7], [28.0, 29.88], [31.0, 75.07], [79.0, 80.35], [85.0, 88.97], [89.0, 92.62], [93.0, 113.76], [116.0, 115.57], [117.0, 117.05], [118.0, 125.44]], "keep_status": [false, false, false, false, false, true, false, true, false, false, true], "silence_prob": [79.76, 0.0, 0.0, 0.0, 0.0, 38.17, 67.51, 45.36, 0.0, 0.0, 41.56], "audiomae_on_audioset": [null, null, null, null, null, [["music", 17.96], ["effects unit", 12.31], ["distortion", 5.17]], null, [["livestock, farm animals, working animals", 22.34], ["cattle, bovinae", 19.43], ["moo", 13.74]], null, null, [["speech", 47.06], ["music", 18.7], ["sound effect", 3.0]]], "duration": [18.98, 0.7, 1.88, 44.07, 1.35, 3.97, 3.62, 20.76, -0.43, 0.05, 7.44]} \ No newline at end of file diff --git a/annotations_filtered/o8ETRMZt6kg_filtered.json b/annotations_filtered/o8ETRMZt6kg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78737c7298fd406bdb8c4c2736076b5d19b8e3c7 --- /dev/null +++ b/annotations_filtered/o8ETRMZt6kg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.87], [8.0, 9.27], [10.0, 10.57], [12.0, 12.82], [15.0, 16.21], [20.0, 19.68], [20.0, 21.74], [22.0, 30.87], [33.0, 33.62], [38.0, 39.14], [41.0, 40.9], [42.0, 44.42], [46.0, 48.73], [50.0, 50.82], [51.0, 52.62], [56.0, 57.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.02, 0.0, 0.0, 0.0, 70.86, 59.86, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.13, 1.27, 0.57, 0.82, 1.21, -0.32, 1.74, 8.87, 0.62, 1.14, -0.1, 2.42, 2.73, 0.82, 1.62, 1.16]} \ No newline at end of file diff --git a/annotations_filtered/o9-cFlOdXn8_filtered.json b/annotations_filtered/o9-cFlOdXn8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a113604cab9580466dba884005bfd9057c55a472 --- /dev/null +++ b/annotations_filtered/o9-cFlOdXn8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.78], [10.0, 14.55], [19.0, 40.9], [41.0, 55.53], [59.0, 60.05], [61.0, 60.88], [62.0, 62.92], [63.0, 71.85], [75.0, 75.27], [78.0, 90.91], [94.0, 97.93], [98.0, 107.74], [116.0, 120.45], [122.0, 128.12], [129.0, 131.55]], "keep_status": [true, true, true, false, false, false, false, false, false, true, true, true, false, true, true], "silence_prob": [30.23, 37.17, 36.4, 34.31, 0.0, 0.0, 0.0, 31.97, 0.0, 30.16, 30.21, 40.38, 55.53, 42.6, 44.87], "audiomae_on_audioset": [[["speech", 39.79], ["music", 19.8], ["hum", 4.82]], [["speech", 31.12], ["thunk", 17.18], ["music", 12.76]], [["rumble", 22.41], ["hum", 20.45], ["speech", 18.76]], [["hum", 43.03], ["mains hum", 32.37], ["music", 4.99]], null, null, null, [["music", 45.99], ["didgeridoo", 20.12], ["speech", 13.6]], null, [["explosion", 20.34], ["speech", 15.44], ["burst, pop", 10.07]], [["speech", 21.3], ["whale vocalization", 19.84], ["music", 10.01]], [["speech", 32.05], ["animal", 17.9], ["music", 12.32]], null, [["music", 39.11], ["whale vocalization", 11.0], ["hum", 5.84]], [["music", 43.98], ["mains hum", 8.35], ["hum", 7.78]]], "duration": [4.78, 4.55, 21.9, 14.53, 1.05, -0.12, 0.92, 8.85, 0.27, 12.91, 3.93, 9.74, 4.45, 6.12, 2.55]} \ No newline at end of file diff --git a/annotations_filtered/o94LScznlmY_filtered.json b/annotations_filtered/o94LScznlmY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3899bd58f28959bf3cfbfe42a6c76083e3f008de --- /dev/null +++ b/annotations_filtered/o94LScznlmY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.61], [11.0, 11.92], [14.0, 14.64], [17.0, 17.9], [19.0, 19.99], [26.0, 27.06], [34.0, 73.97], [76.0, 77.11], [81.0, 88.45], [91.0, 91.29], [92.0, 96.94], [99.0, 108.41], [110.0, 114.03], [115.0, 115.26], [118.0, 118.83], [126.0, 131.73], [136.0, 146.84], [152.0, 153.59]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.12, 0.0, 41.3, 31.6, 44.01, 0.0, 0.0, 31.61, 30.84, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 46.19], ["fly, housefly", 7.17], ["whack, thwack", 6.44]], null, [["speech", 41.82], ["music", 37.49], ["coin (dropping)", 1.25]], [["music", 25.46], ["explosion", 11.68], ["hum", 7.06]], [["fly, housefly", 13.83], ["moo", 12.84], ["cattle, bovinae", 11.46]], null, null, [["music", 16.75], ["moo", 14.29], ["cattle, bovinae", 7.92]], [["speech", 52.77], ["buzz", 6.93], ["music", 5.05]], null], "duration": [0.61, 0.92, 0.64, 0.9, 0.99, 1.06, 39.97, 1.11, 7.45, 0.29, 4.94, 9.41, 4.03, 0.26, 0.83, 5.73, 10.84, 1.59]} \ No newline at end of file diff --git a/annotations_filtered/o9dLO77OSao_filtered.json b/annotations_filtered/o9dLO77OSao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81c37caf3571ee6fce33774cc7c6b403e63e46fe --- /dev/null +++ b/annotations_filtered/o9dLO77OSao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.34], [18.0, 19.55], [21.0, 22.71], [24.0, 26.7], [27.0, 29.15], [32.0, 33.2], [35.0, 35.24], [39.0, 40.14], [43.0, 45.0], [46.0, 47.46], [48.0, 49.18], [50.0, 50.41], [51.0, 52.19], [54.0, 55.41], [56.0, 57.06], [60.0, 63.21], [64.0, 65.18], [66.0, 66.36], [67.0, 68.72], [70.0, 72.1], [74.0, 74.48], [77.0, 78.61], [82.0, 83.15], [88.0, 88.5], [110.0, 112.04], [124.0, 125.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 67.38, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.34, 1.55, 1.71, 2.7, 2.15, 1.2, 0.24, 1.14, 2.0, 1.46, 1.18, 0.41, 1.19, 1.41, 1.06, 3.21, 1.18, 0.36, 1.72, 2.1, 0.48, 1.61, 1.15, 0.5, 2.04, 1.49]} \ No newline at end of file diff --git a/annotations_filtered/o9splceYBXQ_filtered.json b/annotations_filtered/o9splceYBXQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e50f27a2bd4fdc425eb41caf8b83956f86778733 --- /dev/null +++ b/annotations_filtered/o9splceYBXQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[88.0, 90.98], [92.0, 94.41], [95.0, 98.54], [99.0, 101.24]], "keep_status": [false, true, false, true], "silence_prob": [55.6, 36.05, 50.56, 32.01], "audiomae_on_audioset": [null, [["speech", 42.71], ["stomach rumble", 11.7], ["rowboat, canoe, kayak", 4.16]], null, [["speech", 12.35], ["vehicle", 4.95], ["radio", 4.38]]], "duration": [2.98, 2.41, 3.54, 2.24]} \ No newline at end of file diff --git a/annotations_filtered/o9zfxe4JVlQ_filtered.json b/annotations_filtered/o9zfxe4JVlQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f799a27cb643ad432a453091b6c9d28b357bcebb --- /dev/null +++ b/annotations_filtered/o9zfxe4JVlQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.01], [3.0, 3.92], [5.0, 8.51], [11.0, 11.16], [18.0, 19.53], [22.0, 22.55], [23.0, 23.46], [26.0, 27.28], [28.0, 28.97], [31.0, 31.75], [34.0, 35.04], [38.0, 38.38], [40.0, 42.15], [43.0, 51.11], [53.0, 52.89], [55.0, 56.86], [57.0, 57.75], [58.0, 64.05], [68.0, 70.6], [75.0, 75.29], [78.0, 91.56], [95.0, 94.74], [98.0, 105.12], [106.0, 107.2], [108.0, 108.65], [110.0, 113.83], [114.0, 114.24], [115.0, 116.36], [119.0, 123.26], [124.0, 125.56], [127.0, 126.87], [128.0, 128.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.19, 44.57, 0.0, 0.0, 0.0, 32.63, 32.94, 0.0, 33.78, 0.0, 33.94, 0.0, 0.0, 33.03, 0.0, 0.0, 32.81, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 33.15], ["cattle, bovinae", 18.52], ["livestock, farm animals, working animals", 10.97]], null, null, null, [["speech", 50.1], ["fart", 20.03], ["sound effect", 2.73]], [["boing", 74.54], ["speech", 5.9], ["whack, thwack", 2.8]], null, [["boing", 36.69], ["speech", 30.37], ["fart", 4.92]], null, [["boing", 32.89], ["animal", 11.79], ["speech", 10.88]], null, null, [["speech", 54.21], ["sidetone", 20.43], ["fart", 2.61]], null, null, [["boing", 39.04], ["speech", 35.72], ["thunk", 8.44]], null, null, null], "duration": [1.01, 0.92, 3.51, 0.16, 1.53, 0.55, 0.46, 1.28, 0.97, 0.75, 1.04, 0.38, 2.15, 8.11, -0.11, 1.86, 0.75, 6.05, 2.6, 0.29, 13.56, -0.26, 7.12, 1.2, 0.65, 3.83, 0.24, 1.36, 4.26, 1.56, -0.13, 0.02]} \ No newline at end of file diff --git a/annotations_filtered/oA-dHypOn9M_filtered.json b/annotations_filtered/oA-dHypOn9M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..290e8d545db8040306d209e67dd846d4dd768b14 --- /dev/null +++ b/annotations_filtered/oA-dHypOn9M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 147.82]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [143.82]} \ No newline at end of file diff --git a/annotations_filtered/oAFVhwUVJt4_filtered.json b/annotations_filtered/oAFVhwUVJt4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b08d2eb8ebd85387341461a2a2a26f2cc8b7d71 --- /dev/null +++ b/annotations_filtered/oAFVhwUVJt4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.96], [7.0, 9.41], [10.0, 13.51], [17.0, 20.68], [22.0, 25.95], [29.0, 33.39], [37.0, 38.04], [39.0, 40.42], [41.0, 42.08], [43.0, 44.14], [47.0, 51.93], [53.0, 53.91], [54.0, 55.14], [58.0, 59.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 69.34, 59.07, 99.92, 99.82, 99.96, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.96, 2.41, 3.51, 3.68, 3.95, 4.39, 1.04, 1.42, 1.08, 1.14, 4.93, 0.91, 1.14, 1.61]} \ No newline at end of file diff --git a/annotations_filtered/oAJYONuey_8_filtered.json b/annotations_filtered/oAJYONuey_8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c41c6ec7c9282a45e9446a380b8765ee3c8d053c --- /dev/null +++ b/annotations_filtered/oAJYONuey_8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.83], [3.0, 3.33], [5.0, 6.22], [12.0, 13.54], [14.0, 15.11], [16.0, 17.52], [19.0, 20.16], [26.0, 27.14], [29.0, 29.98], [32.0, 33.12], [41.0, 41.94], [44.0, 44.83], [50.0, 50.8], [52.0, 53.0], [55.0, 55.36], [61.0, 61.4], [66.0, 66.95], [76.0, 76.81], [84.0, 84.64], [87.0, 88.5], [89.0, 90.22], [97.0, 98.25], [105.0, 107.0], [112.0, 113.02], [116.0, 116.67], [117.0, 117.78], [125.0, 125.86], [128.0, 129.9], [134.0, 135.48], [136.0, 137.2], [139.0, 140.49], [142.0, 143.5], [145.0, 146.48], [152.0, 152.52], [153.0, 153.27], [155.0, 155.21], [159.0, 161.08], [164.0, 168.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.51, 45.21], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.79], ["hum", 8.6], ["throbbing", 5.68]]], "duration": [0.83, 0.33, 1.22, 1.54, 1.11, 1.52, 1.16, 1.14, 0.98, 1.12, 0.94, 0.83, 0.8, 1.0, 0.36, 0.4, 0.95, 0.81, 0.64, 1.5, 1.22, 1.25, 2.0, 1.02, 0.67, 0.78, 0.86, 1.9, 1.48, 1.2, 1.49, 1.5, 1.48, 0.52, 0.27, 0.21, 2.08, 4.18]} \ No newline at end of file diff --git a/annotations_filtered/oARVdCyRT98_filtered.json b/annotations_filtered/oARVdCyRT98_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7af70ae3eb2d5fd754f40351430c0337e47dc7b --- /dev/null +++ b/annotations_filtered/oARVdCyRT98_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.02], [5.0, 5.64], [10.0, 10.05], [12.0, 13.51], [16.0, 17.02], [22.0, 22.86], [32.0, 33.88], [38.0, 38.47], [39.0, 40.71], [42.0, 42.77], [49.0, 49.79], [54.0, 54.94], [65.0, 67.76], [69.0, 69.94], [73.0, 73.5], [77.0, 77.52], [78.0, 79.25], [82.0, 84.01], [85.0, 85.31], [87.0, 86.86], [90.0, 92.08], [95.0, 96.08], [99.0, 100.58], [103.0, 102.83], [104.0, 106.05], [108.0, 113.14], [115.0, 115.38], [124.0, 125.44], [126.0, 127.18], [130.0, 130.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [87.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 33.17, 68.93, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["boing", 32.86], ["speech", 13.06], ["music", 9.02]], null, null, null, null, null], "duration": [2.02, 0.64, 0.05, 1.51, 1.02, 0.86, 1.88, 0.47, 1.71, 0.77, 0.79, 0.94, 2.76, 0.94, 0.5, 0.52, 1.25, 2.01, 0.31, -0.14, 2.08, 1.08, 1.58, -0.17, 2.05, 5.14, 0.38, 1.44, 1.18, 0.18]} \ No newline at end of file diff --git a/annotations_filtered/oAb2_-uv41Y_filtered.json b/annotations_filtered/oAb2_-uv41Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78dd39dc855597180a180abc86cf716918c8fea4 --- /dev/null +++ b/annotations_filtered/oAb2_-uv41Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.59], [9.0, 9.14], [12.0, 12.21], [14.0, 15.74], [40.0, 40.47], [55.0, 55.71], [60.0, 61.28], [62.0, 64.17], [66.0, 68.57], [73.0, 73.6], [79.0, 85.68], [93.0, 94.39], [95.0, 96.06], [97.0, 99.72], [100.0, 101.28], [115.0, 116.4], [117.0, 118.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.83, 100.0, 0.0, 98.44, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.59, 0.14, 0.21, 1.74, 0.47, 0.71, 1.28, 2.17, 2.57, 0.6, 6.68, 1.39, 1.06, 2.72, 1.28, 1.4, 1.3]} \ No newline at end of file diff --git a/annotations_filtered/oAheN_ARn1U_filtered.json b/annotations_filtered/oAheN_ARn1U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0181f34aa657bc5e84f2e2844976c179b8dab952 --- /dev/null +++ b/annotations_filtered/oAheN_ARn1U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 38.35], [46.0, 62.31], [63.0, 63.93], [64.0, 65.67], [66.0, 77.57], [78.0, 80.64], [81.0, 145.91], [148.0, 152.56], [154.0, 154.68]], "keep_status": [false, true, false, false, false, true, false, false, false], "silence_prob": [90.95, 34.61, 0.0, 0.0, 38.2, 39.74, 0.0, 98.36, 0.0], "audiomae_on_audioset": [null, [["music", 38.45], ["fart", 8.29], ["buzz", 5.57]], null, null, [["music", 52.79], ["fart", 15.06], ["fly, housefly", 4.36]], [["speech", 21.07], ["music", 10.03], ["hum", 8.28]], null, null, null], "duration": [18.35, 16.31, 0.93, 1.67, 11.57, 2.64, 64.91, 4.56, 0.68]} \ No newline at end of file diff --git a/annotations_filtered/oAjKMLcDlfc_filtered.json b/annotations_filtered/oAjKMLcDlfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..050fc15cde29c2549aea6a0c23c26cfc3c20098e --- /dev/null +++ b/annotations_filtered/oAjKMLcDlfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.79], [5.0, 18.64], [20.0, 23.52], [24.0, 30.52], [34.0, 38.67], [48.0, 60.39], [64.0, 65.3], [69.0, 81.92], [83.0, 85.9], [87.0, 87.22], [87.0, 89.19], [94.0, 96.04], [98.0, 104.03], [105.0, 114.81], [120.0, 128.46], [131.0, 132.83]], "keep_status": [false, true, false, true, true, true, false, true, true, false, true, true, true, false, true, false], "silence_prob": [0.0, 29.71, 30.93, 29.48, 29.5, 29.53, 0.0, 29.89, 31.13, 0.0, 30.72, 29.56, 30.66, 29.99, 30.07, 0.0], "audiomae_on_audioset": [null, [["music", 25.36], ["mains hum", 18.58], ["hum", 15.45]], [["music", 60.46], ["didgeridoo", 7.7], ["noise", 6.25]], [["music", 19.2], ["tabla", 16.42], ["throbbing", 11.92]], [["hum", 17.69], ["music", 15.9], ["noise", 15.08]], [["music", 41.27], ["speech", 10.28], ["race car, auto racing", 5.38]], null, [["music", 15.03], ["moo", 7.96], ["fart", 6.2]], [["speech", 24.95], ["music", 18.27], ["meow", 6.64]], null, [["speech", 36.75], ["music", 13.75], ["crowd", 7.28]], [["music", 39.39], ["speech", 27.75], ["electronic music", 2.23]], [["music", 26.0], ["trombone", 12.6], ["musical instrument", 9.62]], [["cattle, bovinae", 40.86], ["moo", 23.01], ["livestock, farm animals, working animals", 10.28]], [["music", 34.71], ["theremin", 15.32], ["speech", 13.62]], null], "duration": [-0.21, 13.64, 3.52, 6.52, 4.67, 12.39, 1.3, 12.92, 2.9, 0.22, 2.19, 2.04, 6.03, 9.81, 8.46, 1.83]} \ No newline at end of file diff --git a/annotations_filtered/oBURpv30IkA_filtered.json b/annotations_filtered/oBURpv30IkA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a91320c35089e9af0168bfb7a834ec7b7d4038e8 --- /dev/null +++ b/annotations_filtered/oBURpv30IkA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.19], [13.0, 14.79], [15.0, 15.8], [16.0, 16.71], [17.0, 17.81], [20.0, 20.21], [34.0, 33.83], [38.0, 37.79], [38.0, 38.52], [39.0, 39.21], [43.0, 43.39], [48.0, 48.54], [60.0, 61.25], [69.0, 71.63], [75.0, 75.52], [83.0, 83.62], [94.0, 93.9], [99.0, 100.95], [101.0, 102.54], [107.0, 107.4], [110.0, 110.44], [112.0, 114.78], [115.0, 118.42], [119.0, 119.79], [120.0, 119.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.17, 35.11, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 51.03], ["speech", 23.97], ["guitar", 8.55]], [["music", 62.24], ["guitar", 11.63], ["musical instrument", 9.96]], null, null], "duration": [0.19, 1.79, 0.8, 0.71, 0.81, 0.21, -0.17, -0.21, 0.52, 0.21, 0.39, 0.54, 1.25, 2.63, 0.52, 0.62, -0.1, 1.95, 1.54, 0.4, 0.44, 2.78, 3.42, 0.79, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/oBfLI1WWrAI_filtered.json b/annotations_filtered/oBfLI1WWrAI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b04b432767b2a22eec2f2e47614444b996652bb4 --- /dev/null +++ b/annotations_filtered/oBfLI1WWrAI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.62], [29.0, 29.79], [31.0, 32.51], [34.0, 35.5], [37.0, 38.15], [39.0, 40.66], [41.0, 54.7], [58.0, 69.53], [82.0, 84.4], [85.0, 84.97], [98.0, 98.93], [100.0, 125.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.63, 43.45, 46.47, 0.0, 0.0, 37.78], "audiomae_on_audioset": [null, null, null, null, null, null, [["theremin", 35.2], ["music", 24.92], ["synthesizer", 11.8]], [["music", 59.09], ["ambient music", 8.03], ["theremin", 5.38]], [["music", 45.45], ["foghorn", 23.95], ["brass instrument", 6.5]], null, null, [["music", 69.74], ["musical instrument", 9.8], ["didgeridoo", 3.42]]], "duration": [1.62, 0.79, 1.51, 1.5, 1.15, 1.66, 13.7, 11.53, 2.4, -0.03, 0.93, 25.78]} \ No newline at end of file diff --git a/annotations_filtered/oBoPQUIowHY_filtered.json b/annotations_filtered/oBoPQUIowHY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4b81ce077b59163d1972df28282288e4edec270 --- /dev/null +++ b/annotations_filtered/oBoPQUIowHY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 9.9], [30.0, 30.72], [38.0, 39.21], [57.0, 56.61], [57.0, 59.39], [61.0, 63.64], [81.0, 84.06], [91.0, 91.52], [92.0, 93.65], [94.0, 95.4], [96.0, 96.72], [97.0, 101.92], [103.0, 105.78], [107.0, 107.89], [108.0, 110.93], [117.0, 117.44], [125.0, 127.48], [134.0, 138.37], [155.0, 156.47]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 46.9, 66.63, 40.93, 0.0, 0.0, 0.0, 0.0, 68.54, 81.0, 0.0, 59.96, 0.0, 78.72, 75.88, 0.0], "audiomae_on_audioset": [null, null, null, null, [["cowbell", 19.59], ["sheep", 8.27], ["bleat", 6.23]], null, [["speech", 54.47], ["hum", 8.7], ["mains hum", 7.04]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.1, 0.72, 1.21, -0.39, 2.39, 2.64, 3.06, 0.52, 1.65, 1.4, 0.72, 4.92, 2.78, 0.89, 2.93, 0.44, 2.48, 4.37, 1.47]} \ No newline at end of file diff --git a/annotations_filtered/oBtG0gj6MxA_filtered.json b/annotations_filtered/oBtG0gj6MxA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1ad19dc4f0c4f70b0b58a15385b165f47ffb9e1 --- /dev/null +++ b/annotations_filtered/oBtG0gj6MxA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.19], [9.0, 9.8], [19.0, 20.9], [21.0, 26.05], [27.0, 28.21], [30.0, 38.75], [40.0, 40.41], [41.0, 48.25], [50.0, 54.7], [65.0, 66.06], [71.0, 71.46], [73.0, 98.86], [99.0, 100.06], [100.0, 112.01]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.93, 0.0, 31.01, 0.0, 30.91, 34.0, 0.0, 0.0, 31.6, 0.0, 30.59], "audiomae_on_audioset": [null, null, null, [["music", 80.91], ["theremin", 3.41], ["musical instrument", 2.86]], null, [["music", 29.22], ["hum", 27.13], ["throbbing", 26.71]], null, [["music", 45.93], ["speech", 16.6], ["boing", 10.09]], [["music", 40.16], ["theremin", 10.7], ["wind instrument, woodwind instrument", 7.97]], null, null, [["music", 77.51], ["didgeridoo", 6.29], ["throbbing", 2.06]], null, [["music", 72.98], ["buzz", 3.3], ["reggae", 2.07]]], "duration": [0.19, 0.8, 1.9, 5.05, 1.21, 8.75, 0.41, 7.25, 4.7, 1.06, 0.46, 25.86, 1.06, 12.01]} \ No newline at end of file diff --git a/annotations_filtered/oCDk1jDXZnM_filtered.json b/annotations_filtered/oCDk1jDXZnM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1321f3d4376aef2d75e389044ec149814d8f1ef2 --- /dev/null +++ b/annotations_filtered/oCDk1jDXZnM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.13], [8.0, 9.76], [11.0, 12.83], [14.0, 15.09], [18.0, 21.24], [23.0, 23.16], [26.0, 29.05], [30.0, 31.21], [33.0, 33.83], [36.0, 41.03], [42.0, 43.83]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 66.51, 0.0, 53.04, 0.0, 0.0, 34.96, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["sidetone", 22.29], ["frog", 9.21], ["hum", 8.08]], null], "duration": [1.13, 1.76, 1.83, 1.09, 3.24, 0.16, 3.05, 1.21, 0.83, 5.03, 1.83]} \ No newline at end of file diff --git a/annotations_filtered/oCE8jHLJe3g_filtered.json b/annotations_filtered/oCE8jHLJe3g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58b58dab68fa4d82bb23869823930b400fe05763 --- /dev/null +++ b/annotations_filtered/oCE8jHLJe3g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 39.56], [43.0, 74.07]], "keep_status": [true, false], "silence_prob": [30.67, 0.0], "audiomae_on_audioset": [[["music", 39.96], ["didgeridoo", 14.58], ["speech", 7.16]], null], "duration": [11.56, 31.07]} \ No newline at end of file diff --git a/annotations_filtered/oCHEAaCGj7k_filtered.json b/annotations_filtered/oCHEAaCGj7k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da77d50c1cc2bc273b70deb4310b5669c5cf282e --- /dev/null +++ b/annotations_filtered/oCHEAaCGj7k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.89], [7.0, 11.3], [14.0, 19.77], [21.0, 22.74], [23.0, 26.15], [29.0, 29.27], [31.0, 31.28], [32.0, 33.84], [34.0, 35.51], [43.0, 43.83], [45.0, 45.06], [46.0, 46.04], [49.0, 51.19], [52.0, 51.88]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [46.19, 38.28, 38.75, 0.0, 57.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.28, 0.0], "audiomae_on_audioset": [[["music", 68.7], ["ambient music", 10.98], ["electronic music", 2.15]], [["music", 28.96], ["hum", 22.35], ["throbbing", 16.8]], [["music", 44.73], ["hum", 8.7], ["synthesizer", 8.22]], null, null, null, null, null, null, null, null, null, [["music", 33.16], ["speech", 17.99], ["foghorn", 14.06]], null], "duration": [3.89, 4.3, 5.77, 1.74, 3.15, 0.27, 0.28, 1.84, 1.51, 0.83, 0.06, 0.04, 2.19, -0.12]} \ No newline at end of file diff --git a/annotations_filtered/oCjXFnr826Y_filtered.json b/annotations_filtered/oCjXFnr826Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9fdc385b7f6c18024f7ac9260129b6111fc2d04b --- /dev/null +++ b/annotations_filtered/oCjXFnr826Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.16], [11.0, 12.24], [14.0, 20.56], [21.0, 24.21], [26.0, 25.95], [28.0, 29.35], [36.0, 36.63], [38.0, 38.13], [41.0, 40.88], [42.0, 42.9], [47.0, 49.81], [51.0, 53.79], [56.0, 57.89], [59.0, 60.24], [73.0, 75.34], [76.0, 78.49], [83.0, 87.49], [89.0, 89.95], [91.0, 91.94], [92.0, 94.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.96, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 100.0, 0.0, 0.0, 100.0, 95.23, 44.57, 0.0, 0.0, 62.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 47.26], ["thunk", 29.14], ["door", 3.81]], null, null, null], "duration": [1.16, 1.24, 6.56, 3.21, -0.05, 1.35, 0.63, 0.13, -0.12, 0.9, 2.81, 2.79, 1.89, 1.24, 2.34, 2.49, 4.49, 0.95, 0.94, 2.59]} \ No newline at end of file diff --git a/annotations_filtered/oCq7TUmVmt8_filtered.json b/annotations_filtered/oCq7TUmVmt8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eace1898e976c3f95618b92627c706af23eaba18 --- /dev/null +++ b/annotations_filtered/oCq7TUmVmt8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.93], [14.0, 14.55], [18.0, 18.76], [20.0, 20.65], [22.0, 23.52], [25.0, 32.58], [34.0, 35.58], [38.0, 38.57], [40.0, 41.01], [44.0, 44.51], [46.0, 48.61], [51.0, 62.99], [65.0, 66.88], [68.0, 69.25], [72.0, 86.76], [88.0, 90.78], [92.0, 93.07], [95.0, 114.88], [117.0, 123.67], [125.0, 127.06], [128.0, 130.18], [133.0, 134.52], [135.0, 136.27], [138.0, 138.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 47.08, 0.0, 0.0, 0.0, 0.0, 35.11, 47.23, 0.0, 0.0, 55.25, 46.79, 0.0, 43.4, 70.3, 53.4, 35.76, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 57.33], ["musical instrument", 8.58], ["wind instrument, woodwind instrument", 8.48]], null, null, null, null, [["music", 28.13], ["speech", 26.45], ["sidetone", 26.29]], [["music", 39.16], ["brass instrument", 12.65], ["trombone", 7.88]], null, null, null, [["music", 42.47], ["musical instrument", 6.31], ["effects unit", 4.3]], null, [["music", 53.84], ["musical instrument", 6.26], ["didgeridoo", 4.06]], null, null, [["music", 34.73], ["didgeridoo", 25.03], ["speech", 6.43]], null, null, null], "duration": [0.93, 0.55, 0.76, 0.65, 1.52, 7.58, 1.58, 0.57, 1.01, 0.51, 2.61, 11.99, 1.88, 1.25, 14.76, 2.78, 1.07, 19.88, 6.67, 2.06, 2.18, 1.52, 1.27, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/oD-1eCD7lkE_filtered.json b/annotations_filtered/oD-1eCD7lkE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2b19011f1fa0a45e181d8386dfa2d0868c26ccc --- /dev/null +++ b/annotations_filtered/oD-1eCD7lkE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 13.88], [15.0, 16.44], [19.0, 21.1], [23.0, 23.13], [24.0, 24.49], [27.0, 27.28], [29.0, 30.42], [34.0, 34.06], [36.0, 36.22], [43.0, 46.08], [47.0, 47.17], [50.0, 50.01], [53.0, 53.27], [56.0, 57.21], [59.0, 59.59], [60.0, 60.79], [80.0, 85.38], [87.0, 87.37], [91.0, 91.62], [96.0, 96.47], [106.0, 106.0], [107.0, 108.8], [110.0, 110.96], [113.0, 113.44], [116.0, 118.54], [123.0, 124.6], [125.0, 131.6], [133.0, 133.14], [135.0, 142.28], [146.0, 145.89], [148.0, 149.84], [154.0, 154.97], [157.0, 168.86], [171.0, 173.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.74, 0.0, 31.78, 0.0, 71.57, 0.0, 0.0, 0.0, 29.59, 45.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 75.53], ["synthesizer", 4.08], ["theremin", 2.82]], null, null, null, null, null, [["speech", 70.95], ["explosion", 4.48], ["buzz", 3.74]], [["cattle, bovinae", 33.92], ["moo", 31.88], ["livestock, farm animals, working animals", 12.76]]], "duration": [-0.12, 1.44, 2.1, 0.13, 0.49, 0.28, 1.42, 0.06, 0.22, 3.08, 0.17, 0.01, 0.27, 1.21, 0.59, 0.79, 5.38, 0.37, 0.62, 0.47, 0.0, 1.8, 0.96, 0.44, 2.54, 1.6, 6.6, 0.14, 7.28, -0.11, 1.84, 0.97, 11.86, 2.57]} \ No newline at end of file diff --git a/annotations_filtered/oD4UHPNEZek_filtered.json b/annotations_filtered/oD4UHPNEZek_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..062086bae7f8d8070d860c0077a44ac05d57ad3e --- /dev/null +++ b/annotations_filtered/oD4UHPNEZek_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 23.58], [25.0, 39.04], [40.0, 41.23], [47.0, 47.98], [50.0, 51.34]], "keep_status": [true, false, false, false, false], "silence_prob": [46.12, 31.64, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 46.7], ["mains hum", 11.09], ["music", 10.14]], [["music", 46.63], ["hum", 24.13], ["buzz", 5.06]], null, null, null], "duration": [3.58, 14.04, 1.23, 0.98, 1.34]} \ No newline at end of file diff --git a/annotations_filtered/oDA4sUtM9B8_filtered.json b/annotations_filtered/oDA4sUtM9B8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7c69c000e909a18d55ea9b48ea54d400af8d881 --- /dev/null +++ b/annotations_filtered/oDA4sUtM9B8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.7], [5.0, 5.24], [6.0, 7.06], [10.0, 32.24], [33.0, 57.62], [59.0, 76.54], [89.0, 89.36], [91.0, 125.95], [132.0, 136.31]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 50.76, 46.79, 45.14, 0.0, 0.0, 53.04], "audiomae_on_audioset": [null, null, null, null, [["music", 75.55], ["theremin", 2.57], ["musical instrument", 2.29]], [["music", 53.9], ["theremin", 33.77], ["musical instrument", 1.36]], null, null, null], "duration": [0.7, 0.24, 1.06, 22.24, 24.62, 17.54, 0.36, 34.95, 4.31]} \ No newline at end of file diff --git a/annotations_filtered/oDD1tW59Mjg_filtered.json b/annotations_filtered/oDD1tW59Mjg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5ea222745ca140da3fea490cea9fd549ba3dfcd --- /dev/null +++ b/annotations_filtered/oDD1tW59Mjg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.48], [6.0, 9.59], [14.0, 14.88], [17.0, 18.08], [19.0, 19.92], [22.0, 22.35], [26.0, 28.56], [37.0, 39.16], [42.0, 42.08], [50.0, 52.0], [53.0, 54.51], [64.0, 65.11], [66.0, 66.95], [84.0, 85.16], [86.0, 87.42], [100.0, 101.14], [103.0, 104.13], [105.0, 109.31], [110.0, 115.82], [123.0, 123.38], [124.0, 124.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.29, 0.0, 0.0, 0.0, 0.0, 55.6, 97.92, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 59.33, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 3.59, 0.88, 1.08, 0.92, 0.35, 2.56, 2.16, 0.08, 2.0, 1.51, 1.11, 0.95, 1.16, 1.42, 1.14, 1.13, 4.31, 5.82, 0.38, 0.55]} \ No newline at end of file diff --git a/annotations_filtered/oDcNKpBgd_0_filtered.json b/annotations_filtered/oDcNKpBgd_0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..895d264d1815d4958c9ed059cfc37bb524a457b6 --- /dev/null +++ b/annotations_filtered/oDcNKpBgd_0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 40.37], [41.0, 74.31], [77.0, 86.31], [88.0, 105.31], [107.0, 107.77], [108.0, 155.68], [157.0, 156.93], [157.0, 157.79], [159.0, 159.48], [160.0, 169.91]], "keep_status": [true, false, true, true, false, false, false, false, false, true], "silence_prob": [27.97, 0.0, 28.15, 27.82, 0.0, 0.0, 0.0, 0.0, 0.0, 27.99], "audiomae_on_audioset": [[["music", 26.67], ["rumble", 9.25], ["sound effect", 4.64]], null, [["music", 32.03], ["grunt", 5.57], ["animal", 5.54]], [["music", 11.28], ["vehicle", 7.41], ["rumble", 4.89]], null, null, null, null, null, [["speech", 29.44], ["explosion", 6.75], ["whoosh, swoosh, swish", 5.65]]], "duration": [20.37, 33.31, 9.31, 17.31, 0.77, 47.68, -0.07, 0.79, 0.48, 9.91]} \ No newline at end of file diff --git a/annotations_filtered/oDeQU3l-JSg_filtered.json b/annotations_filtered/oDeQU3l-JSg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..577f3dbd7c5a1149d021a456458c81f633df50ba --- /dev/null +++ b/annotations_filtered/oDeQU3l-JSg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.86], [6.0, 7.79], [10.0, 15.08], [19.0, 26.62], [28.0, 28.59], [40.0, 40.27], [44.0, 49.54], [50.0, 50.28], [54.0, 54.65], [67.0, 68.42], [71.0, 71.83], [81.0, 81.82], [86.0, 95.59], [99.0, 104.9], [107.0, 107.45], [110.0, 111.55], [113.0, 113.32], [115.0, 129.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true], "silence_prob": [0.0, 0.0, 58.22, 48.48, 0.0, 0.0, 61.47, 0.0, 0.0, 0.0, 0.0, 0.0, 32.77, 41.4, 0.0, 0.0, 0.0, 31.49], "audiomae_on_audioset": [null, null, null, [["music", 48.54], ["didgeridoo", 16.62], ["knock", 11.7]], null, null, null, null, null, null, null, null, [["cattle, bovinae", 17.27], ["moo", 12.11], ["livestock, farm animals, working animals", 9.16]], [["electric shaver, electric razor", 19.19], ["speech", 17.75], ["fly, housefly", 8.51]], null, null, null, [["music", 35.15], ["sheep", 8.59], ["boing", 6.99]]], "duration": [0.86, 1.79, 5.08, 7.62, 0.59, 0.27, 5.54, 0.28, 0.65, 1.42, 0.83, 0.82, 9.59, 5.9, 0.45, 1.55, 0.32, 14.54]} \ No newline at end of file diff --git a/annotations_filtered/oDjuY9KCsI8_filtered.json b/annotations_filtered/oDjuY9KCsI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ddb58b3ed326e514af7439afc317b1b75c02489 --- /dev/null +++ b/annotations_filtered/oDjuY9KCsI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.76], [5.0, 5.02], [6.0, 6.56], [11.0, 11.43], [20.0, 20.06], [31.0, 32.24], [35.0, 35.8], [38.0, 38.94], [43.0, 43.34], [68.0, 68.17], [75.0, 74.66], [79.0, 79.89], [83.0, 83.12], [87.0, 87.62], [89.0, 89.46], [90.0, 91.35], [92.0, 91.96], [93.0, 93.83], [99.0, 106.46], [107.0, 108.35], [124.0, 124.77], [126.0, 127.06], [129.0, 129.37], [131.0, 132.33], [134.0, 134.59], [135.0, 137.44], [138.0, 139.31], [142.0, 142.75], [143.0, 149.81], [150.0, 151.28], [152.0, 153.6], [155.0, 156.27], [157.0, 158.67], [166.0, 167.04], [169.0, 170.19], [173.0, 174.09], [177.0, 180.66], [182.0, 186.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.64, 0.0, 0.0, 51.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.04, 68.28], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.76, 0.02, 0.56, 0.43, 0.06, 1.24, 0.8, 0.94, 0.34, 0.17, -0.34, 0.89, 0.12, 0.62, 0.46, 1.35, -0.04, 0.83, 7.46, 1.35, 0.77, 1.06, 0.37, 1.33, 0.59, 2.44, 1.31, 0.75, 6.81, 1.28, 1.6, 1.27, 1.67, 1.04, 1.19, 1.09, 3.66, 4.65]} \ No newline at end of file diff --git a/annotations_filtered/oEFPcljAXgs_filtered.json b/annotations_filtered/oEFPcljAXgs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4d291d18b8a7ee6512b5098dbbbbaf59b33b439 --- /dev/null +++ b/annotations_filtered/oEFPcljAXgs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.74], [8.0, 11.47], [12.0, 13.93], [26.0, 25.89], [29.0, 30.2], [32.0, 33.94], [36.0, 36.51], [40.0, 41.34], [42.0, 59.04], [60.0, 63.51], [64.0, 64.61], [68.0, 68.52], [69.0, 72.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 57.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.63, 51.82, 0.0, 0.0, 69.47], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.74, 3.47, 1.93, -0.11, 1.2, 1.94, 0.51, 1.34, 17.04, 3.51, 0.61, 0.52, 3.12]} \ No newline at end of file diff --git a/annotations_filtered/oEHayxH_YT8_filtered.json b/annotations_filtered/oEHayxH_YT8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8dafcc4ee18283df8cb7c4691a8650270d0e493b --- /dev/null +++ b/annotations_filtered/oEHayxH_YT8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 26.1], [26.0, 57.67], [60.0, 72.52], [74.0, 75.73], [76.0, 80.79], [81.0, 102.3], [105.0, 106.89], [108.0, 114.44], [116.0, 118.4], [119.0, 128.28], [129.0, 139.38], [140.0, 140.34], [141.0, 142.89], [146.0, 146.37]], "keep_status": [true, false, false, false, false, true, false, true, true, true, false, false, false, false], "silence_prob": [30.19, 0.0, 50.36, 0.0, 49.36, 39.01, 0.0, 47.98, 47.5, 47.74, 32.87, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 22.62], ["hum", 15.57], ["throbbing", 14.13]], null, null, null, [["hum", 35.49], ["mains hum", 21.29], ["music", 17.06]], [["music", 31.07], ["hum", 19.1], ["synthesizer", 10.39]], null, [["hum", 25.31], ["throbbing", 17.69], ["music", 17.34]], [["music", 45.05], ["hum", 7.99], ["mains hum", 3.88]], [["speech", 20.83], ["mains hum", 18.86], ["hum", 18.07]], [["hum", 53.68], ["mains hum", 16.84], ["throbbing", 9.36]], null, null, null], "duration": [14.1, 31.67, 12.52, 1.73, 4.79, 21.3, 1.89, 6.44, 2.4, 9.28, 10.38, 0.34, 1.89, 0.37]} \ No newline at end of file diff --git a/annotations_filtered/oEUB2LSsbe8_filtered.json b/annotations_filtered/oEUB2LSsbe8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b81cb5dfa06ba62f858b28599b3bcb7a826b8ac --- /dev/null +++ b/annotations_filtered/oEUB2LSsbe8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 16.65], [23.0, 24.02], [26.0, 26.42], [28.0, 29.89], [35.0, 37.5], [40.0, 40.46], [41.0, 41.66], [42.0, 60.98], [70.0, 70.01], [73.0, 73.67], [76.0, 76.89], [78.0, 78.9], [81.0, 82.58], [84.0, 84.43], [91.0, 93.23], [95.0, 96.25], [101.0, 100.67], [113.0, 114.4], [116.0, 116.97], [118.0, 122.67]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [32.77, 0.0, 0.0, 0.0, 97.64, 0.0, 0.0, 56.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.64, 0.0, 0.0, 0.0, 0.0, 35.52], "audiomae_on_audioset": [[["speech", 29.4], ["radio", 14.66], ["hum", 14.51]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["telephone", 8.59], ["whale vocalization", 7.25], ["vehicle", 5.64]], null, null, null, null, [["bee, wasp, etc.", 34.45], ["fly, housefly", 26.66], ["insect", 24.33]]], "duration": [13.65, 1.02, 0.42, 1.89, 2.5, 0.46, 0.66, 18.98, 0.01, 0.67, 0.89, 0.9, 1.58, 0.43, 2.23, 1.25, -0.33, 1.4, 0.97, 4.67]} \ No newline at end of file diff --git a/annotations_filtered/oEddtexPCso_filtered.json b/annotations_filtered/oEddtexPCso_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2aea6158bd5ce1c504fc1de3829c69d78cb4d508 --- /dev/null +++ b/annotations_filtered/oEddtexPCso_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 35.61], [43.0, 43.9], [51.0, 52.08], [56.0, 56.27], [57.0, 57.72], [65.0, 65.08], [68.0, 73.36], [74.0, 74.7], [76.0, 76.55], [77.0, 85.16], [87.0, 87.34], [91.0, 91.27], [92.0, 94.9], [98.0, 97.53], [98.0, 100.31], [102.0, 103.99], [113.0, 114.61], [117.0, 123.99], [124.0, 126.86], [130.0, 141.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.71, 0.0, 0.0, 31.48, 0.0, 0.0, 38.35, 0.0, 35.75, 0.0, 0.0, 35.37, 34.61, 31.38], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 53.79], ["fart", 25.43], ["music", 6.05]], null, null, [["speech", 58.52], ["music", 18.85], ["electric shaver, electric razor", 2.99]], null, null, [["music", 44.4], ["speech", 33.73], ["synthesizer", 3.94]], null, [["speech", 30.63], ["music", 20.96], ["sound effect", 5.44]], null, null, [["speech", 41.52], ["music", 28.72], ["telephone bell ringing", 6.01]], [["music", 36.52], ["mains hum", 13.12], ["hum", 7.91]], [["mains hum", 52.19], ["hum", 36.52], ["music", 4.92]]], "duration": [0.61, 0.9, 1.08, 0.27, 0.72, 0.08, 5.36, 0.7, 0.55, 8.16, 0.34, 0.27, 2.9, -0.47, 2.31, 1.99, 1.61, 6.99, 2.86, 11.45]} \ No newline at end of file diff --git a/annotations_filtered/oEtIf_2mzJc_filtered.json b/annotations_filtered/oEtIf_2mzJc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2dbbe9fd001a27b9bce1797f8022418487fa473a --- /dev/null +++ b/annotations_filtered/oEtIf_2mzJc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.27], [5.0, 5.32], [10.0, 11.4], [12.0, 12.41], [16.0, 18.37], [23.0, 23.79], [30.0, 30.62], [36.0, 39.55], [40.0, 42.62], [46.0, 46.43], [49.0, 50.9], [52.0, 54.65], [58.0, 60.1], [65.0, 65.06], [66.0, 66.61], [67.0, 67.17], [75.0, 74.76], [85.0, 85.06], [86.0, 87.07], [89.0, 88.79], [90.0, 90.76], [92.0, 92.37], [95.0, 95.22], [96.0, 96.77], [128.0, 129.2], [133.0, 132.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 0.0, 88.1, 99.88, 0.0, 0.0, 99.94, 73.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.27, 0.32, 1.4, 0.41, 2.37, 0.79, 0.62, 3.55, 2.62, 0.43, 1.9, 2.65, 2.1, 0.06, 0.61, 0.17, -0.24, 0.06, 1.07, -0.21, 0.76, 0.37, 0.22, 0.77, 1.2, -0.07]} \ No newline at end of file diff --git a/annotations_filtered/oFwbpFJpQbg_filtered.json b/annotations_filtered/oFwbpFJpQbg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..03a8fc1ff571c9aa0f0edc4f6364ed0cb01b0cd1 --- /dev/null +++ b/annotations_filtered/oFwbpFJpQbg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.31], [26.0, 32.66], [44.0, 45.15], [55.0, 80.11], [82.0, 82.04], [82.0, 82.14], [82.0, 87.88], [90.0, 90.83]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.14, 0.0, 29.99, 0.0, 0.0, 30.32, 0.0], "audiomae_on_audioset": [null, [["cattle, bovinae", 33.33], ["livestock, farm animals, working animals", 28.44], ["moo", 14.04]], null, [["music", 68.08], ["bleat", 4.6], ["sheep", 3.3]], null, null, [["music", 53.63], ["speech", 10.45], ["didgeridoo", 8.67]], null], "duration": [0.31, 6.66, 1.15, 25.11, 0.04, 0.14, 5.88, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/oG-MKxVWwi4_filtered.json b/annotations_filtered/oG-MKxVWwi4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e345fdcfc3b6ee7f6fc30ec40707b26d61f9bdcf --- /dev/null +++ b/annotations_filtered/oG-MKxVWwi4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.03], [12.0, 13.0], [20.0, 20.07], [22.0, 22.49], [26.0, 28.59], [29.0, 31.58], [32.0, 32.86], [34.0, 35.4], [38.0, 38.75], [40.0, 40.9], [66.0, 66.85], [68.0, 71.05], [75.0, 75.76], [77.0, 78.31], [83.0, 85.65], [87.0, 87.71], [90.0, 90.39], [94.0, 95.2], [97.0, 115.21], [117.0, 118.93], [127.0, 129.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 68.15, 57.81, 0.0, 0.0, 0.0, 0.0, 0.0, 75.39, 0.0, 0.0, 76.04, 0.0, 0.0, 0.0, 70.3, 0.0, 60.42], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.03, 1.0, 0.07, 0.49, 2.59, 2.58, 0.86, 1.4, 0.75, 0.9, 0.85, 3.05, 0.76, 1.31, 2.65, 0.71, 0.39, 1.2, 18.21, 1.93, 2.17]} \ No newline at end of file diff --git a/annotations_filtered/oG58-Vs838M_filtered.json b/annotations_filtered/oG58-Vs838M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da89112eee3c2b8331d4b85d6285bb37c550a4c8 --- /dev/null +++ b/annotations_filtered/oG58-Vs838M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 14.13], [17.0, 17.56], [25.0, 29.57], [30.0, 29.64], [30.0, 29.69], [30.0, 29.81], [30.0, 43.28], [50.0, 53.94], [55.0, 56.57], [58.0, 58.7], [89.0, 91.44], [93.0, 93.65], [105.0, 105.27], [106.0, 107.72], [109.0, 110.15], [112.0, 113.41], [116.0, 116.72], [123.0, 123.52]], "keep_status": [true, false, true, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.55, 0.0, 32.97, 0.0, 0.0, 0.0, 46.47, 41.66, 0.0, 0.0, 68.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 35.94], ["synthesizer", 13.93], ["effects unit", 8.2]], null, [["hum", 23.59], ["throbbing", 16.89], ["whale vocalization", 12.96]], null, null, null, [["speech", 43.55], ["buzz", 8.95], ["bee, wasp, etc.", 7.91]], [["speech", 34.55], ["music", 22.46], ["mains hum", 3.55]], null, null, null, null, null, null, null, null, null, null], "duration": [9.13, 0.56, 4.57, -0.36, -0.31, -0.19, 13.28, 3.94, 1.57, 0.7, 2.44, 0.65, 0.27, 1.72, 1.15, 1.41, 0.72, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/oG5vsPJ5Tos_filtered.json b/annotations_filtered/oG5vsPJ5Tos_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cfaf179f5e7028a380c4e36900e06cc5faba1fac --- /dev/null +++ b/annotations_filtered/oG5vsPJ5Tos_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 37.25], [38.0, 65.52], [68.0, 69.09], [70.0, 70.5], [74.0, 75.32], [76.0, 81.8], [85.0, 86.24], [87.0, 90.39], [93.0, 93.14], [94.0, 100.41], [101.0, 103.01], [103.0, 104.55], [110.0, 110.22], [113.0, 116.26], [117.0, 117.85]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 55.53, 0.0, 0.0, 0.0, 39.35, 0.0, 46.94, 0.0, 55.89, 83.16, 0.0, 0.0, 84.62, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 31.62], ["speech", 25.25], ["hum", 6.17]], null, [["speech", 27.17], ["sidetone", 11.32], ["music", 7.58]], null, null, null, null, null, null, null], "duration": [1.25, 27.52, 1.09, 0.5, 1.32, 5.8, 1.24, 3.39, 0.14, 6.41, 2.01, 1.55, 0.22, 3.26, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/oGV14YsOvWo_filtered.json b/annotations_filtered/oGV14YsOvWo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a49df3333498ef55fa2294e6a87c190687ed1c66 --- /dev/null +++ b/annotations_filtered/oGV14YsOvWo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.35], [3.0, 9.19], [10.0, 16.01], [18.0, 20.66], [27.0, 28.85], [29.0, 29.62], [32.0, 32.37], [33.0, 36.76], [47.0, 53.67], [58.0, 60.32], [67.0, 99.62], [100.0, 101.63], [102.0, 106.73], [107.0, 116.09], [117.0, 120.09], [121.0, 123.57], [124.0, 129.22], [136.0, 136.46], [137.0, 139.06], [141.0, 149.28]], "keep_status": [false, false, true, true, false, false, false, true, true, true, false, false, false, false, true, false, false, false, true, true], "silence_prob": [0.0, 38.23, 34.49, 34.59, 0.0, 0.0, 0.0, 32.63, 32.97, 33.16, 0.0, 0.0, 73.51, 74.29, 48.35, 59.77, 51.6, 0.0, 34.68, 31.78], "audiomae_on_audioset": [null, [["music", 59.9], ["boing", 16.0], ["speech", 10.71]], [["music", 32.99], ["boing", 18.17], ["wind instrument, woodwind instrument", 17.21]], [["music", 38.41], ["fly, housefly", 8.0], ["sidetone", 7.79]], null, null, null, [["boing", 17.19], ["cattle, bovinae", 16.74], ["music", 13.04]], [["whack, thwack", 26.41], ["music", 23.18], ["quack", 5.98]], [["moo", 37.44], ["cattle, bovinae", 16.33], ["livestock, farm animals, working animals", 16.1]], null, null, null, null, [["speech", 26.45], ["music", 11.59], ["wail, moan", 10.82]], null, null, null, [["speech", 23.94], ["music", 19.82], ["crowd", 7.4]], [["sidetone", 26.7], ["music", 20.27], ["speech", 12.58]]], "duration": [0.35, 6.19, 6.01, 2.66, 1.85, 0.62, 0.37, 3.76, 6.67, 2.32, 32.62, 1.63, 4.73, 9.09, 3.09, 2.57, 5.22, 0.46, 2.06, 8.28]} \ No newline at end of file diff --git a/annotations_filtered/oGxBx8RzzrM_filtered.json b/annotations_filtered/oGxBx8RzzrM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78547eb9246c4c19bf30afef41fb8a4fe3b8592f --- /dev/null +++ b/annotations_filtered/oGxBx8RzzrM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.09], [5.0, 6.15], [10.0, 9.76], [10.0, 10.76], [12.0, 17.29], [19.0, 24.95], [27.0, 28.27], [30.0, 30.82], [32.0, 33.99], [36.0, 41.45], [45.0, 51.7], [66.0, 72.3], [73.0, 73.45], [73.0, 75.05], [88.0, 94.39], [99.0, 143.33], [149.0, 148.69], [149.0, 151.16], [153.0, 158.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 45.43, 59.24, 0.0, 0.0, 0.0, 38.17, 31.7, 31.02, 0.0, 31.16, 30.89, 0.0, 0.0, 31.23, 36.96], "audiomae_on_audioset": [null, null, null, null, [["music", 52.29], ["speech", 21.3], ["boing", 6.43]], null, null, null, null, [["speech", 56.74], ["music", 16.33], ["synthesizer", 4.4]], [["music", 66.71], ["speech", 7.82], ["cattle, bovinae", 3.04]], [["music", 83.37], ["swing music", 3.62], ["funk", 1.42]], null, [["music", 51.26], ["speech", 5.21], ["musical instrument", 3.72]], [["music", 71.82], ["singing", 3.06], ["sampler", 2.01]], null, null, [["music", 55.29], ["singing", 8.09], ["synthesizer", 3.15]], [["music", 42.19], ["speech", 9.42], ["sidetone", 7.71]]], "duration": [0.09, 1.15, -0.24, 0.76, 5.29, 5.95, 1.27, 0.82, 1.99, 5.45, 6.7, 6.3, 0.45, 2.05, 6.39, 44.33, -0.31, 2.16, 5.21]} \ No newline at end of file diff --git a/annotations_filtered/oH-kAHKtbTE_filtered.json b/annotations_filtered/oH-kAHKtbTE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84673b966d7c2cb260c250f727aeb50cee1b2e76 --- /dev/null +++ b/annotations_filtered/oH-kAHKtbTE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.95], [7.0, 7.43], [10.0, 17.36], [19.0, 23.77], [25.0, 27.78], [29.0, 30.52], [31.0, 35.16], [36.0, 38.4], [50.0, 52.74], [53.0, 66.48], [67.0, 89.88], [92.0, 94.68], [95.0, 95.84], [97.0, 104.97], [108.0, 109.02], [113.0, 151.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 66.39, 90.25, 79.24, 0.0, 83.7, 79.41, 96.77, 82.43, 82.97, 46.79, 0.0, 55.67, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["dog", 27.03], ["bow-wow", 11.43], ["domestic animals, pets", 8.82]], null, null, null, null], "duration": [1.95, 0.43, 7.36, 4.77, 2.78, 1.52, 4.16, 2.4, 2.74, 13.48, 22.88, 2.68, 0.84, 7.97, 1.02, 38.16]} \ No newline at end of file diff --git a/annotations_filtered/oHJVJ_MEyQI_filtered.json b/annotations_filtered/oHJVJ_MEyQI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b6a41faa34b9b297f08fd88bb2e672d237b6c5b --- /dev/null +++ b/annotations_filtered/oHJVJ_MEyQI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 33.35], [38.0, 63.73], [64.0, 66.51], [67.0, 73.6], [74.0, 77.19], [78.0, 80.62], [81.0, 86.22], [87.0, 99.79]], "keep_status": [false, true, false, false, false, false, false, false], "silence_prob": [0.0, 31.92, 41.42, 37.14, 34.72, 37.13, 31.55, 31.52], "audiomae_on_audioset": [null, [["throbbing", 22.51], ["hum", 20.76], ["music", 8.13]], [["gong", 43.24], ["music", 30.77], ["musical instrument", 4.19]], [["music", 75.66], ["guitar", 8.15], ["musical instrument", 3.69]], [["music", 85.27], ["guitar", 5.64], ["musical instrument", 3.03]], [["music", 79.12], ["musical instrument", 3.64], ["guitar", 3.3]], [["music", 83.19], ["guitar", 6.01], ["musical instrument", 3.41]], [["music", 86.49], ["guitar", 4.96], ["effects unit", 2.31]]], "duration": [1.35, 25.73, 2.51, 6.6, 3.19, 2.62, 5.22, 12.79]} \ No newline at end of file diff --git a/annotations_filtered/oHOnldgbjy8_filtered.json b/annotations_filtered/oHOnldgbjy8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c86ea2ca2877db20cf4d88281e6aaac0349b3d08 --- /dev/null +++ b/annotations_filtered/oHOnldgbjy8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 12.92], [14.0, 62.77], [65.0, 113.54], [117.0, 117.51], [118.0, 117.61]], "keep_status": [true, false, false, false, false], "silence_prob": [38.42, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 46.51], ["throbbing", 10.35], ["music", 10.15]], null, null, null, null], "duration": [5.92, 48.77, 48.54, 0.51, -0.39]} \ No newline at end of file diff --git a/annotations_filtered/oHyebwN9XXU_filtered.json b/annotations_filtered/oHyebwN9XXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad63e55ed50c7a42f36779af14edbe3c84cfcb1d --- /dev/null +++ b/annotations_filtered/oHyebwN9XXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[72.0, 75.39], [90.0, 91.35], [93.0, 98.1], [99.0, 101.6]], "keep_status": [true, false, false, true], "silence_prob": [46.05, 0.0, 42.37, 34.21], "audiomae_on_audioset": [[["music", 32.44], ["sidetone", 21.14], ["speech", 15.65]], null, [["music", 34.24], ["hum", 25.35], ["throbbing", 11.86]], [["music", 53.7], ["mains hum", 8.65], ["hum", 4.57]]], "duration": [3.39, 1.35, 5.1, 2.6]} \ No newline at end of file diff --git a/annotations_filtered/oIEtwZK04wM_filtered.json b/annotations_filtered/oIEtwZK04wM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9679fa3cb225e7d6405ada998394171e7adc524e --- /dev/null +++ b/annotations_filtered/oIEtwZK04wM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.56], [7.0, 9.37], [11.0, 11.31], [16.0, 16.92], [17.0, 23.77], [27.0, 28.41], [37.0, 37.08], [38.0, 38.77], [39.0, 39.8], [42.0, 42.06], [42.0, 45.1], [55.0, 60.39], [65.0, 68.52], [71.0, 73.2], [75.0, 76.4], [82.0, 102.0], [107.0, 111.3], [115.0, 116.16], [129.0, 137.59], [142.0, 142.23], [143.0, 143.8], [152.0, 152.66], [153.0, 153.32], [158.0, 158.45], [159.0, 159.49], [160.0, 168.76], [169.0, 169.42], [174.0, 176.37], [179.0, 182.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 91.47, 0.0, 0.0, 33.91, 0.0, 0.0, 0.0, 0.0, 0.0, 35.13, 36.49, 38.68, 39.18, 0.0, 31.22, 38.25, 0.0, 32.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.06, 0.0, 54.1, 100.0], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 55.44], ["cattle, bovinae", 8.4], ["moo", 7.29]], null, null, null, null, null, [["boing", 54.03], ["music", 17.72], ["speech", 8.37]], [["music", 64.35], ["speech", 12.17], ["musical instrument", 4.41]], [["music", 53.94], ["speech", 22.18], ["boing", 4.77]], [["music", 59.55], ["musical instrument", 8.05], ["didgeridoo", 4.87]], null, [["music", 49.64], ["speech", 19.66], ["outside, rural or natural", 2.28]], [["speech", 47.68], ["music", 21.75], ["explosion", 5.53]], null, [["music", 83.81], ["synthesizer", 2.59], ["sampler", 1.93]], null, null, null, null, null, null, [["speech", 45.92], ["music", 39.41], ["musical instrument", 3.26]], null, null, null], "duration": [0.56, 2.37, 0.31, 0.92, 6.77, 1.41, 0.08, 0.77, 0.8, 0.06, 3.1, 5.39, 3.52, 2.2, 1.4, 20.0, 4.3, 1.16, 8.59, 0.23, 0.8, 0.66, 0.32, 0.45, 0.49, 8.76, 0.42, 2.37, 3.68]} \ No newline at end of file diff --git a/annotations_filtered/oISBveQNkzA_filtered.json b/annotations_filtered/oISBveQNkzA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..082d071fb0aac1d5416c003ff5ad38d3bf734032 --- /dev/null +++ b/annotations_filtered/oISBveQNkzA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 40.05], [44.0, 45.12], [50.0, 53.86], [56.0, 59.56], [66.0, 74.19], [78.0, 93.45], [95.0, 136.71]], "keep_status": [true, false, false, false, false, false, false], "silence_prob": [29.88, 0.0, 28.42, 27.94, 28.27, 28.93, 0.0], "audiomae_on_audioset": [[["singing bowl", 24.31], ["music", 17.97], ["ambient music", 17.65]], null, [["music", 57.28], ["theremin", 8.56], ["synthesizer", 8.21]], [["music", 60.41], ["didgeridoo", 10.73], ["musical instrument", 4.08]], [["music", 55.91], ["didgeridoo", 23.31], ["musical instrument", 4.66]], [["didgeridoo", 66.28], ["music", 23.16], ["musical instrument", 1.06]], null], "duration": [16.05, 1.12, 3.86, 3.56, 8.19, 15.45, 41.71]} \ No newline at end of file diff --git a/annotations_filtered/oIjgZ-i9v_k_filtered.json b/annotations_filtered/oIjgZ-i9v_k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ac4f9b508b421cbc7e257e4ae7acc51dc7d9d28 --- /dev/null +++ b/annotations_filtered/oIjgZ-i9v_k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.03], [8.0, 8.21], [27.0, 40.49], [43.0, 57.43], [58.0, 64.05], [66.0, 71.42], [72.0, 71.54], [72.0, 71.81], [72.0, 90.42], [94.0, 117.75], [122.0, 122.88]], "keep_status": [false, false, false, true, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 60.42, 41.81, 35.98, 36.89, 0.0, 0.0, 37.93, 39.33, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 20.33], ["music", 14.63], ["croak", 10.11]], [["music", 29.18], ["speech", 20.47], ["didgeridoo", 9.39]], [["speech", 37.03], ["music", 14.64], ["moo", 7.95]], null, null, [["speech", 55.14], ["music", 15.12], ["buzz", 4.28]], [["music", 57.81], ["sonar", 12.1], ["frog", 2.33]], null], "duration": [0.03, 0.21, 13.49, 14.43, 6.05, 5.42, -0.46, -0.19, 18.42, 23.75, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/oIlpo2mj_qk_filtered.json b/annotations_filtered/oIlpo2mj_qk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..731ae801ecdd3b0b044437fedfe6b5c06b7713cb --- /dev/null +++ b/annotations_filtered/oIlpo2mj_qk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.91], [12.0, 15.36], [17.0, 19.58], [21.0, 45.33], [47.0, 48.09], [51.0, 53.62], [55.0, 58.35], [60.0, 61.05], [64.0, 65.28], [66.0, 81.03], [82.0, 82.19], [85.0, 86.24], [92.0, 101.73], [103.0, 104.63], [106.0, 108.97]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [74.44, 70.3, 83.7, 68.8, 0.0, 82.07, 30.38, 0.0, 0.0, 32.92, 0.0, 0.0, 33.03, 0.0, 76.37], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 51.43], ["breaking", 8.73], ["fusillade", 4.71]], null, null, [["music", 68.03], ["electronic music", 3.59], ["breaking", 2.94]], null, null, [["music", 57.62], ["hum", 5.28], ["breaking", 4.67]], null, null], "duration": [2.91, 3.36, 2.58, 24.33, 1.09, 2.62, 3.35, 1.05, 1.28, 15.03, 0.19, 1.24, 9.73, 1.63, 2.97]} \ No newline at end of file diff --git a/annotations_filtered/oIu0P3gXxsI_filtered.json b/annotations_filtered/oIu0P3gXxsI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7dc2ac3cc347a5496c49808bb519909102dfc7b3 --- /dev/null +++ b/annotations_filtered/oIu0P3gXxsI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.5], [18.0, 19.26], [20.0, 22.06], [25.0, 25.96], [28.0, 28.88], [31.0, 31.56], [32.0, 32.24], [42.0, 42.18], [44.0, 46.18], [49.0, 49.23], [50.0, 50.41], [51.0, 51.56], [58.0, 58.24], [67.0, 67.88], [69.0, 68.81], [71.0, 71.27], [72.0, 72.35], [73.0, 73.68], [79.0, 79.69], [93.0, 92.75], [97.0, 99.0], [112.0, 112.72]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 47.58, 0.0, 0.0, 0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.45, 0.0], "audiomae_on_audioset": [null, null, [["music", 45.14], ["speech", 17.51], ["throbbing", 4.95]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 1.26, 2.06, 0.96, 0.88, 0.56, 0.24, 0.18, 2.18, 0.23, 0.41, 0.56, 0.24, 0.88, -0.19, 0.27, 0.35, 0.68, 0.69, -0.25, 2.0, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/oJ3bzg-Tvt4_filtered.json b/annotations_filtered/oJ3bzg-Tvt4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/oJ3bzg-Tvt4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/oJFKZnePh3k_filtered.json b/annotations_filtered/oJFKZnePh3k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..617e652fbf5a0b5005962b755ee2503195589e6a --- /dev/null +++ b/annotations_filtered/oJFKZnePh3k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 18.86], [21.0, 27.8], [31.0, 41.57], [42.0, 41.61], [42.0, 41.64], [42.0, 41.94], [42.0, 42.04], [43.0, 42.94]], "keep_status": [false, true, false, false, false, false, false, false], "silence_prob": [30.58, 31.1, 30.45, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 53.84], ["throbbing", 18.48], ["hum", 3.56]], [["hum", 19.77], ["throbbing", 17.39], ["mains hum", 9.92]], [["music", 50.01], ["speech", 32.97], ["vehicle", 1.47]], null, null, null, null, null], "duration": [13.86, 6.8, 10.57, -0.39, -0.36, -0.06, 0.04, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/oK1X8SfGMs8_filtered.json b/annotations_filtered/oK1X8SfGMs8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd367b1a4c39a717aab6490b6ec907a2c212a256 --- /dev/null +++ b/annotations_filtered/oK1X8SfGMs8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.96], [5.0, 6.12], [6.0, 6.76], [8.0, 14.08], [14.0, 20.06], [21.0, 21.69], [24.0, 24.65], [26.0, 26.96], [32.0, 50.79], [51.0, 52.03], [54.0, 62.33], [64.0, 66.6], [67.0, 67.41], [69.0, 68.91], [70.0, 70.24], [73.0, 72.67], [75.0, 76.0], [80.0, 80.28], [85.0, 84.82], [86.0, 86.98], [89.0, 88.72], [89.0, 89.95], [92.0, 92.33], [93.0, 93.02], [94.0, 95.69], [97.0, 98.24], [99.0, 99.91]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.05, 35.08, 0.0, 0.0, 0.0, 33.39, 0.0, 46.22, 99.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["electric shaver, electric razor", 98.25], ["inside, small room", 0.6], ["electric toothbrush", 0.28]], [["boing", 24.54], ["speech", 12.25], ["frog", 9.78]], null, null, null, [["electric shaver, electric razor", 19.81], ["speech", 11.68], ["livestock, farm animals, working animals", 10.97]], null, [["fart", 70.38], ["effects unit", 2.88], ["music", 1.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.04, 1.12, 0.76, 6.08, 6.06, 0.69, 0.65, 0.96, 18.79, 1.03, 8.33, 2.6, 0.41, -0.09, 0.24, -0.33, 1.0, 0.28, -0.18, 0.98, -0.28, 0.95, 0.33, 0.02, 1.69, 1.24, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/oK1zfJausVM_filtered.json b/annotations_filtered/oK1zfJausVM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90c08e620881ba7f4882abb09b12fbfa8a5a76e0 --- /dev/null +++ b/annotations_filtered/oK1zfJausVM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.16], [10.0, 12.75], [13.0, 13.8], [16.0, 17.42], [21.0, 21.59], [22.0, 22.71], [23.0, 24.09], [24.0, 24.27], [25.0, 25.34], [27.0, 28.16], [29.0, 30.15], [32.0, 31.99], [34.0, 34.6], [39.0, 41.27], [43.0, 44.47], [47.0, 48.42], [49.0, 62.99], [64.0, 67.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 89.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.43, 0.0, 0.0, 29.47, 99.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.71], ["speech", 18.98], ["didgeridoo", 1.99]], null, null, [["whip", 47.34], ["music", 12.05], ["speech", 10.07]], null], "duration": [0.16, 2.75, 0.8, 1.42, 0.59, 0.71, 1.09, 0.27, 0.34, 1.16, 1.15, -0.01, 0.6, 2.27, 1.47, 1.42, 13.99, 3.71]} \ No newline at end of file diff --git a/annotations_filtered/oK4FZ3ks17M_filtered.json b/annotations_filtered/oK4FZ3ks17M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0217e4ed3c452a5229862b0ee47fa6f9c2b3e884 --- /dev/null +++ b/annotations_filtered/oK4FZ3ks17M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.36], [9.0, 10.72], [12.0, 12.72], [13.0, 16.46], [20.0, 21.32], [23.0, 23.35], [32.0, 33.44], [35.0, 35.4], [42.0, 42.43], [51.0, 51.66], [54.0, 56.08], [57.0, 58.48], [60.0, 62.14], [69.0, 69.21], [73.0, 73.65], [79.0, 78.8], [83.0, 83.47], [86.0, 88.82], [95.0, 98.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.91, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.36, 1.72, 0.72, 3.46, 1.32, 0.35, 1.44, 0.4, 0.43, 0.66, 2.08, 1.48, 2.14, 0.21, 0.65, -0.2, 0.47, 2.82, 3.66]} \ No newline at end of file diff --git a/annotations_filtered/oKCF_TzQ6Pk_filtered.json b/annotations_filtered/oKCF_TzQ6Pk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2233ebb2fde03f9b6859057bfdee93472dd891a1 --- /dev/null +++ b/annotations_filtered/oKCF_TzQ6Pk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.04], [10.0, 10.4], [23.0, 30.43], [38.0, 39.18], [41.0, 42.13], [44.0, 45.32], [47.0, 47.98], [50.0, 51.43], [55.0, 60.05], [64.0, 69.52], [70.0, 89.04], [91.0, 91.91], [96.0, 97.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.56, 30.6, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["buzz", 22.4], ["rumble", 18.11], ["sonar", 7.19]], null, null], "duration": [0.04, 0.4, 7.43, 1.18, 1.13, 1.32, 0.98, 1.43, 5.05, 5.52, 19.04, 0.91, 1.85]} \ No newline at end of file diff --git a/annotations_filtered/oKXV-XQzUrY_filtered.json b/annotations_filtered/oKXV-XQzUrY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..507eeba179282cbecbbf2da94a076bf57b1e304b --- /dev/null +++ b/annotations_filtered/oKXV-XQzUrY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.77], [7.0, 7.08], [8.0, 8.18], [9.0, 9.73], [11.0, 11.77], [16.0, 16.04], [21.0, 38.53], [48.0, 51.16], [66.0, 66.55], [68.0, 74.63], [78.0, 78.26], [83.0, 89.21], [95.0, 95.23], [97.0, 98.12], [99.0, 99.33], [102.0, 103.25], [104.0, 104.26], [105.0, 107.49], [110.0, 114.54], [118.0, 119.01], [122.0, 124.06], [124.0, 126.25]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.02, 54.5, 0.0, 47.98, 0.0, 44.34, 0.0, 0.0, 0.0, 0.0, 0.0, 65.91, 100.0, 0.0, 100.0, 43.13], "audiomae_on_audioset": [null, null, null, null, null, null, [["livestock, farm animals, working animals", 29.55], ["music", 21.96], ["cattle, bovinae", 15.85]], null, null, [["livestock, farm animals, working animals", 26.49], ["cowbell", 20.02], ["sheep", 16.22]], null, [["music", 49.18], ["speech", 13.43], ["singing", 2.48]], null, null, null, null, null, null, null, null, null, [["speech", 43.07], ["music", 30.47], ["theremin", 4.18]]], "duration": [0.77, 0.08, 0.18, 0.73, 0.77, 0.04, 17.53, 3.16, 0.55, 6.63, 0.26, 6.21, 0.23, 1.12, 0.33, 1.25, 0.26, 2.49, 4.54, 1.01, 2.06, 2.25]} \ No newline at end of file diff --git a/annotations_filtered/oKYBGq7pt3M_filtered.json b/annotations_filtered/oKYBGq7pt3M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3eb80a49ff2cd801ae2252f030fec6a1a4491d6e --- /dev/null +++ b/annotations_filtered/oKYBGq7pt3M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.69], [26.0, 26.49], [37.0, 37.08], [37.0, 37.88], [51.0, 56.07], [58.0, 58.65], [59.0, 67.09], [67.0, 67.12], [87.0, 87.49], [88.0, 88.45], [89.0, 94.29], [97.0, 108.77]], "keep_status": [true, false, false, false, true, false, true, false, false, false, true, false], "silence_prob": [36.06, 0.0, 0.0, 0.0, 35.38, 0.0, 33.38, 0.0, 0.0, 0.0, 42.35, 32.98], "audiomae_on_audioset": [[["music", 24.83], ["speech", 23.05], ["mantra", 2.72]], null, null, null, [["mosquito", 19.14], ["fly, housefly", 17.02], ["speech", 9.69]], null, [["cattle, bovinae", 25.17], ["moo", 21.1], ["speech", 16.04]], null, null, null, [["music", 31.98], ["moo", 18.86], ["cattle, bovinae", 17.17]], [["speech", 42.72], ["music", 27.11], ["buzz", 3.4]]], "duration": [2.69, 0.49, 0.08, 0.88, 5.07, 0.65, 8.09, 0.12, 0.49, 0.45, 5.29, 11.77]} \ No newline at end of file diff --git a/annotations_filtered/oKmBIC6X6Fs_filtered.json b/annotations_filtered/oKmBIC6X6Fs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cdb70c645005c5537fcc4a6c29c29b81c9cf117d --- /dev/null +++ b/annotations_filtered/oKmBIC6X6Fs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 12.48], [14.0, 15.38], [18.0, 20.31], [21.0, 26.64], [28.0, 42.01], [43.0, 44.34], [46.0, 47.6], [49.0, 51.7], [57.0, 58.94], [60.0, 61.57], [66.0, 68.01], [70.0, 70.65], [73.0, 77.06], [85.0, 85.46], [106.0, 109.26], [111.0, 114.1]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [36.87, 0.0, 34.05, 35.44, 37.46, 0.0, 0.0, 100.0, 0.0, 0.0, 98.73, 0.0, 63.1, 0.0, 99.36, 34.32], "audiomae_on_audioset": [[["music", 36.18], ["musical instrument", 17.9], ["guitar", 7.14]], null, [["music", 50.02], ["musical instrument", 12.96], ["keyboard (musical)", 9.98]], [["music", 53.38], ["musical instrument", 22.41], ["guitar", 3.14]], [["music", 50.32], ["musical instrument", 13.08], ["piano", 6.11]], null, null, null, null, null, null, null, null, null, null, [["speech", 47.83], ["breaking", 15.66], ["coin (dropping)", 3.71]]], "duration": [11.48, 1.38, 2.31, 5.64, 14.01, 1.34, 1.6, 2.7, 1.94, 1.57, 2.01, 0.65, 4.06, 0.46, 3.26, 3.1]} \ No newline at end of file diff --git a/annotations_filtered/oLIwz9gn00g_filtered.json b/annotations_filtered/oLIwz9gn00g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e0d3b3ad7a21a4d151653261f0d5c041adbf354 --- /dev/null +++ b/annotations_filtered/oLIwz9gn00g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.83], [4.0, 10.59], [11.0, 12.16], [14.0, 14.57], [18.0, 18.96], [20.0, 21.86], [22.0, 22.54], [24.0, 24.41], [26.0, 27.24], [29.0, 29.02], [31.0, 32.51], [36.0, 36.32], [38.0, 37.56], [38.0, 41.77], [44.0, 49.38], [52.0, 51.97], [58.0, 58.7], [61.0, 64.45], [66.0, 66.73], [69.0, 71.0], [71.0, 71.88], [74.0, 80.05], [81.0, 82.11], [86.0, 88.2], [90.0, 90.59], [93.0, 93.45], [95.0, 98.05], [101.0, 102.41], [104.0, 104.89], [106.0, 105.83], [107.0, 107.49], [113.0, 114.03], [116.0, 117.66], [119.0, 119.3], [120.0, 120.55], [121.0, 123.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 36.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.11, 47.98, 0.0, 0.0, 89.9, 0.0, 93.6, 0.0, 93.45, 0.0, 72.6, 0.0, 0.0, 97.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.15], "audiomae_on_audioset": [null, [["speech", 54.91], ["sidetone", 33.91], ["telephone", 2.95]], null, null, null, null, null, null, null, null, null, null, null, [["frog", 26.93], ["speech", 21.91], ["music", 7.77]], [["sine wave", 30.38], ["hum", 16.31], ["sidetone", 11.52]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 23.54], ["radio", 6.73], ["smash, crash", 5.12]]], "duration": [1.83, 6.59, 1.16, 0.57, 0.96, 1.86, 0.54, 0.41, 1.24, 0.02, 1.51, 0.32, -0.44, 3.77, 5.38, -0.03, 0.7, 3.45, 0.73, 2.0, 0.88, 6.05, 1.11, 2.2, 0.59, 0.45, 3.05, 1.41, 0.89, -0.17, 0.49, 1.03, 1.66, 0.3, 0.55, 2.97]} \ No newline at end of file diff --git a/annotations_filtered/oLJ7246t3-c_filtered.json b/annotations_filtered/oLJ7246t3-c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35b4df6829618f85420cf3df30ef9f43f15bb26c --- /dev/null +++ b/annotations_filtered/oLJ7246t3-c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.45], [6.0, 6.05], [6.0, 9.27], [12.0, 13.09], [17.0, 18.3], [19.0, 20.56], [21.0, 23.08], [24.0, 25.73], [27.0, 31.89], [33.0, 34.1], [38.0, 39.18], [42.0, 43.87], [46.0, 48.66], [50.0, 66.65], [68.0, 68.5], [69.0, 70.66], [73.0, 72.99], [74.0, 74.88], [77.0, 77.18], [78.0, 79.79], [81.0, 80.84], [85.0, 85.6], [87.0, 88.67], [90.0, 91.23], [93.0, 93.61], [96.0, 98.2], [101.0, 102.46], [104.0, 104.35], [109.0, 111.33], [113.0, 113.68], [115.0, 115.62], [119.0, 156.78], [157.0, 164.67], [166.0, 167.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.05, 0.0, 92.97, 0.0, 0.0, 0.0, 99.16, 0.0, 97.54, 0.0, 0.0, 0.0, 99.4, 83.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 97.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.45, 0.05, 3.27, 1.09, 1.3, 1.56, 2.08, 1.73, 4.89, 1.1, 1.18, 1.87, 2.66, 16.65, 0.5, 1.66, -0.01, 0.88, 0.18, 1.79, -0.16, 0.6, 1.67, 1.23, 0.61, 2.2, 1.46, 0.35, 2.33, 0.68, 0.62, 37.78, 7.67, 1.71]} \ No newline at end of file diff --git a/annotations_filtered/oLPTh_DaPa8_filtered.json b/annotations_filtered/oLPTh_DaPa8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6f677c332e018670863f76d7bf627099a6b97b7 --- /dev/null +++ b/annotations_filtered/oLPTh_DaPa8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.92], [9.0, 10.89], [12.0, 14.1], [15.0, 14.84], [15.0, 16.46], [17.0, 17.49], [19.0, 20.26], [25.0, 25.76], [27.0, 26.92], [31.0, 31.9], [33.0, 33.17], [35.0, 37.84], [40.0, 40.15], [47.0, 47.53], [52.0, 52.91], [56.0, 56.73], [61.0, 63.41], [64.0, 72.84], [74.0, 89.92], [92.0, 92.38], [93.0, 95.35], [104.0, 106.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.52, 99.99, 0.0, 99.21, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.92, 1.89, 2.1, -0.16, 1.46, 0.49, 1.26, 0.76, -0.08, 0.9, 0.17, 2.84, 0.15, 0.53, 0.91, 0.73, 2.41, 8.84, 15.92, 0.38, 2.35, 2.3]} \ No newline at end of file diff --git a/annotations_filtered/oLQ5NOAIAw0_filtered.json b/annotations_filtered/oLQ5NOAIAw0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb92c4fd5890ddc601eb3b196fc81e351dd2cba6 --- /dev/null +++ b/annotations_filtered/oLQ5NOAIAw0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.59], [14.0, 14.81], [22.0, 22.52], [24.0, 25.32], [26.0, 27.82], [31.0, 32.1], [38.0, 38.77], [39.0, 39.99], [48.0, 49.05], [50.0, 51.04], [53.0, 54.24], [60.0, 60.79], [61.0, 62.51], [119.0, 121.64], [128.0, 128.66], [130.0, 130.5], [131.0, 130.77], [132.0, 132.76], [134.0, 135.68], [136.0, 136.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.59, 0.81, 0.52, 1.32, 1.82, 1.1, 0.77, 0.99, 1.05, 1.04, 1.24, 0.79, 1.51, 2.64, 0.66, 0.5, -0.23, 0.76, 1.68, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/oLQsS64Mgjg_filtered.json b/annotations_filtered/oLQsS64Mgjg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ccb766b520ec5efcf0e61a8b7ea8972f5a6d091 --- /dev/null +++ b/annotations_filtered/oLQsS64Mgjg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.15], [6.0, 7.97], [13.0, 13.14], [18.0, 18.71], [28.0, 28.34], [29.0, 28.75], [29.0, 32.24], [33.0, 33.88], [35.0, 35.46], [39.0, 40.88], [51.0, 53.37], [59.0, 59.14], [60.0, 60.56], [63.0, 65.35], [67.0, 69.16], [72.0, 73.3], [74.0, 74.56], [76.0, 76.79], [78.0, 78.71], [80.0, 80.77], [86.0, 86.16], [87.0, 87.81], [89.0, 90.51], [91.0, 93.16], [94.0, 95.22], [100.0, 100.85], [109.0, 109.48], [110.0, 109.9], [115.0, 115.23], [116.0, 117.31], [123.0, 123.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [55.53, 0.0, 0.0, 0.0, 0.0, 0.0, 64.97, 0.0, 0.0, 0.0, 58.89, 0.0, 0.0, 47.01, 41.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.61], ["guitar", 13.64], ["musical instrument", 8.6]], [["music", 25.66], ["speech", 21.59], ["musical instrument", 4.65]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.15, 1.97, 0.14, 0.71, 0.34, -0.25, 3.24, 0.88, 0.46, 1.88, 2.37, 0.14, 0.56, 2.35, 2.16, 1.3, 0.56, 0.79, 0.71, 0.77, 0.16, 0.81, 1.51, 2.16, 1.22, 0.85, 0.48, -0.1, 0.23, 1.31, 0.18]} \ No newline at end of file diff --git a/annotations_filtered/oLUmNV0tmMo_filtered.json b/annotations_filtered/oLUmNV0tmMo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bed686d33d25455175b7f37defba309c466c75e --- /dev/null +++ b/annotations_filtered/oLUmNV0tmMo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 17.22], [21.0, 25.84], [26.0, 28.32], [36.0, 47.95], [54.0, 53.87], [54.0, 60.05], [63.0, 85.08], [85.0, 87.99], [90.0, 112.95], [114.0, 143.33], [144.0, 158.85], [160.0, 160.93], [168.0, 171.73]], "keep_status": [false, false, true, false, false, true, false, true, false, false, false, false, true], "silence_prob": [37.34, 35.82, 35.29, 33.92, 0.0, 34.93, 37.98, 38.83, 37.49, 35.0, 40.82, 0.0, 34.23], "audiomae_on_audioset": [[["music", 52.83], ["buzz", 10.41], ["electric shaver, electric razor", 7.78]], [["music", 60.1], ["brass instrument", 5.28], ["foghorn", 5.09]], [["moo", 26.86], ["cattle, bovinae", 25.46], ["livestock, farm animals, working animals", 9.42]], [["music", 82.17], ["electronic music", 5.9], ["dubstep", 1.32]], null, [["speech", 18.66], ["throbbing", 15.74], ["music", 15.28]], [["music", 49.46], ["throbbing", 32.14], ["hum", 6.35]], [["music", 39.14], ["mosquito", 11.7], ["boing", 11.01]], [["moo", 29.38], ["cattle, bovinae", 22.17], ["music", 18.89]], [["music", 65.32], ["throbbing", 10.66], ["hum", 3.51]], [["music", 59.19], ["synthesizer", 20.57], ["theremin", 2.82]], null, [["music", 39.96], ["hum", 11.47], ["electronic music", 5.68]]], "duration": [4.22, 4.84, 2.32, 11.95, -0.13, 6.05, 22.08, 2.99, 22.95, 29.33, 14.85, 0.93, 3.73]} \ No newline at end of file diff --git a/annotations_filtered/oLnrsZa4EqQ_filtered.json b/annotations_filtered/oLnrsZa4EqQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2951e0d45cb77d23c5002a6fe44acb307c199a0 --- /dev/null +++ b/annotations_filtered/oLnrsZa4EqQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.07], [4.0, 4.06], [5.0, 7.7], [10.0, 10.44], [14.0, 19.18], [20.0, 22.69], [24.0, 25.98], [27.0, 27.38], [27.0, 29.66], [32.0, 34.25], [35.0, 70.19], [71.0, 71.61], [72.0, 78.19], [79.0, 79.83], [82.0, 103.27], [105.0, 136.26], [138.0, 138.5], [140.0, 140.37], [143.0, 143.46], [144.0, 145.47], [147.0, 147.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 86.09, 0.0, 95.23, 99.44, 0.0, 0.0, 84.98, 98.93, 0.0, 0.0, 38.3, 0.0, 30.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.37], ["speech", 21.27], ["hum", 6.27]], null, [["music", 47.22], ["hum", 14.54], ["effects unit", 6.34]], null, null, null, null, null, null], "duration": [1.07, 0.06, 2.7, 0.44, 5.18, 2.69, 1.98, 0.38, 2.66, 2.25, 35.19, 0.61, 6.19, 0.83, 21.27, 31.26, 0.5, 0.37, 0.46, 1.47, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/oMH9kIyIl1I_filtered.json b/annotations_filtered/oMH9kIyIl1I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ace4faf5f2025ddf89e849d0f3b2f6fa0c73ec48 --- /dev/null +++ b/annotations_filtered/oMH9kIyIl1I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.09], [25.0, 36.73], [39.0, 38.69], [39.0, 46.74], [52.0, 56.88], [60.0, 70.92], [75.0, 78.97], [83.0, 86.95], [94.0, 95.35]], "keep_status": [false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 30.66, 0.0, 29.41, 29.67, 29.56, 29.64, 29.64, 0.0], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 43.25], ["cattle, bovinae", 29.36], ["moo", 18.82]], null, [["music", 79.26], ["hum", 3.17], ["cacophony", 2.79]], [["music", 81.6], ["cacophony", 3.75], ["musical instrument", 1.43]], [["music", 80.19], ["rock music", 2.34], ["musical instrument", 2.27]], [["music", 57.24], ["hum", 7.97], ["mains hum", 5.06]], [["music", 58.29], ["throbbing", 5.49], ["hum", 4.97]], null], "duration": [0.09, 11.73, -0.31, 7.74, 4.88, 10.92, 3.97, 3.95, 1.35]} \ No newline at end of file diff --git a/annotations_filtered/oMLjP2ajXvs_filtered.json b/annotations_filtered/oMLjP2ajXvs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c502c9f4469d9ecf1bfb33197920db75b3e1a36 --- /dev/null +++ b/annotations_filtered/oMLjP2ajXvs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 45.67], [51.0, 57.1], [58.0, 74.38], [79.0, 83.39], [90.0, 94.04]], "keep_status": [true, true, false, false, false], "silence_prob": [32.41, 38.31, 32.87, 33.11, 32.55], "audiomae_on_audioset": [[["music", 31.05], ["synthesizer", 24.13], ["theremin", 12.39]], [["fly, housefly", 34.44], ["insect", 20.41], ["vehicle", 11.24]], [["fly, housefly", 32.73], ["insect", 30.57], ["bee, wasp, etc.", 18.8]], [["speech", 79.9], ["radio", 4.23], ["music", 1.58]], [["insect", 32.4], ["fly, housefly", 31.53], ["bee, wasp, etc.", 6.81]]], "duration": [14.67, 6.1, 16.38, 4.39, 4.04]} \ No newline at end of file diff --git a/annotations_filtered/oMWqB05lpRU_filtered.json b/annotations_filtered/oMWqB05lpRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d6966eb6c0a0cc8a147c8a119d871d3a133715b --- /dev/null +++ b/annotations_filtered/oMWqB05lpRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.18], [9.0, 71.36], [73.0, 99.08], [99.0, 110.94], [112.0, 124.23], [125.0, 125.86], [127.0, 129.41], [132.0, 131.79]], "keep_status": [false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 29.85, 29.5, 29.56, 0.0, 32.43, 0.0], "audiomae_on_audioset": [null, null, [["music", 61.62], ["throbbing", 20.11], ["hum", 4.31]], [["music", 47.89], ["throbbing", 34.52], ["electronic music", 5.25]], [["vehicle", 15.42], ["music", 11.42], ["hum", 10.13]], null, [["music", 76.63], ["throbbing", 3.22], ["musical instrument", 2.53]], null], "duration": [0.18, 62.36, 26.08, 11.94, 12.23, 0.86, 2.41, -0.21]} \ No newline at end of file diff --git a/annotations_filtered/oMpgPQbRt8U_filtered.json b/annotations_filtered/oMpgPQbRt8U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9db586aeea07fe9586f1c7c8b61bf09b6af89ba --- /dev/null +++ b/annotations_filtered/oMpgPQbRt8U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.94], [32.0, 36.27], [48.0, 55.19], [60.0, 61.18], [65.0, 65.06], [67.0, 68.23]], "keep_status": [false, false, false, false, false, false], "silence_prob": [87.55, 69.2, 61.37, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [4.94, 4.27, 7.19, 1.18, 0.06, 1.23]} \ No newline at end of file diff --git a/annotations_filtered/oMt4F9ELo3U_filtered.json b/annotations_filtered/oMt4F9ELo3U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29aa7447bff986a1fa76ba92293fe26dd9575fd4 --- /dev/null +++ b/annotations_filtered/oMt4F9ELo3U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.75], [11.0, 12.58], [22.0, 21.74], [24.0, 24.73], [25.0, 24.76], [25.0, 25.17], [25.0, 26.32], [28.0, 29.49], [30.0, 37.49], [41.0, 41.17], [43.0, 43.06], [45.0, 44.78], [46.0, 46.26], [51.0, 50.85], [53.0, 54.4], [58.0, 59.19], [64.0, 72.66], [73.0, 74.55], [78.0, 84.38], [85.0, 85.85], [89.0, 91.4], [91.0, 91.44], [101.0, 101.87], [123.0, 125.96], [139.0, 142.21], [147.0, 149.17], [153.0, 155.26], [157.0, 157.6], [161.0, 161.33], [162.0, 162.73], [168.0, 168.0], [168.0, 170.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.1, 0.0, 41.48, 0.0, 60.6, 0.0, 0.0, 30.36, 29.66, 29.61, 51.34, 0.0, 0.0, 0.0, 0.0, 36.12], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 66.93], ["fly, housefly", 7.26], ["bee, wasp, etc.", 3.41]], null, null, null, null, [["cattle, bovinae", 31.44], ["moo", 25.4], ["speech", 23.51]], [["speech", 59.57], ["electric shaver, electric razor", 5.07], ["vehicle", 4.9]], [["livestock, farm animals, working animals", 17.21], ["cattle, bovinae", 15.17], ["insect", 12.55]], null, null, null, null, null, [["sidetone", 38.57], ["speech", 28.37], ["music", 16.31]]], "duration": [0.75, 1.58, -0.26, 0.73, -0.24, 0.17, 1.32, 1.49, 7.49, 0.17, 0.06, -0.22, 0.26, -0.15, 1.4, 1.19, 8.66, 1.55, 6.38, 0.85, 2.4, 0.44, 0.87, 2.96, 3.21, 2.17, 2.26, 0.6, 0.33, 0.73, 0.0, 2.43]} \ No newline at end of file diff --git a/annotations_filtered/oMx6C31dCeo_filtered.json b/annotations_filtered/oMx6C31dCeo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9f303e04ee3d1b5bf6b3371eb704dba7a795c5e --- /dev/null +++ b/annotations_filtered/oMx6C31dCeo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.3], [4.0, 4.48], [32.0, 34.7], [43.0, 46.57], [48.0, 48.83], [49.0, 49.47], [51.0, 54.77], [58.0, 59.14], [59.0, 63.0], [69.0, 71.52], [72.0, 88.59], [97.0, 99.81], [100.0, 101.02], [109.0, 110.61], [113.0, 114.83], [116.0, 117.75], [119.0, 120.65], [122.0, 122.5], [127.0, 128.28]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 58.3, 51.6, 0.0, 0.0, 37.54, 0.0, 36.23, 61.77, 45.05, 38.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["keys jangling", 43.84], ["breaking", 26.79], ["hum", 8.73]], null, [["telephone", 26.8], ["speech", 21.95], ["busy signal", 12.35]], null, [["speech", 36.52], ["music", 11.62], ["chirp tone", 8.29]], [["music", 39.0], ["grunt", 12.06], ["speech", 4.64]], null, null, null, null, null, null, null], "duration": [0.3, 0.48, 2.7, 3.57, 0.83, 0.47, 3.77, 1.14, 4.0, 2.52, 16.59, 2.81, 1.02, 1.61, 1.83, 1.75, 1.65, 0.5, 1.28]} \ No newline at end of file diff --git a/annotations_filtered/oN2S394WfuU_filtered.json b/annotations_filtered/oN2S394WfuU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9909406ca12d85aec34a9443af68b7a96ec821b3 --- /dev/null +++ b/annotations_filtered/oN2S394WfuU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.24], [26.0, 26.77], [28.0, 28.21], [30.0, 30.84], [43.0, 43.56], [52.0, 53.23], [57.0, 58.43], [58.0, 58.46], [71.0, 73.43], [91.0, 93.29], [93.0, 95.93], [97.0, 101.06], [102.0, 124.12], [125.0, 128.02], [129.0, 136.26], [137.0, 136.88], [137.0, 137.22]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.54, 30.9, 30.56, 36.3, 55.31, 100.0, 99.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 34.73], ["ambient music", 11.43], ["gong", 6.54]], [["music", 35.56], ["gong", 25.51], ["ambient music", 14.46]], [["gong", 51.68], ["music", 22.82], ["electronic music", 6.69]], null, null, null, null, null], "duration": [0.24, 0.77, 0.21, 0.84, 0.56, 1.23, 1.43, 0.46, 2.43, 2.29, 2.93, 4.06, 22.12, 3.02, 7.26, -0.12, 0.22]} \ No newline at end of file diff --git a/annotations_filtered/oN832LNaq4w_filtered.json b/annotations_filtered/oN832LNaq4w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b62778623c4b5f439815b8aa3662347feb407477 --- /dev/null +++ b/annotations_filtered/oN832LNaq4w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 29.34], [32.0, 32.0], [34.0, 39.43], [41.0, 41.23], [42.0, 47.88], [48.0, 49.08], [51.0, 60.0], [61.0, 61.59], [62.0, 63.37], [64.0, 67.31], [68.0, 68.76], [69.0, 69.97], [71.0, 74.76], [76.0, 77.5], [79.0, 79.46], [80.0, 80.94], [82.0, 84.35], [86.0, 86.53], [89.0, 89.13], [90.0, 93.09], [94.0, 95.77], [96.0, 108.85], [110.0, 110.74], [112.0, 115.48], [116.0, 116.26], [117.0, 125.73]], "keep_status": [true, false, true, false, false, false, true, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [32.87, 0.0, 30.15, 0.0, 36.07, 0.0, 30.72, 0.0, 0.0, 32.18, 0.0, 0.0, 31.99, 0.0, 0.0, 0.0, 38.8, 0.0, 0.0, 64.52, 0.0, 88.46, 0.0, 100.0, 0.0, 38.15], "audiomae_on_audioset": [[["speech", 29.06], ["hum", 15.11], ["throbbing", 4.32]], null, [["smash, crash", 16.07], ["whack, thwack", 7.45], ["radio", 5.72]], null, [["speech", 62.36], ["beatboxing", 13.03], ["sidetone", 8.49]], null, [["speech", 33.57], ["whack, thwack", 12.68], ["creak", 5.1]], null, null, [["frog", 16.66], ["noise", 15.91], ["fart", 11.52]], null, null, [["beatboxing", 64.38], ["fart", 5.92], ["speech", 4.39]], null, null, null, [["radio", 12.39], ["frog", 10.74], ["speech", 10.73]], null, null, null, null, null, null, null, null, [["speech", 77.0], ["radio", 5.45], ["whack, thwack", 4.88]]], "duration": [21.34, 0.0, 5.43, 0.23, 5.88, 1.08, 9.0, 0.59, 1.37, 3.31, 0.76, 0.97, 3.76, 1.5, 0.46, 0.94, 2.35, 0.53, 0.13, 3.09, 1.77, 12.85, 0.74, 3.48, 0.26, 8.73]} \ No newline at end of file diff --git a/annotations_filtered/oNGklu1muXI_filtered.json b/annotations_filtered/oNGklu1muXI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75953514f8962b4dd2b0b73cf76df0ac772d3218 --- /dev/null +++ b/annotations_filtered/oNGklu1muXI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.51], [16.0, 16.07], [21.0, 21.36], [24.0, 24.85], [27.0, 27.04], [28.0, 34.38], [36.0, 36.61], [39.0, 41.86], [42.0, 43.98], [48.0, 48.27], [49.0, 50.43], [58.0, 58.21], [60.0, 60.78], [61.0, 61.59], [62.0, 70.53], [73.0, 73.95]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 37.51, 0.0, 46.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.91, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 42.8], ["music", 34.75], ["sidetone", 2.54]], null, [["music", 32.1], ["speech", 17.91], ["pulse", 9.79]], null, null, null, null, null, null, [["speech", 47.52], ["music", 14.5], ["hum", 5.05]], null], "duration": [1.51, 0.07, 0.36, 0.85, 0.04, 6.38, 0.61, 2.86, 1.98, 0.27, 1.43, 0.21, 0.78, 0.59, 8.53, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/oNWAiWBup2Q_filtered.json b/annotations_filtered/oNWAiWBup2Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c548673f8d29910127b20f9cd1fac705774d6d4 --- /dev/null +++ b/annotations_filtered/oNWAiWBup2Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.67], [15.0, 15.11], [38.0, 38.4], [47.0, 53.89], [56.0, 58.31], [62.0, 62.94], [66.0, 66.5], [68.0, 68.08], [72.0, 83.29], [88.0, 87.84], [90.0, 92.74], [95.0, 108.19], [109.0, 109.59], [110.0, 111.37], [114.0, 115.18], [116.0, 118.39], [120.0, 123.89], [126.0, 127.79], [129.0, 131.14], [131.0, 147.23], [150.0, 154.5], [159.0, 159.02], [164.0, 174.28], [177.0, 184.47], [186.0, 187.08], [206.0, 217.41]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, true, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.63, 51.55, 0.0, 0.0, 0.0, 34.04, 0.0, 30.01, 32.91, 0.0, 0.0, 0.0, 35.32, 39.52, 0.0, 34.98, 34.02, 35.0, 0.0, 33.95, 33.88, 0.0, 35.82], "audiomae_on_audioset": [null, null, null, [["music", 53.26], ["didgeridoo", 11.05], ["hum", 9.82]], null, null, null, null, [["music", 31.5], ["speech", 25.39], ["vehicle", 7.66]], null, [["speech", 17.7], ["motorcycle", 11.2], ["sidetone", 8.43]], [["music", 56.5], ["throbbing", 8.71], ["hum", 5.41]], null, null, null, [["music", 47.43], ["theremin", 22.08], ["speech", 2.74]], [["music", 42.95], ["hum", 9.13], ["theremin", 8.24]], null, [["speech", 35.05], ["music", 9.85], ["vehicle", 6.48]], [["hum", 26.37], ["buzz", 16.75], ["music", 16.19]], [["music", 60.79], ["synthesizer", 7.26], ["hum", 5.11]], null, [["music", 81.28], ["synthesizer", 1.62], ["musical instrument", 1.59]], [["music", 41.47], ["speech", 23.26], ["hum", 7.5]], null, [["music", 65.39], ["hum", 9.59], ["throbbing", 6.57]]], "duration": [0.67, 0.11, 0.4, 6.89, 2.31, 0.94, 0.5, 0.08, 11.29, -0.16, 2.74, 13.19, 0.59, 1.37, 1.18, 2.39, 3.89, 1.79, 2.14, 16.23, 4.5, 0.02, 10.28, 7.47, 1.08, 11.41]} \ No newline at end of file diff --git a/annotations_filtered/oNiW2ftWINg_filtered.json b/annotations_filtered/oNiW2ftWINg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48c85367d2fb9ea223553585f949e44b59df70db --- /dev/null +++ b/annotations_filtered/oNiW2ftWINg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.56], [8.0, 8.87], [9.0, 9.56], [11.0, 17.19], [18.0, 18.86], [21.0, 20.98], [23.0, 24.26], [26.0, 27.08], [30.0, 43.75], [47.0, 47.76], [56.0, 57.18], [58.0, 67.36], [68.0, 70.55], [71.0, 72.01], [75.0, 76.57], [78.0, 79.84], [81.0, 85.01], [86.0, 87.24], [87.0, 89.94], [91.0, 91.61], [92.0, 93.26], [97.0, 98.68], [100.0, 104.21], [105.0, 107.05], [109.0, 114.78], [118.0, 119.57], [123.0, 124.21], [126.0, 126.79], [130.0, 131.16], [132.0, 143.21], [144.0, 149.08], [150.0, 154.35], [155.0, 164.34], [165.0, 166.9], [168.0, 171.95], [174.0, 175.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 51.6, 0.0, 0.0, 0.0, 0.0, 53.4, 0.0, 0.0, 59.59, 85.9, 0.0, 0.0, 0.0, 84.43, 0.0, 56.4, 0.0, 0.0, 0.0, 44.78, 90.25, 73.51, 0.0, 0.0, 0.0, 0.0, 73.82, 88.46, 65.09, 33.05, 0.0, 98.99, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 28.03], ["didgeridoo", 20.28], ["music", 13.6]], null, null, null, null, null, null, null, null, null, [["speech", 45.65], ["sidetone", 8.01], ["music", 7.53]], null, null, null], "duration": [0.56, 0.87, 0.56, 6.19, 0.86, -0.02, 1.26, 1.08, 13.75, 0.76, 1.18, 9.36, 2.55, 1.01, 1.57, 1.84, 4.01, 1.24, 2.94, 0.61, 1.26, 1.68, 4.21, 2.05, 5.78, 1.57, 1.21, 0.79, 1.16, 11.21, 5.08, 4.35, 9.34, 1.9, 3.95, 1.61]} \ No newline at end of file diff --git a/annotations_filtered/oNmhgpAGlBs_filtered.json b/annotations_filtered/oNmhgpAGlBs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa3e834cc3634194c62bf301179564348b584eca --- /dev/null +++ b/annotations_filtered/oNmhgpAGlBs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 18.62], [19.0, 34.65], [38.0, 41.08], [43.0, 44.93], [46.0, 47.16], [52.0, 52.69], [57.0, 57.79], [58.0, 62.48], [65.0, 65.28], [67.0, 68.45], [69.0, 70.26], [71.0, 71.85], [72.0, 72.69], [77.0, 77.92], [79.0, 82.51], [83.0, 83.64], [85.0, 84.96], [86.0, 87.29], [88.0, 88.47], [89.0, 99.06], [99.0, 99.66], [100.0, 101.9], [109.0, 110.22], [122.0, 122.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 99.99, 99.95, 0.0, 0.0, 0.0, 0.0, 99.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [11.62, 15.65, 3.08, 1.93, 1.16, 0.69, 0.79, 4.48, 0.28, 1.45, 1.26, 0.85, 0.69, 0.92, 3.51, 0.64, -0.04, 1.29, 0.47, 10.06, 0.66, 1.9, 1.22, 0.99]} \ No newline at end of file diff --git a/annotations_filtered/oNoOFf527GU_filtered.json b/annotations_filtered/oNoOFf527GU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa47b7c4acd1a31ef73fe7d6bacff700e33c9efa --- /dev/null +++ b/annotations_filtered/oNoOFf527GU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.63], [7.0, 9.8], [12.0, 12.82], [17.0, 18.12], [19.0, 19.84], [32.0, 32.9], [42.0, 44.47], [48.0, 48.98], [65.0, 65.96], [68.0, 69.23], [73.0, 73.99], [80.0, 81.13], [82.0, 86.19], [89.0, 92.26], [94.0, 94.07], [94.0, 94.1], [94.0, 94.2], [96.0, 100.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [76.2, 90.25, 0.0, 0.0, 0.0, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 0.0, 46.72, 96.17, 0.0, 0.0, 0.0, 98.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 40.85], ["radio", 24.71], ["whale vocalization", 14.92]], null, null, null, null, null], "duration": [3.63, 2.8, 0.82, 1.12, 0.84, 0.9, 2.47, 0.98, 0.96, 1.23, 0.99, 1.13, 4.19, 3.26, 0.07, 0.1, 0.2, 4.55]} \ No newline at end of file diff --git a/annotations_filtered/oNpeuCWJgCc_filtered.json b/annotations_filtered/oNpeuCWJgCc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0448572e2d17a267d56d1cfeb9c5a677353ef1c6 --- /dev/null +++ b/annotations_filtered/oNpeuCWJgCc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.6], [11.0, 11.53], [12.0, 13.76], [17.0, 18.47], [27.0, 32.51], [36.0, 36.98], [40.0, 44.63], [48.0, 59.53], [62.0, 62.92], [64.0, 64.93], [66.0, 73.26], [75.0, 82.54], [86.0, 86.95], [90.0, 91.44], [100.0, 102.19], [107.0, 107.1], [107.0, 111.57], [113.0, 113.76], [115.0, 118.29], [121.0, 122.64]], "keep_status": [true, false, false, false, true, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [30.19, 0.0, 0.0, 0.0, 31.74, 0.0, 30.83, 31.0, 0.0, 0.0, 31.54, 31.45, 0.0, 0.0, 39.75, 0.0, 42.67, 0.0, 30.64, 0.0], "audiomae_on_audioset": [[["music", 41.0], ["speech", 13.48], ["fly, housefly", 8.44]], null, null, null, [["music", 50.83], ["percussion", 4.17], ["musical instrument", 3.66]], null, [["music", 55.67], ["cattle, bovinae", 6.64], ["moo", 4.81]], [["music", 70.7], ["musical instrument", 3.8], ["music of latin america", 2.28]], null, null, [["music", 68.63], ["music of latin america", 3.1], ["musical instrument", 2.44]], [["music", 69.86], ["musical instrument", 4.45], ["swing music", 1.64]], null, null, [["music", 36.78], ["sidetone", 22.94], ["didgeridoo", 10.18]], null, [["music", 53.25], ["didgeridoo", 19.75], ["speech", 4.26]], null, [["music", 61.28], ["cacophony", 9.58], ["cheering", 2.13]], null], "duration": [5.6, 0.53, 1.76, 1.47, 5.51, 0.98, 4.63, 11.53, 0.92, 0.93, 7.26, 7.54, 0.95, 1.44, 2.19, 0.1, 4.57, 0.76, 3.29, 1.64]} \ No newline at end of file diff --git a/annotations_filtered/oNuGwa5Kd8E_filtered.json b/annotations_filtered/oNuGwa5Kd8E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..843912143b67fa449cdf36b51cc76b057a058c4a --- /dev/null +++ b/annotations_filtered/oNuGwa5Kd8E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 13.73], [24.0, 24.27], [26.0, 26.6], [31.0, 31.68], [33.0, 33.57], [34.0, 34.84], [37.0, 40.17], [41.0, 41.91], [43.0, 43.38], [44.0, 45.03], [49.0, 49.01], [56.0, 56.66], [71.0, 71.52], [73.0, 73.57], [74.0, 74.88], [76.0, 76.81], [77.0, 79.2], [83.0, 83.64], [91.0, 90.76], [93.0, 96.53], [100.0, 111.13], [113.0, 115.86], [124.0, 125.73], [127.0, 129.52], [133.0, 135.21], [137.0, 138.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.57, 0.0, 0.0, 37.07, 35.26, 82.07, 0.0, 43.38, 30.34, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 61.35], ["musical instrument", 8.55], ["didgeridoo", 3.88]], null, null, null, null, null, null, null, null, null, [["speech", 47.36], ["music", 11.13], ["didgeridoo", 4.83]], null, null, [["music", 35.74], ["speech", 19.49], ["pulse", 11.98]], [["hum", 25.49], ["music", 25.42], ["speech", 18.2]], null, null, [["music", 28.03], ["speech", 25.24], ["hum", 8.52]], [["speech", 50.26], ["fart", 12.56], ["boing", 11.86]], null], "duration": [-0.27, 0.27, 0.6, 0.68, 0.57, 0.84, 3.17, 0.91, 0.38, 1.03, 0.01, 0.66, 0.52, 0.57, 0.88, 0.81, 2.2, 0.64, -0.24, 3.53, 11.13, 2.86, 1.73, 2.52, 2.21, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/oOFm9UaRuik_filtered.json b/annotations_filtered/oOFm9UaRuik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a70fd952199a06f9e01b8550461e0327bae5410d --- /dev/null +++ b/annotations_filtered/oOFm9UaRuik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.07], [7.0, 7.53], [11.0, 12.06], [17.0, 17.95], [27.0, 27.24], [30.0, 30.23], [32.0, 35.13], [41.0, 41.12], [53.0, 52.79], [54.0, 57.03], [60.0, 61.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.13, 0.0, 0.0, 71.43, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.07, 0.53, 1.06, 0.95, 0.24, 0.23, 3.13, 0.12, -0.21, 3.03, 1.67]} \ No newline at end of file diff --git a/annotations_filtered/oOWl14GlJx4_filtered.json b/annotations_filtered/oOWl14GlJx4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b5c2d094317ac0303fd1d07bcdce424f06eef63 --- /dev/null +++ b/annotations_filtered/oOWl14GlJx4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.08], [7.0, 9.14], [13.0, 15.11], [16.0, 17.61], [19.0, 97.95], [100.0, 101.29], [103.0, 102.74], [104.0, 106.51], [108.0, 110.02], [111.0, 111.82], [113.0, 123.11]], "keep_status": [false, true, true, false, false, false, false, true, true, false, true], "silence_prob": [0.0, 30.63, 31.58, 0.0, 0.0, 0.0, 0.0, 31.62, 32.9, 0.0, 44.23], "audiomae_on_audioset": [null, [["owl", 17.76], ["throbbing", 13.7], ["hoot", 10.08]], [["music", 18.74], ["hum", 14.09], ["explosion", 10.07]], null, null, null, null, [["wind instrument, woodwind instrument", 23.14], ["foghorn", 21.11], ["speech", 19.0]], [["mains hum", 22.82], ["hum", 12.35], ["throbbing", 7.08]], null, [["speech", 16.63], ["hum", 12.44], ["animal", 7.51]]], "duration": [1.08, 2.14, 2.11, 1.61, 78.95, 1.29, -0.26, 2.51, 2.02, 0.82, 10.11]} \ No newline at end of file diff --git a/annotations_filtered/oOp7Q_xw94I_filtered.json b/annotations_filtered/oOp7Q_xw94I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d6796bfef8b3a9acef0ab6a7a188bec2abc06e7 --- /dev/null +++ b/annotations_filtered/oOp7Q_xw94I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.72], [27.0, 26.82], [30.0, 30.62], [45.0, 50.36], [51.0, 52.51], [58.0, 60.61], [62.0, 64.74], [83.0, 83.56], [88.0, 91.27], [103.0, 106.54], [108.0, 108.65], [110.0, 110.02], [122.0, 123.21]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.58, 0.0, 37.27, 31.74, 0.0, 35.24, 57.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 37.45], ["music", 26.91], ["didgeridoo", 6.59]], null, [["music", 38.37], ["foghorn", 26.6], ["brass instrument", 7.44]], [["music", 25.05], ["double bass", 11.3], ["cello", 10.3]], null, [["foghorn", 37.47], ["speech", 25.13], ["music", 3.51]], null, null, null, null], "duration": [-0.28, -0.18, 0.62, 5.36, 1.51, 2.61, 2.74, 0.56, 3.27, 3.54, 0.65, 0.02, 1.21]} \ No newline at end of file diff --git a/annotations_filtered/oPOqdtLP8XM_filtered.json b/annotations_filtered/oPOqdtLP8XM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c177411da9d08a14bf71583b958611b289da23f9 --- /dev/null +++ b/annotations_filtered/oPOqdtLP8XM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.91], [6.0, 7.16], [10.0, 13.22], [14.0, 16.09], [17.0, 18.27], [22.0, 23.7], [26.0, 27.8], [32.0, 32.91], [34.0, 35.77], [38.0, 41.61], [43.0, 45.62], [48.0, 49.03], [50.0, 51.07], [53.0, 53.0], [54.0, 54.68], [56.0, 57.21], [67.0, 68.74], [70.0, 71.85], [73.0, 74.07], [77.0, 77.16], [80.0, 81.43], [85.0, 85.77], [90.0, 91.15], [92.0, 92.38], [106.0, 107.92], [108.0, 109.39], [112.0, 112.19], [116.0, 117.0], [123.0, 123.53], [126.0, 127.79], [129.0, 129.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 84.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.91, 1.16, 3.22, 2.09, 1.27, 1.7, 1.8, 0.91, 1.77, 3.61, 2.62, 1.03, 1.07, 0.0, 0.68, 1.21, 1.74, 1.85, 1.07, 0.16, 1.43, 0.77, 1.15, 0.38, 1.92, 1.39, 0.19, 1.0, 0.53, 1.79, 0.93]} \ No newline at end of file diff --git a/annotations_filtered/oPS8-oRvVh4_filtered.json b/annotations_filtered/oPS8-oRvVh4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3daac953e5d0c551c2317a5f1ddf1d31b1e9e4b --- /dev/null +++ b/annotations_filtered/oPS8-oRvVh4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 57.3]], "keep_status": [true], "silence_prob": [29.32], "audiomae_on_audioset": [[["mains hum", 18.51], ["hum", 12.63], ["music", 9.6]]], "duration": [16.3]} \ No newline at end of file diff --git a/annotations_filtered/oQAY2uslGuI_filtered.json b/annotations_filtered/oQAY2uslGuI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7bfc204d9cc2305de8f61ea82b0c168b7f66bb1e --- /dev/null +++ b/annotations_filtered/oQAY2uslGuI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 12.97], [15.0, 24.07], [29.0, 29.37], [29.0, 39.93], [40.0, 41.93], [50.0, 50.7]], "keep_status": [false, false, false, false, false, false], "silence_prob": [34.77, 34.43, 0.0, 32.35, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 58.71], ["grunt", 7.15], ["music", 6.51]], [["speech", 42.6], ["burping, eructation", 17.32], ["grunt", 12.3]], null, [["speech", 78.85], ["speech synthesizer", 3.1], ["music", 2.45]], null, null], "duration": [7.97, 9.07, 0.37, 10.93, 1.93, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/oQIubudKQQE_filtered.json b/annotations_filtered/oQIubudKQQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa90740e0017062d9819120477738c4c8cd00c33 --- /dev/null +++ b/annotations_filtered/oQIubudKQQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.23], [9.0, 8.67], [10.0, 13.41], [15.0, 20.98], [23.0, 23.43], [24.0, 25.86], [27.0, 29.73], [35.0, 35.75], [39.0, 39.65], [40.0, 40.32], [40.0, 40.95], [42.0, 42.13], [43.0, 44.07], [52.0, 53.3], [59.0, 62.43], [69.0, 70.53], [72.0, 72.84], [74.0, 75.19], [76.0, 77.09], [82.0, 85.82], [89.0, 91.05], [92.0, 95.25], [98.0, 99.96], [108.0, 108.95], [111.0, 113.36], [114.0, 115.79], [124.0, 125.04], [128.0, 128.36], [133.0, 133.14], [134.0, 143.88], [146.0, 149.37], [150.0, 150.69], [155.0, 156.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 83.7, 69.34, 0.0, 0.0, 82.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.36, 0.0, 0.0, 0.0, 0.0, 99.4, 99.62, 99.98, 0.0, 0.0, 99.76, 0.0, 0.0, 0.0, 0.0, 97.11, 93.29, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.23, -0.33, 3.41, 5.98, 0.43, 1.86, 2.73, 0.75, 0.65, 0.32, 0.95, 0.13, 1.07, 1.3, 3.43, 1.53, 0.84, 1.19, 1.09, 3.82, 2.05, 3.25, 1.96, 0.95, 2.36, 1.79, 1.04, 0.36, 0.14, 9.88, 3.37, 0.69, 1.64]} \ No newline at end of file diff --git a/annotations_filtered/oQjMZTetuEg_filtered.json b/annotations_filtered/oQjMZTetuEg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a4269fa7c09c8ea66b3e87f2d178b7d9099826b --- /dev/null +++ b/annotations_filtered/oQjMZTetuEg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.39], [3.0, 3.48], [15.0, 17.0], [37.0, 36.93], [57.0, 57.7], [59.0, 59.0], [61.0, 67.83], [82.0, 83.24], [86.0, 89.51], [92.0, 94.42], [98.0, 101.53], [106.0, 111.65], [115.0, 116.13], [125.0, 128.87], [131.0, 132.85], [139.0, 139.21], [142.0, 142.33], [152.0, 155.02], [158.0, 158.89]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 41.01, 0.0, 0.0, 0.0, 34.7, 0.0, 28.97, 30.35, 30.18, 30.13, 0.0, 29.37, 0.0, 0.0, 0.0, 41.26, 0.0], "audiomae_on_audioset": [null, null, [["music", 22.8], ["speech", 12.78], ["thunk", 11.63]], null, null, null, [["speech", 54.39], ["music", 38.72], ["boing", 2.06]], null, [["music", 57.86], ["vehicle", 5.68], ["skidding", 4.27]], [["music", 70.0], ["throbbing", 7.91], ["hum", 6.77]], [["music", 65.97], ["speech", 4.5], ["throbbing", 4.28]], [["livestock, farm animals, working animals", 32.13], ["cattle, bovinae", 17.96], ["moo", 13.92]], null, [["music", 66.69], ["boom", 3.08], ["throbbing", 2.99]], null, null, null, [["music", 35.32], ["foghorn", 8.78], ["mains hum", 6.29]], null], "duration": [0.39, 0.48, 2.0, -0.07, 0.7, 0.0, 6.83, 1.24, 3.51, 2.42, 3.53, 5.65, 1.13, 3.87, 1.85, 0.21, 0.33, 3.02, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/oR1-UFrcZ0k_filtered.json b/annotations_filtered/oR1-UFrcZ0k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c60f23db05ee4a32ae356249c0302947a76c6587 --- /dev/null +++ b/annotations_filtered/oR1-UFrcZ0k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 19.26], [21.0, 20.83], [25.0, 31.45], [32.0, 60.29], [61.0, 93.23]], "keep_status": [true, false, false, false, false], "silence_prob": [31.26, 0.0, 31.19, 31.53, 0.0], "audiomae_on_audioset": [[["music", 27.3], ["mains hum", 17.44], ["hum", 11.9]], null, [["music", 68.96], ["speech", 5.55], ["trombone", 3.97]], [["music", 63.02], ["musical instrument", 3.84], ["fart", 3.76]], null], "duration": [3.26, -0.17, 6.45, 28.29, 32.23]} \ No newline at end of file diff --git a/annotations_filtered/oR3h33DSGPM_filtered.json b/annotations_filtered/oR3h33DSGPM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f549e248c5c0ecb7efb5113c2098b50f77debed --- /dev/null +++ b/annotations_filtered/oR3h33DSGPM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 13.04], [14.0, 23.36], [28.0, 40.96], [47.0, 47.8], [49.0, 50.18], [55.0, 55.75], [57.0, 57.32], [58.0, 58.4], [66.0, 66.51], [72.0, 72.57], [87.0, 86.81], [88.0, 89.75], [93.0, 92.7], [97.0, 98.64], [100.0, 102.19], [119.0, 120.53], [127.0, 128.19], [135.0, 136.59], [138.0, 138.65], [140.0, 141.52]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.8, 41.3, 75.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.82, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 68.66], ["hum", 7.47], ["music", 6.46]], [["music", 26.49], ["speech", 19.41], ["didgeridoo", 9.6]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.04, 9.36, 12.96, 0.8, 1.18, 0.75, 0.32, 0.4, 0.51, 0.57, -0.19, 1.75, -0.3, 1.64, 2.19, 1.53, 1.19, 1.59, 0.65, 1.52]} \ No newline at end of file diff --git a/annotations_filtered/oRKbez1LpWU_filtered.json b/annotations_filtered/oRKbez1LpWU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2b4aea0e0e2a14e35fc5ee059c450ff816bc2cc --- /dev/null +++ b/annotations_filtered/oRKbez1LpWU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.24], [7.0, 9.66], [12.0, 14.49], [16.0, 17.42], [18.0, 18.28], [18.0, 20.65], [21.0, 21.3], [22.0, 23.57], [35.0, 35.04], [35.0, 35.77], [44.0, 47.63], [52.0, 52.54], [57.0, 57.42], [77.0, 79.37], [80.0, 80.38], [81.0, 81.04], [83.0, 85.08], [89.0, 89.48], [101.0, 101.65], [105.0, 105.7], [112.0, 113.34], [116.0, 116.56], [123.0, 125.32], [137.0, 137.27], [147.0, 146.97], [149.0, 150.55], [172.0, 171.98], [173.0, 172.76], [177.0, 177.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [98.86, 85.35, 99.21, 0.0, 0.0, 51.94, 0.0, 0.0, 0.0, 0.0, 53.16, 0.0, 0.0, 57.72, 0.0, 0.0, 31.37, 0.0, 0.0, 0.0, 0.0, 0.0, 32.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 24.79], ["cattle, bovinae", 21.32], ["moo", 16.72]], null, null, null, null, null, [["speech", 56.03], ["laughter", 4.05], ["whimper", 4.03]], null, null, null, null, null, null], "duration": [3.24, 2.66, 2.49, 1.42, 0.28, 2.65, 0.3, 1.57, 0.04, 0.77, 3.63, 0.54, 0.42, 2.37, 0.38, 0.04, 2.08, 0.48, 0.65, 0.7, 1.34, 0.56, 2.32, 0.27, -0.03, 1.55, -0.02, -0.24, 0.96]} \ No newline at end of file diff --git a/annotations_filtered/oRRupV-lwbU_filtered.json b/annotations_filtered/oRRupV-lwbU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e88969a5d246d33c2717e83be340cd915b65cf80 --- /dev/null +++ b/annotations_filtered/oRRupV-lwbU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.34], [9.0, 10.03], [13.0, 19.85], [21.0, 25.03], [28.0, 29.24], [32.0, 33.08], [35.0, 35.72], [44.0, 45.82], [49.0, 50.99], [52.0, 53.38], [55.0, 55.56], [59.0, 58.99], [63.0, 63.24], [65.0, 66.51], [74.0, 74.8], [82.0, 82.53], [83.0, 82.93], [84.0, 86.1], [87.0, 88.16], [91.0, 92.48]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.97, 0.0, 36.98, 33.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.75, 0.0, 0.0], "audiomae_on_audioset": [[["boing", 60.89], ["music", 9.47], ["speech", 7.5]], null, [["speech", 43.39], ["explosion", 8.17], ["screaming", 6.97]], [["boing", 26.81], ["speech", 14.22], ["cattle, bovinae", 9.46]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.34, 1.03, 6.85, 4.03, 1.24, 1.08, 0.72, 1.82, 1.99, 1.38, 0.56, -0.01, 0.24, 1.51, 0.8, 0.53, -0.07, 2.1, 1.16, 1.48]} \ No newline at end of file diff --git a/annotations_filtered/oRe8EuewinY_filtered.json b/annotations_filtered/oRe8EuewinY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91c63a0d4108613e095d25eba3ab7fac53a8ee26 --- /dev/null +++ b/annotations_filtered/oRe8EuewinY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.75], [28.0, 28.61], [35.0, 35.56], [37.0, 37.89], [39.0, 39.72], [40.0, 41.67], [44.0, 44.9], [47.0, 47.48], [49.0, 49.45], [51.0, 51.38], [52.0, 53.97], [55.0, 57.21], [58.0, 59.53], [61.0, 85.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.02, 0.0, 29.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.49], ["didgeridoo", 14.08], ["theremin", 11.45]]], "duration": [1.75, 0.61, 0.56, 0.89, 0.72, 1.67, 0.9, 0.48, 0.45, 0.38, 1.97, 2.21, 1.53, 24.77]} \ No newline at end of file diff --git a/annotations_filtered/oRh8qQyIngg_filtered.json b/annotations_filtered/oRh8qQyIngg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9febc99e5c8b2b718df5e0998b0055189e44b6b5 --- /dev/null +++ b/annotations_filtered/oRh8qQyIngg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.99], [8.0, 8.67], [14.0, 65.5], [66.0, 65.55], [66.0, 66.82], [70.0, 74.83], [83.0, 84.5], [89.0, 91.12], [92.0, 98.47], [108.0, 108.97], [111.0, 116.02], [118.0, 117.88], [119.0, 127.14]], "keep_status": [true, false, false, false, false, false, false, true, false, false, true, false, true], "silence_prob": [30.82, 0.0, 0.0, 0.0, 0.0, 30.54, 0.0, 31.87, 30.89, 0.0, 31.48, 0.0, 33.74], "audiomae_on_audioset": [[["music", 27.64], ["noise", 25.61], ["synthesizer", 7.88]], null, null, null, null, [["cattle, bovinae", 31.14], ["moo", 27.03], ["livestock, farm animals, working animals", 21.14]], null, [["foghorn", 31.73], ["music", 22.61], ["speech", 14.49]], [["speech", 43.51], ["sidetone", 21.38], ["music", 10.78]], null, [["music", 24.8], ["speech", 19.21], ["throbbing", 9.26]], null, [["music", 43.61], ["noise", 7.54], ["sidetone", 6.65]]], "duration": [4.99, 0.67, 51.5, -0.45, 0.82, 4.83, 1.5, 2.12, 6.47, 0.97, 5.02, -0.12, 8.14]} \ No newline at end of file diff --git a/annotations_filtered/oS6AtbHHjSo_filtered.json b/annotations_filtered/oS6AtbHHjSo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56fcaa94a1e698a2d658c4f57b9a364d407c40ca --- /dev/null +++ b/annotations_filtered/oS6AtbHHjSo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 15.11], [16.0, 21.76], [24.0, 24.63], [28.0, 42.94], [51.0, 54.75]], "keep_status": [true, true, false, true, false], "silence_prob": [30.11, 30.39, 0.0, 30.24, 30.24], "audiomae_on_audioset": [[["speech", 42.74], ["music", 16.64], ["vehicle", 2.96]], [["speech", 34.77], ["music", 21.87], ["cacophony", 4.33]], null, [["music", 12.29], ["whack, thwack", 10.69], ["speech", 9.23]], [["music", 54.21], ["speech", 18.75], ["throbbing", 5.31]]], "duration": [10.11, 5.76, 0.63, 14.94, 3.75]} \ No newline at end of file diff --git a/annotations_filtered/oS_Iap5D9jQ_filtered.json b/annotations_filtered/oS_Iap5D9jQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab0bbddb877ab91f8f7af999df796188ac250cb9 --- /dev/null +++ b/annotations_filtered/oS_Iap5D9jQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.68], [8.0, 9.02], [12.0, 92.37], [93.0, 108.36], [111.0, 112.82], [114.0, 117.81], [119.0, 119.99], [121.0, 123.87], [125.0, 148.27], [154.0, 156.9], [159.0, 163.78], [164.0, 165.89], [167.0, 168.05], [168.0, 168.79], [170.0, 186.27], [186.0, 186.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [86.45, 0.0, 0.0, 95.51, 0.0, 96.54, 0.0, 96.54, 83.16, 93.76, 88.64, 0.0, 0.0, 0.0, 95.78, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.68, 1.02, 80.37, 15.36, 1.82, 3.81, 0.99, 2.87, 23.27, 2.9, 4.78, 1.89, 1.05, 0.79, 16.27, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/oSc-5smBhRQ_filtered.json b/annotations_filtered/oSc-5smBhRQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7956586d939171d0157bbe23b58d7e24816f7907 --- /dev/null +++ b/annotations_filtered/oSc-5smBhRQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.11], [9.0, 9.9], [11.0, 13.88], [16.0, 16.19], [20.0, 19.79], [38.0, 39.11], [40.0, 40.37], [43.0, 43.36], [45.0, 45.17], [46.0, 46.04], [55.0, 55.56], [57.0, 56.79], [57.0, 57.2], [60.0, 60.42], [69.0, 69.42], [77.0, 77.8], [80.0, 81.03], [83.0, 85.5], [87.0, 90.46], [93.0, 92.69], [93.0, 94.61], [102.0, 103.28], [109.0, 109.73], [111.0, 112.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 76.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.44, 54.1, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.11, 0.9, 2.88, 0.19, -0.21, 1.11, 0.37, 0.36, 0.17, 0.04, 0.56, -0.21, 0.2, 0.42, 0.42, 0.8, 1.03, 2.5, 3.46, -0.31, 1.61, 1.28, 0.73, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/oSpMQ0WtrSs_filtered.json b/annotations_filtered/oSpMQ0WtrSs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51b86d5daf7fae3c30050b0a15dec1012cd7c89c --- /dev/null +++ b/annotations_filtered/oSpMQ0WtrSs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.74], [34.0, 36.46], [41.0, 40.59], [41.0, 41.54], [49.0, 49.45], [53.0, 52.84], [54.0, 56.0], [57.0, 65.92], [67.0, 68.47], [72.0, 73.31], [83.0, 83.49], [84.0, 85.7], [87.0, 87.49], [97.0, 101.24], [116.0, 117.98], [124.0, 124.7], [126.0, 126.71]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [38.56, 100.0, 0.0, 0.0, 0.0, 0.0, 96.42, 49.18, 0.0, 0.0, 0.0, 0.0, 0.0, 44.34, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 34.51], ["moo", 10.62], ["livestock, farm animals, working animals", 8.02]], null, null, null, null, null, null, [["speech", 73.52], ["thunk", 8.63], ["thump, thud", 1.68]], null, null, null, null, null, [["music", 33.48], ["speech", 25.04], ["didgeridoo", 5.42]], null, null, null], "duration": [4.74, 2.46, -0.41, 0.54, 0.45, -0.16, 2.0, 8.92, 1.47, 1.31, 0.49, 1.7, 0.49, 4.24, 1.98, 0.7, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/oSvVjh93suI_filtered.json b/annotations_filtered/oSvVjh93suI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef4e4cb93e82d0c3f49b9c3258444c533e7644f8 --- /dev/null +++ b/annotations_filtered/oSvVjh93suI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 47.88], [48.0, 48.78], [52.0, 52.27], [57.0, 58.21], [59.0, 71.15], [72.0, 72.62], [76.0, 77.35], [78.0, 77.97], [78.0, 78.51], [83.0, 83.12], [84.0, 84.81], [88.0, 88.13], [93.0, 93.51], [96.0, 96.36], [100.0, 100.74], [104.0, 111.75], [117.0, 125.0], [125.0, 128.29], [132.0, 135.62], [143.0, 143.33], [144.0, 149.59], [153.0, 154.01], [157.0, 162.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 69.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.96, 59.96, 73.51, 81.17, 0.0, 93.45, 0.0, 98.01], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, 0.78, 0.27, 1.21, 12.15, 0.62, 1.35, -0.03, 0.51, 0.12, 0.81, 0.13, 0.51, 0.36, 0.74, 7.75, 8.0, 3.29, 3.62, 0.33, 5.59, 1.01, 5.68]} \ No newline at end of file diff --git a/annotations_filtered/oT_RsXOPjTs_filtered.json b/annotations_filtered/oT_RsXOPjTs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8984d49d1d338a5793691f16214d80c9be37c8e0 --- /dev/null +++ b/annotations_filtered/oT_RsXOPjTs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[51.0, 52.79], [55.0, 56.71], [67.0, 67.29], [70.0, 69.84], [78.0, 78.54], [81.0, 81.87], [83.0, 83.79], [84.0, 85.28], [86.0, 86.85], [88.0, 89.43], [91.0, 93.29], [95.0, 118.13], [120.0, 121.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.7, 43.03, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["frog", 21.53], ["gurgling", 13.04], ["whale vocalization", 12.01]], null], "duration": [1.79, 1.71, 0.29, -0.16, 0.54, 0.87, 0.79, 1.28, 0.85, 1.43, 2.29, 23.13, 1.95]} \ No newline at end of file diff --git a/annotations_filtered/oToIYlwJY9I_filtered.json b/annotations_filtered/oToIYlwJY9I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..043d80d6c134150fc6bda1e7ca3f91aaf52ef451 --- /dev/null +++ b/annotations_filtered/oToIYlwJY9I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.27], [4.0, 4.11], [6.0, 9.58], [14.0, 16.11], [18.0, 18.06], [18.0, 19.65], [24.0, 33.42], [34.0, 35.33], [39.0, 39.72], [40.0, 40.34], [41.0, 41.88], [45.0, 59.48], [66.0, 107.06], [108.0, 111.62], [116.0, 117.96], [122.0, 124.6], [128.0, 133.2], [137.0, 137.62], [141.0, 146.89], [147.0, 149.12]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.14, 33.76, 0.0, 0.0, 31.32, 0.0, 0.0, 0.0, 0.0, 32.29, 0.0, 41.34, 0.0, 38.14, 33.95, 0.0, 37.27, 35.5], "audiomae_on_audioset": [null, null, [["music", 49.87], ["speech", 6.1], ["moo", 5.89]], [["music", 74.84], ["speech", 5.36], ["electronic music", 2.94]], null, null, [["music", 78.63], ["speech", 6.9], ["cattle, bovinae", 3.08]], null, null, null, null, [["music", 80.54], ["musical instrument", 2.65], ["didgeridoo", 2.19]], null, [["music", 66.45], ["guitar", 4.12], ["bass guitar", 3.83]], null, [["music", 67.9], ["singing", 3.79], ["dubstep", 3.22]], [["music", 81.41], ["singing", 1.45], ["musical instrument", 0.84]], null, [["music", 65.57], ["bass guitar", 7.55], ["guitar", 5.03]], [["music", 66.7], ["musical instrument", 2.98], ["guitar", 2.87]]], "duration": [1.27, 0.11, 3.58, 2.11, 0.06, 1.65, 9.42, 1.33, 0.72, 0.34, 0.88, 14.48, 41.06, 3.62, 1.96, 2.6, 5.2, 0.62, 5.89, 2.12]} \ No newline at end of file diff --git a/annotations_filtered/oTx_o5B0J1Q_filtered.json b/annotations_filtered/oTx_o5B0J1Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41b6b21c810f0866bc9af0fe492be3be87b20076 --- /dev/null +++ b/annotations_filtered/oTx_o5B0J1Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.94], [7.0, 7.94], [14.0, 13.78], [20.0, 22.28], [24.0, 23.82], [28.0, 39.97], [45.0, 45.47], [46.0, 47.49], [49.0, 53.05], [54.0, 54.06], [58.0, 61.69], [68.0, 70.53], [74.0, 75.09], [76.0, 77.63], [84.0, 84.86], [86.0, 87.22], [91.0, 91.71], [92.0, 93.38], [111.0, 112.29], [115.0, 115.28], [117.0, 118.77]], "keep_status": [false, false, false, true, false, true, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 49.4, 0.0, 32.17, 0.0, 0.0, 48.44, 0.0, 99.92, 43.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 8.66], ["hum", 8.35], ["music", 8.01]], null, [["speech", 25.72], ["music", 24.83], ["vehicle", 4.35]], null, null, [["speech", 26.57], ["fly, housefly", 5.16], ["bee, wasp, etc.", 5.03]], null, null, [["whale vocalization", 22.52], ["music", 16.87], ["didgeridoo", 5.39]], null, null, null, null, null, null, null, null, null], "duration": [0.94, 0.94, -0.22, 2.28, -0.18, 11.97, 0.47, 1.49, 4.05, 0.06, 3.69, 2.53, 1.09, 1.63, 0.86, 1.22, 0.71, 1.38, 1.29, 0.28, 1.77]} \ No newline at end of file diff --git a/annotations_filtered/oTzTcic-1qs_filtered.json b/annotations_filtered/oTzTcic-1qs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75317ec5aab1406367f80e9d78da956928ef699f --- /dev/null +++ b/annotations_filtered/oTzTcic-1qs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.62], [30.0, 30.52], [39.0, 38.77], [42.0, 42.2], [45.0, 46.08], [51.0, 51.11], [54.0, 53.79], [54.0, 55.27], [56.0, 57.13], [57.0, 57.54], [59.0, 58.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.62, 0.52, -0.23, 0.2, 1.08, 0.11, -0.21, 1.27, 1.13, 0.54, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/oUKw4qcGHZs_filtered.json b/annotations_filtered/oUKw4qcGHZs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b317ac65f4269b8e3a8151e2627cc070ba79b4b2 --- /dev/null +++ b/annotations_filtered/oUKw4qcGHZs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[93.0, 95.89], [96.0, 144.22], [148.0, 148.22], [150.0, 154.41], [155.0, 160.03], [164.0, 165.0]], "keep_status": [false, false, false, false, false, false], "silence_prob": [85.17, 0.0, 0.0, 73.06, 51.6, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [2.89, 48.22, 0.22, 4.41, 5.03, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/oUQ9ZKUt2XQ_filtered.json b/annotations_filtered/oUQ9ZKUt2XQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7dd826d57d632e016f1b0345fb898c957818135b --- /dev/null +++ b/annotations_filtered/oUQ9ZKUt2XQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 18.2], [21.0, 21.49], [22.0, 22.59], [28.0, 29.47], [30.0, 31.87], [32.0, 35.24], [43.0, 44.34], [45.0, 46.67], [47.0, 54.99], [57.0, 60.56], [63.0, 65.13], [66.0, 67.04], [69.0, 72.86], [77.0, 77.62], [97.0, 97.73], [98.0, 112.99], [113.0, 119.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.13, 0.0, 0.0, 0.0, 0.0, 98.44, 0.0, 0.0, 100.0, 99.56, 100.0, 0.0, 100.0, 0.0, 0.0, 92.97, 67.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.2, 0.49, 0.59, 1.47, 1.87, 3.24, 1.34, 1.67, 7.99, 3.56, 2.13, 1.04, 3.86, 0.62, 0.73, 14.99, 6.42]} \ No newline at end of file diff --git a/annotations_filtered/oUXPpeE2pv4_filtered.json b/annotations_filtered/oUXPpeE2pv4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4207773c0a815c8cc0eacc066b6c3e72820b4115 --- /dev/null +++ b/annotations_filtered/oUXPpeE2pv4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 30.01], [32.0, 32.1], [37.0, 41.25], [42.0, 42.26], [44.0, 142.72], [144.0, 155.39]], "keep_status": [false, false, true, false, false, true], "silence_prob": [33.5, 0.0, 33.1, 0.0, 0.0, 39.28], "audiomae_on_audioset": [[["speech", 43.25], ["music", 21.42], ["buzz", 13.62]], null, [["chant", 23.07], ["music", 15.57], ["hum", 15.0]], null, null, [["music", 20.98], ["insect", 20.41], ["fly, housefly", 18.93]]], "duration": [19.01, 0.1, 4.25, 0.26, 98.72, 11.39]} \ No newline at end of file diff --git a/annotations_filtered/oUleBi3j0o8_filtered.json b/annotations_filtered/oUleBi3j0o8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71c5cd97fc84060353e67e01a3a1a4e5d7356f11 --- /dev/null +++ b/annotations_filtered/oUleBi3j0o8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 16.61], [21.0, 66.48], [70.0, 76.76], [81.0, 88.25], [91.0, 105.85], [106.0, 124.82], [128.0, 128.58]], "keep_status": [true, false, true, true, true, false, false], "silence_prob": [29.02, 0.0, 29.37, 28.67, 28.73, 28.85, 0.0], "audiomae_on_audioset": [[["music", 28.2], ["speech", 15.43], ["cattle, bovinae", 5.66]], null, [["music", 49.63], ["cacophony", 7.45], ["fart", 5.5]], [["music", 33.54], ["buzz", 10.39], ["hum", 7.9]], [["mains hum", 14.57], ["hum", 12.81], ["speech", 9.0]], [["music", 86.29], ["cacophony", 2.47], ["throbbing", 2.21]], null], "duration": [8.61, 45.48, 6.76, 7.25, 14.85, 18.82, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/oUo_8mKGHvY_filtered.json b/annotations_filtered/oUo_8mKGHvY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b0cd8ab02a0b4f4c9c3a5d6fee393b1cc362407 --- /dev/null +++ b/annotations_filtered/oUo_8mKGHvY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.61], [12.0, 12.38], [19.0, 19.75], [35.0, 34.86], [41.0, 41.64], [45.0, 46.3], [80.0, 81.01], [83.0, 83.59], [85.0, 86.16], [87.0, 87.49], [88.0, 89.61], [90.0, 90.61], [102.0, 103.38], [105.0, 105.17], [109.0, 109.9], [113.0, 113.02], [120.0, 121.37], [122.0, 123.38], [124.0, 127.08], [127.0, 127.92], [131.0, 131.11], [133.0, 132.87], [136.0, 136.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.61, 0.38, 0.75, -0.14, 0.64, 1.3, 1.01, 0.59, 1.16, 0.49, 1.61, 0.61, 1.38, 0.17, 0.9, 0.02, 1.37, 1.38, 3.08, 0.92, 0.11, -0.13, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/oUpzcxwFI6o_filtered.json b/annotations_filtered/oUpzcxwFI6o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3fd852a02e732372e098a7a2f3f7a85c4161bf6d --- /dev/null +++ b/annotations_filtered/oUpzcxwFI6o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.92], [9.0, 13.24], [16.0, 16.48], [22.0, 26.27], [27.0, 29.0], [30.0, 31.51], [37.0, 37.71], [40.0, 40.81], [43.0, 44.1], [47.0, 47.87], [50.0, 51.53], [54.0, 55.68], [57.0, 57.11], [58.0, 60.0], [62.0, 62.82], [66.0, 67.32], [69.0, 72.4], [73.0, 74.19], [75.0, 81.33], [82.0, 98.29], [99.0, 100.3], [101.0, 113.93], [121.0, 124.7], [125.0, 125.24], [132.0, 132.24], [132.0, 132.38], [132.0, 136.22], [138.0, 140.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 84.8, 0.0, 96.66, 71.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0, 92.64, 0.0, 54.23, 84.25, 0.0, 38.79, 42.3, 0.0, 0.0, 0.0, 39.49, 34.68], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 75.59], ["bass guitar", 4.18], ["hum", 2.04]], [["music", 71.05], ["bass guitar", 6.15], ["guitar", 5.37]], null, null, null, [["music", 53.62], ["bass guitar", 7.86], ["plucked string instrument", 5.65]], [["music", 68.24], ["ambient music", 4.72], ["new-age music", 4.35]]], "duration": [0.92, 4.24, 0.48, 4.27, 2.0, 1.51, 0.71, 0.81, 1.1, 0.87, 1.53, 1.68, 0.11, 2.0, 0.82, 1.32, 3.4, 1.19, 6.33, 16.29, 1.3, 12.93, 3.7, 0.24, 0.24, 0.38, 4.22, 2.64]} \ No newline at end of file diff --git a/annotations_filtered/oVLfIoIujHE_filtered.json b/annotations_filtered/oVLfIoIujHE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0780bf8586f9e64816cfa4ce1cf89286a54cf05 --- /dev/null +++ b/annotations_filtered/oVLfIoIujHE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 56.61], [66.0, 66.55], [68.0, 71.81], [73.0, 74.43], [76.0, 77.8], [79.0, 85.14], [86.0, 97.33], [99.0, 101.88], [103.0, 109.58], [112.0, 113.29], [116.0, 119.84], [125.0, 125.52], [126.0, 126.49], [128.0, 128.29], [129.0, 130.4], [132.0, 134.42]], "keep_status": [false, false, false, false, false, false, true, true, true, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 53.78, 0.0, 0.0, 40.31, 35.18, 39.15, 45.95, 0.0, 33.35, 0.0, 0.0, 0.0, 0.0, 36.87], "audiomae_on_audioset": [null, null, null, null, null, [["music", 73.61], ["hum", 5.11], ["musical instrument", 4.23]], [["music", 58.87], ["musical instrument", 5.41], ["speech", 4.97]], [["music", 26.47], ["speech", 5.75], ["musical instrument", 3.14]], [["music", 43.35], ["effects unit", 14.19], ["speech", 5.39]], null, [["music", 23.17], ["sheep", 14.49], ["bleat", 11.14]], null, null, null, null, [["music", 44.14], ["didgeridoo", 16.59], ["mantra", 6.44]]], "duration": [40.61, 0.55, 3.81, 1.43, 1.8, 6.14, 11.33, 2.88, 6.58, 1.29, 3.84, 0.52, 0.49, 0.29, 1.4, 2.42]} \ No newline at end of file diff --git a/annotations_filtered/oW7IadnQblg_filtered.json b/annotations_filtered/oW7IadnQblg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21a5b4c06a9f0cb11b8f41f45dea864908e2cc4f --- /dev/null +++ b/annotations_filtered/oW7IadnQblg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.64], [11.0, 12.06], [24.0, 27.11], [28.0, 41.67], [42.0, 43.66], [46.0, 51.65], [52.0, 53.27], [54.0, 57.32], [58.0, 59.19], [63.0, 65.92], [69.0, 69.9], [73.0, 73.92], [76.0, 77.9], [84.0, 93.6], [95.0, 95.55], [97.0, 97.31], [98.0, 99.91], [102.0, 102.3], [104.0, 110.03]], "keep_status": [false, false, true, true, false, true, false, true, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 32.69, 34.06, 0.0, 33.22, 0.0, 40.02, 0.0, 33.59, 0.0, 0.0, 0.0, 33.17, 0.0, 0.0, 0.0, 0.0, 31.95], "audiomae_on_audioset": [null, null, [["crowd", 26.78], ["cheering", 14.75], ["speech", 9.1]], [["crowd", 23.59], ["cheering", 13.92], ["cattle, bovinae", 12.45]], null, [["livestock, farm animals, working animals", 40.14], ["cattle, bovinae", 13.6], ["moo", 13.45]], null, [["hum", 22.51], ["whale vocalization", 13.58], ["speech", 13.41]], null, [["speech", 15.32], ["livestock, farm animals, working animals", 9.88], ["cattle, bovinae", 5.78]], null, null, null, [["music", 62.14], ["throbbing", 7.44], ["electronic music", 5.68]], null, null, null, null, [["music", 13.95], ["explosion", 9.52], ["sound effect", 8.12]]], "duration": [0.64, 1.06, 3.11, 13.67, 1.66, 5.65, 1.27, 3.32, 1.19, 2.92, 0.9, 0.92, 1.9, 9.6, 0.55, 0.31, 1.91, 0.3, 6.03]} \ No newline at end of file diff --git a/annotations_filtered/oWBYpwZ5-AM_filtered.json b/annotations_filtered/oWBYpwZ5-AM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9fbef9f6ec4c98f7e6a1ee74a9a1e0fa5eacbd2f --- /dev/null +++ b/annotations_filtered/oWBYpwZ5-AM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.63], [6.0, 6.59], [7.0, 8.21], [9.0, 10.0], [13.0, 14.01], [15.0, 18.49], [20.0, 20.29], [21.0, 22.96], [25.0, 26.67], [28.0, 31.41]], "keep_status": [false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 36.15, 0.0, 0.0, 0.0, 53.65], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 36.05], ["mains hum", 16.74], ["hum", 15.84]], null, null, null, null], "duration": [0.63, 0.59, 1.21, 1.0, 1.01, 3.49, 0.29, 1.96, 1.67, 3.41]} \ No newline at end of file diff --git a/annotations_filtered/oWSIUe5wYvc_filtered.json b/annotations_filtered/oWSIUe5wYvc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..359100c211baea495259a4ebd917655647edd693 --- /dev/null +++ b/annotations_filtered/oWSIUe5wYvc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.3], [11.0, 13.49], [17.0, 60.84], [61.0, 107.81], [109.0, 112.23], [114.0, 126.32]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 60.51, 0.0, 0.0, 100.0, 83.16], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [1.3, 2.49, 43.84, 46.81, 3.23, 12.32]} \ No newline at end of file diff --git a/annotations_filtered/oWjtcWh-gyI_filtered.json b/annotations_filtered/oWjtcWh-gyI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1be8c24d4637a2a48e76219b8c4fb85f15df4cf0 --- /dev/null +++ b/annotations_filtered/oWjtcWh-gyI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 9.88], [13.0, 13.59], [16.0, 20.71], [28.0, 29.15], [34.0, 35.75], [36.0, 37.05], [46.0, 53.47], [58.0, 57.92], [59.0, 59.1], [59.0, 60.08], [61.0, 68.47], [89.0, 89.6], [90.0, 90.22], [92.0, 94.07], [96.0, 96.69], [100.0, 121.44], [125.0, 125.44], [127.0, 132.8], [134.0, 135.21], [135.0, 138.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 30.33, 0.0, 0.0, 0.0, 34.01, 0.0, 0.0, 0.0, 35.26, 0.0, 0.0, 41.91, 0.0, 31.05, 0.0, 33.87, 0.0, 32.39], "audiomae_on_audioset": [null, null, [["music", 48.52], ["speech", 35.27], ["electronic music", 2.74]], null, null, null, [["music", 55.83], ["mains hum", 11.57], ["hum", 7.53]], null, null, null, [["music", 56.43], ["didgeridoo", 7.12], ["hum", 5.58]], null, null, [["music", 34.97], ["throbbing", 12.9], ["speech", 11.85]], null, [["electric shaver, electric razor", 33.84], ["speech", 29.83], ["buzz", 11.27]], null, [["speech", 80.84], ["hum", 1.73], ["vehicle", 1.54]], null, [["breaking", 18.43], ["cattle, bovinae", 12.97], ["moo", 11.44]]], "duration": [-0.12, 0.59, 4.71, 1.15, 1.75, 1.05, 7.47, -0.08, 0.1, 1.08, 7.47, 0.6, 0.22, 2.07, 0.69, 21.44, 0.44, 5.8, 1.21, 3.2]} \ No newline at end of file diff --git a/annotations_filtered/oWr69u4tLoc_filtered.json b/annotations_filtered/oWr69u4tLoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58eebf4150c0c9beb0bf1675c3156ea377e89bd6 --- /dev/null +++ b/annotations_filtered/oWr69u4tLoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.0], [4.0, 4.06], [6.0, 6.89], [7.0, 9.46], [11.0, 12.07], [14.0, 14.5], [18.0, 18.06], [20.0, 23.77], [37.0, 44.47], [45.0, 46.03], [49.0, 53.76], [58.0, 58.92], [60.0, 63.88], [65.0, 65.84], [68.0, 69.04], [70.0, 71.31]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 42.98, 0.0, 0.0, 0.0, 53.4, 71.14, 0.0, 59.68, 0.0, 65.55, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 51.39], ["livestock, farm animals, working animals", 5.02], ["moo", 4.3]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.0, 0.06, 0.89, 2.46, 1.07, 0.5, 0.06, 3.77, 7.47, 1.03, 4.76, 0.92, 3.88, 0.84, 1.04, 1.31]} \ No newline at end of file diff --git a/annotations_filtered/oWuYilt9hX8_filtered.json b/annotations_filtered/oWuYilt9hX8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7688426d55698208c496dd88b971955bd6b7be4 --- /dev/null +++ b/annotations_filtered/oWuYilt9hX8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 25.79], [31.0, 31.58], [36.0, 36.86], [42.0, 42.09], [43.0, 43.07], [44.0, 44.91], [46.0, 46.63], [49.0, 49.35], [55.0, 55.14], [56.0, 57.62], [59.0, 58.95], [69.0, 72.69], [78.0, 81.8], [86.0, 87.05], [90.0, 90.51], [106.0, 113.24], [127.0, 127.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.43, 97.83, 0.0, 0.0, 49.87, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["crushing", 57.86], ["music", 12.74], ["creak", 4.58]], null], "duration": [0.79, 0.58, 0.86, 0.09, 0.07, 0.91, 0.63, 0.35, 0.14, 1.62, -0.05, 3.69, 3.8, 1.05, 0.51, 7.24, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/oX3PL_u2LbQ_filtered.json b/annotations_filtered/oX3PL_u2LbQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fcf77441f917578bea0a19b00093b31a8f47f43 --- /dev/null +++ b/annotations_filtered/oX3PL_u2LbQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.22], [3.0, 4.06], [5.0, 5.37], [8.0, 8.24], [9.0, 11.64], [15.0, 15.58], [20.0, 20.78], [22.0, 22.96], [26.0, 26.97], [29.0, 29.93], [31.0, 31.68], [32.0, 33.02], [35.0, 36.32], [37.0, 38.6], [40.0, 40.51], [51.0, 51.22], [75.0, 75.78], [90.0, 91.88], [93.0, 94.05], [95.0, 95.47], [99.0, 99.1], [103.0, 104.31], [109.0, 109.26], [112.0, 112.78], [119.0, 119.03], [130.0, 130.96], [132.0, 137.2], [139.0, 139.95], [141.0, 141.39], [142.0, 144.22], [145.0, 145.25], [146.0, 159.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 99.52, 0.0, 45.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 32.81], ["music", 29.92], ["hum", 8.12]]], "duration": [1.22, 1.06, 0.37, 0.24, 2.64, 0.58, 0.78, 0.96, 0.97, 0.93, 0.68, 1.02, 1.32, 1.6, 0.51, 0.22, 0.78, 1.88, 1.05, 0.47, 0.1, 1.31, 0.26, 0.78, 0.03, 0.96, 5.2, 0.95, 0.39, 2.22, 0.25, 13.29]} \ No newline at end of file diff --git a/annotations_filtered/oXDyQju8my4_filtered.json b/annotations_filtered/oXDyQju8my4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2612448cd9e4ca121c10293440f0ad121de4123 --- /dev/null +++ b/annotations_filtered/oXDyQju8my4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.58], [10.0, 11.7], [21.0, 22.18], [27.0, 27.82], [31.0, 31.45], [39.0, 40.59], [41.0, 41.79], [44.0, 43.87], [45.0, 48.12], [48.0, 50.26], [51.0, 52.07], [55.0, 55.46], [59.0, 61.35], [62.0, 63.19], [64.0, 64.3], [66.0, 70.6], [73.0, 76.3], [92.0, 91.84], [95.0, 96.52], [97.0, 98.22], [99.0, 99.64], [105.0, 105.93], [111.0, 111.7], [114.0, 114.12], [116.0, 116.41], [117.0, 117.46], [119.0, 120.01], [123.0, 126.05]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.48, 41.95, 0.0, 0.0, 99.76, 0.0, 0.0, 37.73, 31.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.17], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["radio", 20.83], ["fart", 12.08], ["speech", 10.42]], [["speech", 42.61], ["music", 9.08], ["hum", 4.99]], null, null, null, null, null, [["hum", 22.4], ["mains hum", 22.3], ["music", 13.01]], [["music", 37.26], ["speech", 16.8], ["musical instrument", 5.34]], null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 52.19], ["moo", 37.95], ["livestock, farm animals, working animals", 4.17]]], "duration": [2.58, 1.7, 1.18, 0.82, 0.45, 1.59, 0.79, -0.13, 3.12, 2.26, 1.07, 0.46, 2.35, 1.19, 0.3, 4.6, 3.3, -0.16, 1.52, 1.22, 0.64, 0.93, 0.7, 0.12, 0.41, 0.46, 1.01, 3.05]} \ No newline at end of file diff --git a/annotations_filtered/oXMUkgWoMlQ_filtered.json b/annotations_filtered/oXMUkgWoMlQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4647b52e8b44b2c31ae1a2892d2a198d0535534c --- /dev/null +++ b/annotations_filtered/oXMUkgWoMlQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.21], [4.0, 4.53], [5.0, 20.06], [30.0, 30.0], [37.0, 36.9], [38.0, 49.91], [50.0, 51.7], [53.0, 60.12]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.56, 0.0, 0.0, 55.18, 0.0, 50.61], "audiomae_on_audioset": [null, null, [["hum", 39.03], ["mains hum", 35.2], ["music", 9.88]], null, null, null, null, null], "duration": [1.21, 0.53, 15.06, 0.0, -0.1, 11.91, 1.7, 7.12]} \ No newline at end of file diff --git a/annotations_filtered/oXpKBkMq_OM_filtered.json b/annotations_filtered/oXpKBkMq_OM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85fca763c0c3dde4ce2335a7a47272fc09295c52 --- /dev/null +++ b/annotations_filtered/oXpKBkMq_OM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 26.18], [27.0, 27.26], [29.0, 58.36]], "keep_status": [false, false, true], "silence_prob": [72.75, 0.0, 32.79], "audiomae_on_audioset": [null, null, [["music", 21.87], ["whack, thwack", 16.41], ["speech", 15.43]]], "duration": [6.18, 0.26, 29.36]} \ No newline at end of file diff --git a/annotations_filtered/oY0IQEEQ35g_filtered.json b/annotations_filtered/oY0IQEEQ35g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4950d22fea4ed8bb8077555f1ba2d4851ea826ea --- /dev/null +++ b/annotations_filtered/oY0IQEEQ35g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.12], [6.0, 6.13], [11.0, 12.87], [20.0, 20.12], [21.0, 21.68], [25.0, 28.04], [30.0, 39.92], [40.0, 41.13], [42.0, 55.93], [57.0, 57.5], [60.0, 91.62], [93.0, 110.76], [119.0, 141.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 92.8, 97.22, 0.0, 45.36, 0.0, 0.0, 36.43, 39.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["gong", 40.72], ["hum", 20.92], ["mains hum", 14.13]], null, null, [["music", 40.24], ["throbbing", 11.29], ["noise", 9.9]], [["music", 66.08], ["throbbing", 5.68], ["hum", 4.23]]], "duration": [1.12, 0.13, 1.87, 0.12, 0.68, 3.04, 9.92, 1.13, 13.93, 0.5, 31.62, 17.76, 22.32]} \ No newline at end of file diff --git a/annotations_filtered/oY0spjrKFdM_filtered.json b/annotations_filtered/oY0spjrKFdM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..653b11ffa4cf08116bf72ca61d4a11dea69b80c8 --- /dev/null +++ b/annotations_filtered/oY0spjrKFdM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.13], [11.0, 12.68], [17.0, 16.98], [24.0, 24.54], [34.0, 35.14], [38.0, 38.8], [45.0, 44.91], [46.0, 47.01], [59.0, 59.78], [61.0, 61.84], [67.0, 67.22], [71.0, 71.07], [72.0, 130.79], [133.0, 137.22], [142.0, 142.5], [148.0, 148.58], [160.0, 161.16], [164.0, 164.61], [167.0, 168.07], [175.0, 176.13], [180.0, 186.06], [187.0, 187.81], [191.0, 191.52], [198.0, 207.35], [208.0, 209.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.35, 0.0, 0.0, 31.21, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["brass instrument", 26.51], ["music", 24.26], ["trombone", 11.83]], null, null, null, null, null, null, [["music", 85.14], ["foghorn", 2.71], ["theremin", 1.08]], null, null, [["music", 74.86], ["boing", 4.4], ["theremin", 2.16]], null], "duration": [0.13, 1.68, -0.02, 0.54, 1.14, 0.8, -0.09, 1.01, 0.78, 0.84, 0.22, 0.07, 58.79, 4.22, 0.5, 0.58, 1.16, 0.61, 1.07, 1.13, 6.06, 0.81, 0.52, 9.35, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/oY1tp2HG06w_filtered.json b/annotations_filtered/oY1tp2HG06w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d18f2f6395142a0f0402cb9c55902665f95ed70 --- /dev/null +++ b/annotations_filtered/oY1tp2HG06w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.58], [8.0, 18.89], [20.0, 23.4], [25.0, 35.21], [37.0, 38.38], [41.0, 45.2], [53.0, 53.59], [57.0, 57.59], [58.0, 59.36], [60.0, 61.21], [67.0, 68.91], [70.0, 71.68], [76.0, 76.59], [78.0, 78.12], [78.0, 83.07], [83.0, 84.25], [85.0, 98.58], [100.0, 100.79], [104.0, 104.3], [105.0, 106.15], [107.0, 108.18], [110.0, 111.11], [112.0, 114.59], [117.0, 119.16], [121.0, 122.3], [124.0, 124.87], [128.0, 130.27], [136.0, 136.59], [143.0, 144.24], [147.0, 149.37], [151.0, 161.15], [166.0, 167.61], [169.0, 170.06], [171.0, 171.76], [178.0, 178.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 51.99, 64.52, 67.89, 0.0, 72.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.57, 0.0, 66.15, 0.0, 0.0, 0.0, 0.0, 0.0, 43.1, 52.27, 0.0, 0.0, 39.28, 0.0, 0.0, 99.93, 32.66, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 77.43], ["sidetone", 3.12], ["dial tone", 2.75]], null, null, null, [["speech", 24.02], ["music", 5.02], ["buzz", 2.98]], null, null, null, [["music", 38.76], ["domestic animals, pets", 9.33], ["animal", 7.47]], null, null, null, null], "duration": [0.58, 10.89, 3.4, 10.21, 1.38, 4.2, 0.59, 0.59, 1.36, 1.21, 1.91, 1.68, 0.59, 0.12, 5.07, 1.25, 13.58, 0.79, 0.3, 1.15, 1.18, 1.11, 2.59, 2.16, 1.3, 0.87, 2.27, 0.59, 1.24, 2.37, 10.15, 1.61, 1.06, 0.76, 0.12]} \ No newline at end of file diff --git a/annotations_filtered/oY31D4QSB-Y_filtered.json b/annotations_filtered/oY31D4QSB-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2dbdb3c675500878b624396fedb1469f3bcd00a2 --- /dev/null +++ b/annotations_filtered/oY31D4QSB-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.08], [13.0, 18.98], [21.0, 21.88], [22.0, 21.96], [26.0, 28.93], [31.0, 35.82], [37.0, 43.92], [44.0, 77.16], [78.0, 85.11], [89.0, 106.66], [108.0, 114.37], [116.0, 116.01], [118.0, 118.84], [119.0, 121.26], [122.0, 124.8]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [98.8, 32.22, 0.0, 0.0, 70.44, 62.27, 50.26, 0.0, 33.68, 32.17, 32.58, 0.0, 0.0, 58.89, 64.86], "audiomae_on_audioset": [null, [["speech", 34.21], ["music", 23.36], ["outside, rural or natural", 3.38]], null, null, null, null, null, null, [["music", 59.86], ["noise", 19.02], ["cacophony", 2.33]], [["music", 48.34], ["noise", 14.12], ["cacophony", 5.06]], [["whale vocalization", 63.88], ["music", 13.89], ["mosquito", 2.46]], null, null, null, null], "duration": [3.08, 5.98, 0.88, -0.04, 2.93, 4.82, 6.92, 33.16, 7.11, 17.66, 6.37, 0.01, 0.84, 2.26, 2.8]} \ No newline at end of file diff --git a/annotations_filtered/oY7QReO1WOQ_filtered.json b/annotations_filtered/oY7QReO1WOQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e77e080b176f546692373df582ebe7103c719cb1 --- /dev/null +++ b/annotations_filtered/oY7QReO1WOQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.22], [9.0, 12.88], [18.0, 18.42], [22.0, 26.43], [31.0, 32.1], [37.0, 36.81], [38.0, 40.34], [49.0, 48.9], [60.0, 60.71]], "keep_status": [false, true, false, true, false, false, true, false, false], "silence_prob": [0.0, 33.35, 0.0, 31.75, 0.0, 0.0, 29.2, 0.0, 0.0], "audiomae_on_audioset": [null, [["gong", 29.96], ["hum", 18.64], ["speech", 14.43]], null, [["thunk", 19.74], ["crack", 18.72], ["breaking", 16.26]], null, null, [["speech", 34.76], ["beatboxing", 10.96], ["thump, thud", 5.81]], null, null], "duration": [1.22, 3.88, 0.42, 4.43, 1.1, -0.19, 2.34, -0.1, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/oYcKftzUS_Y_filtered.json b/annotations_filtered/oYcKftzUS_Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66680e13ac8082f94827d64850e0a0893ce44e14 --- /dev/null +++ b/annotations_filtered/oYcKftzUS_Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.52], [12.0, 12.83], [17.0, 18.1], [20.0, 19.72], [23.0, 24.43], [26.0, 26.65], [28.0, 28.95], [31.0, 31.23], [32.0, 35.78], [38.0, 39.58], [41.0, 42.21], [44.0, 45.98], [48.0, 49.77], [52.0, 55.97], [57.0, 58.7], [59.0, 60.69], [65.0, 66.6], [68.0, 69.35], [70.0, 71.98], [73.0, 74.11], [75.0, 78.04], [79.0, 80.67], [82.0, 83.32], [85.0, 90.61], [91.0, 94.39], [95.0, 97.06], [98.0, 98.78], [101.0, 102.34], [104.0, 107.38], [111.0, 113.8], [120.0, 122.01], [125.0, 129.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 99.31, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 0.83, 1.1, -0.28, 1.43, 0.65, 0.95, 0.23, 3.78, 1.58, 1.21, 1.98, 1.77, 3.97, 1.7, 1.69, 1.6, 1.35, 1.98, 1.11, 3.04, 1.67, 1.32, 5.61, 3.39, 2.06, 0.78, 1.34, 3.38, 2.8, 2.01, 4.63]} \ No newline at end of file diff --git a/annotations_filtered/oYet52yPgu0_filtered.json b/annotations_filtered/oYet52yPgu0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c158709677b87a31090fda1e7f3ffc57decdac44 --- /dev/null +++ b/annotations_filtered/oYet52yPgu0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[70.0, 69.94], [70.0, 70.53], [74.0, 78.24], [80.0, 80.96], [92.0, 91.93], [92.0, 95.57], [101.0, 101.9], [103.0, 103.3], [106.0, 106.88]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.86, 0.0, 0.0, 36.16, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 36.23], ["mains hum", 32.1], ["throbbing", 4.46]], null, null, [["speech", 40.45], ["music", 31.29], ["quack", 7.1]], null, null, null], "duration": [-0.06, 0.53, 4.24, 0.96, -0.07, 3.57, 0.9, 0.3, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/oYx2teRxnvw_filtered.json b/annotations_filtered/oYx2teRxnvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc0a34a9775ce3716354c0b7035c36c83afdf865 --- /dev/null +++ b/annotations_filtered/oYx2teRxnvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.44], [15.0, 20.41], [22.0, 23.18], [24.0, 26.01], [29.0, 29.71], [38.0, 39.09], [43.0, 43.93], [49.0, 49.45], [51.0, 51.51], [53.0, 54.23], [56.0, 56.51], [57.0, 62.8], [65.0, 66.19], [70.0, 70.93], [72.0, 72.67], [75.0, 75.66], [79.0, 79.64], [83.0, 82.98], [84.0, 84.69], [87.0, 87.59], [90.0, 92.69], [93.0, 94.39], [95.0, 96.18], [97.0, 97.38], [98.0, 101.06], [102.0, 103.79], [105.0, 107.65], [108.0, 114.07], [120.0, 120.23], [127.0, 126.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 99.99, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.07, 0.0, 0.0, 0.0, 99.97, 0.0, 91.47, 83.7, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.44, 5.41, 1.18, 2.01, 0.71, 1.09, 0.93, 0.45, 0.51, 1.23, 0.51, 5.8, 1.19, 0.93, 0.67, 0.66, 0.64, -0.02, 0.69, 0.59, 2.69, 1.39, 1.18, 0.38, 3.06, 1.79, 2.65, 6.07, 0.23, -0.09]} \ No newline at end of file diff --git a/annotations_filtered/oZ1Mz78d3wI_filtered.json b/annotations_filtered/oZ1Mz78d3wI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a53c52c6a4edcd2b3606e5c06a3c03ff37ef37e --- /dev/null +++ b/annotations_filtered/oZ1Mz78d3wI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 38.47], [39.0, 42.7], [43.0, 66.9], [67.0, 66.93], [69.0, 72.1], [75.0, 75.05], [77.0, 78.07], [81.0, 84.96], [85.0, 100.21], [101.0, 102.56], [104.0, 104.68], [107.0, 123.3], [125.0, 125.88], [127.0, 150.72], [151.0, 154.18], [157.0, 168.89]], "keep_status": [false, true, true, false, false, false, false, true, false, false, false, true, false, false, true, false], "silence_prob": [32.77, 31.01, 31.83, 0.0, 38.75, 0.0, 0.0, 40.92, 33.77, 0.0, 0.0, 39.18, 0.0, 32.48, 41.93, 35.47], "audiomae_on_audioset": [[["music", 77.05], ["throbbing", 3.53], ["hum", 1.96]], [["music", 35.19], ["singing", 7.17], ["chant", 6.74]], [["music", 55.09], ["throbbing", 5.6], ["synthesizer", 4.55]], null, [["music", 72.9], ["synthesizer", 6.33], ["pulse", 2.27]], null, null, [["music", 19.25], ["noise", 15.28], ["livestock, farm animals, working animals", 6.77]], [["music", 80.55], ["synthesizer", 3.19], ["noise", 2.58]], null, null, [["music", 29.41], ["fly, housefly", 18.23], ["insect", 9.52]], null, [["music", 77.84], ["groan", 4.35], ["carnatic music", 2.24]], [["music", 39.26], ["hum", 10.21], ["theremin", 9.22]], [["music", 58.07], ["theremin", 16.93], ["ambient music", 4.0]]], "duration": [24.47, 3.7, 23.9, -0.07, 3.1, 0.05, 1.07, 3.96, 15.21, 1.56, 0.68, 16.3, 0.88, 23.72, 3.18, 11.89]} \ No newline at end of file diff --git a/annotations_filtered/oZ28XpWmN00_filtered.json b/annotations_filtered/oZ28XpWmN00_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..740813c2ac6c493f5e5b9499b2be913af49cc4d9 --- /dev/null +++ b/annotations_filtered/oZ28XpWmN00_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.59], [8.0, 8.33], [12.0, 12.51], [21.0, 21.46], [31.0, 32.86], [36.0, 36.29], [42.0, 58.53], [59.0, 58.85], [60.0, 63.14], [64.0, 64.91], [66.0, 68.23], [71.0, 71.47], [76.0, 77.03], [80.0, 80.55], [82.0, 85.65], [96.0, 100.85], [106.0, 109.85], [112.0, 125.04]], "keep_status": [true, false, false, false, false, false, false, false, true, false, true, false, false, false, true, false, true, true], "silence_prob": [34.17, 0.0, 0.0, 0.0, 0.0, 0.0, 33.34, 0.0, 39.12, 0.0, 35.29, 0.0, 0.0, 0.0, 34.75, 34.63, 31.57, 32.03], "audiomae_on_audioset": [[["speech", 48.33], ["music", 17.43], ["hum", 3.79]], null, null, null, null, null, [["speech", 43.29], ["music", 28.56], ["buzz", 4.64]], null, [["speech", 28.29], ["hum", 15.36], ["mains hum", 11.76]], null, [["eruption", 22.67], ["music", 12.05], ["hum", 10.4]], null, null, null, [["speech", 15.42], ["eruption", 13.37], ["music", 10.89]], [["speech", 58.06], ["explosion", 10.38], ["eruption", 10.33]], [["speech", 33.64], ["music", 8.3], ["whack, thwack", 4.27]], [["music", 29.0], ["hum", 16.89], ["mains hum", 14.92]]], "duration": [3.59, 0.33, 0.51, 0.46, 1.86, 0.29, 16.53, -0.15, 3.14, 0.91, 2.23, 0.47, 1.03, 0.55, 3.65, 4.85, 3.85, 13.04]} \ No newline at end of file diff --git a/annotations_filtered/oZ868onS6YY_filtered.json b/annotations_filtered/oZ868onS6YY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/oZ868onS6YY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/oZEJTJSZQQs_filtered.json b/annotations_filtered/oZEJTJSZQQs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97c5f19b8dbc9db552bb877210ba67c5d4058280 --- /dev/null +++ b/annotations_filtered/oZEJTJSZQQs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.8], [6.0, 6.91], [8.0, 8.34], [12.0, 12.7], [19.0, 19.58], [22.0, 27.5], [28.0, 28.14], [35.0, 35.51], [42.0, 42.89], [44.0, 44.02], [47.0, 49.5], [50.0, 51.49], [52.0, 54.38], [58.0, 58.68], [66.0, 66.43], [71.0, 72.82], [80.0, 80.6], [81.0, 84.6], [88.0, 90.37], [91.0, 91.52], [102.0, 103.32], [105.0, 106.51], [109.0, 110.73], [113.0, 113.34], [115.0, 115.96], [120.0, 120.8], [124.0, 125.71], [137.0, 137.1], [140.0, 140.0], [146.0, 147.16], [150.0, 154.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 90.08, 0.0, 99.05, 0.0, 0.0, 0.0, 0.0, 100.0, 77.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.8, 0.91, 0.34, 0.7, 0.58, 5.5, 0.14, 0.51, 0.89, 0.02, 2.5, 1.49, 2.38, 0.68, 0.43, 1.82, 0.6, 3.6, 2.37, 0.52, 1.32, 1.51, 1.73, 0.34, 0.96, 0.8, 1.71, 0.1, 0.0, 1.16, 4.14]} \ No newline at end of file diff --git a/annotations_filtered/oZQ95ON2X-s_filtered.json b/annotations_filtered/oZQ95ON2X-s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..445ea21d57fcc945c2060c195f0594c1b172d577 --- /dev/null +++ b/annotations_filtered/oZQ95ON2X-s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.28], [8.0, 11.04], [22.0, 23.06], [24.0, 26.92], [29.0, 29.93], [31.0, 32.04], [41.0, 47.9], [50.0, 61.13], [62.0, 66.01], [70.0, 72.79], [74.0, 77.92], [88.0, 89.26], [91.0, 92.8], [95.0, 95.12], [109.0, 110.02], [111.0, 111.57], [112.0, 113.56], [115.0, 115.97], [116.0, 117.09], [118.0, 123.16], [124.0, 124.83], [127.0, 128.16], [131.0, 132.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.82, 0.0, 88.46, 0.0, 0.0, 69.07, 100.0, 100.0, 98.1, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.28, 3.04, 1.06, 2.92, 0.93, 1.04, 6.9, 11.13, 4.01, 2.79, 3.92, 1.26, 1.8, 0.12, 1.02, 0.57, 1.56, 0.97, 1.09, 5.16, 0.83, 1.16, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/oZePQEUplJs_filtered.json b/annotations_filtered/oZePQEUplJs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ff6edc7e037dc9fa72e5d0ac8002e0d28ab0abe --- /dev/null +++ b/annotations_filtered/oZePQEUplJs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.05], [4.0, 4.97], [9.0, 15.58], [17.0, 18.89], [20.0, 24.16], [25.0, 26.4], [28.0, 28.75], [40.0, 42.38], [44.0, 43.83], [51.0, 52.73], [57.0, 59.29], [63.0, 65.1], [67.0, 74.39], [75.0, 79.44], [80.0, 84.64], [91.0, 90.91], [92.0, 92.74], [95.0, 95.32], [100.0, 103.0], [104.0, 105.87], [107.0, 108.21], [110.0, 110.67], [114.0, 115.94], [118.0, 120.29], [122.0, 125.39], [131.0, 132.0], [138.0, 139.65], [143.0, 143.83], [145.0, 145.89], [148.0, 149.15], [151.0, 153.01], [153.0, 153.15], [153.0, 153.2], [158.0, 158.25], [161.0, 162.33], [169.0, 170.23], [172.0, 174.18], [176.0, 179.68], [184.0, 184.91]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.84, 0.0, 32.28, 0.0, 0.0, 40.21, 0.0, 0.0, 62.78, 80.64, 42.81, 45.88, 40.29, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 90.6, 99.26, 0.0, 0.0, 0.0, 0.0, 0.0, 32.51, 0.0, 0.0, 0.0, 0.0, 0.0, 73.51, 93.91, 0.0], "audiomae_on_audioset": [null, null, [["music", 56.62], ["speech", 11.51], ["radio", 9.56]], null, [["clip-clop", 12.48], ["hum", 11.84], ["horse", 10.68]], null, null, [["speech", 66.93], ["busy signal", 3.45], ["radio", 3.44]], null, null, null, null, [["speech", 44.33], ["sidetone", 15.51], ["radio", 10.32]], [["throbbing", 44.2], ["music", 16.13], ["hum", 7.28]], [["whale vocalization", 18.93], ["speech", 11.98], ["hum", 11.29]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.48], ["sidetone", 15.32], ["noise", 11.73]], null, null, null, null, null, null, null, null], "duration": [0.05, 0.97, 6.58, 1.89, 4.16, 1.4, 0.75, 2.38, -0.17, 1.73, 2.29, 2.1, 7.39, 4.44, 4.64, -0.09, 0.74, 0.32, 3.0, 1.87, 1.21, 0.67, 1.94, 2.29, 3.39, 1.0, 1.65, 0.83, 0.89, 1.15, 2.01, 0.15, 0.2, 0.25, 1.33, 1.23, 2.18, 3.68, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/oZlQMLXqw0g_filtered.json b/annotations_filtered/oZlQMLXqw0g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f88c3718b9f0e792cb9d7b3186028c130744f1c --- /dev/null +++ b/annotations_filtered/oZlQMLXqw0g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.37], [6.0, 8.26], [13.0, 13.27], [17.0, 18.84], [22.0, 22.45], [22.0, 23.67], [29.0, 30.48], [34.0, 34.28], [36.0, 54.13], [59.0, 59.09], [61.0, 62.07], [68.0, 69.04], [70.0, 70.55], [73.0, 74.12], [75.0, 75.54], [83.0, 84.38], [85.0, 85.67], [87.0, 90.32], [99.0, 99.22], [102.0, 101.76], [103.0, 105.14], [108.0, 109.19], [110.0, 111.33], [114.0, 114.44], [115.0, 116.41], [117.0, 125.34], [126.0, 126.87], [128.0, 130.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.13, 0.0, 0.0, 55.89, 0.0, 0.0, 0.0, 0.0, 36.93, 0.0, 36.67], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.78], ["harp", 31.12], ["musical instrument", 11.24]], null, [["music", 34.88], ["harp", 21.56], ["musical instrument", 17.4]]], "duration": [0.37, 2.26, 0.27, 1.84, 0.45, 1.67, 1.48, 0.28, 18.13, 0.09, 1.07, 1.04, 0.55, 1.12, 0.54, 1.38, 0.67, 3.32, 0.22, -0.24, 2.14, 1.19, 1.33, 0.44, 1.41, 8.34, 0.87, 2.81]} \ No newline at end of file diff --git a/annotations_filtered/oZu2JfM2Aq8_filtered.json b/annotations_filtered/oZu2JfM2Aq8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4321130cf24860ab4a5e43d4b0a9d5b9c9792c70 --- /dev/null +++ b/annotations_filtered/oZu2JfM2Aq8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.84], [13.0, 24.49], [26.0, 29.98], [31.0, 32.54], [33.0, 33.25], [41.0, 41.07], [48.0, 48.86], [51.0, 54.26], [55.0, 58.01], [61.0, 62.77], [63.0, 64.37], [66.0, 67.86], [71.0, 71.93], [73.0, 74.29], [83.0, 84.38], [92.0, 92.72], [95.0, 96.28], [97.0, 98.59], [100.0, 100.82], [103.0, 104.33], [105.0, 106.22], [107.0, 107.99], [110.0, 111.35], [112.0, 113.21], [114.0, 114.34], [119.0, 119.67], [122.0, 123.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [46.33, 75.07, 58.55, 0.0, 0.0, 0.0, 0.0, 50.06, 46.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["sidetone", 77.47], ["speech", 10.06], ["hum", 2.04]], null, null, null, null, null, null, null, [["speech", 67.03], ["sidetone", 6.26], ["sonar", 6.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.84, 11.49, 3.98, 1.54, 0.25, 0.07, 0.86, 3.26, 3.01, 1.77, 1.37, 1.86, 0.93, 1.29, 1.38, 0.72, 1.28, 1.59, 0.82, 1.33, 1.22, 0.99, 1.35, 1.21, 0.34, 0.67, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/oZzS9hBwaqg_filtered.json b/annotations_filtered/oZzS9hBwaqg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fb2e08d5803401361486ab6faff3c3cfb19701c --- /dev/null +++ b/annotations_filtered/oZzS9hBwaqg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.61], [10.0, 11.92], [13.0, 14.03], [15.0, 16.7], [20.0, 23.03], [24.0, 24.51], [25.0, 27.09], [29.0, 32.32], [34.0, 40.44], [42.0, 44.93], [47.0, 74.63], [77.0, 137.69], [138.0, 138.45]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [60.7, 0.0, 0.0, 0.0, 56.55, 0.0, 51.71, 46.94, 51.82, 49.78, 32.18, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 42.53], ["mains hum", 21.92], ["music", 19.89]], null, [["hum", 23.05], ["music", 17.8], ["mains hum", 7.86]], [["throbbing", 40.25], ["hum", 23.63], ["music", 16.59]], null, null], "duration": [3.61, 1.92, 1.03, 1.7, 3.03, 0.51, 2.09, 3.32, 6.44, 2.93, 27.63, 60.69, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/o_3BdeGhzrs_filtered.json b/annotations_filtered/o_3BdeGhzrs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a778f5b69050fd4910476b12b5b1abcab92db9a --- /dev/null +++ b/annotations_filtered/o_3BdeGhzrs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 15.8], [19.0, 20.48], [23.0, 43.16], [44.0, 55.44], [62.0, 72.98], [76.0, 145.98], [149.0, 155.9], [156.0, 156.63], [157.0, 157.91], [161.0, 184.57]], "keep_status": [false, false, false, false, true, false, true, false, false, false], "silence_prob": [30.51, 0.0, 30.43, 29.71, 29.85, 0.0, 31.35, 0.0, 0.0, 29.98], "audiomae_on_audioset": [[["speech", 39.54], ["music", 19.98], ["vehicle", 13.11]], null, [["music", 63.92], ["vehicle", 5.91], ["car", 5.03]], [["music", 50.91], ["throbbing", 10.5], ["hum", 9.85]], [["music", 54.92], ["electronic music", 5.48], ["hum", 4.85]], null, [["insect", 30.72], ["fly, housefly", 25.11], ["music", 12.49]], null, null, [["music", 42.68], ["throbbing", 22.27], ["hum", 14.69]]], "duration": [8.8, 1.48, 20.16, 11.44, 10.98, 69.98, 6.9, 0.63, 0.91, 23.57]} \ No newline at end of file diff --git a/annotations_filtered/o_49_kbx9yA_filtered.json b/annotations_filtered/o_49_kbx9yA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f482b75ab3a54c19010a615eabfd1936b525a709 --- /dev/null +++ b/annotations_filtered/o_49_kbx9yA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.65], [3.0, 3.55], [5.0, 7.16], [9.0, 10.76], [12.0, 14.4], [15.0, 17.29], [20.0, 24.27], [26.0, 27.55], [29.0, 33.0], [35.0, 48.64], [49.0, 50.52], [52.0, 64.96], [66.0, 67.46], [69.0, 79.59], [81.0, 81.67], [84.0, 103.62], [105.0, 115.62], [116.0, 116.63], [118.0, 121.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 96.77, 0.0, 99.85, 98.8, 91.81, 0.0, 89.36, 87.37, 0.0, 95.09, 0.0, 70.86, 0.0, 84.25, 82.97, 0.0, 93.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.65, 0.55, 2.16, 1.76, 2.4, 2.29, 4.27, 1.55, 4.0, 13.64, 1.52, 12.96, 1.46, 10.59, 0.67, 19.62, 10.62, 0.63, 3.69]} \ No newline at end of file diff --git a/annotations_filtered/o_6VSJ_RjkE_filtered.json b/annotations_filtered/o_6VSJ_RjkE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28262155af8c433e7a4aa14494e1987f03dc4780 --- /dev/null +++ b/annotations_filtered/o_6VSJ_RjkE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.9], [5.0, 5.0], [5.0, 5.86], [13.0, 13.58], [15.0, 15.57]], "keep_status": [false, false, false, false, false], "silence_prob": [92.15, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [2.9, 0.0, 0.86, 0.58, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/o_N-H_5Pvu8_filtered.json b/annotations_filtered/o_N-H_5Pvu8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e5846495e862b949daa17adc895d9f11fee62b6 --- /dev/null +++ b/annotations_filtered/o_N-H_5Pvu8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.92], [9.0, 11.33], [12.0, 13.26], [15.0, 16.82], [20.0, 21.39], [22.0, 22.05], [23.0, 23.63], [25.0, 26.64], [28.0, 46.52], [47.0, 49.17], [50.0, 50.06], [51.0, 52.74], [55.0, 96.53], [100.0, 100.52], [101.0, 101.7], [103.0, 102.98], [104.0, 106.62], [107.0, 109.58], [110.0, 110.78]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 65.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.64, 35.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.6, 40.41, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["mains hum", 27.47], ["hum", 18.81], ["radio", 14.92]], [["sidetone", 42.96], ["speech", 16.63], ["hum", 13.91]], null, null, null, null, null, null, null, [["hum", 35.6], ["mains hum", 15.11], ["livestock, farm animals, working animals", 3.85]], null], "duration": [0.92, 2.33, 1.26, 1.82, 1.39, 0.05, 0.63, 1.64, 18.52, 2.17, 0.06, 1.74, 41.53, 0.52, 0.7, -0.02, 2.62, 2.58, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/o_vwPlWTrgo_filtered.json b/annotations_filtered/o_vwPlWTrgo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d8f8ffacdf9de47465eb3ef551bd600c8a946d7 --- /dev/null +++ b/annotations_filtered/o_vwPlWTrgo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 12.39], [14.0, 16.75], [19.0, 19.33], [22.0, 28.51], [29.0, 28.9], [29.0, 29.07], [29.0, 34.94], [39.0, 58.09], [59.0, 60.96], [62.0, 63.73], [64.0, 75.39], [76.0, 79.24], [84.0, 123.57], [127.0, 136.7], [137.0, 140.97]], "keep_status": [false, true, false, false, false, false, true, false, false, false, true, true, false, true, true], "silence_prob": [31.26, 34.22, 0.0, 30.81, 0.0, 0.0, 31.76, 30.21, 0.0, 0.0, 33.28, 37.8, 0.0, 32.79, 29.88], "audiomae_on_audioset": [[["music", 64.47], ["synthesizer", 7.22], ["musical instrument", 4.95]], [["speech", 34.99], ["music", 13.24], ["vehicle", 6.3]], null, [["speech", 38.36], ["music", 35.1], ["explosion", 2.71]], null, null, [["speech", 38.84], ["music", 19.77], ["gunshot, gunfire", 6.15]], [["speech", 41.58], ["music", 22.92], ["hum", 8.36]], null, null, [["music", 43.35], ["hum", 8.2], ["didgeridoo", 7.35]], [["music", 37.39], ["didgeridoo", 8.13], ["scary music", 5.25]], null, [["speech", 37.7], ["music", 13.15], ["buzz", 7.67]], [["music", 32.53], ["didgeridoo", 19.35], ["vehicle", 6.14]]], "duration": [9.39, 2.75, 0.33, 6.51, -0.1, 0.07, 5.94, 19.09, 1.96, 1.73, 11.39, 3.24, 39.57, 9.7, 3.97]} \ No newline at end of file diff --git a/annotations_filtered/o_yIykgKbeQ_filtered.json b/annotations_filtered/o_yIykgKbeQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..690e1c18d2370ac5f45b4cca816fc5739ad0eebe --- /dev/null +++ b/annotations_filtered/o_yIykgKbeQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.68], [7.0, 7.82], [10.0, 9.76], [11.0, 12.73], [14.0, 14.3], [15.0, 16.63], [17.0, 19.2], [21.0, 22.6], [28.0, 29.47], [34.0, 34.6], [38.0, 38.37], [40.0, 40.37], [42.0, 42.5], [43.0, 44.59], [46.0, 47.85], [49.0, 50.23], [51.0, 52.35], [54.0, 53.94], [55.0, 56.62], [60.0, 61.35], [62.0, 63.78], [65.0, 66.01], [69.0, 69.75], [75.0, 76.49], [77.0, 77.97], [80.0, 81.51], [84.0, 84.74], [86.0, 87.37], [88.0, 90.15], [91.0, 91.54], [93.0, 93.56], [95.0, 95.82], [97.0, 99.27], [103.0, 104.57], [106.0, 108.57], [110.0, 110.64], [113.0, 119.5], [120.0, 121.81], [124.0, 127.08]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.62, 0.0, 0.0, 0.0, 30.64, 0.0, 37.31, 0.0, 79.59, 0.0, 56.93], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 30.77], ["fly, housefly", 9.86], ["insect", 7.83]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 34.02], ["cattle, bovinae", 31.64], ["moo", 27.61]], null, null, null, [["cattle, bovinae", 21.34], ["moo", 14.21], ["livestock, farm animals, working animals", 12.48]], null, [["fly, housefly", 21.88], ["livestock, farm animals, working animals", 15.99], ["insect", 13.58]], null, null, null, null], "duration": [1.68, 0.82, -0.24, 1.73, 0.3, 1.63, 2.2, 1.6, 1.47, 0.6, 0.37, 0.37, 0.5, 1.59, 1.85, 1.23, 1.35, -0.06, 1.62, 1.35, 1.78, 1.01, 0.75, 1.49, 0.97, 1.51, 0.74, 1.37, 2.15, 0.54, 0.56, 0.82, 2.27, 1.57, 2.57, 0.64, 6.5, 1.81, 3.08]} \ No newline at end of file diff --git a/annotations_filtered/oaKjYmfK_Pw_filtered.json b/annotations_filtered/oaKjYmfK_Pw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..097e3229cb8ceef0117aedb6261c5e7bad422a45 --- /dev/null +++ b/annotations_filtered/oaKjYmfK_Pw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.32], [3.0, 9.78], [11.0, 11.43], [13.0, 13.42], [15.0, 16.07], [17.0, 19.82], [21.0, 22.22], [23.0, 23.41], [26.0, 27.43], [32.0, 32.63], [35.0, 35.21], [39.0, 39.72], [50.0, 51.49], [52.0, 54.63], [59.0, 59.49], [61.0, 62.24], [63.0, 64.03], [65.0, 66.21], [68.0, 68.49], [73.0, 76.69], [78.0, 79.89], [80.0, 83.54], [85.0, 85.92], [95.0, 96.58], [104.0, 113.43], [116.0, 118.18], [121.0, 120.95], [121.0, 121.1], [123.0, 127.94], [138.0, 139.21], [141.0, 141.2], [143.0, 143.14], [144.0, 146.23], [147.0, 153.3], [154.0, 156.09], [158.0, 170.41], [172.0, 173.28], [174.0, 174.82], [176.0, 177.11], [178.0, 181.9], [184.0, 189.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 81.17, 0.0, 0.0, 0.0, 99.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 0.0, 0.0, 0.0, 0.0, 73.82, 0.0, 39.49, 0.0, 0.0, 97.33, 99.88, 0.0, 0.0, 58.38, 0.0, 0.0, 0.0, 75.39, 99.84, 99.36, 72.46, 0.0, 0.0, 0.0, 68.15, 69.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 26.7], ["speech", 19.92], ["music", 9.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.32, 6.78, 0.43, 0.42, 1.07, 2.82, 1.22, 0.41, 1.43, 0.63, 0.21, 0.72, 1.49, 2.63, 0.49, 1.24, 1.03, 1.21, 0.49, 3.69, 1.89, 3.54, 0.92, 1.58, 9.43, 2.18, -0.05, 0.1, 4.94, 1.21, 0.2, 0.14, 2.23, 6.3, 2.09, 12.41, 1.28, 0.82, 1.11, 3.9, 5.57]} \ No newline at end of file diff --git a/annotations_filtered/oaVuVu5KXuE_filtered.json b/annotations_filtered/oaVuVu5KXuE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8ec45713dab7df3253a70ed015819acd7a89b39 --- /dev/null +++ b/annotations_filtered/oaVuVu5KXuE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.93], [11.0, 11.6], [12.0, 22.22], [23.0, 23.48], [25.0, 27.58], [29.0, 30.18], [31.0, 32.95], [33.0, 36.66], [37.0, 36.83], [38.0, 42.18], [44.0, 46.94], [48.0, 52.96], [54.0, 56.22], [57.0, 58.92], [60.0, 62.43], [64.0, 67.04], [71.0, 74.48], [76.0, 78.26], [80.0, 83.0], [85.0, 85.62], [86.0, 87.78], [89.0, 91.02], [93.0, 94.98], [96.0, 96.84], [98.0, 99.23], [100.0, 100.97], [102.0, 102.3], [103.0, 104.45], [106.0, 106.83], [108.0, 108.75], [109.0, 118.32], [121.0, 121.47], [123.0, 123.65], [125.0, 125.56], [128.0, 130.65], [131.0, 140.04], [142.0, 147.58], [149.0, 153.4], [155.0, 156.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.72, 0.0, 100.0, 0.0, 0.0, 29.96, 0.0, 35.47, 99.98, 42.72, 70.86, 0.0, 100.0, 100.0, 100.0, 47.05, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.89, 0.0, 0.0, 0.0, 100.0, 56.48, 100.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 91.78], ["fart", 1.59], ["hum", 0.86]], null, null, null, null, [["speech", 56.34], ["beatboxing", 33.64], ["vocal music", 0.92]], null, [["speech", 61.31], ["music", 5.79], ["sidetone", 4.42]], null, [["sine wave", 33.57], ["sidetone", 19.69], ["speech", 12.38]], null, null, null, null, null, [["tuning fork", 34.21], ["chirp tone", 20.71], ["speech", 20.54]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.93, 0.6, 10.22, 0.48, 2.58, 1.18, 1.95, 3.66, -0.17, 4.18, 2.94, 4.96, 2.22, 1.92, 2.43, 3.04, 3.48, 2.26, 3.0, 0.62, 1.78, 2.02, 1.98, 0.84, 1.23, 0.97, 0.3, 1.45, 0.83, 0.75, 9.32, 0.47, 0.65, 0.56, 2.65, 9.04, 5.58, 4.4, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/oaqTzvd4aq8_filtered.json b/annotations_filtered/oaqTzvd4aq8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6b022251062a66ac389f6c140ab33cc9b37e6bf --- /dev/null +++ b/annotations_filtered/oaqTzvd4aq8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.18], [21.0, 21.88], [28.0, 27.82], [32.0, 32.75], [39.0, 39.19], [46.0, 46.85], [55.0, 56.1], [58.0, 58.92], [63.0, 63.09], [67.0, 67.31], [69.0, 69.3], [73.0, 73.92], [85.0, 85.5], [90.0, 90.58], [100.0, 101.7], [103.0, 103.47], [105.0, 107.59], [110.0, 111.2], [118.0, 119.58], [121.0, 124.19]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [40.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.56, 0.0, 0.0, 31.59], "audiomae_on_audioset": [[["sidetone", 43.5], ["radio", 17.68], ["hum", 7.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.9], ["theremin", 8.36], ["musical instrument", 3.39]], null, null, [["music", 40.98], ["frog", 11.38], ["fly, housefly", 9.51]]], "duration": [2.18, 0.88, -0.18, 0.75, 0.19, 0.85, 1.1, 0.92, 0.09, 0.31, 0.3, 0.92, 0.5, 0.58, 1.7, 0.47, 2.59, 1.2, 1.58, 3.19]} \ No newline at end of file diff --git a/annotations_filtered/ob2QomOgStQ_filtered.json b/annotations_filtered/ob2QomOgStQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e4eba83b3d2d04d2d3c9997f19c663675e500c7 --- /dev/null +++ b/annotations_filtered/ob2QomOgStQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 117.59], [124.0, 124.17], [124.0, 135.57], [136.0, 156.19], [158.0, 169.43], [171.0, 204.42]], "keep_status": [false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 29.13, 29.54, 30.04, 0.0], "audiomae_on_audioset": [null, null, [["hum", 17.73], ["music", 14.71], ["throbbing", 14.43]], [["music", 50.2], ["hum", 6.58], ["speech", 4.94]], [["music", 65.18], ["synthesizer", 5.48], ["speech", 5.48]], null], "duration": [100.59, 0.17, 11.57, 20.19, 11.43, 33.42]} \ No newline at end of file diff --git a/annotations_filtered/obDVqhso9l4_filtered.json b/annotations_filtered/obDVqhso9l4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8fac23709ca41907da735250a32a2e2de8b535f --- /dev/null +++ b/annotations_filtered/obDVqhso9l4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 22.84], [24.0, 27.4], [30.0, 36.07], [37.0, 37.72], [43.0, 43.24], [45.0, 45.82], [47.0, 47.24], [57.0, 57.15]], "keep_status": [true, true, true, false, false, false, false, false], "silence_prob": [39.75, 37.85, 37.44, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["noise", 37.64], ["music", 16.52], ["hum", 8.98]], [["music", 32.56], ["wind chime", 7.74], ["effects unit", 7.31]], [["music", 36.15], ["livestock, farm animals, working animals", 13.33], ["didgeridoo", 8.13]], null, null, null, null, null], "duration": [13.84, 3.4, 6.07, 0.72, 0.24, 0.82, 0.24, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/ob_6XAhj_1U_filtered.json b/annotations_filtered/ob_6XAhj_1U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22af92ece19cf9c06ad0bc09a9fbb2375325edb9 --- /dev/null +++ b/annotations_filtered/ob_6XAhj_1U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.21], [2.0, 2.61], [5.0, 5.73], [10.0, 10.56], [15.0, 16.21], [21.0, 22.2], [23.0, 23.14], [23.0, 24.36], [50.0, 49.96], [60.0, 66.61], [69.0, 69.84], [71.0, 73.67], [74.0, 75.96], [78.0, 78.66], [89.0, 92.42], [99.0, 99.01], [102.0, 102.17], [105.0, 106.17], [108.0, 114.84], [124.0, 126.06], [129.0, 130.91], [133.0, 133.56], [135.0, 136.61], [140.0, 141.69], [142.0, 143.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.4, 0.0, 38.54, 0.0, 0.0, 38.0, 0.0, 0.0, 0.0, 35.64, 39.15, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 43.78], ["hum", 16.6], ["throbbing", 11.34]], null, [["music", 86.93], ["hum", 1.92], ["throbbing", 1.69]], null, null, [["music", 44.48], ["cattle, bovinae", 8.57], ["moo", 6.22]], null, null, null, [["music", 39.7], ["speech", 10.26], ["throbbing", 6.88]], [["music", 31.54], ["speech", 8.18], ["fly, housefly", 5.98]], null, null, null, null, null], "duration": [0.21, 0.61, 0.73, 0.56, 1.21, 1.2, 0.14, 1.36, -0.04, 6.61, 0.84, 2.67, 1.96, 0.66, 3.42, 0.01, 0.17, 1.17, 6.84, 2.06, 1.91, 0.56, 1.61, 1.69, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/obeGwYOdAPc_filtered.json b/annotations_filtered/obeGwYOdAPc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3814366b5075ce78d2ee74426455ef9b6cdde4d --- /dev/null +++ b/annotations_filtered/obeGwYOdAPc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.67], [4.0, 4.28], [9.0, 8.88], [10.0, 10.29], [11.0, 12.82], [30.0, 30.82], [32.0, 37.05], [37.0, 38.35], [40.0, 45.01], [46.0, 62.72], [63.0, 68.45], [75.0, 75.52], [77.0, 85.77], [87.0, 90.29], [91.0, 91.45], [97.0, 100.43], [103.0, 107.42], [109.0, 113.22], [114.0, 116.9], [119.0, 120.29], [121.0, 137.4], [140.0, 150.2], [151.0, 155.28], [158.0, 160.0], [161.0, 161.38]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, true, false, false, true, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.66, 0.0, 66.39, 36.94, 70.16, 0.0, 50.31, 33.04, 0.0, 50.02, 45.43, 31.58, 45.21, 0.0, 33.2, 42.37, 52.33, 71.57, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 39.61], ["breaking", 18.8], ["whack, thwack", 11.43]], null, null, [["gunshot, gunfire", 19.57], ["speech", 13.85], ["whack, thwack", 7.89]], null, null, null, [["whack, thwack", 25.68], ["sound effect", 5.07], ["gunshot, gunfire", 4.72]], null, null, [["speech", 28.92], ["music", 22.0], ["throbbing", 13.65]], [["speech", 39.01], ["music", 25.38], ["burst, pop", 5.86]], [["speech", 38.99], ["music", 20.47], ["animal", 1.78]], null, [["speech", 59.65], ["music", 13.32], ["machine gun", 5.61]], [["whack, thwack", 52.59], ["hum", 10.05], ["thunk", 3.63]], null, null, null], "duration": [0.67, 0.28, -0.12, 0.29, 1.82, 0.82, 5.05, 1.35, 5.01, 16.72, 5.45, 0.52, 8.77, 3.29, 0.45, 3.43, 4.42, 4.22, 2.9, 1.29, 16.4, 10.2, 4.28, 2.0, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/obn9BZj6V-M_filtered.json b/annotations_filtered/obn9BZj6V-M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7261d2a4fb430b5b10fa07bbcc23a9e2109839d1 --- /dev/null +++ b/annotations_filtered/obn9BZj6V-M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.41], [5.0, 5.83], [9.0, 10.66], [15.0, 16.01], [18.0, 20.24], [24.0, 27.31], [29.0, 30.84], [33.0, 33.64], [37.0, 43.28], [45.0, 59.58], [61.0, 93.77], [95.0, 96.82], [98.0, 98.42], [100.0, 102.76], [106.0, 110.15], [115.0, 125.1], [127.0, 131.52], [135.0, 136.56], [139.0, 150.67], [153.0, 158.94], [161.0, 164.59], [167.0, 168.05], [170.0, 173.37], [175.0, 194.93], [196.0, 197.16], [198.0, 222.78], [223.0, 224.87], [225.0, 225.58], [227.0, 227.94], [229.0, 229.8]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false, false, true, true, false, true, false, false, false, true, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 45.72, 52.16, 0.0, 0.0, 32.03, 28.78, 0.0, 0.0, 0.0, 30.66, 30.02, 30.77, 34.65, 0.0, 31.54, 30.2, 28.39, 0.0, 33.92, 28.9, 0.0, 28.95, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 29.83], ["singing bowl", 17.36], ["theremin", 10.22]], null, null, null, [["music", 37.93], ["whale vocalization", 13.49], ["synthesizer", 9.39]], [["speech", 62.94], ["music", 26.74], ["outside, rural or natural", 1.15]], null, null, null, [["speech", 15.56], ["foghorn", 14.88], ["civil defense siren", 9.51]], [["music", 36.29], ["fly, housefly", 7.13], ["mains hum", 7.06]], [["music", 46.71], ["theremin", 35.51], ["hum", 4.91]], [["music", 31.35], ["speech", 17.81], ["whale vocalization", 15.01]], null, [["music", 58.85], ["hum", 14.37], ["electronic music", 7.66]], [["mains hum", 26.84], ["hum", 26.81], ["music", 22.19]], [["music", 20.43], ["vehicle", 7.86], ["rumble", 7.57]], null, [["speech", 21.47], ["music", 16.32], ["civil defense siren", 9.71]], [["music", 66.79], ["theremin", 16.73], ["electronic music", 2.78]], null, [["music", 54.79], ["sound effect", 5.23], ["musical instrument", 3.48]], null, null, null, null], "duration": [0.41, 0.83, 1.66, 1.01, 2.24, 3.31, 1.84, 0.64, 6.28, 14.58, 32.77, 1.82, 0.42, 2.76, 4.15, 10.1, 4.52, 1.56, 11.67, 5.94, 3.59, 1.05, 3.37, 19.93, 1.16, 24.78, 1.87, 0.58, 0.94, 0.8]} \ No newline at end of file diff --git a/annotations_filtered/obnODOdLD7k_filtered.json b/annotations_filtered/obnODOdLD7k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c64d82a9186cf9e806e4e1aeaf407904ec98dde4 --- /dev/null +++ b/annotations_filtered/obnODOdLD7k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.21], [7.0, 7.33], [10.0, 10.02], [16.0, 20.02], [27.0, 30.35], [36.0, 36.44], [39.0, 39.26], [42.0, 42.8], [44.0, 45.22], [45.0, 47.16], [49.0, 49.81], [50.0, 51.44], [52.0, 55.56], [56.0, 58.41], [62.0, 62.28], [63.0, 65.85], [68.0, 67.78], [71.0, 71.46], [72.0, 73.48], [75.0, 75.76], [77.0, 77.45], [78.0, 79.76], [81.0, 83.05], [85.0, 87.18], [89.0, 90.04], [90.0, 91.57], [98.0, 101.04], [101.0, 105.85], [106.0, 106.22], [106.0, 108.35], [109.0, 108.57], [109.0, 118.3], [119.0, 120.92], [121.0, 121.71]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.72, 46.97, 0.0, 0.0, 0.0, 0.0, 83.88, 0.0, 0.0, 44.87, 73.21, 0.0, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 99.97, 0.0, 0.0, 98.59, 71.0, 0.0, 66.76, 0.0, 61.87, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 85.12], ["whack, thwack", 5.9], ["thunk", 3.49]], [["radio", 23.39], ["frog", 12.99], ["livestock, farm animals, working animals", 10.66]], null, null, null, null, null, null, null, [["speech", 34.74], ["radio", 14.44], ["whale vocalization", 7.59]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.21, 0.33, 0.02, 4.02, 3.35, 0.44, 0.26, 0.8, 1.22, 2.16, 0.81, 1.44, 3.56, 2.41, 0.28, 2.85, -0.22, 0.46, 1.48, 0.76, 0.45, 1.76, 2.05, 2.18, 1.04, 1.57, 3.04, 4.85, 0.22, 2.35, -0.43, 9.3, 1.92, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/oc8Hm_t5BRo_filtered.json b/annotations_filtered/oc8Hm_t5BRo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0dda91e20b9c0eeee55e89646827fde77b7c735 --- /dev/null +++ b/annotations_filtered/oc8Hm_t5BRo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.56], [6.0, 9.39], [11.0, 37.18], [39.0, 47.39], [52.0, 62.19], [66.0, 66.56], [71.0, 79.78], [82.0, 91.18], [93.0, 93.88], [96.0, 96.25], [97.0, 99.45], [100.0, 109.04], [110.0, 130.77], [135.0, 134.76], [136.0, 153.15], [154.0, 154.3], [156.0, 158.57]], "keep_status": [false, true, true, false, true, false, true, true, false, false, false, true, true, false, false, false, true], "silence_prob": [53.78, 40.97, 29.79, 30.02, 29.13, 0.0, 29.83, 30.57, 0.0, 0.0, 33.92, 28.53, 28.64, 0.0, 28.54, 0.0, 28.58], "audiomae_on_audioset": [null, [["music", 40.56], ["throbbing", 9.61], ["hum", 9.39]], [["hum", 33.56], ["music", 25.7], ["rumble", 9.36]], [["mains hum", 39.02], ["hum", 33.54], ["speech", 13.7]], [["speech", 30.1], ["music", 11.71], ["vehicle", 9.66]], null, [["music", 24.76], ["hum", 20.79], ["mains hum", 16.86]], [["vehicle", 15.26], ["car", 13.97], ["race car, auto racing", 9.94]], null, null, [["hum", 37.94], ["throbbing", 27.59], ["music", 12.16]], [["music", 37.38], ["speech", 14.57], ["groan", 7.59]], [["animal", 27.7], ["roaring cats (lions, tigers)", 22.9], ["wild animals", 18.93]], null, [["vehicle", 52.04], ["car", 26.54], ["race car, auto racing", 6.04]], null, [["sheep", 29.41], ["bleat", 19.27], ["chant", 6.44]]], "duration": [2.56, 3.39, 26.18, 8.39, 10.19, 0.56, 8.78, 9.18, 0.88, 0.25, 2.45, 9.04, 20.77, -0.24, 17.15, 0.3, 2.57]} \ No newline at end of file diff --git a/annotations_filtered/oc8bWybEFFI_filtered.json b/annotations_filtered/oc8bWybEFFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41baa962a94d32db43d666ee174b2caf0933ee06 --- /dev/null +++ b/annotations_filtered/oc8bWybEFFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.62], [17.0, 17.59], [19.0, 19.45], [26.0, 29.64], [32.0, 43.31], [47.0, 48.81], [50.0, 56.94], [62.0, 62.19], [64.0, 64.61], [74.0, 93.88], [94.0, 96.63], [123.0, 124.82], [125.0, 125.79], [127.0, 127.52], [130.0, 130.55], [132.0, 132.81], [134.0, 135.63], [138.0, 138.21], [140.0, 140.05], [142.0, 142.67], [145.0, 149.93], [155.0, 156.2], [165.0, 168.64], [177.0, 177.31], [178.0, 178.61], [179.0, 180.23]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 94.66, 32.21, 0.0, 33.1, 0.0, 0.0, 30.16, 39.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.31, 0.0, 42.02, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["gong", 73.31], ["music", 13.63], ["hum", 2.81]], null, [["mosquito", 66.4], ["fly, housefly", 14.69], ["whip", 5.33]], null, null, [["whack, thwack", 17.83], ["mosquito", 6.97], ["groan", 6.95]], [["music", 38.87], ["sidetone", 31.35], ["speech", 6.67]], null, null, null, null, null, null, null, null, null, [["speech", 27.43], ["fly, housefly", 25.5], ["insect", 19.03]], null, [["fly, housefly", 27.72], ["speech", 15.1], ["insect", 14.47]], null, null, null], "duration": [0.62, 0.59, 0.45, 3.64, 11.31, 1.81, 6.94, 0.19, 0.61, 19.88, 2.63, 1.82, 0.79, 0.52, 0.55, 0.81, 1.63, 0.21, 0.05, 0.67, 4.93, 1.2, 3.64, 0.31, 0.61, 1.23]} \ No newline at end of file diff --git a/annotations_filtered/ocDL_b6BRE4_filtered.json b/annotations_filtered/ocDL_b6BRE4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17f314315ebe6f1dcdf60b890b21920bc8da07e9 --- /dev/null +++ b/annotations_filtered/ocDL_b6BRE4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.08], [6.0, 7.87], [14.0, 14.15], [15.0, 15.9], [31.0, 33.17], [34.0, 35.65], [39.0, 39.07], [42.0, 44.04], [45.0, 47.07], [49.0, 49.81], [53.0, 53.3], [57.0, 57.6], [58.0, 60.72], [63.0, 71.85], [76.0, 78.63], [85.0, 86.58], [91.0, 92.33], [94.0, 95.77], [97.0, 99.5], [101.0, 106.84], [108.0, 109.19], [114.0, 114.49], [117.0, 116.9], [118.0, 118.44], [120.0, 120.77], [123.0, 124.39], [126.0, 128.6], [129.0, 128.63], [147.0, 149.99], [158.0, 158.62], [166.0, 166.46], [169.0, 170.83], [175.0, 178.29], [179.0, 184.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 73.06, 0.0, 0.0, 99.56, 67.89, 0.0, 0.0, 0.0, 73.51, 39.86, 91.98, 0.0, 0.0, 0.0, 77.7, 34.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.97, 0.0, 73.51, 0.0, 0.0, 0.0, 35.88, 90.43], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 29.99], ["wind instrument, woodwind instrument", 13.72], ["flute", 11.09]], null, null, null, null, null, [["music", 74.97], ["lullaby", 3.52], ["singing bowl", 3.06]], null, null, null, null, null, null, [["music", 63.67], ["theremin", 8.92], ["wind instrument, woodwind instrument", 2.86]], null, null, null, null, null, [["music", 48.16], ["theremin", 19.2], ["synthesizer", 4.37]], null], "duration": [0.08, 1.87, 0.15, 0.9, 2.17, 1.65, 0.07, 2.04, 2.07, 0.81, 0.3, 0.6, 2.72, 8.85, 2.63, 1.58, 1.33, 1.77, 2.5, 5.84, 1.19, 0.49, -0.1, 0.44, 0.77, 1.39, 2.6, -0.37, 2.99, 0.62, 0.46, 1.83, 3.29, 5.86]} \ No newline at end of file diff --git a/annotations_filtered/ocb7pXndlug_filtered.json b/annotations_filtered/ocb7pXndlug_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ffd5bfff7ff8b86cf19aaff9137a26c386e35eb --- /dev/null +++ b/annotations_filtered/ocb7pXndlug_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.33], [4.0, 14.44], [25.0, 25.93], [45.0, 72.35], [75.0, 76.35], [77.0, 81.01], [81.0, 84.62], [86.0, 88.05], [89.0, 93.85]], "keep_status": [false, false, false, true, false, true, true, false, false], "silence_prob": [0.0, 34.22, 0.0, 29.47, 0.0, 31.47, 36.72, 99.95, 82.43], "audiomae_on_audioset": [null, [["cattle, bovinae", 43.65], ["livestock, farm animals, working animals", 35.71], ["moo", 10.61]], null, [["speech", 38.23], ["explosion", 16.59], ["groan", 10.84]], null, [["crushing", 34.53], ["creak", 13.34], ["crack", 10.09]], [["chirp tone", 18.91], ["noise", 13.9], ["music", 8.33]], null, null], "duration": [0.33, 10.44, 0.93, 27.35, 1.35, 4.01, 3.62, 2.05, 4.85]} \ No newline at end of file diff --git a/annotations_filtered/oceYG6ogT_E_filtered.json b/annotations_filtered/oceYG6ogT_E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e24390640130b096c8cb76278f6e43f93875d5a --- /dev/null +++ b/annotations_filtered/oceYG6ogT_E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.49], [12.0, 12.43], [15.0, 19.65], [21.0, 21.73], [23.0, 23.72], [26.0, 27.58], [38.0, 39.28], [40.0, 40.78], [41.0, 42.42], [43.0, 43.21], [44.0, 44.29], [48.0, 49.42], [51.0, 51.92], [57.0, 57.06], [59.0, 59.39], [60.0, 60.05], [63.0, 63.12], [65.0, 65.57], [66.0, 67.66], [94.0, 94.49], [113.0, 114.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 97.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.49, 0.43, 4.65, 0.73, 0.72, 1.58, 1.28, 0.78, 1.42, 0.21, 0.29, 1.42, 0.92, 0.06, 0.39, 0.05, 0.12, 0.57, 1.66, 0.49, 1.66]} \ No newline at end of file diff --git a/annotations_filtered/ocyplDqvhuo_filtered.json b/annotations_filtered/ocyplDqvhuo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..14c2835ea03a66255dfb6d56410f576ef4ba489c --- /dev/null +++ b/annotations_filtered/ocyplDqvhuo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.38], [13.0, 14.66], [17.0, 18.47], [20.0, 20.26], [22.0, 23.14], [25.0, 25.79], [27.0, 28.17], [30.0, 30.62], [31.0, 32.29], [33.0, 34.11], [36.0, 49.4], [51.0, 52.3], [56.0, 56.93], [59.0, 63.66], [65.0, 65.8], [70.0, 71.02], [73.0, 75.02], [78.0, 79.86], [81.0, 81.33], [83.0, 86.19], [87.0, 89.68], [92.0, 95.18], [96.0, 96.45], [97.0, 97.95], [102.0, 103.33], [104.0, 106.03], [107.0, 115.05], [116.0, 116.75], [118.0, 120.68], [123.0, 125.04], [125.0, 127.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.15, 0.0, 0.0, 99.9, 0.0, 0.0, 99.36, 0.0, 0.0, 99.52, 99.4, 99.48, 0.0, 0.0, 0.0, 100.0, 99.1, 0.0, 99.48, 95.51, 99.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.38, 1.66, 1.47, 0.26, 1.14, 0.79, 1.17, 0.62, 1.29, 1.11, 13.4, 1.3, 0.93, 4.66, 0.8, 1.02, 2.02, 1.86, 0.33, 3.19, 2.68, 3.18, 0.45, 0.95, 1.33, 2.03, 8.05, 0.75, 2.68, 2.04, 2.26]} \ No newline at end of file diff --git a/annotations_filtered/od6IxUWPMcs_filtered.json b/annotations_filtered/od6IxUWPMcs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8df0706b5a6293ff03489b62ab0cdd28466d4db --- /dev/null +++ b/annotations_filtered/od6IxUWPMcs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.29], [13.0, 13.07], [17.0, 31.45], [35.0, 35.78], [38.0, 39.83], [41.0, 45.25], [51.0, 55.21], [57.0, 57.37], [66.0, 68.52], [70.0, 77.26], [80.0, 81.4], [85.0, 87.35], [93.0, 93.66], [97.0, 97.17], [101.0, 101.24], [104.0, 106.34], [108.0, 110.29], [143.0, 149.15], [152.0, 152.51], [158.0, 159.49], [163.0, 164.94], [166.0, 166.7], [168.0, 172.47]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 33.14, 0.0, 0.0, 79.41, 47.2, 0.0, 54.63, 47.39, 0.0, 48.52, 0.0, 0.0, 0.0, 55.89, 55.18, 43.15, 0.0, 0.0, 0.0, 0.0, 48.14], "audiomae_on_audioset": [null, null, [["throbbing", 38.45], ["hum", 36.44], ["music", 13.98]], null, null, null, [["sidetone", 48.42], ["hum", 18.01], ["mains hum", 10.15]], null, null, [["sidetone", 49.02], ["throbbing", 10.16], ["speech", 9.52]], null, [["hum", 41.76], ["mains hum", 16.76], ["whale vocalization", 8.36]], null, null, null, null, null, [["hum", 31.53], ["speech", 14.26], ["throbbing", 13.92]], null, null, null, null, [["speech", 16.85], ["radio", 11.11], ["hum", 10.98]]], "duration": [0.29, 0.07, 14.45, 0.78, 1.83, 4.25, 4.21, 0.37, 2.52, 7.26, 1.4, 2.35, 0.66, 0.17, 0.24, 2.34, 2.29, 6.15, 0.51, 1.49, 1.94, 0.7, 4.47]} \ No newline at end of file diff --git a/annotations_filtered/odEociFdDN4_filtered.json b/annotations_filtered/odEociFdDN4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c04dfa4422477158edf1fd3f57e44bd8a60f2c2 --- /dev/null +++ b/annotations_filtered/odEociFdDN4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.32], [8.0, 8.67], [9.0, 9.85], [10.0, 12.16], [19.0, 22.3], [23.0, 24.39], [29.0, 30.05], [33.0, 38.82], [41.0, 41.2], [43.0, 43.36], [45.0, 45.71], [50.0, 50.94], [52.0, 54.85], [58.0, 58.68], [63.0, 65.35], [66.0, 66.7], [68.0, 69.6], [71.0, 71.66], [72.0, 74.44], [76.0, 76.79], [78.0, 78.71], [82.0, 84.28], [85.0, 85.89], [87.0, 93.46], [99.0, 112.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 83.16, 85.35, 0.0, 0.0, 97.11, 0.0, 0.0, 0.0, 0.0, 92.31, 0.0, 98.99, 0.0, 0.0, 0.0, 86.09, 0.0, 0.0, 81.53, 0.0, 69.61, 60.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.32, 0.67, 0.85, 2.16, 3.3, 1.39, 1.05, 5.82, 0.2, 0.36, 0.71, 0.94, 2.85, 0.68, 2.35, 0.7, 1.6, 0.66, 2.44, 0.79, 0.71, 2.28, 0.89, 6.46, 13.21]} \ No newline at end of file diff --git a/annotations_filtered/odNZhZSydNc_filtered.json b/annotations_filtered/odNZhZSydNc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34f89f8bf32ac4aac5af5a5bbfd3f4ccb31f12b3 --- /dev/null +++ b/annotations_filtered/odNZhZSydNc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.71], [4.0, 4.53], [9.0, 14.07], [15.0, 15.9], [18.0, 17.64], [19.0, 19.52], [22.0, 22.57], [24.0, 24.8], [26.0, 26.7], [28.0, 28.39], [31.0, 33.27], [35.0, 35.68], [37.0, 37.56], [42.0, 44.64], [45.0, 46.09], [48.0, 48.39], [54.0, 55.17], [59.0, 59.51], [61.0, 61.32], [66.0, 67.71], [68.0, 68.34], [69.0, 69.89], [78.0, 82.76], [85.0, 89.8], [98.0, 98.49], [99.0, 99.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 62.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.29, 0.0, 0.0, 37.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.56, 29.84, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["wood", 19.79], ["music", 17.7], ["electric shaver, electric razor", 7.01]], null, null, null, null, null, null, null, null, [["mains hum", 44.05], ["hum", 42.9], ["electric shaver, electric razor", 5.28]], [["music", 37.07], ["electric shaver, electric razor", 19.1], ["wail, moan", 5.52]], null, null], "duration": [-0.29, 0.53, 5.07, 0.9, -0.36, 0.52, 0.57, 0.8, 0.7, 0.39, 2.27, 0.68, 0.56, 2.64, 1.09, 0.39, 1.17, 0.51, 0.32, 1.71, 0.34, 0.89, 4.76, 4.8, 0.49, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/odUsOcEqT4g_filtered.json b/annotations_filtered/odUsOcEqT4g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df28b1bf6c9753b286c7de2ab815d9d936c00a3e --- /dev/null +++ b/annotations_filtered/odUsOcEqT4g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.78], [9.0, 9.04], [12.0, 12.78], [16.0, 19.11], [27.0, 29.71], [30.0, 30.27], [31.0, 31.68], [32.0, 33.1], [36.0, 36.46], [37.0, 40.22], [42.0, 56.57], [62.0, 62.63], [65.0, 66.34], [67.0, 69.03], [78.0, 77.55], [78.0, 78.41], [80.0, 83.22], [84.0, 85.01], [87.0, 87.86], [90.0, 94.59], [96.0, 96.92], [99.0, 99.5], [101.0, 100.89], [105.0, 105.95], [111.0, 113.21], [126.0, 126.86], [127.0, 127.58], [131.0, 134.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 59.07, 74.6, 0.0, 0.0, 0.0, 0.0, 57.48, 72.46, 0.0, 0.0, 51.94, 0.0, 0.0, 57.25, 0.0, 0.0, 99.31, 0.0, 0.0, 0.0, 0.0, 59.86, 0.0, 0.0, 97.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.78, 0.04, 0.78, 3.11, 2.71, 0.27, 0.68, 1.1, 0.46, 3.22, 14.57, 0.63, 1.34, 2.03, -0.45, 0.41, 3.22, 1.01, 0.86, 4.59, 0.92, 0.5, -0.11, 0.95, 2.21, 0.86, 0.58, 3.54]} \ No newline at end of file diff --git a/annotations_filtered/odrqxoaNPC0_filtered.json b/annotations_filtered/odrqxoaNPC0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d59f1d3602433da5ea4f85b8f800960e422abbf6 --- /dev/null +++ b/annotations_filtered/odrqxoaNPC0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.79], [14.0, 16.51], [18.0, 43.98], [45.0, 55.27], [56.0, 75.3], [77.0, 103.54], [106.0, 115.96], [116.0, 118.0], [119.0, 122.52]], "keep_status": [false, false, true, false, true, true, false, false, false], "silence_prob": [0.0, 99.62, 32.55, 37.34, 31.11, 31.81, 69.2, 87.55, 84.62], "audiomae_on_audioset": [null, null, [["speech", 56.07], ["music", 4.83], ["outside, rural or natural", 3.27]], [["speech", 47.34], ["music", 28.22], ["outside, urban or manmade", 2.01]], [["speech", 32.42], ["insect", 10.73], ["vehicle", 10.01]], [["music", 10.78], ["burst, pop", 6.31], ["smash, crash", 6.21]], null, null, null], "duration": [0.79, 2.51, 25.98, 10.27, 19.3, 26.54, 9.96, 2.0, 3.52]} \ No newline at end of file diff --git a/annotations_filtered/oeCRY2mdih8_filtered.json b/annotations_filtered/oeCRY2mdih8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39fa4711ade9803049aada7bf465c12f96970f3e --- /dev/null +++ b/annotations_filtered/oeCRY2mdih8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.26], [5.0, 4.73], [8.0, 10.61], [13.0, 14.45], [15.0, 16.6], [18.0, 19.41], [23.0, 25.64], [27.0, 28.43], [30.0, 30.86], [32.0, 33.98], [36.0, 36.58], [38.0, 38.25], [39.0, 40.09], [44.0, 60.66], [62.0, 69.3], [71.0, 71.36], [73.0, 73.09], [77.0, 81.62], [84.0, 85.8], [90.0, 91.3], [93.0, 96.3], [100.0, 100.2], [102.0, 104.14], [105.0, 106.47], [108.0, 108.55], [110.0, 109.97], [111.0, 111.6], [113.0, 119.62], [122.0, 122.67], [124.0, 130.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 98.66, 0.0, 0.0, 0.0, 96.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.32, 39.08, 0.0, 0.0, 49.97, 0.0, 0.0, 51.34, 0.0, 65.79, 0.0, 0.0, 0.0, 0.0, 51.44, 0.0, 40.57], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.89], ["frog", 19.47], ["musical instrument", 5.02]], [["music", 51.17], ["musical instrument", 5.72], ["animal", 3.42]], null, null, [["music", 60.35], ["musical instrument", 5.47], ["guitar", 3.31]], null, null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 23.59], ["noise", 8.24], ["crackle", 5.59]]], "duration": [0.26, -0.27, 2.61, 1.45, 1.6, 1.41, 2.64, 1.43, 0.86, 1.98, 0.58, 0.25, 1.09, 16.66, 7.3, 0.36, 0.09, 4.62, 1.8, 1.3, 3.3, 0.2, 2.14, 1.47, 0.55, -0.03, 0.6, 6.62, 0.67, 6.65]} \ No newline at end of file diff --git a/annotations_filtered/oeF5tq_zeqU_filtered.json b/annotations_filtered/oeF5tq_zeqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96886b61860237a2142711faf8f34de0c84bc628 --- /dev/null +++ b/annotations_filtered/oeF5tq_zeqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.51], [4.0, 16.51], [18.0, 20.36], [22.0, 23.72], [27.0, 26.84], [29.0, 33.12], [34.0, 38.31], [39.0, 39.78], [41.0, 44.0], [45.0, 52.1], [53.0, 57.23], [57.0, 58.38], [60.0, 62.06], [63.0, 63.9], [64.0, 66.46], [68.0, 72.23], [73.0, 74.04], [75.0, 75.2], [76.0, 80.77], [85.0, 93.26], [95.0, 95.93], [99.0, 102.81], [108.0, 111.67], [113.0, 114.05], [115.0, 149.91], [152.0, 159.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 50.16, 99.82, 0.0, 0.0, 65.79, 99.78, 0.0, 50.06, 73.67, 95.37, 0.0, 99.48, 0.0, 42.19, 94.37, 0.0, 0.0, 89.54, 88.28, 0.0, 95.37, 99.78, 0.0, 0.0, 57.01], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.06], ["singing bowl", 24.41], ["music", 9.72]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.51, 12.51, 2.36, 1.72, -0.16, 4.12, 4.31, 0.78, 3.0, 7.1, 4.23, 1.38, 2.06, 0.9, 2.46, 4.23, 1.04, 0.2, 4.77, 8.26, 0.93, 3.81, 3.67, 1.05, 34.91, 7.16]} \ No newline at end of file diff --git a/annotations_filtered/oeQ4HWhPEdA_filtered.json b/annotations_filtered/oeQ4HWhPEdA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..533223871b1826228013c068e0ed4384130e7615 --- /dev/null +++ b/annotations_filtered/oeQ4HWhPEdA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.28], [23.0, 23.95], [31.0, 31.13], [48.0, 47.98], [59.0, 59.12], [64.0, 64.42], [80.0, 80.52]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [1.28, 0.95, 0.13, -0.02, 0.12, 0.42, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/oeW9lZBY-VM_filtered.json b/annotations_filtered/oeW9lZBY-VM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3831dfa4b8aaa4212f094a3050206f8a3ef73d6 --- /dev/null +++ b/annotations_filtered/oeW9lZBY-VM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.12], [6.0, 5.83], [12.0, 12.34], [17.0, 21.14], [26.0, 26.67], [30.0, 30.18], [46.0, 46.75], [51.0, 55.71], [56.0, 55.95], [57.0, 59.07], [60.0, 61.97], [72.0, 73.18], [74.0, 75.29], [85.0, 86.7], [95.0, 94.9], [98.0, 103.13], [107.0, 107.5], [108.0, 112.21], [113.0, 114.29], [117.0, 117.76], [123.0, 124.41], [127.0, 127.8], [133.0, 136.58], [138.0, 141.29], [143.0, 142.7], [145.0, 145.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 73.82, 0.0, 0.0, 0.0, 82.79, 0.0, 98.59, 0.0, 0.0, 0.0, 0.0, 0.0, 43.48, 0.0, 90.43, 0.0, 0.0, 0.0, 0.0, 99.21, 93.76, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mantra", 21.12], ["lullaby", 12.91], ["male singing", 10.44]], null, null, null, null, null, null, null, null, null, null], "duration": [0.12, -0.17, 0.34, 4.14, 0.67, 0.18, 0.75, 4.71, -0.05, 2.07, 1.97, 1.18, 1.29, 1.7, -0.1, 5.13, 0.5, 4.21, 1.29, 0.76, 1.41, 0.8, 3.58, 3.29, -0.3, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/oefn8TJ3_H8_filtered.json b/annotations_filtered/oefn8TJ3_H8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de8f7011013ba20ba3350c6568ff252194e2ae73 --- /dev/null +++ b/annotations_filtered/oefn8TJ3_H8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 18.23], [21.0, 24.43], [26.0, 26.59], [27.0, 30.2], [32.0, 33.12], [34.0, 37.23], [43.0, 44.54], [49.0, 51.29], [52.0, 52.35], [54.0, 54.92], [56.0, 59.85], [63.0, 68.25], [71.0, 73.01], [75.0, 76.3], [78.0, 80.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [61.08, 97.22, 0.0, 73.67, 0.0, 54.9, 0.0, 91.98, 0.0, 0.0, 87.55, 70.16, 92.31, 0.0, 89.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.23, 3.43, 0.59, 3.2, 1.12, 3.23, 1.54, 2.29, 0.35, 0.92, 3.85, 5.25, 2.01, 1.3, 2.32]} \ No newline at end of file diff --git a/annotations_filtered/oepaVuuBAtA_filtered.json b/annotations_filtered/oepaVuuBAtA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..adaa7f1387a1ee52349f914d15806e60b4995e35 --- /dev/null +++ b/annotations_filtered/oepaVuuBAtA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.52], [4.0, 4.77], [6.0, 7.94], [9.0, 10.35], [12.0, 14.52], [15.0, 15.97], [16.0, 17.15], [18.0, 18.98], [24.0, 25.56], [27.0, 27.65], [29.0, 29.56], [32.0, 32.66], [33.0, 34.8], [36.0, 38.11], [39.0, 40.31], [42.0, 44.47], [46.0, 47.6], [48.0, 49.27], [50.0, 51.63], [52.0, 53.16], [55.0, 55.66], [58.0, 58.51], [59.0, 60.17], [62.0, 63.51], [64.0, 65.11], [67.0, 67.9], [71.0, 71.68], [79.0, 79.86], [81.0, 80.89], [83.0, 88.35], [89.0, 90.53], [92.0, 92.42], [93.0, 93.66], [96.0, 96.43], [99.0, 99.71], [102.0, 102.73], [103.0, 106.89], [108.0, 108.55], [110.0, 111.11], [112.0, 113.22], [115.0, 116.01], [118.0, 119.28], [123.0, 123.16], [124.0, 124.83], [125.0, 126.69], [128.0, 128.22], [129.0, 132.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 42.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.09, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.54], "audiomae_on_audioset": [null, null, null, null, [["speech", 51.62], ["dial tone", 17.63], ["busy signal", 8.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 68.98], ["speech", 25.26], ["dial tone", 2.82]]], "duration": [0.52, 0.77, 1.94, 1.35, 2.52, 0.97, 1.15, 0.98, 1.56, 0.65, 0.56, 0.66, 1.8, 2.11, 1.31, 2.47, 1.6, 1.27, 1.63, 1.16, 0.66, 0.51, 1.17, 1.51, 1.11, 0.9, 0.68, 0.86, -0.11, 5.35, 1.53, 0.42, 0.66, 0.43, 0.71, 0.73, 3.89, 0.55, 1.11, 1.22, 1.01, 1.28, 0.16, 0.83, 1.69, 0.22, 3.58]} \ No newline at end of file diff --git a/annotations_filtered/oexJPg9rZqo_filtered.json b/annotations_filtered/oexJPg9rZqo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c13fe57e87a23d61541f6b25bee7d7d8834244a3 --- /dev/null +++ b/annotations_filtered/oexJPg9rZqo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 50.11], [53.0, 53.94], [55.0, 55.66], [57.0, 60.44], [63.0, 67.29], [71.0, 116.78], [120.0, 119.94], [122.0, 127.36]], "keep_status": [false, false, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 29.11, 33.45, 0.0, 0.0, 29.64], "audiomae_on_audioset": [null, null, null, [["music", 31.42], ["throbbing", 9.22], ["speech", 6.98]], [["music", 40.95], ["speech", 18.44], ["sidetone", 5.63]], null, null, [["sidetone", 30.25], ["speech", 28.89], ["music", 9.7]]], "duration": [32.11, 0.94, 0.66, 3.44, 4.29, 45.78, -0.06, 5.36]} \ No newline at end of file diff --git a/annotations_filtered/oezKQEF0deY_filtered.json b/annotations_filtered/oezKQEF0deY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..710c9b50e409698f9a0eb4105e38c48af89fea2d --- /dev/null +++ b/annotations_filtered/oezKQEF0deY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.2], [11.0, 13.59], [15.0, 22.1], [23.0, 25.66], [27.0, 29.08], [30.0, 33.74], [35.0, 59.44], [64.0, 80.87]], "keep_status": [false, false, false, false, false, false, true, false], "silence_prob": [65.09, 65.2, 58.22, 90.95, 98.51, 96.17, 47.5, 39.11], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 17.82], ["speech", 16.69], ["noise", 11.14]], [["music", 66.62], ["tubular bells", 7.37], ["chime", 3.4]]], "duration": [2.2, 2.59, 7.1, 2.66, 2.08, 3.74, 24.44, 16.87]} \ No newline at end of file diff --git a/annotations_filtered/of7H9H_aPxg_filtered.json b/annotations_filtered/of7H9H_aPxg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c4262ddc9b60e2452e1cb767d625420432be7d5 --- /dev/null +++ b/annotations_filtered/of7H9H_aPxg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.1], [7.0, 7.2], [8.0, 8.36], [10.0, 32.58]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 32.69], "audiomae_on_audioset": [null, null, null, [["hum", 24.32], ["speech", 18.49], ["music", 17.69]]], "duration": [0.1, 0.2, 0.36, 22.58]} \ No newline at end of file diff --git a/annotations_filtered/ofIzQbTGQ2E_filtered.json b/annotations_filtered/ofIzQbTGQ2E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f57e4648aedea94d223c1980217b1ef5f0f5621 --- /dev/null +++ b/annotations_filtered/ofIzQbTGQ2E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.08], [8.0, 11.37], [13.0, 17.39], [18.0, 18.94], [20.0, 20.48], [21.0, 23.55], [24.0, 24.33], [25.0, 25.0], [27.0, 27.73], [30.0, 30.01], [34.0, 34.94], [38.0, 46.58], [49.0, 49.6], [51.0, 51.49], [53.0, 53.27], [54.0, 55.61], [60.0, 61.11], [64.0, 64.17], [65.0, 67.9], [70.0, 78.06], [79.0, 79.56], [81.0, 83.69], [84.0, 85.16], [85.0, 89.72], [95.0, 95.55], [96.0, 97.06], [97.0, 99.35], [100.0, 101.63], [103.0, 103.87], [105.0, 109.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [43.28, 74.6, 70.72, 0.0, 0.0, 50.21, 0.0, 0.0, 0.0, 0.0, 0.0, 76.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.77, 93.91, 0.0, 78.21, 0.0, 54.3, 0.0, 0.0, 56.4, 0.0, 0.0, 42.24], "audiomae_on_audioset": [[["fly, housefly", 53.24], ["insect", 23.18], ["mosquito", 6.19]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 23.21], ["music", 17.24], ["inside, small room", 8.8]]], "duration": [2.08, 3.37, 4.39, 0.94, 0.48, 2.55, 0.33, 0.0, 0.73, 0.01, 0.94, 8.58, 0.6, 0.49, 0.27, 1.61, 1.11, 0.17, 2.9, 8.06, 0.56, 2.69, 1.16, 4.72, 0.55, 1.06, 2.35, 1.63, 0.87, 4.41]} \ No newline at end of file diff --git a/annotations_filtered/ofWdRHOZpV4_filtered.json b/annotations_filtered/ofWdRHOZpV4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/ofWdRHOZpV4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/ofYq-2TXzTs_filtered.json b/annotations_filtered/ofYq-2TXzTs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27ef2080b53ca7fbecedfc352ad13c2069fa8bb2 --- /dev/null +++ b/annotations_filtered/ofYq-2TXzTs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.55], [6.0, 12.12], [13.0, 15.82], [17.0, 18.84], [20.0, 19.72], [23.0, 23.92], [25.0, 26.64], [27.0, 30.67], [32.0, 34.65], [36.0, 38.06], [43.0, 43.43]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [36.5, 33.82, 33.38, 0.0, 0.0, 0.0, 0.0, 66.51, 40.68, 44.34, 0.0], "audiomae_on_audioset": [[["music", 41.95], ["hum", 14.23], ["throbbing", 6.83]], [["hum", 44.55], ["throbbing", 15.22], ["speech", 13.36]], [["music", 89.75], ["theremin", 2.3], ["electronic music", 1.01]], null, null, null, null, null, [["speech", 25.62], ["hum", 23.34], ["mains hum", 13.15]], [["music", 42.18], ["whale vocalization", 26.54], ["theremin", 12.42]], null], "duration": [3.55, 6.12, 2.82, 1.84, -0.28, 0.92, 1.64, 3.67, 2.65, 2.06, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/oflbCHWZCBU_filtered.json b/annotations_filtered/oflbCHWZCBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9e5fe578fbd8ecd73c4ea1d67623d8dda1c8cd8 --- /dev/null +++ b/annotations_filtered/oflbCHWZCBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.52], [5.0, 5.49], [7.0, 10.62], [11.0, 12.12], [15.0, 15.53], [17.0, 21.14], [24.0, 24.41], [26.0, 27.43], [28.0, 30.1], [31.0, 32.83], [34.0, 37.34], [39.0, 40.59], [42.0, 42.84], [44.0, 46.06], [46.0, 46.2], [46.0, 49.74], [55.0, 56.81], [61.0, 64.18], [66.0, 65.94], [66.0, 66.01], [67.0, 70.19], [71.0, 75.63], [77.0, 91.42], [94.0, 96.21], [97.0, 97.19], [101.0, 102.24], [103.0, 103.99], [106.0, 112.63], [113.0, 114.44], [119.0, 120.7], [126.0, 127.3], [132.0, 134.42], [137.0, 150.5], [155.0, 160.54], [164.0, 167.17], [169.0, 173.35], [180.0, 180.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 64.18, 0.0, 0.0, 90.43, 0.0, 0.0, 81.53, 0.0, 32.29, 0.0, 0.0, 31.98, 0.0, 31.17, 0.0, 31.3, 0.0, 0.0, 32.14, 31.16, 31.19, 42.48, 0.0, 0.0, 0.0, 36.04, 0.0, 0.0, 0.0, 31.74, 30.24, 30.25, 31.58, 31.04, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 76.72], ["guitar", 4.98], ["musical instrument", 4.4]], null, null, [["music", 65.76], ["guitar", 5.88], ["plucked string instrument", 4.42]], null, [["music", 71.19], ["boing", 8.47], ["speech", 5.29]], null, [["music", 74.74], ["bass guitar", 3.82], ["country", 2.08]], null, null, [["music", 73.4], ["guitar", 3.27], ["bass guitar", 3.23]], [["music", 48.92], ["musical instrument", 6.1], ["singing", 5.7]], [["music", 85.78], ["country", 2.04], ["musical instrument", 1.99]], [["music", 65.53], ["speech", 1.39], ["musical instrument", 1.23]], null, null, null, [["music", 68.03], ["speech", 3.74], ["musical instrument", 1.87]], null, null, null, [["music", 74.45], ["synthesizer", 4.1], ["musical instrument", 2.82]], [["music", 87.01], ["didgeridoo", 8.42], ["musical instrument", 0.74]], [["music", 76.12], ["didgeridoo", 4.44], ["livestock, farm animals, working animals", 3.16]], [["music", 71.64], ["speech", 3.07], ["guitar", 1.16]], [["music", 80.62], ["musical instrument", 2.26], ["bass guitar", 1.99]], null], "duration": [1.52, 0.49, 3.62, 1.12, 0.53, 4.14, 0.41, 1.43, 2.1, 1.83, 3.34, 1.59, 0.84, 2.06, 0.2, 3.74, 1.81, 3.18, -0.06, 0.01, 3.19, 4.63, 14.42, 2.21, 0.19, 1.24, 0.99, 6.63, 1.44, 1.7, 1.3, 2.42, 13.5, 5.54, 3.17, 4.35, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/oflnRQP6Woo_filtered.json b/annotations_filtered/oflnRQP6Woo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..907c8be30404ced43c5786ba600226a4fb80a2b8 --- /dev/null +++ b/annotations_filtered/oflnRQP6Woo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.75], [23.0, 27.06], [30.0, 33.22], [35.0, 36.85], [37.0, 82.71], [90.0, 90.42], [93.0, 113.22], [114.0, 117.14], [117.0, 118.52], [119.0, 119.7], [120.0, 120.88], [122.0, 122.22], [123.0, 129.03], [131.0, 136.83], [139.0, 144.8], [146.0, 146.13], [147.0, 149.96], [150.0, 151.07], [152.0, 152.36], [154.0, 156.78], [160.0, 171.85], [180.0, 179.56], [182.0, 186.87], [191.0, 191.64]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 36.67, 37.09, 0.0, 0.0, 0.0, 41.52, 39.41, 0.0, 0.0, 0.0, 0.0, 39.83, 62.68, 99.48, 0.0, 67.63, 0.0, 0.0, 34.8, 31.37, 0.0, 33.26, 0.0], "audiomae_on_audioset": [null, [["speech", 38.74], ["music", 21.15], ["hum", 9.43]], [["music", 43.74], ["throbbing", 9.89], ["hum", 9.66]], null, null, null, [["music", 59.43], ["hum", 15.23], ["throbbing", 6.18]], [["speech", 42.65], ["music", 39.68], ["synthesizer", 2.61]], null, null, null, null, [["music", 35.66], ["speech", 20.41], ["animal", 6.42]], null, null, null, null, null, null, [["music", 75.66], ["synthesizer", 7.67], ["musical instrument", 2.44]], [["music", 82.06], ["throbbing", 2.09], ["electronic music", 1.48]], null, [["music", 36.77], ["boing", 15.79], ["speech", 10.89]], null], "duration": [0.75, 4.06, 3.22, 1.85, 45.71, 0.42, 20.22, 3.14, 1.52, 0.7, 0.88, 0.22, 6.03, 5.83, 5.8, 0.13, 2.96, 1.07, 0.36, 2.78, 11.85, -0.44, 4.87, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/ofmssjTsGnE_filtered.json b/annotations_filtered/ofmssjTsGnE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68a9b152e7d04497e87e16b1bae88fdf30ca5591 --- /dev/null +++ b/annotations_filtered/ofmssjTsGnE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.41], [3.0, 3.96], [8.0, 8.29], [12.0, 11.99], [17.0, 18.32], [21.0, 21.49], [22.0, 22.72], [24.0, 24.51], [29.0, 29.13], [32.0, 32.68], [33.0, 33.89], [35.0, 36.31], [40.0, 40.58], [41.0, 41.79], [42.0, 43.02], [45.0, 46.92], [48.0, 48.61], [49.0, 49.81], [51.0, 51.92], [52.0, 52.81], [56.0, 56.08], [58.0, 58.53], [83.0, 83.47], [86.0, 87.69], [89.0, 90.12], [105.0, 105.95], [107.0, 108.63], [111.0, 114.96], [116.0, 116.46], [118.0, 120.16], [122.0, 128.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 99.96, 98.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.41, 0.96, 0.29, -0.01, 1.32, 0.49, 0.72, 0.51, 0.13, 0.68, 0.89, 1.31, 0.58, 0.79, 1.02, 1.92, 0.61, 0.81, 0.92, 0.81, 0.08, 0.53, 0.47, 1.69, 1.12, 0.95, 1.63, 3.96, 0.46, 2.16, 6.95]} \ No newline at end of file diff --git a/annotations_filtered/ofxfYinuKKc_filtered.json b/annotations_filtered/ofxfYinuKKc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0acc27938bc4c1c4f38ebff0207b9e7101aca618 --- /dev/null +++ b/annotations_filtered/ofxfYinuKKc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.91], [22.0, 22.3], [24.0, 24.04], [26.0, 26.3], [28.0, 28.32], [31.0, 31.99], [56.0, 55.71], [73.0, 73.48], [84.0, 88.28], [91.0, 91.08], [93.0, 93.5], [94.0, 95.32], [96.0, 98.15], [100.0, 100.79], [101.0, 101.87]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.49, 0.0, 0.0, 0.0, 52.22, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 49.73], ["hum", 8.82], ["theremin", 4.25]], null, null, null, null, null, null], "duration": [0.91, 0.3, 0.04, 0.3, 0.32, 0.99, -0.29, 0.48, 4.28, 0.08, 0.5, 1.32, 2.15, 0.79, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/og1c8h2UyE8_filtered.json b/annotations_filtered/og1c8h2UyE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5be7d5205f2fa6849269278ea75c5a09f83a4a1 --- /dev/null +++ b/annotations_filtered/og1c8h2UyE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 35.72], [39.0, 40.96], [44.0, 45.45], [51.0, 51.68], [54.0, 54.06], [55.0, 56.61], [58.0, 85.9], [88.0, 88.4], [89.0, 92.28], [96.0, 97.01], [99.0, 100.11], [101.0, 104.85], [107.0, 110.49], [114.0, 114.47], [122.0, 123.9], [125.0, 125.14], [126.0, 127.94]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [44.72, 0.0, 0.0, 0.0, 0.0, 0.0, 31.54, 0.0, 29.24, 0.0, 0.0, 31.41, 40.92, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 37.54], ["theremin", 6.35], ["percussion", 6.2]], null, null, null, null, null, [["hum", 43.98], ["music", 16.09], ["mains hum", 13.55]], null, [["music", 51.18], ["hum", 12.04], ["throbbing", 9.66]], null, null, [["throbbing", 35.71], ["hum", 26.96], ["music", 24.01]], [["music", 37.05], ["ambient music", 9.72], ["synthesizer", 8.75]], null, null, null, null], "duration": [2.72, 1.96, 1.45, 0.68, 0.06, 1.61, 27.9, 0.4, 3.28, 1.01, 1.11, 3.85, 3.49, 0.47, 1.9, 0.14, 1.94]} \ No newline at end of file diff --git a/annotations_filtered/og36vWGn5CU_filtered.json b/annotations_filtered/og36vWGn5CU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abb49a911a6a95d335b6c653027c2f4117f39f78 --- /dev/null +++ b/annotations_filtered/og36vWGn5CU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.34], [26.0, 27.9], [29.0, 32.53], [55.0, 55.66], [56.0, 56.64], [67.0, 67.8], [104.0, 105.38], [108.0, 110.25], [118.0, 118.5], [119.0, 118.72], [140.0, 140.56], [142.0, 142.06], [143.0, 143.85], [145.0, 148.04], [150.0, 149.61], [150.0, 151.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.42, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.34, 1.9, 3.53, 0.66, 0.64, 0.8, 1.38, 2.25, 0.5, -0.28, 0.56, 0.06, 0.85, 3.04, -0.39, 1.48]} \ No newline at end of file diff --git a/annotations_filtered/ogUC0Fcvh7g_filtered.json b/annotations_filtered/ogUC0Fcvh7g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d1d34cbceff3332838a7efaf0c961d0b5167d1f --- /dev/null +++ b/annotations_filtered/ogUC0Fcvh7g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.59], [5.0, 6.79], [7.0, 8.28], [9.0, 9.56], [10.0, 16.88], [17.0, 22.5], [38.0, 38.55], [55.0, 54.84], [57.0, 57.55], [61.0, 61.82], [68.0, 68.74], [91.0, 91.35], [95.0, 95.45], [104.0, 106.2], [110.0, 109.75], [111.0, 111.38]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.42, 30.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.4, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["bee, wasp, etc.", 20.63], ["insect", 15.14], ["fly, housefly", 9.89]], [["fly, housefly", 37.81], ["insect", 31.99], ["mains hum", 9.52]], null, null, null, null, null, null, null, [["speech", 25.86], ["hum", 12.72], ["sidetone", 7.19]], null, null], "duration": [0.59, 1.79, 1.28, 0.56, 6.88, 5.5, 0.55, -0.16, 0.55, 0.82, 0.74, 0.35, 0.45, 2.2, -0.25, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/ogkh8GaUkBE_filtered.json b/annotations_filtered/ogkh8GaUkBE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..671c3a814a78e99b7ea8c1345235a2aa7bb8a1d7 --- /dev/null +++ b/annotations_filtered/ogkh8GaUkBE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.93], [6.0, 28.48], [29.0, 31.9], [32.0, 33.67], [34.0, 36.12], [39.0, 42.77], [44.0, 46.8], [55.0, 56.03], [57.0, 57.62], [65.0, 65.33], [66.0, 66.63], [67.0, 68.27]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.83, 73.06, 0.0, 35.95, 99.56, 74.44, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 49.44], ["theremin", 31.33], ["musical instrument", 4.72]], null, null, [["grunt", 27.6], ["groan", 21.59], ["livestock, farm animals, working animals", 18.48]], null, null, null, null, null, null, null], "duration": [0.93, 22.48, 2.9, 1.67, 2.12, 3.77, 2.8, 1.03, 0.62, 0.33, 0.63, 1.27]} \ No newline at end of file diff --git a/annotations_filtered/oh3KwtatlkY_filtered.json b/annotations_filtered/oh3KwtatlkY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ce971da82414bdd8d26c0b1eaadfbe3020ab1cc --- /dev/null +++ b/annotations_filtered/oh3KwtatlkY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.13], [13.0, 13.02], [20.0, 21.69], [22.0, 22.91], [28.0, 28.68], [31.0, 31.35], [34.0, 34.74], [36.0, 36.22], [41.0, 40.93], [47.0, 46.84], [48.0, 49.4], [50.0, 51.65], [57.0, 56.94], [58.0, 58.63], [59.0, 63.04], [66.0, 67.95], [76.0, 82.39], [86.0, 86.98], [87.0, 87.02], [89.0, 89.04], [89.0, 91.39], [97.0, 104.48], [105.0, 107.27], [115.0, 115.33], [121.0, 121.53], [134.0, 138.32], [140.0, 141.03], [142.0, 143.23], [147.0, 148.1], [150.0, 150.47], [153.0, 153.54], [158.0, 158.62], [159.0, 159.54], [161.0, 161.22], [162.0, 163.19], [165.0, 165.32], [169.0, 168.79]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.69, 0.0, 41.1, 0.0, 0.0, 0.0, 30.56, 30.35, 32.62, 0.0, 0.0, 34.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 34.63], ["cattle, bovinae", 12.4], ["livestock, farm animals, working animals", 12.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 12.83], ["keys jangling", 9.58], ["glass", 6.83]], null, [["car", 23.55], ["keys jangling", 23.32], ["speech", 19.48]], null, null, null, [["music", 55.42], ["speech", 11.86], ["hip hop music", 4.42]], [["music", 51.3], ["speech", 14.28], ["throbbing", 4.92]], [["insect", 19.9], ["speech", 18.95], ["fly, housefly", 14.87]], null, null, [["speech", 85.77], ["hum", 4.9], ["throbbing", 1.55]], null, null, null, null, null, null, null, null, null, null, null], "duration": [4.13, 0.02, 1.69, 0.91, 0.68, 0.35, 0.74, 0.22, -0.07, -0.16, 1.4, 1.65, -0.06, 0.63, 4.04, 1.95, 6.39, 0.98, 0.02, 0.04, 2.39, 7.48, 2.27, 0.33, 0.53, 4.32, 1.03, 1.23, 1.1, 0.47, 0.54, 0.62, 0.54, 0.22, 1.19, 0.32, -0.21]} \ No newline at end of file diff --git a/annotations_filtered/oh4GYHtq2hY_filtered.json b/annotations_filtered/oh4GYHtq2hY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28cf592a317fd8adbe18516b90fa8606eb5e56dd --- /dev/null +++ b/annotations_filtered/oh4GYHtq2hY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[100.0, 110.22]], "keep_status": [false], "silence_prob": [35.25], "audiomae_on_audioset": [[["music", 80.18], ["scary music", 7.83], ["soundtrack music", 1.62]]], "duration": [10.22]} \ No newline at end of file diff --git a/annotations_filtered/oh8pzfm5QF8_filtered.json b/annotations_filtered/oh8pzfm5QF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc9f2949ab843a59bb25406249a2665d80dded29 --- /dev/null +++ b/annotations_filtered/oh8pzfm5QF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.23], [9.0, 9.86], [12.0, 12.6], [16.0, 22.13], [26.0, 26.77], [30.0, 30.6], [35.0, 36.93], [38.0, 38.43], [41.0, 42.9], [63.0, 62.83], [73.0, 74.97], [77.0, 78.51], [79.0, 80.35], [81.0, 81.36], [83.0, 83.67], [84.0, 84.94], [88.0, 89.11], [92.0, 92.45], [93.0, 93.51], [103.0, 104.06], [107.0, 108.26], [113.0, 114.4], [116.0, 116.67], [118.0, 119.26]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 42.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 41.77], ["mains hum", 22.39], ["vehicle", 3.5]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.23, 0.86, 0.6, 6.13, 0.77, 0.6, 1.93, 0.43, 1.9, -0.17, 1.97, 1.51, 1.35, 0.36, 0.67, 0.94, 1.11, 0.45, 0.51, 1.06, 1.26, 1.4, 0.67, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/ohMzC_1W0ZY_filtered.json b/annotations_filtered/ohMzC_1W0ZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe51cd8b9314346530649b6e683d57093816fe1e --- /dev/null +++ b/annotations_filtered/ohMzC_1W0ZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.68], [9.0, 11.67], [13.0, 13.56], [17.0, 23.03], [23.0, 34.47], [37.0, 40.73], [44.0, 47.38], [48.0, 58.53], [61.0, 63.53], [89.0, 94.51]], "keep_status": [false, false, false, true, true, false, true, false, false, false], "silence_prob": [50.26, 44.72, 0.0, 39.46, 37.63, 63.1, 48.65, 35.68, 54.56, 34.52], "audiomae_on_audioset": [null, [["music", 60.48], ["hum", 7.67], ["synthesizer", 4.35]], null, [["music", 42.35], ["speech", 11.45], ["didgeridoo", 9.14]], [["speech", 24.66], ["music", 21.44], ["livestock, farm animals, working animals", 5.65]], null, [["music", 57.16], ["animal", 4.92], ["quack", 4.91]], [["music", 60.84], ["speech", 22.27], ["synthesizer", 5.93]], null, [["music", 71.65], ["musical instrument", 3.88], ["didgeridoo", 2.9]]], "duration": [3.68, 2.67, 0.56, 6.03, 11.47, 3.73, 3.38, 10.53, 2.53, 5.51]} \ No newline at end of file diff --git a/annotations_filtered/ohgN4PexEv4_filtered.json b/annotations_filtered/ohgN4PexEv4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e57152447d442aa1e116b97be76db926139adb4 --- /dev/null +++ b/annotations_filtered/ohgN4PexEv4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.49], [8.0, 8.65], [10.0, 11.53], [13.0, 13.42], [16.0, 16.12], [19.0, 19.45], [20.0, 25.25], [31.0, 33.29], [35.0, 35.78], [43.0, 45.15], [54.0, 54.62], [57.0, 60.25], [64.0, 68.49], [80.0, 80.86], [82.0, 84.32], [87.0, 90.95], [93.0, 96.94], [97.0, 99.23], [101.0, 102.22], [105.0, 106.46], [109.0, 110.61], [122.0, 122.2], [124.0, 124.06], [126.0, 128.04], [130.0, 136.46], [144.0, 149.71], [161.0, 163.24], [165.0, 166.01], [167.0, 168.27], [173.0, 188.35], [191.0, 190.92], [191.0, 191.88], [194.0, 195.91], [196.0, 208.47], [211.0, 212.52], [214.0, 215.67], [217.0, 218.13], [220.0, 220.45], [222.0, 223.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.09, 77.87, 0.0, 76.7, 0.0, 99.94, 100.0, 0.0, 100.0, 100.0, 99.99, 99.1, 0.0, 0.0, 0.0, 0.0, 0.0, 95.64, 98.01, 99.76, 99.05, 0.0, 0.0, 87.92, 0.0, 0.0, 0.0, 99.8, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.49, 0.65, 1.53, 0.42, 0.12, 0.45, 5.25, 2.29, 0.78, 2.15, 0.62, 3.25, 4.49, 0.86, 2.32, 3.95, 3.94, 2.23, 1.22, 1.46, 1.61, 0.2, 0.06, 2.04, 6.46, 5.71, 2.24, 1.01, 1.27, 15.35, -0.08, 0.88, 1.91, 12.47, 1.52, 1.67, 1.13, 0.45, 1.6]} \ No newline at end of file diff --git a/annotations_filtered/ohnhJ6gyLhk_filtered.json b/annotations_filtered/ohnhJ6gyLhk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29cc6edcd99ba01c362445fff50728d21262eb66 --- /dev/null +++ b/annotations_filtered/ohnhJ6gyLhk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.02], [8.0, 12.38], [14.0, 14.66], [15.0, 15.94], [17.0, 21.09], [24.0, 29.47], [31.0, 32.0], [34.0, 34.89], [37.0, 37.69], [39.0, 54.04], [64.0, 64.25], [65.0, 65.16], [66.0, 66.33], [67.0, 67.17], [68.0, 68.55], [72.0, 72.08], [73.0, 81.78], [82.0, 82.7], [86.0, 87.52], [88.0, 88.84], [95.0, 95.15], [96.0, 97.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 74.13, 0.0, 0.0, 93.6, 99.21, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.02, 4.38, 0.66, 0.94, 4.09, 5.47, 1.0, 0.89, 0.69, 15.04, 0.25, 0.16, 0.33, 0.17, 0.55, 0.08, 8.78, 0.7, 1.52, 0.84, 0.15, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/ohnkD-gjNVQ_filtered.json b/annotations_filtered/ohnkD-gjNVQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a76a3680b7dc1b5cf220ea78a356a15ab26b257 --- /dev/null +++ b/annotations_filtered/ohnkD-gjNVQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.81], [11.0, 30.82], [32.0, 33.45], [37.0, 52.69], [53.0, 66.8], [68.0, 70.56], [71.0, 80.54], [82.0, 88.01], [89.0, 91.54], [92.0, 92.82], [95.0, 104.5]], "keep_status": [false, false, false, false, false, true, true, false, true, false, true], "silence_prob": [0.0, 28.89, 0.0, 31.31, 29.48, 30.01, 29.82, 29.1, 31.15, 0.0, 29.29], "audiomae_on_audioset": [null, [["music", 46.6], ["speech", 16.75], ["buzz", 9.0]], null, [["speech", 32.12], ["music", 31.99], ["buzz", 8.93]], [["music", 74.03], ["hum", 5.23], ["electronic music", 2.95]], [["music", 36.38], ["hum", 13.31], ["mains hum", 12.57]], [["music", 27.74], ["hum", 22.83], ["breaking", 10.92]], [["speech", 44.87], ["music", 18.43], ["explosion", 11.53]], [["music", 53.03], ["foghorn", 14.03], ["brass instrument", 2.86]], null, [["speech", 36.12], ["music", 19.4], ["hum", 9.62]]], "duration": [0.81, 19.82, 1.45, 15.69, 13.8, 2.56, 9.54, 6.01, 2.54, 0.82, 9.5]} \ No newline at end of file diff --git a/annotations_filtered/ohoPpyAG0zA_filtered.json b/annotations_filtered/ohoPpyAG0zA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87c0000c028c1d1f73a998211da06fb71484cd71 --- /dev/null +++ b/annotations_filtered/ohoPpyAG0zA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 17.98], [19.0, 19.38], [20.0, 20.88], [21.0, 22.86], [24.0, 24.09], [33.0, 33.08], [36.0, 95.77], [96.0, 107.0]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [33.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.56], "audiomae_on_audioset": [[["hum", 36.31], ["mains hum", 27.35], ["music", 22.48]], null, null, null, null, null, null, [["music", 48.23], ["speech", 31.99], ["hum", 3.15]]], "duration": [2.98, 0.38, 0.88, 1.86, 0.09, 0.08, 59.77, 11.0]} \ No newline at end of file diff --git a/annotations_filtered/ohz8_IafGwE_filtered.json b/annotations_filtered/ohz8_IafGwE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4eb6344ecbd13ec3e000b5789fc9d40b270504c5 --- /dev/null +++ b/annotations_filtered/ohz8_IafGwE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.22], [9.0, 8.67], [9.0, 9.71], [15.0, 20.49], [21.0, 22.76], [24.0, 25.93], [36.0, 37.23]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 85.54, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [1.22, -0.33, 0.71, 5.49, 1.76, 1.93, 1.23]} \ No newline at end of file diff --git a/annotations_filtered/oiQPOmrEAxo_filtered.json b/annotations_filtered/oiQPOmrEAxo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06ba077d92bd4d628a75e2145b0b7dbdf5d3c39f --- /dev/null +++ b/annotations_filtered/oiQPOmrEAxo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.46], [10.0, 24.48], [28.0, 38.77], [43.0, 73.06], [73.0, 73.18], [73.0, 76.69], [79.0, 79.71], [82.0, 90.66], [91.0, 108.3], [108.0, 108.45], [109.0, 116.65], [120.0, 125.46], [127.0, 130.37], [132.0, 134.97], [136.0, 136.95], [137.0, 146.52], [149.0, 182.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 28.92, 29.15, 0.0, 0.0, 29.13, 0.0, 28.82, 28.93, 0.0, 31.36, 34.28, 31.26, 29.54, 0.0, 29.56, 0.0], "audiomae_on_audioset": [null, [["music", 64.88], ["speech", 6.65], ["hum", 5.12]], [["speech", 53.12], ["music", 33.51], ["throbbing", 1.9]], null, null, [["music", 55.31], ["synthesizer", 10.25], ["electronic music", 4.63]], null, [["speech", 46.35], ["music", 41.97], ["hum", 1.63]], [["music", 36.7], ["speech", 36.39], ["throbbing", 4.97]], null, [["music", 46.31], ["electronic music", 16.9], ["soundtrack music", 6.25]], [["music", 28.65], ["synthesizer", 12.53], ["hum", 11.86]], [["music", 59.94], ["speech", 20.98], ["boing", 7.31]], [["music", 63.95], ["stomach rumble", 4.65], ["whale vocalization", 4.59]], null, [["speech", 48.4], ["music", 39.93], ["synthesizer", 1.39]], null], "duration": [0.46, 14.48, 10.77, 30.06, 0.18, 3.69, 0.71, 8.66, 17.3, 0.45, 7.65, 5.46, 3.37, 2.97, 0.95, 9.52, 33.21]} \ No newline at end of file diff --git a/annotations_filtered/oiYBUM-EE-w_filtered.json b/annotations_filtered/oiYBUM-EE-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b454e9e94fb34d886f0dae4bd9fdffe5d61f98ce --- /dev/null +++ b/annotations_filtered/oiYBUM-EE-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 31.83], [37.0, 37.37], [48.0, 48.56], [72.0, 71.83], [81.0, 87.29], [88.0, 92.79], [109.0, 123.48], [126.0, 125.81], [128.0, 127.72]], "keep_status": [true, false, false, false, true, true, true, false, false], "silence_prob": [33.55, 0.0, 0.0, 0.0, 30.64, 29.67, 29.96, 0.0, 0.0], "audiomae_on_audioset": [[["music", 30.25], ["synthesizer", 14.86], ["musical instrument", 9.34]], null, null, null, [["speech", 42.98], ["vehicle", 9.4], ["explosion", 9.11]], [["speech", 32.22], ["explosion", 28.23], ["eruption", 7.13]], [["hum", 15.68], ["noise", 15.06], ["music", 14.92]], null, null], "duration": [4.83, 0.37, 0.56, -0.17, 6.29, 4.79, 14.48, -0.19, -0.28]} \ No newline at end of file diff --git a/annotations_filtered/oiikIyodOAk_filtered.json b/annotations_filtered/oiikIyodOAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..113db8a1774e764bccb4417667148cd27bfc8e10 --- /dev/null +++ b/annotations_filtered/oiikIyodOAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.83], [6.0, 6.78], [10.0, 10.32], [11.0, 14.01], [15.0, 15.7], [18.0, 20.55], [22.0, 22.82], [24.0, 30.65], [39.0, 41.5], [42.0, 43.43], [45.0, 46.74], [49.0, 52.22], [54.0, 62.53], [63.0, 68.76], [69.0, 80.13], [81.0, 83.81], [85.0, 86.31], [87.0, 92.52], [99.0, 102.59], [113.0, 114.74], [115.0, 114.88], [118.0, 117.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.7, 0.0, 99.71, 0.0, 76.53, 46.54, 0.0, 0.0, 48.91, 89.36, 99.97, 49.78, 33.45, 0.0, 36.63, 31.74, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 69.62], ["sidetone", 3.25], ["animal", 2.54]], null, null, null, null, [["music", 32.27], ["mains hum", 23.73], ["speech", 15.45]], null, null, [["music", 60.0], ["hum", 4.7], ["theremin", 3.91]], null, null, [["music", 47.95], ["gong", 22.64], ["hum", 7.27]], [["music", 18.16], ["speech", 14.99], ["hum", 13.05]], null, [["speech", 33.57], ["gong", 13.24], ["music", 11.73]], [["speech", 26.65], ["music", 22.35], ["throbbing", 7.12]], null, null, null], "duration": [0.83, 0.78, 0.32, 3.01, 0.7, 2.55, 0.82, 6.65, 2.5, 1.43, 1.74, 3.22, 8.53, 5.76, 11.13, 2.81, 1.31, 5.52, 3.59, 1.74, -0.12, -0.29]} \ No newline at end of file diff --git a/annotations_filtered/ojgy7kyNp5g_filtered.json b/annotations_filtered/ojgy7kyNp5g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..467f160f7cd24f871fcf8fa91bb72a0daa248f99 --- /dev/null +++ b/annotations_filtered/ojgy7kyNp5g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 7.45], [9.0, 11.04], [16.0, 16.85], [18.0, 18.3], [19.0, 19.35], [20.0, 20.29], [21.0, 22.49], [25.0, 29.66], [30.0, 46.57], [52.0, 55.65], [58.0, 59.37], [61.0, 67.34], [70.0, 71.64], [75.0, 76.89], [79.0, 81.92], [83.0, 84.64], [90.0, 91.03], [95.0, 98.37], [102.0, 103.77], [105.0, 105.68], [107.0, 112.21], [112.0, 118.42], [120.0, 121.37]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [35.96, 48.19, 0.0, 0.0, 0.0, 0.0, 0.0, 64.18, 43.45, 75.23, 0.0, 51.55, 0.0, 0.0, 56.63, 0.0, 0.0, 67.89, 0.0, 0.0, 30.03, 35.96, 0.0], "audiomae_on_audioset": [[["music", 57.35], ["musical instrument", 6.67], ["synthesizer", 6.16]], [["speech", 25.54], ["music", 22.75], ["whale vocalization", 9.84]], null, null, null, null, null, null, [["music", 49.43], ["hum", 11.3], ["musical instrument", 4.96]], null, null, null, null, null, null, null, null, null, null, null, [["animal", 39.36], ["speech", 28.72], ["roar", 16.9]], [["speech", 33.26], ["hum", 13.79], ["mains hum", 8.63]], null], "duration": [6.45, 2.04, 0.85, 0.3, 0.35, 0.29, 1.49, 4.66, 16.57, 3.65, 1.37, 6.34, 1.64, 1.89, 2.92, 1.64, 1.03, 3.37, 1.77, 0.68, 5.21, 6.42, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/ojiHA64n6iw_filtered.json b/annotations_filtered/ojiHA64n6iw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2f33fac25cd1a3a5fcf5b44cde3011b21f40bb3 --- /dev/null +++ b/annotations_filtered/ojiHA64n6iw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.38], [3.0, 3.08], [3.0, 3.97], [17.0, 18.3], [23.0, 23.4], [25.0, 25.07], [33.0, 33.22], [34.0, 35.43], [43.0, 44.14], [46.0, 47.11], [50.0, 50.87], [54.0, 55.43], [56.0, 57.54], [59.0, 60.22], [64.0, 64.83], [68.0, 71.79], [80.0, 81.38], [83.0, 83.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.08, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 33.74], ["theremin", 19.43], ["didgeridoo", 14.58]], null, null], "duration": [0.38, 0.08, 0.97, 1.3, 0.4, 0.07, 0.22, 1.43, 1.14, 1.11, 0.87, 1.43, 1.54, 1.22, 0.83, 3.79, 1.38, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/ojoC-Kbzpo8_filtered.json b/annotations_filtered/ojoC-Kbzpo8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dcb33f494af3af5e3cf55acbbef7646ebaf10242 --- /dev/null +++ b/annotations_filtered/ojoC-Kbzpo8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 24.66], [28.0, 27.94], [28.0, 33.12], [33.0, 33.44], [37.0, 38.28], [44.0, 44.49], [79.0, 80.25], [80.0, 81.65], [122.0, 131.72], [133.0, 140.71], [142.0, 157.96], [159.0, 160.61]], "keep_status": [true, false, true, false, false, false, false, false, true, true, true, false], "silence_prob": [37.46, 0.0, 34.82, 0.0, 0.0, 0.0, 0.0, 0.0, 29.42, 30.46, 28.61, 0.0], "audiomae_on_audioset": [[["music", 25.12], ["didgeridoo", 15.09], ["chorus effect", 5.89]], null, [["chant", 16.53], ["music", 14.88], ["didgeridoo", 12.05]], null, null, null, null, null, [["livestock, farm animals, working animals", 17.91], ["music", 12.03], ["cowbell", 8.22]], [["speech", 12.09], ["whack, thwack", 9.57], ["burst, pop", 8.42]], [["livestock, farm animals, working animals", 18.53], ["cattle, bovinae", 14.13], ["moo", 6.23]], null], "duration": [5.66, -0.06, 5.12, 0.44, 1.28, 0.49, 1.25, 1.65, 9.72, 7.71, 15.96, 1.61]} \ No newline at end of file diff --git a/annotations_filtered/ojydQ3_FDqI_filtered.json b/annotations_filtered/ojydQ3_FDqI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..079845d8e55b21ecc42d025e5dcf768f23611503 --- /dev/null +++ b/annotations_filtered/ojydQ3_FDqI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 26.42], [28.0, 28.39], [30.0, 44.49], [47.0, 47.93], [51.0, 67.42], [69.0, 87.89], [91.0, 103.42], [107.0, 121.15], [123.0, 124.93], [126.0, 130.25]], "keep_status": [true, false, false, false, false, true, false, true, false, false], "silence_prob": [30.92, 0.0, 30.25, 0.0, 50.16, 48.06, 31.51, 34.41, 0.0, 51.94], "audiomae_on_audioset": [[["music", 40.14], ["wind instrument, woodwind instrument", 7.81], ["theremin", 6.82]], null, [["music", 46.21], ["theremin", 35.65], ["musical instrument", 4.84]], null, null, [["music", 22.06], ["theremin", 10.71], ["mains hum", 6.76]], [["music", 51.49], ["theremin", 23.95], ["musical instrument", 10.24]], [["music", 37.27], ["hum", 17.98], ["mains hum", 8.11]], null, null], "duration": [9.42, 0.39, 14.49, 0.93, 16.42, 18.89, 12.42, 14.15, 1.93, 4.25]} \ No newline at end of file diff --git a/annotations_filtered/ok6H1OFTmyA_filtered.json b/annotations_filtered/ok6H1OFTmyA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7474fe6e7680c39f0a375ae3e6329f1a98f330c --- /dev/null +++ b/annotations_filtered/ok6H1OFTmyA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.97], [3.0, 3.75], [4.0, 5.81], [9.0, 10.76], [12.0, 13.69], [14.0, 17.02], [18.0, 21.63], [22.0, 23.25], [25.0, 26.69], [29.0, 28.76], [30.0, 31.13], [32.0, 33.66], [35.0, 45.33], [46.0, 47.97], [50.0, 49.92], [52.0, 53.0], [54.0, 56.93], [58.0, 60.37], [61.0, 63.42], [64.0, 67.37], [68.0, 71.24], [72.0, 72.82], [74.0, 74.82], [75.0, 76.47], [78.0, 80.01], [80.0, 82.61], [83.0, 84.21], [86.0, 86.73], [88.0, 88.43], [90.0, 90.34], [91.0, 91.91], [94.0, 95.01], [96.0, 110.91], [113.0, 118.64], [120.0, 123.55], [125.0, 125.44], [126.0, 128.28], [129.0, 133.32], [134.0, 135.84], [137.0, 140.17], [142.0, 142.48], [144.0, 149.25], [151.0, 156.37], [157.0, 160.49], [162.0, 167.24], [168.0, 180.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 60.6, 72.75, 0.0, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0, 0.0, 0.0, 90.43, 88.64, 75.88, 99.73, 84.98, 0.0, 0.0, 0.0, 97.43, 54.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.47, 95.64, 93.91, 0.0, 80.29, 78.38, 0.0, 92.15, 0.0, 93.29, 87.92, 90.95, 89.54, 52.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.03, 0.75, 1.81, 1.76, 1.69, 3.02, 3.63, 1.25, 1.69, -0.24, 1.13, 1.66, 10.33, 1.97, -0.08, 1.0, 2.93, 2.37, 2.42, 3.37, 3.24, 0.82, 0.82, 1.47, 2.01, 2.61, 1.21, 0.73, 0.43, 0.34, 0.91, 1.01, 14.91, 5.64, 3.55, 0.44, 2.28, 4.32, 1.84, 3.17, 0.48, 5.25, 5.37, 3.49, 5.24, 12.23]} \ No newline at end of file diff --git a/annotations_filtered/ok_8VGksYow_filtered.json b/annotations_filtered/ok_8VGksYow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1445ad2e6b588979f6cbcc545c9827a8aa350092 --- /dev/null +++ b/annotations_filtered/ok_8VGksYow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 14.69], [15.0, 17.83], [18.0, 20.46], [22.0, 23.4], [24.0, 30.79], [32.0, 34.2], [35.0, 38.38], [40.0, 50.09], [51.0, 51.95], [55.0, 56.32], [58.0, 59.98], [63.0, 64.22], [68.0, 70.12], [71.0, 73.04], [74.0, 74.93], [75.0, 77.97], [81.0, 81.8], [83.0, 84.23]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 81.53, 32.79, 0.0, 57.01, 96.42, 76.37, 97.33, 0.0, 0.0, 0.0, 0.0, 87.37, 34.12, 0.0, 59.86, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 35.93], ["hum", 20.45], ["sidetone", 7.9]], null, null, null, null, null, null, null, null, null, null, [["speech", 51.49], ["music", 5.41], ["chirp tone", 2.84]], null, null, null, null], "duration": [-0.31, 2.83, 2.46, 1.4, 6.79, 2.2, 3.38, 10.09, 0.95, 1.32, 1.98, 1.22, 2.12, 2.04, 0.93, 2.97, 0.8, 1.23]} \ No newline at end of file diff --git a/annotations_filtered/olTfms7kJIk_filtered.json b/annotations_filtered/olTfms7kJIk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66c7e14153bf120c38051a960d8d81a3be2d85a1 --- /dev/null +++ b/annotations_filtered/olTfms7kJIk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.03], [16.0, 18.96], [22.0, 33.61], [34.0, 50.73], [53.0, 61.59], [64.0, 64.69], [65.0, 68.59]], "keep_status": [false, true, false, false, false, false, false], "silence_prob": [0.0, 44.96, 52.74, 50.21, 53.97, 0.0, 89.36], "audiomae_on_audioset": [null, [["music", 21.27], ["speech", 12.14], ["wind instrument, woodwind instrument", 9.2]], null, null, null, null, null], "duration": [1.03, 2.96, 11.61, 16.73, 8.59, 0.69, 3.59]} \ No newline at end of file diff --git a/annotations_filtered/olxqe0CQ7W0_filtered.json b/annotations_filtered/olxqe0CQ7W0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f622a4a2e88ff481a9fcbf4f70622ec6d4c0018 --- /dev/null +++ b/annotations_filtered/olxqe0CQ7W0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 18.91], [22.0, 21.79], [24.0, 25.73], [27.0, 30.35], [32.0, 33.27], [35.0, 35.4], [37.0, 37.2], [44.0, 45.4], [48.0, 51.21], [52.0, 53.62], [56.0, 56.46], [58.0, 60.52], [61.0, 62.07], [62.0, 74.78], [76.0, 76.92], [77.0, 77.43], [78.0, 79.79], [81.0, 82.05], [84.0, 85.28], [88.0, 89.5], [91.0, 91.61], [94.0, 95.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.3, 0.0, 0.0, 39.28, 0.0, 0.0, 0.0, 0.0, 73.21, 0.0, 0.0, 60.42, 0.0, 47.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 68.58], ["musical instrument", 6.18], ["guitar", 5.32]], null, null, [["knock", 61.16], ["music", 7.16], ["hammer", 7.14]], null, null, null, null, null, null, null, null, null, [["music", 62.19], ["musical instrument", 8.97], ["pizzicato", 2.81]], null, null, null, null, null, null, null, null], "duration": [16.91, -0.21, 1.73, 3.35, 1.27, 0.4, 0.2, 1.4, 3.21, 1.62, 0.46, 2.52, 1.07, 12.78, 0.92, 0.43, 1.79, 1.05, 1.28, 1.5, 0.61, 1.89]} \ No newline at end of file diff --git a/annotations_filtered/omiio7SJIOE_filtered.json b/annotations_filtered/omiio7SJIOE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52ad210ff64849fa8e3e0f146816fa356ae2f192 --- /dev/null +++ b/annotations_filtered/omiio7SJIOE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 45.0], [47.0, 47.66], [50.0, 52.81], [54.0, 56.67], [57.0, 61.84], [69.0, 70.73], [78.0, 78.06], [79.0, 80.6], [85.0, 85.55], [87.0, 92.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.01, 0.0, 86.82, 96.04, 86.09, 0.0, 0.0, 0.0, 0.0, 52.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [2.0, 0.66, 2.81, 2.67, 4.84, 1.73, 0.06, 1.6, 0.55, 5.75]} \ No newline at end of file diff --git a/annotations_filtered/omy5TVA-fY0_filtered.json b/annotations_filtered/omy5TVA-fY0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c18c2c12b82ca6df2e65843e76ef4f1907358d0f --- /dev/null +++ b/annotations_filtered/omy5TVA-fY0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 29.39], [32.0, 42.96], [45.0, 75.71], [76.0, 109.14], [112.0, 113.41], [114.0, 117.95], [120.0, 127.26], [128.0, 128.26], [129.0, 129.74], [130.0, 131.58], [132.0, 149.13]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [39.07, 41.95, 0.0, 0.0, 0.0, 34.81, 34.78, 0.0, 0.0, 0.0, 30.16], "audiomae_on_audioset": [[["music", 76.35], ["ambient music", 4.0], ["synthesizer", 3.21]], [["music", 30.29], ["mosquito", 11.15], ["fly, housefly", 8.76]], null, null, null, [["music", 15.62], ["explosion", 9.6], ["speech", 9.24]], [["speech", 42.67], ["explosion", 26.49], ["fart", 12.75]], null, null, null, [["music", 57.74], ["throbbing", 8.19], ["cacophony", 8.05]]], "duration": [18.39, 10.96, 30.71, 33.14, 1.41, 3.95, 7.26, 0.26, 0.74, 1.58, 17.13]} \ No newline at end of file diff --git a/annotations_filtered/onK1BeyHSZ4_filtered.json b/annotations_filtered/onK1BeyHSZ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d06f4886156de1f800a8cb6640a77dea411baf3b --- /dev/null +++ b/annotations_filtered/onK1BeyHSZ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.59], [10.0, 26.45], [33.0, 32.8]], "keep_status": [false, true, false], "silence_prob": [0.0, 30.37, 0.0], "audiomae_on_audioset": [null, [["music", 43.6], ["speech", 15.01], ["boing", 5.8]], null], "duration": [1.59, 16.45, -0.2]} \ No newline at end of file diff --git a/annotations_filtered/onNv1u-qdZY_filtered.json b/annotations_filtered/onNv1u-qdZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee84603cfe5e22d90e5bb43ecde041b2dbe72815 --- /dev/null +++ b/annotations_filtered/onNv1u-qdZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 18.4], [23.0, 23.75], [25.0, 24.97], [26.0, 30.33], [30.0, 31.89], [33.0, 34.64], [35.0, 35.43], [40.0, 45.79], [46.0, 48.24], [49.0, 53.4], [57.0, 57.72], [60.0, 62.48], [63.0, 66.61], [75.0, 75.93], [78.0, 84.23], [85.0, 91.15], [93.0, 94.1], [96.0, 143.92], [147.0, 149.54], [152.0, 154.5], [157.0, 158.23], [160.0, 160.08], [161.0, 172.07]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, true, false, false, false], "silence_prob": [29.86, 0.0, 0.0, 37.02, 0.0, 0.0, 0.0, 40.71, 59.15, 75.23, 0.0, 81.35, 32.62, 0.0, 29.28, 30.25, 0.0, 0.0, 35.88, 48.82, 0.0, 0.0, 35.68], "audiomae_on_audioset": [[["music", 37.49], ["didgeridoo", 11.0], ["buzz", 6.55]], null, null, [["mains hum", 20.89], ["sidetone", 19.54], ["hum", 12.91]], null, null, null, [["music", 62.24], ["speech", 14.66], ["didgeridoo", 4.18]], null, null, null, null, [["mosquito", 35.66], ["fly, housefly", 21.93], ["frog", 15.04]], null, [["music", 18.97], ["hum", 16.48], ["speech", 14.19]], [["speech", 20.86], ["fly, housefly", 11.4], ["mains hum", 10.81]], null, null, [["speech", 36.69], ["throbbing", 15.5], ["music", 12.99]], [["music", 18.23], ["coin (dropping)", 16.44], ["hum", 9.52]], null, null, [["hum", 38.45], ["mains hum", 18.41], ["speech", 14.19]]], "duration": [13.4, 0.75, -0.03, 4.33, 1.89, 1.64, 0.43, 5.79, 2.24, 4.4, 0.72, 2.48, 3.61, 0.93, 6.23, 6.15, 1.1, 47.92, 2.54, 2.5, 1.23, 0.08, 11.07]} \ No newline at end of file diff --git a/annotations_filtered/onO71_aItKA_filtered.json b/annotations_filtered/onO71_aItKA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b90978086008c97b04ee3deaea3c8dd4a50d6fa8 --- /dev/null +++ b/annotations_filtered/onO71_aItKA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.56], [8.0, 10.32], [13.0, 13.12], [15.0, 17.58], [18.0, 21.74], [22.0, 24.06], [25.0, 26.35], [27.0, 32.26], [36.0, 38.25], [40.0, 46.62], [47.0, 48.61], [50.0, 49.77], [52.0, 52.76], [54.0, 54.46], [55.0, 54.62], [55.0, 62.68], [64.0, 75.37], [76.0, 76.55], [79.0, 88.28], [89.0, 89.18], [90.0, 96.62], [108.0, 110.51], [112.0, 112.43], [115.0, 121.41], [122.0, 122.93], [124.0, 127.72], [130.0, 130.82], [131.0, 131.94], [138.0, 139.26], [140.0, 145.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 71.57, 0.0, 64.18, 51.12, 48.31, 0.0, 57.32, 75.07, 58.13, 0.0, 0.0, 0.0, 0.0, 0.0, 43.87, 48.74, 0.0, 43.58, 0.0, 32.56, 29.83, 0.0, 28.69, 0.0, 30.14, 0.0, 0.0, 0.0, 35.47], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 40.44], ["sidetone", 26.64], ["throbbing", 5.88]], null, null, null, null, null, null, null, null, null, [["frog", 54.35], ["music", 7.22], ["effects unit", 5.94]], [["hum", 18.88], ["animal", 17.01], ["speech", 10.9]], null, [["speech", 25.79], ["mains hum", 20.16], ["hum", 10.96]], null, [["speech", 65.83], ["didgeridoo", 9.55], ["music", 7.63]], [["speech", 76.81], ["music", 9.3], ["didgeridoo", 2.05]], null, [["gong", 41.24], ["hum", 13.59], ["mains hum", 6.95]], null, [["didgeridoo", 83.92], ["music", 6.06], ["musical instrument", 2.43]], null, null, null, [["music", 44.01], ["speech", 12.05], ["synthesizer", 6.83]]], "duration": [0.56, 2.32, 0.12, 2.58, 3.74, 2.06, 1.35, 5.26, 2.25, 6.62, 1.61, -0.23, 0.76, 0.46, -0.38, 7.68, 11.37, 0.55, 9.28, 0.18, 6.62, 2.51, 0.43, 6.41, 0.93, 3.72, 0.82, 0.94, 1.26, 5.76]} \ No newline at end of file diff --git a/annotations_filtered/onbiOVpX0_w_filtered.json b/annotations_filtered/onbiOVpX0_w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f229ace6a933d02517d75f861e547d0f34bce01b --- /dev/null +++ b/annotations_filtered/onbiOVpX0_w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 23.9], [28.0, 43.63], [44.0, 45.2], [47.0, 46.85], [48.0, 49.49], [51.0, 51.54], [54.0, 59.12], [62.0, 64.3], [72.0, 72.18], [73.0, 98.58], [99.0, 99.93], [102.0, 102.3], [104.0, 104.48]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 64.52, 0.0, 0.0, 0.0, 0.0, 34.29, 35.33, 0.0, 33.35, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["roaring cats (lions, tigers)", 19.62], ["whale vocalization", 16.99], ["music", 16.7]], [["music", 38.71], ["hum", 14.67], ["mains hum", 14.01]], null, [["music", 49.48], ["throbbing", 17.82], ["hum", 13.2]], null, null, null], "duration": [-0.1, 15.63, 1.2, -0.15, 1.49, 0.54, 5.12, 2.3, 0.18, 25.58, 0.93, 0.3, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/onesjJyXdFQ_filtered.json b/annotations_filtered/onesjJyXdFQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dbefb6828283a0ded696ce4f001fe0096b272ed9 --- /dev/null +++ b/annotations_filtered/onesjJyXdFQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.6], [9.0, 10.34], [12.0, 13.47], [16.0, 18.18], [21.0, 22.54], [24.0, 25.44], [29.0, 29.24], [31.0, 32.02], [35.0, 36.78], [41.0, 40.83], [42.0, 42.77], [45.0, 45.74], [50.0, 50.52], [52.0, 52.89], [56.0, 56.74], [60.0, 62.55], [64.0, 65.16], [69.0, 69.77], [78.0, 78.29], [88.0, 92.31], [93.0, 94.96], [97.0, 98.31], [100.0, 101.44], [102.0, 103.17], [107.0, 110.13], [111.0, 113.39], [119.0, 118.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 95.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.54, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 92.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.6, 1.34, 1.47, 2.18, 1.54, 1.44, 0.24, 1.02, 1.78, -0.17, 0.77, 0.74, 0.52, 0.89, 0.74, 2.55, 1.16, 0.77, 0.29, 4.31, 1.96, 1.31, 1.44, 1.17, 3.13, 2.39, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/onxbHFyNqGw_filtered.json b/annotations_filtered/onxbHFyNqGw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a5faa9ed21c9c81ed73c40f8015f7de07a6859b --- /dev/null +++ b/annotations_filtered/onxbHFyNqGw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 36.44], [37.0, 38.6], [39.0, 40.14], [41.0, 42.16], [43.0, 53.96], [54.0, 54.03], [55.0, 58.14]], "keep_status": [true, false, false, false, true, false, true], "silence_prob": [33.43, 0.0, 0.0, 0.0, 29.55, 0.0, 30.5], "audiomae_on_audioset": [[["music", 39.29], ["didgeridoo", 16.8], ["theremin", 4.83]], null, null, null, [["speech", 22.87], ["music", 18.72], ["fart", 15.54]], null, [["moo", 27.47], ["cattle, bovinae", 27.14], ["livestock, farm animals, working animals", 11.43]]], "duration": [2.44, 1.6, 1.14, 1.16, 10.96, 0.03, 3.14]} \ No newline at end of file diff --git a/annotations_filtered/onyfp4uSmcY_filtered.json b/annotations_filtered/onyfp4uSmcY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3781ffb51b4902128a1850004d356c56aab6e8e --- /dev/null +++ b/annotations_filtered/onyfp4uSmcY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.58], [25.0, 26.86], [27.0, 29.37], [31.0, 31.02], [31.0, 32.22], [33.0, 32.71], [34.0, 34.23]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.98, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 34.33], ["music", 31.45], ["musical instrument", 6.17]], null, null, null, null], "duration": [0.58, 1.86, 2.37, 0.02, 1.22, -0.29, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/oo5SkNM3c1Y_filtered.json b/annotations_filtered/oo5SkNM3c1Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0f5a11302e696669208cde9e7f6d8339fae97e6 --- /dev/null +++ b/annotations_filtered/oo5SkNM3c1Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.75], [26.0, 26.92], [30.0, 31.24], [36.0, 39.39], [41.0, 43.39], [45.0, 45.27], [48.0, 49.17], [50.0, 52.54], [53.0, 55.36], [56.0, 56.76], [61.0, 60.93], [64.0, 66.48], [67.0, 67.53], [68.0, 68.96], [69.0, 71.34], [73.0, 74.22], [82.0, 82.92], [84.0, 84.75], [90.0, 105.0], [108.0, 109.38], [111.0, 111.01], [112.0, 112.43], [114.0, 120.5], [126.0, 126.93], [128.0, 129.39], [131.0, 132.11], [144.0, 144.49], [146.0, 147.16], [148.0, 152.76], [156.0, 156.56], [160.0, 160.74], [163.0, 163.58], [167.0, 168.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.76, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 66.88, 0.0, 0.0, 0.0, 74.76, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0, 60.98, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.75, 0.92, 1.24, 3.39, 2.39, 0.27, 1.17, 2.54, 2.36, 0.76, -0.07, 2.48, 0.53, 0.96, 2.34, 1.22, 0.92, 0.75, 15.0, 1.38, 0.01, 0.43, 6.5, 0.93, 1.39, 1.11, 0.49, 1.16, 4.76, 0.56, 0.74, 0.58, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/oo7VlD66ISM_filtered.json b/annotations_filtered/oo7VlD66ISM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c0a290516cf053cd25c6bb73130fbff6b126187 --- /dev/null +++ b/annotations_filtered/oo7VlD66ISM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.49], [9.0, 10.67], [21.0, 21.27], [28.0, 28.41], [33.0, 33.81], [37.0, 37.61], [43.0, 43.19], [82.0, 83.35], [92.0, 92.85]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.49, 1.67, 0.27, 0.41, 0.81, 0.61, 0.19, 1.35, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/ooS5gVdYgRQ_filtered.json b/annotations_filtered/ooS5gVdYgRQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bfb04bf5da2e32ee8d56c90ef0126800e9614b8 --- /dev/null +++ b/annotations_filtered/ooS5gVdYgRQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[64.0, 66.63], [77.0, 78.39], [85.0, 84.79], [88.0, 88.55], [93.0, 93.31]], "keep_status": [true, false, false, false, false], "silence_prob": [29.19, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 37.07], ["explosion", 10.52], ["music", 4.63]], null, null, null, null], "duration": [2.63, 1.39, -0.21, 0.55, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/ooiimi7zkoE_filtered.json b/annotations_filtered/ooiimi7zkoE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bce3dafc13a8c990d6af687966dbb6ec76366e7 --- /dev/null +++ b/annotations_filtered/ooiimi7zkoE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 25.37], [25.0, 25.51], [26.0, 25.56], [26.0, 25.73], [27.0, 33.51], [34.0, 36.31], [39.0, 39.8], [42.0, 46.77], [47.0, 50.41], [52.0, 76.5], [79.0, 112.78], [114.0, 115.8], [121.0, 121.51], [123.0, 126.59], [128.0, 131.58], [133.0, 133.47], [136.0, 136.38], [137.0, 146.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [99.97, 0.0, 0.0, 0.0, 99.95, 99.87, 0.0, 90.25, 99.87, 99.95, 0.0, 0.0, 0.0, 60.7, 37.02, 0.0, 0.0, 32.26], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.39], ["electronic music", 5.81], ["hum", 5.37]], null, null, [["mains hum", 53.94], ["hum", 24.37], ["electric shaver, electric razor", 4.44]]], "duration": [5.37, 0.51, -0.44, -0.27, 6.51, 2.31, 0.8, 4.77, 3.41, 24.5, 33.78, 1.8, 0.51, 3.59, 3.58, 0.47, 0.38, 9.57]} \ No newline at end of file diff --git a/annotations_filtered/oow41RrqpHE_filtered.json b/annotations_filtered/oow41RrqpHE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5bfc47ff29e21ac6a0d662269fc94afbc4365cef --- /dev/null +++ b/annotations_filtered/oow41RrqpHE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.26], [2.0, 4.23], [5.0, 7.52], [8.0, 12.29], [13.0, 27.63]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 43.1, 89.36, 66.27, 86.09], "audiomae_on_audioset": [null, [["speech", 70.12], ["telephone", 12.2], ["sidetone", 5.26]], null, null, null], "duration": [0.26, 2.23, 2.52, 4.29, 14.63]} \ No newline at end of file diff --git a/annotations_filtered/oowcsynjIwc_filtered.json b/annotations_filtered/oowcsynjIwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09688cb8b6f172cee7bb9c70b64cf8c377ee99ae --- /dev/null +++ b/annotations_filtered/oowcsynjIwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.6], [12.0, 14.35], [16.0, 16.65], [18.0, 21.81], [23.0, 25.07], [27.0, 31.06], [32.0, 34.42], [35.0, 36.04], [40.0, 76.74], [77.0, 114.71], [115.0, 115.37], [116.0, 117.21], [118.0, 119.01], [119.0, 121.02], [122.0, 122.77], [123.0, 123.4], [124.0, 133.35], [143.0, 143.85], [144.0, 146.5], [148.0, 148.85], [150.0, 150.06], [151.0, 151.02], [152.0, 152.17], [153.0, 153.45], [157.0, 159.26], [161.0, 163.24], [165.0, 165.43], [166.0, 166.62], [170.0, 170.23], [172.0, 173.45], [176.0, 177.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [89.36, 93.91, 0.0, 92.8, 90.43, 89.9, 69.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.84, 0.0, 0.0, 30.55, 0.0, 35.4, 0.0, 0.0, 0.0, 0.0, 0.0, 40.81, 41.05, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 23.52], ["music", 15.17], ["didgeridoo", 9.17]], null, null, [["speech", 70.58], ["radio", 2.44], ["horse", 2.15]], null, [["fly, housefly", 33.27], ["insect", 22.1], ["frog", 12.39]], null, null, null, null, null, [["fly, housefly", 46.88], ["insect", 22.12], ["bee, wasp, etc.", 13.08]], [["fly, housefly", 33.96], ["insect", 14.61], ["bee, wasp, etc.", 14.21]], null, null, null, null, null], "duration": [4.6, 2.35, 0.65, 3.81, 2.07, 4.06, 2.42, 1.04, 36.74, 37.71, 0.37, 1.21, 1.01, 2.02, 0.77, 0.4, 9.35, 0.85, 2.5, 0.85, 0.06, 0.02, 0.17, 0.45, 2.26, 2.24, 0.43, 0.62, 0.23, 1.45, 1.09]} \ No newline at end of file diff --git a/annotations_filtered/oozQe2Bk2cA_filtered.json b/annotations_filtered/oozQe2Bk2cA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/oozQe2Bk2cA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/op6H61wRi-Y_filtered.json b/annotations_filtered/op6H61wRi-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01afa2775f0039d1f4004041b4f346c64ad7aeb0 --- /dev/null +++ b/annotations_filtered/op6H61wRi-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.06], [16.0, 18.4], [19.0, 19.84], [26.0, 26.47], [28.0, 28.68], [32.0, 32.0], [32.0, 32.07], [33.0, 33.32], [34.0, 34.23], [35.0, 43.5], [47.0, 58.85], [69.0, 70.38], [71.0, 75.78], [77.0, 77.67], [80.0, 81.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [42.67, 38.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.48, 37.76, 0.0, 39.67, 0.0, 0.0], "audiomae_on_audioset": [[["sidetone", 33.64], ["speech", 33.59], ["music", 4.82]], [["chirp tone", 44.1], ["sine wave", 21.53], ["speech", 15.35]], null, null, null, null, null, null, null, [["speech", 68.96], ["music", 22.12], ["electric shaver, electric razor", 0.86]], [["music", 54.87], ["speech", 25.55], ["musical instrument", 3.6]], null, [["music", 37.63], ["speech", 21.11], ["didgeridoo", 4.61]], null, null], "duration": [4.06, 2.4, 0.84, 0.47, 0.68, 0.0, 0.07, 0.32, 0.23, 8.5, 11.85, 1.38, 4.78, 0.67, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/opCf3mp24dE_filtered.json b/annotations_filtered/opCf3mp24dE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc3236a775c8eb8c3ee37d077e4b0d934a633a72 --- /dev/null +++ b/annotations_filtered/opCf3mp24dE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.6], [15.0, 16.7], [17.0, 19.52], [20.0, 21.79], [23.0, 23.99], [29.0, 30.13], [32.0, 33.96], [35.0, 36.51], [38.0, 38.06], [39.0, 38.89], [44.0, 44.02], [49.0, 50.36], [53.0, 53.28], [55.0, 56.59], [62.0, 64.4], [66.0, 72.71], [80.0, 81.58], [84.0, 85.35], [86.0, 93.97], [97.0, 97.36], [99.0, 99.18], [100.0, 100.16], [102.0, 102.81], [104.0, 104.95], [110.0, 111.06], [111.0, 112.08], [115.0, 114.99], [119.0, 120.02], [122.0, 124.17], [125.0, 126.08], [129.0, 130.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 83.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.41, 69.88, 0.0, 0.0, 39.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.72, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.87], ["synthesizer", 8.97], ["speech", 5.85]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.6, 1.7, 2.52, 1.79, 0.99, 1.13, 1.96, 1.51, 0.06, -0.11, 0.02, 1.36, 0.28, 1.59, 2.4, 6.71, 1.58, 1.35, 7.97, 0.36, 0.18, 0.16, 0.81, 0.95, 1.06, 1.08, -0.01, 1.02, 2.17, 1.08, 1.55]} \ No newline at end of file diff --git a/annotations_filtered/opSAGkaqx6Y_filtered.json b/annotations_filtered/opSAGkaqx6Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7a5b6d283a203d11d99ca48757c2a8177bd1d2e --- /dev/null +++ b/annotations_filtered/opSAGkaqx6Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.8], [22.0, 44.76], [46.0, 74.01], [82.0, 81.85], [87.0, 87.42], [98.0, 98.86], [104.0, 103.81], [105.0, 105.61], [110.0, 110.35], [110.0, 111.5], [119.0, 119.25], [124.0, 124.09], [125.0, 126.52], [128.0, 128.16], [129.0, 130.17], [131.0, 130.98], [135.0, 135.87], [138.0, 138.33], [139.0, 140.22], [147.0, 150.9], [153.0, 153.17], [154.0, 155.17], [165.0, 165.3], [174.0, 173.8], [174.0, 175.17], [180.0, 180.5]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.39, 29.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 49.4], ["sine wave", 7.71], ["singing bowl", 6.0]], [["music", 11.45], ["whack, thwack", 8.12], ["hum", 6.5]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 66.87], ["synthesizer", 4.21], ["hum", 3.08]], null, null, null, null, null, null], "duration": [1.8, 22.76, 28.01, -0.15, 0.42, 0.86, -0.19, 0.61, 0.35, 1.5, 0.25, 0.09, 1.52, 0.16, 1.17, -0.02, 0.87, 0.33, 1.22, 3.9, 0.17, 1.17, 0.3, -0.2, 1.17, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/opWPxmr2h2s_filtered.json b/annotations_filtered/opWPxmr2h2s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e299f34773867ae066cbe53ff0d00a9fefc748a --- /dev/null +++ b/annotations_filtered/opWPxmr2h2s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.5], [11.0, 12.34], [18.0, 18.49], [20.0, 26.76], [29.0, 29.49], [30.0, 30.54], [38.0, 37.99], [59.0, 59.12], [75.0, 76.96], [78.0, 80.55], [83.0, 85.06], [87.0, 88.23], [89.0, 89.31], [92.0, 93.45], [94.0, 94.63], [96.0, 95.94], [99.0, 99.35], [100.0, 101.11], [108.0, 108.3], [109.0, 109.58], [110.0, 110.62], [111.0, 111.84], [113.0, 116.07], [118.0, 120.24], [122.0, 123.33], [125.0, 126.91], [132.0, 133.66], [137.0, 139.62], [143.0, 144.68]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.04, 0.0, 0.0, 0.0, 0.0, 0.0, 99.68, 76.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.29, 76.37, 0.0, 0.0, 0.0, 74.6, 0.0], "audiomae_on_audioset": [null, null, null, [["fart", 20.19], ["groan", 16.38], ["grunt", 10.25]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 1.34, 0.49, 6.76, 0.49, 0.54, -0.01, 0.12, 1.96, 2.55, 2.06, 1.23, 0.31, 1.45, 0.63, -0.06, 0.35, 1.11, 0.3, 0.58, 0.62, 0.84, 3.07, 2.24, 1.33, 1.91, 1.66, 2.62, 1.68]} \ No newline at end of file diff --git a/annotations_filtered/opXI29YEI5s_filtered.json b/annotations_filtered/opXI29YEI5s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1985eedc2d051eadc880c3be88a4b65981c0c40 --- /dev/null +++ b/annotations_filtered/opXI29YEI5s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.95], [15.0, 15.43], [29.0, 29.62], [33.0, 34.86], [38.0, 37.89], [38.0, 39.09], [40.0, 41.74], [46.0, 46.5], [51.0, 51.73], [54.0, 54.4], [55.0, 102.79], [115.0, 116.36], [119.0, 118.86], [119.0, 165.21], [166.0, 171.39], [172.0, 173.37], [174.0, 182.97], [187.0, 187.1], [193.0, 195.18], [197.0, 198.53], [207.0, 210.07], [211.0, 212.6], [213.0, 215.16], [216.0, 216.68], [221.0, 221.88], [223.0, 223.42], [225.0, 225.9], [231.0, 232.02], [233.0, 233.78], [235.0, 235.01]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.23, 0.0, 39.66, 0.0, 65.67, 0.0, 55.67, 0.0, 62.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 39.45], ["music", 22.56], ["hum", 6.17]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["vehicle", 21.74], ["car", 11.24], ["buzz", 7.51]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.95, 0.43, 0.62, 1.86, -0.11, 1.09, 1.74, 0.5, 0.73, 0.4, 47.79, 1.36, -0.14, 46.21, 5.39, 1.37, 8.97, 0.1, 2.18, 1.53, 3.07, 1.6, 2.16, 0.68, 0.88, 0.42, 0.9, 1.02, 0.78, 0.01]} \ No newline at end of file diff --git a/annotations_filtered/opoVbcNO48o_filtered.json b/annotations_filtered/opoVbcNO48o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad13411ae9d7df5a7a2264259b18f5c5f0808c6e --- /dev/null +++ b/annotations_filtered/opoVbcNO48o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 26.64], [30.0, 61.08], [62.0, 77.97], [79.0, 87.45], [96.0, 99.94], [101.0, 103.55], [112.0, 118.25]], "keep_status": [true, false, false, true, false, true, false], "silence_prob": [30.8, 0.0, 29.91, 28.32, 29.32, 29.99, 29.66], "audiomae_on_audioset": [[["music", 42.98], ["shofar", 8.96], ["trombone", 3.02]], null, [["music", 85.76], ["speech", 3.11], ["didgeridoo", 1.24]], [["music", 41.22], ["theremin", 13.92], ["whale vocalization", 11.29]], [["music", 56.88], ["theremin", 15.14], ["didgeridoo", 6.8]], [["music", 39.32], ["speech", 20.52], ["foghorn", 7.2]], [["music", 63.37], ["didgeridoo", 5.22], ["theremin", 4.84]]], "duration": [10.64, 31.08, 15.97, 8.45, 3.94, 2.55, 6.25]} \ No newline at end of file diff --git a/annotations_filtered/opseGWIdLd4_filtered.json b/annotations_filtered/opseGWIdLd4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd47c5f722fd6ffb0acba11c84c4eb6f02d52166 --- /dev/null +++ b/annotations_filtered/opseGWIdLd4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.94], [13.0, 18.3], [19.0, 162.73]], "keep_status": [false, false, false], "silence_prob": [69.07, 40.17, 0.0], "audiomae_on_audioset": [null, [["music", 55.49], ["theremin", 10.49], ["musical instrument", 6.81]], null], "duration": [2.94, 5.3, 143.73]} \ No newline at end of file diff --git a/annotations_filtered/opt5yQqMIdc_filtered.json b/annotations_filtered/opt5yQqMIdc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ed93a355e22775d8134592747b6112db00f11ca --- /dev/null +++ b/annotations_filtered/opt5yQqMIdc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.44], [15.0, 16.61], [24.0, 24.11], [24.0, 30.28], [35.0, 35.8], [37.0, 39.97], [42.0, 46.94], [58.0, 61.33], [62.0, 62.48], [65.0, 103.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.46, 0.0, 44.87, 48.56, 66.63, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 73.6], ["boing", 7.45], ["speech", 6.74]], null, [["music", 55.47], ["didgeridoo", 10.74], ["speech", 6.27]], [["music", 51.43], ["speech", 24.46], ["musical instrument", 3.16]], null, null, null], "duration": [0.44, 1.61, 0.11, 6.28, 0.8, 2.97, 4.94, 3.33, 0.48, 38.01]} \ No newline at end of file diff --git a/annotations_filtered/optHzRmqdFk_filtered.json b/annotations_filtered/optHzRmqdFk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..587c01fc29b82ea697013602d041d285fb34c017 --- /dev/null +++ b/annotations_filtered/optHzRmqdFk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.83], [12.0, 20.09], [23.0, 24.04], [30.0, 31.7], [33.0, 35.85], [40.0, 41.71], [44.0, 45.32], [47.0, 47.33], [50.0, 55.81], [57.0, 63.42], [65.0, 71.09], [72.0, 74.66], [77.0, 80.77], [81.0, 84.06], [85.0, 88.32], [91.0, 93.63], [95.0, 95.49], [96.0, 98.95], [99.0, 101.95], [103.0, 106.14], [114.0, 116.56], [118.0, 118.89], [119.0, 121.49], [122.0, 123.58], [125.0, 126.98], [129.0, 132.06], [135.0, 135.58], [137.0, 141.49], [142.0, 146.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false], "silence_prob": [61.37, 73.51, 0.0, 0.0, 59.77, 0.0, 0.0, 0.0, 50.31, 62.17, 86.82, 43.35, 87.55, 43.82, 92.15, 91.98, 0.0, 49.18, 45.59, 74.6, 90.08, 0.0, 33.79, 0.0, 0.0, 73.82, 0.0, 40.7, 50.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 63.98], ["hum", 7.98], ["sidetone", 5.47]], null, [["speech", 62.02], ["sidetone", 7.73], ["hum", 5.78]], null, null, null, [["speech", 80.77], ["radio", 5.26], ["sidetone", 4.44]], [["speech", 25.87], ["music", 13.51], ["hum", 3.18]], null, null, null, [["speech", 11.93], ["guitar", 11.79], ["music", 9.99]], null, null, null, null, [["hum", 50.48], ["throbbing", 13.83], ["mains hum", 12.45]], null], "duration": [7.83, 8.09, 1.04, 1.7, 2.85, 1.71, 1.32, 0.33, 5.81, 6.42, 6.09, 2.66, 3.77, 3.06, 3.32, 2.63, 0.49, 2.95, 2.95, 3.14, 2.56, 0.89, 2.49, 1.58, 1.98, 3.06, 0.58, 4.49, 4.62]} \ No newline at end of file diff --git a/annotations_filtered/opyh8AAgisI_filtered.json b/annotations_filtered/opyh8AAgisI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..479b3cccc8e407997a68ce7226232fc23d49d421 --- /dev/null +++ b/annotations_filtered/opyh8AAgisI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.02], [13.0, 16.06], [18.0, 24.81], [28.0, 33.12], [33.0, 35.61], [36.0, 37.29], [38.0, 38.3], [39.0, 48.0], [51.0, 52.49], [53.0, 57.89], [60.0, 62.77], [65.0, 68.94], [72.0, 75.68], [77.0, 77.8], [84.0, 84.1], [88.0, 94.9], [96.0, 97.71], [102.0, 102.74], [104.0, 105.21], [108.0, 112.16], [113.0, 115.97], [116.0, 120.77], [122.0, 126.23], [127.0, 134.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.47, 79.94, 87.0, 94.81, 96.54, 0.0, 0.0, 99.96, 0.0, 98.8, 100.0, 100.0, 100.0, 0.0, 0.0, 99.31, 0.0, 0.0, 0.0, 94.66, 92.15, 76.7, 82.25, 87.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.02, 3.06, 6.81, 5.12, 2.61, 1.29, 0.3, 9.0, 1.49, 4.89, 2.77, 3.94, 3.68, 0.8, 0.1, 6.9, 1.71, 0.74, 1.21, 4.16, 2.97, 4.77, 4.23, 7.25]} \ No newline at end of file diff --git a/annotations_filtered/oqAu5fVDwAM_filtered.json b/annotations_filtered/oqAu5fVDwAM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8400d9dd21619bd87960da8fb749985168321ba5 --- /dev/null +++ b/annotations_filtered/oqAu5fVDwAM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.67], [10.0, 10.67], [11.0, 12.16], [14.0, 14.76], [16.0, 16.6], [17.0, 17.19], [18.0, 21.39], [24.0, 23.6], [24.0, 25.51], [26.0, 28.78], [29.0, 29.93], [31.0, 33.0], [34.0, 34.57], [38.0, 42.08], [46.0, 47.43], [50.0, 52.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [52.74, 0.0, 0.0, 0.0, 0.0, 0.0, 62.58, 0.0, 0.0, 55.39, 0.0, 58.98, 0.0, 32.35, 0.0, 30.03], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.74], ["speech", 23.24], ["sampler", 3.07]], null, [["speech", 52.9], ["music", 6.14], ["thunk", 4.95]]], "duration": [3.67, 0.67, 1.16, 0.76, 0.6, 0.19, 3.39, -0.4, 1.51, 2.78, 0.93, 2.0, 0.57, 4.08, 1.43, 2.44]} \ No newline at end of file diff --git a/annotations_filtered/oqBWx58n1Yk_filtered.json b/annotations_filtered/oqBWx58n1Yk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82d0e287770a30df12600b0bc9e8d056dfb7119f --- /dev/null +++ b/annotations_filtered/oqBWx58n1Yk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.58], [7.0, 7.01], [10.0, 10.02], [11.0, 11.64], [13.0, 14.2], [16.0, 16.21], [17.0, 18.28], [21.0, 21.78], [22.0, 22.6], [25.0, 26.27], [27.0, 27.45], [28.0, 29.08], [31.0, 41.69], [44.0, 52.84], [53.0, 90.56], [92.0, 101.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.24, 37.49, 0.0, 32.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.37], ["speech", 25.55], ["musical instrument", 3.94]], [["music", 57.56], ["harp", 8.54], ["musical instrument", 3.39]], null, [["music", 42.65], ["gong", 18.58], ["singing bowl", 7.13]]], "duration": [-0.42, 0.01, 0.02, 0.64, 1.2, 0.21, 1.28, 0.78, 0.6, 1.27, 0.45, 1.08, 10.69, 8.84, 37.56, 9.41]} \ No newline at end of file diff --git a/annotations_filtered/oqDlKpTihNo_filtered.json b/annotations_filtered/oqDlKpTihNo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..310fe7c72824f0b138583516d267aca0f8063eea --- /dev/null +++ b/annotations_filtered/oqDlKpTihNo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.3], [7.0, 7.11], [8.0, 9.58], [10.0, 10.44], [12.0, 12.41], [15.0, 16.24], [21.0, 21.54], [23.0, 27.08], [38.0, 45.12], [47.0, 48.52], [49.0, 50.14], [51.0, 52.29], [54.0, 55.63], [57.0, 57.11], [62.0, 62.21], [64.0, 65.23], [71.0, 73.31], [74.0, 75.19], [76.0, 76.82], [77.0, 78.87]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.49, 52.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.42, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 54.99], ["tuning fork", 9.52], ["dishes, pots, and pans", 4.0]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.3, 0.11, 1.58, 0.44, 0.41, 1.24, 0.54, 4.08, 7.12, 1.52, 1.14, 1.29, 1.63, 0.11, 0.21, 1.23, 2.31, 1.19, 0.82, 1.87]} \ No newline at end of file diff --git a/annotations_filtered/oqEm8mihoA4_filtered.json b/annotations_filtered/oqEm8mihoA4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..612285292cdf812b4be0373aa21436cfb97216de --- /dev/null +++ b/annotations_filtered/oqEm8mihoA4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.44], [10.0, 11.23], [13.0, 12.93], [32.0, 33.49], [36.0, 36.83], [43.0, 43.93], [44.0, 46.99], [51.0, 54.14], [63.0, 63.29], [74.0, 75.24], [76.0, 77.04], [80.0, 81.78], [82.0, 83.15], [91.0, 91.57], [96.0, 97.09], [106.0, 105.92], [108.0, 109.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.3, 50.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.44, 1.23, -0.07, 1.49, 0.83, 0.93, 2.99, 3.14, 0.29, 1.24, 1.04, 1.78, 1.15, 0.57, 1.09, -0.08, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/oqGij9ylbAk_filtered.json b/annotations_filtered/oqGij9ylbAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ada8b4802b0bdefeabbf14d9a15662732db07b04 --- /dev/null +++ b/annotations_filtered/oqGij9ylbAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.12], [14.0, 24.8], [26.0, 92.2]], "keep_status": [false, true, false], "silence_prob": [0.0, 37.07, 0.0], "audiomae_on_audioset": [null, [["music", 30.01], ["speech", 19.85], ["hum", 9.1]], null], "duration": [0.12, 10.8, 66.2]} \ No newline at end of file diff --git a/annotations_filtered/oqKAuNefcSM_filtered.json b/annotations_filtered/oqKAuNefcSM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98f21dd18104c40ca8a6a32bd2f32924cf02e1fb --- /dev/null +++ b/annotations_filtered/oqKAuNefcSM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.55], [6.0, 7.6], [8.0, 12.73], [23.0, 23.94], [26.0, 27.3], [29.0, 29.2], [30.0, 31.4], [34.0, 34.65], [38.0, 38.13]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 77.32], ["boing", 3.52], ["frog", 2.95]], null, null, null, null, null, null], "duration": [0.55, 1.6, 4.73, 0.94, 1.3, 0.2, 1.4, 0.65, 0.13]} \ No newline at end of file diff --git a/annotations_filtered/oqQGFh5yiWE_filtered.json b/annotations_filtered/oqQGFh5yiWE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6ba41dff5e6421a63c8ecb6671a22e7e7ace73e --- /dev/null +++ b/annotations_filtered/oqQGFh5yiWE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.29], [3.0, 3.69], [9.0, 9.49], [12.0, 12.73], [14.0, 15.42], [20.0, 20.44], [24.0, 25.86], [27.0, 32.22], [35.0, 35.58], [36.0, 37.07], [38.0, 43.5], [45.0, 45.71], [48.0, 48.61], [54.0, 54.45], [62.0, 61.86], [70.0, 70.8], [77.0, 77.67], [81.0, 81.68], [82.0, 82.61], [85.0, 85.08], [92.0, 92.25], [97.0, 98.54], [106.0, 107.05], [113.0, 113.12], [116.0, 116.56], [122.0, 122.12], [126.0, 127.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 0.0, 0.0, 36.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 32.72], ["moo", 16.01], ["cattle, bovinae", 13.61]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 0.69, 0.49, 0.73, 1.42, 0.44, 1.86, 5.22, 0.58, 1.07, 5.5, 0.71, 0.61, 0.45, -0.14, 0.8, 0.67, 0.68, 0.61, 0.08, 0.25, 1.54, 1.05, 0.12, 0.56, 0.12, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/oqquLzHmH5k_filtered.json b/annotations_filtered/oqquLzHmH5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f2be9ee6f2ed3dadd73aefd5d6496a7a0ed3cbf --- /dev/null +++ b/annotations_filtered/oqquLzHmH5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.96], [4.0, 5.27], [6.0, 8.97], [11.0, 13.29], [14.0, 19.35], [22.0, 22.37], [23.0, 24.81], [25.0, 27.94], [31.0, 31.14], [37.0, 37.86], [39.0, 39.65], [40.0, 40.86], [43.0, 43.39], [45.0, 45.96], [48.0, 49.15], [54.0, 54.92], [57.0, 59.24], [63.0, 63.81], [70.0, 72.45], [81.0, 83.15], [87.0, 88.26], [90.0, 91.0], [95.0, 96.87], [100.0, 100.23], [102.0, 103.44], [105.0, 106.0], [108.0, 108.11], [110.0, 109.88], [110.0, 111.16], [113.0, 114.15], [115.0, 115.57], [117.0, 118.15], [120.0, 121.93], [128.0, 128.19], [130.0, 132.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 75.72, 99.93, 99.36, 0.0, 0.0, 86.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 87.19, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.96, 1.27, 2.97, 2.29, 5.35, 0.37, 1.81, 2.94, 0.14, 0.86, 0.65, 0.86, 0.39, 0.96, 1.15, 0.92, 2.24, 0.81, 2.45, 2.15, 1.26, 1.0, 1.87, 0.23, 1.44, 1.0, 0.11, -0.12, 1.16, 1.15, 0.57, 1.15, 1.93, 0.19, 2.48]} \ No newline at end of file diff --git a/annotations_filtered/oquM3yN0E4A_filtered.json b/annotations_filtered/oquM3yN0E4A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc0702d75ddd0d7ef2a0b1cc25e7bc98198b1cf6 --- /dev/null +++ b/annotations_filtered/oquM3yN0E4A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.85], [6.0, 6.1], [7.0, 8.06], [9.0, 9.51], [14.0, 15.72], [22.0, 23.6], [37.0, 37.42], [44.0, 45.6], [48.0, 48.0]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [60.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [3.85, 0.1, 1.06, 0.51, 1.72, 1.6, 0.42, 1.6, 0.0]} \ No newline at end of file diff --git a/annotations_filtered/oqwzuiSy9y0_filtered.json b/annotations_filtered/oqwzuiSy9y0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf5edf0658fa0970b504b347eb31761705508891 --- /dev/null +++ b/annotations_filtered/oqwzuiSy9y0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.35], [6.0, 8.06], [12.0, 11.77], [15.0, 15.77], [18.0, 18.84], [20.0, 21.51], [26.0, 26.7], [29.0, 28.7], [29.0, 31.6], [34.0, 36.17], [39.0, 38.84], [42.0, 41.82], [43.0, 45.55], [51.0, 53.59], [74.0, 79.15], [86.0, 89.16], [92.0, 92.67], [95.0, 95.05], [101.0, 102.74], [105.0, 105.88], [107.0, 107.33]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 98.99, 0.0, 0.0, 94.52, 98.66, 75.88, 60.89, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["cattle, bovinae", 22.31], ["moo", 20.29], ["music", 17.68]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.35, 2.06, -0.23, 0.77, 0.84, 1.51, 0.7, -0.3, 2.6, 2.17, -0.16, -0.18, 2.55, 2.59, 5.15, 3.16, 0.67, 0.05, 1.74, 0.88, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/or6rCLpiS10_filtered.json b/annotations_filtered/or6rCLpiS10_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..600ac9530b46f81ea7935c736c1493d7d8654ce5 --- /dev/null +++ b/annotations_filtered/or6rCLpiS10_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 103.59], [107.0, 122.89]], "keep_status": [false, true], "silence_prob": [0.0, 28.48], "audiomae_on_audioset": [null, [["speech", 54.45], ["music", 6.03], ["explosion", 4.75]]], "duration": [94.59, 15.89]} \ No newline at end of file diff --git a/annotations_filtered/orGDoXo7xKA_filtered.json b/annotations_filtered/orGDoXo7xKA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..568e8e1d4dbb4d0366c91ad50f5ba8915c29980b --- /dev/null +++ b/annotations_filtered/orGDoXo7xKA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.34], [6.0, 9.05], [12.0, 13.58], [14.0, 22.91], [25.0, 25.83], [27.0, 27.6], [29.0, 30.74], [32.0, 33.02], [33.0, 36.98], [38.0, 39.34], [41.0, 42.74], [46.0, 46.74], [47.0, 48.73], [50.0, 55.65], [58.0, 59.83], [63.0, 66.12], [68.0, 68.67], [69.0, 68.71], [69.0, 69.38], [71.0, 70.87], [73.0, 75.66], [78.0, 80.89], [86.0, 86.32], [91.0, 93.6], [94.0, 99.74]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, true, true], "silence_prob": [0.0, 36.67, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 58.38, 0.0, 0.0, 0.0, 0.0, 49.73, 0.0, 39.93, 0.0, 0.0, 0.0, 0.0, 39.01, 31.83, 0.0, 33.92, 33.3], "audiomae_on_audioset": [null, [["sine wave", 27.53], ["speech", 20.71], ["sidetone", 18.76]], null, null, null, null, null, null, null, null, null, null, null, [["music", 49.01], ["hum", 13.69], ["throbbing", 10.7]], null, [["speech", 42.21], ["music", 17.92], ["didgeridoo", 4.46]], null, null, null, null, [["mains hum", 24.57], ["sidetone", 20.54], ["hum", 10.61]], [["music", 32.75], ["speech", 18.25], ["theremin", 10.38]], null, [["music", 55.17], ["speech", 6.58], ["theremin", 5.63]], [["music", 29.28], ["foghorn", 11.57], ["theremin", 7.82]]], "duration": [0.34, 3.05, 1.58, 8.91, 0.83, 0.6, 1.74, 1.02, 3.98, 1.34, 1.74, 0.74, 1.73, 5.65, 1.83, 3.12, 0.67, -0.29, 0.38, -0.13, 2.66, 2.89, 0.32, 2.6, 5.74]} \ No newline at end of file diff --git a/annotations_filtered/orgbJEoA7ak_filtered.json b/annotations_filtered/orgbJEoA7ak_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..521cffefe5624b93b09a0a676b1b0137f60a6d11 --- /dev/null +++ b/annotations_filtered/orgbJEoA7ak_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.38], [11.0, 30.16], [31.0, 43.61], [46.0, 84.92], [86.0, 86.48], [88.0, 96.87], [97.0, 118.02], [119.0, 143.73], [146.0, 148.54], [151.0, 169.3]], "keep_status": [false, true, false, false, false, true, true, true, true, true], "silence_prob": [0.0, 34.91, 33.23, 0.0, 0.0, 32.37, 32.09, 33.83, 38.75, 32.89], "audiomae_on_audioset": [null, [["hum", 27.54], ["throbbing", 14.26], ["speech", 12.48]], [["music", 49.99], ["buzz", 11.69], ["hum", 8.69]], null, null, [["speech", 28.6], ["vehicle", 14.65], ["hum", 9.37]], [["music", 34.96], ["hum", 16.29], ["mains hum", 13.81]], [["music", 28.28], ["whale vocalization", 27.6], ["vehicle", 2.85]], [["music", 42.1], ["theremin", 14.22], ["throbbing", 9.66]], [["music", 35.71], ["speech", 22.82], ["hum", 5.82]]], "duration": [1.38, 19.16, 12.61, 38.92, 0.48, 8.87, 21.02, 24.73, 2.54, 18.3]} \ No newline at end of file diff --git a/annotations_filtered/orhrsjDwamY_filtered.json b/annotations_filtered/orhrsjDwamY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..072f05effc25407f8153949f2fa7c3fda4e703ed --- /dev/null +++ b/annotations_filtered/orhrsjDwamY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 30.25], [33.0, 47.33], [48.0, 50.14], [52.0, 53.18], [55.0, 55.22], [58.0, 58.7], [62.0, 68.35], [69.0, 70.33], [71.0, 72.99], [74.0, 74.95], [76.0, 78.33], [79.0, 82.04], [83.0, 92.48], [93.0, 93.95], [96.0, 116.23], [119.0, 125.36], [127.0, 128.31]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [37.97, 33.97, 91.3, 0.0, 0.0, 0.0, 79.59, 0.0, 0.0, 0.0, 57.89, 60.42, 36.42, 0.0, 29.55, 29.58, 0.0], "audiomae_on_audioset": [[["music", 56.19], ["thump, thud", 8.19], ["clang", 7.05]], [["hum", 26.98], ["music", 19.86], ["throbbing", 5.98]], null, null, null, null, null, null, null, null, null, null, [["music", 34.76], ["hum", 12.04], ["electronic music", 6.93]], null, [["hum", 43.29], ["mains hum", 18.63], ["throbbing", 11.53]], [["buzz", 30.7], ["music", 19.19], ["hum", 9.56]], null], "duration": [9.25, 14.33, 2.14, 1.18, 0.22, 0.7, 6.35, 1.33, 1.99, 0.95, 2.33, 3.04, 9.48, 0.95, 20.23, 6.36, 1.31]} \ No newline at end of file diff --git a/annotations_filtered/os1gnR5k3S8_filtered.json b/annotations_filtered/os1gnR5k3S8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cbfb63060c4a88865aa109f3192e893427cbcdc2 --- /dev/null +++ b/annotations_filtered/os1gnR5k3S8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 6.12], [9.0, 14.32], [15.0, 15.7], [17.0, 17.96], [19.0, 20.26], [22.0, 22.52], [25.0, 25.89], [31.0, 33.29], [39.0, 41.35], [42.0, 47.38], [48.0, 51.6], [57.0, 57.81], [68.0, 68.37], [75.0, 82.61], [83.0, 85.35], [88.0, 88.28], [91.0, 91.44], [102.0, 102.51], [108.0, 109.12], [113.0, 113.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [70.86, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 94.81, 60.42, 0.0, 0.0, 39.83, 60.14, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 40.0], ["speech", 12.11], ["guitar", 3.77]], null, null, null, null, null, null], "duration": [6.12, 5.32, 0.7, 0.96, 1.26, 0.52, 0.89, 2.29, 2.35, 5.38, 3.6, 0.81, 0.37, 7.61, 2.35, 0.28, 0.44, 0.51, 1.12, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/os1x0te4Waw_filtered.json b/annotations_filtered/os1x0te4Waw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6715e309a819ee16522edf5c35dcae2ee360dc3 --- /dev/null +++ b/annotations_filtered/os1x0te4Waw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.31], [10.0, 13.46], [15.0, 18.28], [24.0, 24.58], [27.0, 28.29], [32.0, 32.76], [39.0, 41.0], [45.0, 45.82], [52.0, 52.81], [55.0, 54.85], [57.0, 58.09], [63.0, 64.13], [66.0, 66.33], [66.0, 67.73], [72.0, 73.63], [75.0, 77.73], [79.0, 80.87], [84.0, 85.89], [89.0, 96.2], [99.0, 99.52], [100.0, 104.18], [108.0, 124.6]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.73, 52.05, 53.28, 0.0, 0.0, 0.0, 58.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.32, 0.0, 0.0, 68.28, 0.0, 65.67, 31.73], "audiomae_on_audioset": [[["fly, housefly", 11.35], ["insect", 10.03], ["speech", 9.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 51.42], ["speech", 31.15], ["music", 6.09]]], "duration": [2.31, 3.46, 3.28, 0.58, 1.29, 0.76, 2.0, 0.82, 0.81, -0.15, 1.09, 1.13, 0.33, 1.73, 1.63, 2.73, 1.87, 1.89, 7.2, 0.52, 4.18, 16.6]} \ No newline at end of file diff --git a/annotations_filtered/os7KKfG3QE0_filtered.json b/annotations_filtered/os7KKfG3QE0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3dd8205c58bbd059ada1b74784e59556d5ecad2c --- /dev/null +++ b/annotations_filtered/os7KKfG3QE0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.11], [13.0, 13.69], [19.0, 20.16], [21.0, 21.54], [23.0, 23.31], [36.0, 39.51], [41.0, 41.67], [44.0, 44.17], [47.0, 51.58], [52.0, 51.61], [52.0, 51.68], [52.0, 51.71], [52.0, 51.75], [54.0, 54.6], [55.0, 55.49], [58.0, 57.72], [61.0, 61.28], [75.0, 75.19], [79.0, 80.94], [82.0, 89.55], [100.0, 100.55], [101.0, 101.9], [105.0, 106.0], [112.0, 112.68], [116.0, 116.04], [117.0, 118.4], [120.0, 119.62], [127.0, 128.12], [130.0, 130.89], [134.0, 134.42], [136.0, 136.24], [140.0, 140.46], [141.0, 143.36], [144.0, 144.69], [146.0, 146.7], [149.0, 149.03], [151.0, 151.14], [156.0, 156.57], [158.0, 165.86], [168.0, 169.86]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 41.32, 0.0, 0.0, 42.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.22, 0.0, 0.0, 0.0, 0.0, 0.0, 30.56, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 28.43], ["fart", 9.16], ["speech", 6.45]], null, null, [["hum", 21.3], ["music", 16.12], ["speech", 11.17]], null, null, null, null, null, null, null, null, null, null, [["music", 25.39], ["whale vocalization", 23.4], ["livestock, farm animals, working animals", 16.31]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 44.96], ["chirp tone", 8.45], ["music", 8.21]], null, null, null, null, null, [["speech", 30.26], ["livestock, farm animals, working animals", 27.53], ["cattle, bovinae", 7.97]], null], "duration": [1.11, 0.69, 1.16, 0.54, 0.31, 3.51, 0.67, 0.17, 4.58, -0.39, -0.32, -0.29, -0.25, 0.6, 0.49, -0.28, 0.28, 0.19, 1.94, 7.55, 0.55, 0.9, 1.0, 0.68, 0.04, 1.4, -0.38, 1.12, 0.89, 0.42, 0.24, 0.46, 2.36, 0.69, 0.7, 0.03, 0.14, 0.57, 7.86, 1.86]} \ No newline at end of file diff --git a/annotations_filtered/osE84bZ1jNc_filtered.json b/annotations_filtered/osE84bZ1jNc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1cb37968f79266f810fa531a856c4da58fa9c8b6 --- /dev/null +++ b/annotations_filtered/osE84bZ1jNc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.57], [4.0, 4.75], [6.0, 10.62], [12.0, 13.09], [14.0, 14.67], [15.0, 16.19], [18.0, 19.97], [21.0, 24.0], [24.0, 27.04], [30.0, 30.89], [31.0, 32.44], [33.0, 34.79], [38.0, 38.3], [39.0, 40.04], [41.0, 45.17], [46.0, 47.78], [48.0, 48.69], [50.0, 81.35], [82.0, 84.32], [85.0, 90.78], [91.0, 94.83], [95.0, 95.66], [97.0, 97.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 50.02, 0.0, 0.0, 0.0, 0.0, 84.98, 71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 34.04, 29.65, 30.45, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 32.43], ["theremin", 14.51], ["music", 10.76]], [["didgeridoo", 23.65], ["music", 16.8], ["foghorn", 13.28]], [["fart", 55.98], ["music", 8.6], ["speech", 6.21]], null, null], "duration": [0.57, 0.75, 4.62, 1.09, 0.67, 1.19, 1.97, 3.0, 3.04, 0.89, 1.44, 1.79, 0.3, 1.04, 4.17, 1.78, 0.69, 31.35, 2.32, 5.78, 3.83, 0.66, 0.8]} \ No newline at end of file diff --git a/annotations_filtered/osLhRtHZ4Gw_filtered.json b/annotations_filtered/osLhRtHZ4Gw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59a5aca66af652d5656f3a651afa0a0a260d6992 --- /dev/null +++ b/annotations_filtered/osLhRtHZ4Gw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.75], [11.0, 46.85], [49.0, 49.27], [50.0, 49.92], [51.0, 51.81], [53.0, 53.82], [54.0, 55.86], [56.0, 56.05], [56.0, 56.08], [56.0, 56.12], [56.0, 56.15], [57.0, 61.21], [64.0, 66.77], [68.0, 69.85], [70.0, 71.2], [77.0, 77.8], [79.0, 79.15], [80.0, 80.64], [82.0, 82.63], [84.0, 84.11], [89.0, 89.46], [92.0, 92.62], [93.0, 95.39], [96.0, 96.96], [103.0, 113.19], [115.0, 115.26], [117.0, 117.49], [119.0, 120.11], [121.0, 121.9], [123.0, 123.77], [126.0, 126.67], [128.0, 129.81], [134.0, 138.82], [141.0, 141.39], [143.0, 143.45], [145.0, 146.69], [149.0, 154.62], [155.0, 157.06], [158.0, 158.43], [164.0, 164.1], [167.0, 166.99], [167.0, 171.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.74, 31.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.12, 0.0, 30.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.87, 0.0, 0.0, 0.0, 34.07, 33.5, 0.0, 0.0, 0.0, 32.03], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 60.63], ["whack, thwack", 16.6], ["breaking", 9.09]], [["mains hum", 38.6], ["hum", 30.73], ["speech", 6.96]], null, null, null, null, null, null, null, null, null, [["rumble", 25.24], ["speech", 22.28], ["music", 5.16]], null, [["music", 35.7], ["speech", 31.53], ["fart", 5.21]], null, null, null, null, null, null, null, [["speech", 23.16], ["hum", 15.17], ["rumble", 14.91]], null, null, null, [["speech", 49.93], ["music", 7.84], ["hum", 5.52]], [["speech", 55.09], ["music", 11.22], ["whale vocalization", 4.76]], null, null, null, [["whack, thwack", 50.43], ["breaking", 14.66], ["thump, thud", 11.34]]], "duration": [0.75, 35.85, 0.27, -0.08, 0.81, 0.82, 1.86, 0.05, 0.08, 0.12, 0.15, 4.21, 2.77, 1.85, 1.2, 0.8, 0.15, 0.64, 0.63, 0.11, 0.46, 0.62, 2.39, 0.96, 10.19, 0.26, 0.49, 1.11, 0.9, 0.77, 0.67, 1.81, 4.82, 0.39, 0.45, 1.69, 5.62, 2.06, 0.43, 0.1, -0.01, 4.44]} \ No newline at end of file diff --git a/annotations_filtered/osfdb5BrLPI_filtered.json b/annotations_filtered/osfdb5BrLPI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6e04a1a1f25d8216ae6a1b3ce0284d9d0958b37 --- /dev/null +++ b/annotations_filtered/osfdb5BrLPI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.94], [4.0, 6.27], [11.0, 11.06], [13.0, 13.54], [16.0, 16.28], [18.0, 18.6], [20.0, 21.46], [22.0, 22.67], [25.0, 25.89], [26.0, 27.77], [29.0, 29.73], [31.0, 31.94], [33.0, 33.62], [36.0, 36.85], [40.0, 40.98], [42.0, 42.79], [44.0, 44.73], [45.0, 47.41], [48.0, 48.12], [49.0, 50.8], [52.0, 53.86], [55.0, 55.93], [58.0, 58.16], [59.0, 59.86], [62.0, 62.88], [68.0, 68.35], [69.0, 69.18], [72.0, 72.39], [74.0, 75.09], [76.0, 77.04], [79.0, 79.71], [83.0, 84.28], [86.0, 87.45], [88.0, 88.32], [90.0, 90.64], [91.0, 91.72], [94.0, 94.41], [95.0, 95.3], [96.0, 96.96], [99.0, 100.08], [100.0, 102.25], [103.0, 104.46], [106.0, 106.07], [107.0, 108.08], [109.0, 110.25], [111.0, 116.41], [118.0, 118.35], [119.0, 119.31], [120.0, 122.62], [123.0, 123.6], [124.0, 125.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 52.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.49, 0.0, 0.0, 0.0, 0.0, 46.61, 0.0, 0.0, 34.47, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 21.78], ["didgeridoo", 8.33], ["radio", 8.06]], null, null, null, null, [["music", 46.64], ["speech", 8.89], ["radio", 7.89]], null, null, [["music", 16.03], ["distortion", 12.93], ["effects unit", 12.56]], null, null], "duration": [-0.06, 2.27, 0.06, 0.54, 0.28, 0.6, 1.46, 0.67, 0.89, 1.77, 0.73, 0.94, 0.62, 0.85, 0.98, 0.79, 0.73, 2.41, 0.12, 1.8, 1.86, 0.93, 0.16, 0.86, 0.88, 0.35, 0.18, 0.39, 1.09, 1.04, 0.71, 1.28, 1.45, 0.32, 0.64, 0.72, 0.41, 0.3, 0.96, 1.08, 2.25, 1.46, 0.07, 1.08, 1.25, 5.41, 0.35, 0.31, 2.62, 0.6, 1.24]} \ No newline at end of file diff --git a/annotations_filtered/otOIqHsnQZY_filtered.json b/annotations_filtered/otOIqHsnQZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4329735b6aa37cf743d6413fb060af8120f57336 --- /dev/null +++ b/annotations_filtered/otOIqHsnQZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.09], [9.0, 9.9], [13.0, 14.23], [25.0, 25.88], [28.0, 28.49], [29.0, 30.13], [36.0, 36.39], [36.0, 38.55], [41.0, 41.52], [43.0, 44.9], [53.0, 54.24], [54.0, 54.73], [61.0, 62.43], [63.0, 64.44], [65.0, 66.46], [67.0, 67.31], [68.0, 68.18], [69.0, 69.03], [69.0, 70.23], [71.0, 70.98], [71.0, 71.64], [72.0, 72.17], [74.0, 74.07], [75.0, 77.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.35], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["boing", 49.0], ["speech", 19.38], ["music", 15.78]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whack, thwack", 17.34], ["boing", 12.33], ["smash, crash", 11.55]]], "duration": [1.09, 0.9, 1.23, 0.88, 0.49, 1.13, 0.39, 2.55, 0.52, 1.9, 1.24, 0.73, 1.43, 1.44, 1.46, 0.31, 0.18, 0.03, 1.23, -0.02, 0.64, 0.17, 0.07, 2.67]} \ No newline at end of file diff --git a/annotations_filtered/otQNGe5sWaQ_filtered.json b/annotations_filtered/otQNGe5sWaQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5aa36e0b8e9f014804f6b09c253e452ba04ead3d --- /dev/null +++ b/annotations_filtered/otQNGe5sWaQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 23.55], [28.0, 37.76], [39.0, 69.62], [70.0, 78.7], [79.0, 84.72], [88.0, 91.29], [97.0, 97.39], [99.0, 99.64], [101.0, 101.24], [103.0, 105.17], [107.0, 107.15], [109.0, 115.43], [118.0, 118.18], [119.0, 121.9], [128.0, 127.94]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, true, false, true, false], "silence_prob": [99.48, 99.73, 0.0, 95.23, 97.43, 33.94, 0.0, 0.0, 0.0, 49.92, 0.0, 33.26, 0.0, 45.24, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["boing", 21.14], ["moo", 16.82], ["cattle, bovinae", 16.19]], null, null, null, [["speech", 39.28], ["tuning fork", 11.18], ["dial tone", 6.92]], null, [["music", 27.81], ["speech", 14.39], ["explosion", 5.9]], null, [["music", 34.5], ["hum", 14.15], ["mains hum", 4.09]], null], "duration": [3.55, 9.76, 30.62, 8.7, 5.72, 3.29, 0.39, 0.64, 0.24, 2.17, 0.15, 6.43, 0.18, 2.9, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/otQ_oCvSq6E_filtered.json b/annotations_filtered/otQ_oCvSq6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fff0d2798a4bf87ec7da6afce98803684cb98446 --- /dev/null +++ b/annotations_filtered/otQ_oCvSq6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.13], [4.0, 3.91], [5.0, 6.57], [8.0, 9.15], [11.0, 11.85], [12.0, 13.15], [14.0, 15.65], [16.0, 17.39], [22.0, 21.98], [23.0, 24.56], [26.0, 26.23], [27.0, 28.38], [29.0, 29.61], [32.0, 32.95], [34.0, 33.94], [35.0, 36.56], [37.0, 37.76], [38.0, 39.04], [40.0, 40.02], [41.0, 42.47], [46.0, 49.87], [51.0, 52.88], [55.0, 58.77], [62.0, 148.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.13, -0.09, 1.57, 1.15, 0.85, 1.15, 1.65, 1.39, -0.02, 1.56, 0.23, 1.38, 0.61, 0.95, -0.06, 1.56, 0.76, 1.04, 0.02, 1.47, 3.87, 1.88, 3.77, 86.69]} \ No newline at end of file diff --git a/annotations_filtered/otk_S_5inBM_filtered.json b/annotations_filtered/otk_S_5inBM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cb319cf51f3e72904650eeeb126a133699af6c8 --- /dev/null +++ b/annotations_filtered/otk_S_5inBM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.0], [1.0, 2.25], [2.0, 18.59], [23.0, 24.04], [24.0, 24.97], [27.0, 27.53], [28.0, 28.83], [30.0, 30.94], [34.0, 36.09], [38.0, 45.25], [49.0, 53.28], [55.0, 55.17], [57.0, 57.69], [58.0, 59.05], [60.0, 61.37], [63.0, 63.91], [65.0, 64.86], [66.0, 67.04], [68.0, 71.81], [72.0, 109.65], [111.0, 111.42], [113.0, 113.48], [116.0, 116.31], [119.0, 120.24], [124.0, 124.95], [134.0, 136.41], [136.0, 136.49], [137.0, 139.02], [141.0, 142.7], [143.0, 147.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 55.46, 0.0, 0.0, 0.0, 0.0, 0.0, 95.78, 42.11, 53.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.16, 0.0, 52.1, 0.0, 62.68], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["clang", 61.64], ["glass", 8.88], ["music", 7.71]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 31.8], ["speech", 20.74], ["hum", 4.45]], null, null, null, null], "duration": [1.0, 1.25, 16.59, 1.04, 0.97, 0.53, 0.83, 0.94, 2.09, 7.25, 4.28, 0.17, 0.69, 1.05, 1.37, 0.91, -0.14, 1.04, 3.81, 37.65, 0.42, 0.48, 0.31, 1.24, 0.95, 2.41, 0.49, 2.02, 1.7, 4.33]} \ No newline at end of file diff --git a/annotations_filtered/ouDfr9Jh0s8_filtered.json b/annotations_filtered/ouDfr9Jh0s8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..236c519399d7c64bf9306e8a2930dfa7013c721e --- /dev/null +++ b/annotations_filtered/ouDfr9Jh0s8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.05], [7.0, 7.15], [9.0, 9.02], [11.0, 29.76], [30.0, 33.05], [33.0, 37.35], [38.0, 38.87], [41.0, 43.93], [44.0, 44.78], [46.0, 48.54], [49.0, 49.13], [54.0, 66.18], [68.0, 72.5], [73.0, 76.87], [78.0, 79.51], [80.0, 80.87], [84.0, 85.18], [87.0, 87.27], [88.0, 88.69], [90.0, 90.36], [92.0, 93.14], [96.0, 96.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.64, 0.0, 0.0, 94.95, 88.46, 85.9, 0.0, 94.66, 0.0, 88.64, 0.0, 40.19, 75.39, 97.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 68.6], ["synthesizer", 10.57], ["echo", 2.53]], null, null, null, null, null, null, null, null, null, null], "duration": [3.05, 0.15, 0.02, 18.76, 3.05, 4.35, 0.87, 2.93, 0.78, 2.54, 0.13, 12.18, 4.5, 3.87, 1.51, 0.87, 1.18, 0.27, 0.69, 0.36, 1.14, 0.55]} \ No newline at end of file diff --git a/annotations_filtered/ouQG7Pcq1S8_filtered.json b/annotations_filtered/ouQG7Pcq1S8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd144b512fd3aebaa0c395888ad788f8774b9dac --- /dev/null +++ b/annotations_filtered/ouQG7Pcq1S8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.53], [18.0, 22.52], [24.0, 25.02], [28.0, 28.27], [31.0, 30.99], [34.0, 34.82], [35.0, 35.09], [35.0, 42.63], [43.0, 46.13], [53.0, 63.27], [65.0, 71.15], [75.0, 76.1], [79.0, 82.04], [83.0, 85.72], [98.0, 111.75], [120.0, 122.25], [123.0, 126.84], [128.0, 128.76], [129.0, 130.69], [134.0, 133.66], [136.0, 136.43], [138.0, 137.89], [142.0, 141.84], [149.0, 149.93], [153.0, 153.37], [154.0, 154.65], [156.0, 156.44]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.7, 32.11, 32.44, 31.55, 0.0, 37.84, 35.77, 77.53, 61.57, 39.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 50.6], ["speech", 19.47], ["boing", 4.24]], null, null, null, null, null, [["music", 52.56], ["speech", 21.93], ["boing", 4.38]], [["music", 43.0], ["bow-wow", 12.37], ["dog", 9.22]], [["boing", 37.38], ["music", 25.73], ["whack, thwack", 24.38]], [["music", 48.03], ["groan", 8.17], ["boing", 4.67]], null, [["speech", 37.89], ["cattle, bovinae", 9.61], ["music", 7.98]], [["hum", 35.24], ["music", 19.38], ["whale vocalization", 8.99]], null, null, [["music", 36.2], ["speech", 32.08], ["hum", 3.3]], null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 4.52, 1.02, 0.27, -0.01, 0.82, 0.09, 7.63, 3.13, 10.27, 6.15, 1.1, 3.04, 2.72, 13.75, 2.25, 3.84, 0.76, 1.69, -0.34, 0.43, -0.11, -0.16, 0.93, 0.37, 0.65, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/ouXz_ETh2eI_filtered.json b/annotations_filtered/ouXz_ETh2eI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ffa06d822261bceb285042dae3a35819fe372330 --- /dev/null +++ b/annotations_filtered/ouXz_ETh2eI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.3], [13.0, 13.42], [29.0, 29.52], [30.0, 31.38], [32.0, 32.76], [35.0, 37.74], [39.0, 56.62], [59.0, 80.28], [87.0, 89.26], [91.0, 101.12], [104.0, 104.14], [105.0, 112.28], [117.0, 122.0]], "keep_status": [false, false, false, false, false, false, true, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 77.53, 41.5, 36.66, 38.03, 39.33, 0.0, 100.0, 41.24], "audiomae_on_audioset": [null, null, null, null, null, null, [["sheep", 27.39], ["animal", 25.45], ["wild animals", 13.9]], [["livestock, farm animals, working animals", 38.88], ["cattle, bovinae", 21.76], ["moo", 15.43]], [["speech", 17.61], ["music", 14.13], ["sheep", 4.22]], [["animal", 18.47], ["sheep", 8.26], ["speech", 7.08]], null, null, [["moo", 20.17], ["cattle, bovinae", 14.9], ["livestock, farm animals, working animals", 13.59]]], "duration": [1.3, 0.42, 0.52, 1.38, 0.76, 2.74, 17.62, 21.28, 2.26, 10.12, 0.14, 7.28, 5.0]} \ No newline at end of file diff --git a/annotations_filtered/oub2YWXPV6g_filtered.json b/annotations_filtered/oub2YWXPV6g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5074079e99ac313c06dc16423d1839ea24f7ff37 --- /dev/null +++ b/annotations_filtered/oub2YWXPV6g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.82], [13.0, 14.28], [15.0, 15.7], [17.0, 27.63], [29.0, 30.08], [34.0, 49.98], [51.0, 53.32], [54.0, 55.26], [56.0, 58.28], [61.0, 65.8], [67.0, 68.4], [74.0, 73.82], [75.0, 76.17], [78.0, 80.06], [81.0, 81.23], [83.0, 86.68], [88.0, 88.65], [92.0, 93.19], [107.0, 108.6], [111.0, 116.75]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.56, 0.0, 67.89, 84.25, 0.0, 93.76, 94.66, 0.0, 0.0, 0.0, 95.51, 0.0, 97.73, 0.0, 0.0, 0.0, 67.25], "audiomae_on_audioset": [null, null, null, [["stomach rumble", 16.45], ["whale vocalization", 15.96], ["speech", 8.58]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.82, 1.28, 0.7, 10.63, 1.08, 15.98, 2.32, 1.26, 2.28, 4.8, 1.4, -0.18, 1.17, 2.06, 0.23, 3.68, 0.65, 1.19, 1.6, 5.75]} \ No newline at end of file diff --git a/annotations_filtered/ouppQFx3v-I_filtered.json b/annotations_filtered/ouppQFx3v-I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..888fe6255d5ac88fdb3ac129f75c190917269e9b --- /dev/null +++ b/annotations_filtered/ouppQFx3v-I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.43], [6.0, 7.11], [9.0, 15.43], [20.0, 24.26], [25.0, 27.99], [34.0, 36.46], [38.0, 39.77], [42.0, 42.62], [46.0, 48.9], [52.0, 54.06], [57.0, 58.43], [61.0, 62.75], [65.0, 67.49], [69.0, 70.23], [72.0, 73.62], [78.0, 78.56], [79.0, 81.43], [85.0, 85.8], [90.0, 92.43], [94.0, 94.74], [98.0, 99.79], [102.0, 106.15], [107.0, 107.64], [110.0, 113.29], [116.0, 118.49], [121.0, 121.93], [124.0, 125.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 97.73, 98.93, 99.26, 96.54, 0.0, 0.0, 99.31, 99.52, 0.0, 0.0, 83.7, 0.0, 0.0, 0.0, 82.79, 0.0, 99.73, 0.0, 0.0, 99.76, 0.0, 99.21, 99.36, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.43, 1.11, 6.43, 4.26, 2.99, 2.46, 1.77, 0.62, 2.9, 2.06, 1.43, 1.75, 2.49, 1.23, 1.62, 0.56, 2.43, 0.8, 2.43, 0.74, 1.79, 4.15, 0.64, 3.29, 2.49, 0.93, 1.63]} \ No newline at end of file diff --git a/annotations_filtered/ovFDrgui4a0_filtered.json b/annotations_filtered/ovFDrgui4a0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2683276f5e886941d239d59c4044d7ced50f8fa --- /dev/null +++ b/annotations_filtered/ovFDrgui4a0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 13.1], [15.0, 28.51], [31.0, 34.33], [35.0, 36.26], [38.0, 62.06], [63.0, 76.37]], "keep_status": [true, false, true, false, false, true], "silence_prob": [32.6, 36.15, 36.69, 0.0, 32.25, 30.4], "audiomae_on_audioset": [[["music", 50.39], ["hum", 7.94], ["mains hum", 5.04]], [["music", 61.53], ["hum", 6.76], ["ambient music", 6.27]], [["music", 58.9], ["musical instrument", 4.49], ["guitar", 4.07]], null, [["music", 77.31], ["echo", 4.05], ["livestock, farm animals, working animals", 1.99]], [["bow-wow", 26.12], ["music", 16.69], ["yip", 12.25]]], "duration": [12.1, 13.51, 3.33, 1.26, 24.06, 13.37]} \ No newline at end of file diff --git a/annotations_filtered/ovPXL1WPTMA_filtered.json b/annotations_filtered/ovPXL1WPTMA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebd4a498990976f377c7082fb54221be6e78af84 --- /dev/null +++ b/annotations_filtered/ovPXL1WPTMA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 26.81], [29.0, 34.42], [37.0, 40.83], [41.0, 44.51], [46.0, 56.73], [60.0, 61.57], [63.0, 65.03], [67.0, 75.95], [77.0, 77.57]], "keep_status": [false, false, true, true, false, false, true, true, false], "silence_prob": [50.11, 79.41, 40.82, 49.87, 49.36, 0.0, 34.34, 31.09, 0.0], "audiomae_on_audioset": [null, null, [["music", 36.69], ["speech", 22.9], ["hum", 5.52]], [["music", 27.42], ["hum", 13.34], ["fly, housefly", 8.28]], [["music", 73.85], ["synthesizer", 2.52], ["boing", 1.94]], null, [["mosquito", 25.32], ["music", 16.48], ["fly, housefly", 11.81]], [["fly, housefly", 28.11], ["music", 17.38], ["mosquito", 17.34]], null], "duration": [16.81, 5.42, 3.83, 3.51, 10.73, 1.57, 2.03, 8.95, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/ovQk7fd4_Co_filtered.json b/annotations_filtered/ovQk7fd4_Co_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/ovQk7fd4_Co_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/ovV34LOq9Q8_filtered.json b/annotations_filtered/ovV34LOq9Q8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3dc9a0bb40a2b92b57eb47435a61fdffbb341ed --- /dev/null +++ b/annotations_filtered/ovV34LOq9Q8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.16], [6.0, 8.99], [10.0, 11.26], [13.0, 15.77], [19.0, 20.83], [22.0, 25.79], [27.0, 28.05], [36.0, 36.83], [42.0, 43.04], [47.0, 57.54], [58.0, 58.72], [59.0, 59.78], [62.0, 62.78], [66.0, 67.09], [76.0, 84.75], [85.0, 91.0], [94.0, 94.47], [100.0, 100.97], [102.0, 102.02], [104.0, 103.81], [104.0, 106.0], [107.0, 108.36], [109.0, 109.54]], "keep_status": [false, true, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 32.45, 0.0, 38.7, 0.0, 34.72, 0.0, 0.0, 0.0, 37.71, 0.0, 0.0, 0.0, 0.0, 37.78, 39.18, 0.0, 0.0, 0.0, 0.0, 38.9, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 29.35], ["civil defense siren", 10.71], ["shofar", 5.62]], null, [["music", 47.77], ["synthesizer", 9.68], ["musical instrument", 6.37]], null, [["speech", 18.09], ["music", 15.62], ["buzz", 9.96]], null, null, null, [["music", 69.7], ["didgeridoo", 4.49], ["theremin", 3.57]], null, null, null, null, [["music", 38.28], ["speech", 26.93], ["didgeridoo", 14.26]], [["music", 31.13], ["theremin", 18.04], ["speech", 13.36]], null, null, null, null, [["music", 12.18], ["speech", 11.26], ["didgeridoo", 5.52]], null, null], "duration": [0.16, 2.99, 1.26, 2.77, 1.83, 3.79, 1.05, 0.83, 1.04, 10.54, 0.72, 0.78, 0.78, 1.09, 8.75, 6.0, 0.47, 0.97, 0.02, -0.19, 2.0, 1.36, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/oviA5ncbmc8_filtered.json b/annotations_filtered/oviA5ncbmc8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c10b7a9d0cc36fe192930e66ce7e161e97275393 --- /dev/null +++ b/annotations_filtered/oviA5ncbmc8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.55], [6.0, 7.55], [11.0, 13.53], [20.0, 20.65], [25.0, 33.61], [35.0, 35.38], [38.0, 38.69], [39.0, 44.04], [44.0, 48.56], [51.0, 52.95], [54.0, 61.8], [63.0, 64.74], [67.0, 67.54], [70.0, 77.7], [79.0, 78.71], [91.0, 95.61], [97.0, 97.87], [100.0, 106.19], [108.0, 109.0], [109.0, 117.22], [122.0, 124.7], [132.0, 138.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 98.51, 0.0, 0.0, 90.78, 99.96, 0.0, 85.54, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 99.82, 0.0, 48.1, 99.99, 98.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 81.83], ["sidetone", 5.63], ["hum", 1.92]], null, null], "duration": [1.55, 1.55, 2.53, 0.65, 8.61, 0.38, 0.69, 5.04, 4.56, 1.95, 7.8, 1.74, 0.54, 7.7, -0.29, 4.61, 0.87, 6.19, 1.0, 8.22, 2.7, 6.74]} \ No newline at end of file diff --git a/annotations_filtered/ovxjAnlr7qg_filtered.json b/annotations_filtered/ovxjAnlr7qg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67d253cb77dea62abeee0b3940ae8b45623cffb9 --- /dev/null +++ b/annotations_filtered/ovxjAnlr7qg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.53], [20.0, 20.14], [24.0, 24.49], [40.0, 40.86], [42.0, 42.96], [70.0, 69.79], [77.0, 77.14], [77.0, 82.31], [84.0, 86.04], [89.0, 91.0], [92.0, 97.56], [100.0, 100.03], [101.0, 102.52], [104.0, 105.43], [106.0, 113.0], [121.0, 122.4], [130.0, 135.33], [139.0, 142.47], [144.0, 144.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.64, 53.04, 53.28, 33.53, 0.0, 0.0, 0.0, 40.17, 0.0, 41.3, 50.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 67.81], ["didgeridoo", 8.45], ["guitar", 4.86]], null, null, [["speech", 35.23], ["music", 21.25], ["sidetone", 11.03]], null, null, null, [["music", 64.81], ["musical instrument", 3.06], ["speech", 2.62]], null, [["music", 36.89], ["speech", 12.01], ["didgeridoo", 5.81]], null, null], "duration": [1.53, 0.14, 0.49, 0.86, 0.96, -0.21, 0.14, 5.31, 2.04, 2.0, 5.56, 0.03, 1.52, 1.43, 7.0, 1.4, 5.33, 3.47, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/ovy6F76ip3M_filtered.json b/annotations_filtered/ovy6F76ip3M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55ac755d18d6fb69402cdc89e9ab2faa23efa761 --- /dev/null +++ b/annotations_filtered/ovy6F76ip3M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.55], [5.0, 11.91], [14.0, 15.03], [16.0, 18.12], [19.0, 21.47], [23.0, 23.23], [24.0, 27.72], [29.0, 30.55], [34.0, 35.31], [37.0, 38.97], [41.0, 41.15], [43.0, 45.06], [48.0, 47.93], [50.0, 54.73], [57.0, 57.1], [64.0, 64.66], [73.0, 73.75], [75.0, 75.3], [76.0, 77.09], [80.0, 91.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 72.75, 0.0, 100.0, 100.0, 0.0, 77.36, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 43.03], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 54.42], ["wail, moan", 9.8], ["bleat", 4.91]]], "duration": [0.55, 6.91, 1.03, 2.12, 2.47, 0.23, 3.72, 1.55, 1.31, 1.97, 0.15, 2.06, -0.07, 4.73, 0.1, 0.66, 0.75, 0.3, 1.09, 11.5]} \ No newline at end of file diff --git a/annotations_filtered/ow0vNLhDNzI_filtered.json b/annotations_filtered/ow0vNLhDNzI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b75de2a0154d57f296459633974a15e262745b6 --- /dev/null +++ b/annotations_filtered/ow0vNLhDNzI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 83.81], [85.0, 103.91], [105.0, 104.94], [106.0, 106.84], [108.0, 132.8], [135.0, 137.19], [140.0, 140.95]], "keep_status": [false, false, false, false, false, true, false], "silence_prob": [0.0, 29.41, 0.0, 0.0, 29.1, 32.42, 0.0], "audiomae_on_audioset": [null, [["music", 72.04], ["throbbing", 9.8], ["hum", 5.96]], null, null, [["music", 29.97], ["throbbing", 28.13], ["hum", 25.98]], [["hum", 22.61], ["burping, eructation", 16.96], ["music", 16.52]], null], "duration": [62.81, 18.91, -0.06, 0.84, 24.8, 2.19, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/ow3Pf0LSXwc_filtered.json b/annotations_filtered/ow3Pf0LSXwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b98f77933a876bf5af8ed9bc017d117b44b30fb6 --- /dev/null +++ b/annotations_filtered/ow3Pf0LSXwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 24.14], [25.0, 28.17], [30.0, 32.39], [33.0, 33.81], [37.0, 39.24], [48.0, 56.86], [61.0, 71.32], [76.0, 97.58]], "keep_status": [true, true, true, false, false, false, true, false], "silence_prob": [36.11, 38.46, 45.3, 0.0, 38.33, 34.01, 34.07, 32.97], "audiomae_on_audioset": [[["music", 24.86], ["didgeridoo", 11.2], ["hum", 11.01]], [["music", 55.42], ["speech", 6.07], ["theremin", 4.97]], [["music", 55.14], ["synthesizer", 7.36], ["musical instrument", 4.22]], null, [["music", 51.18], ["throbbing", 15.3], ["hum", 7.56]], [["music", 63.76], ["synthesizer", 8.95], ["theremin", 8.21]], [["speech", 45.56], ["hum", 11.89], ["music", 10.98]], [["hum", 45.41], ["mains hum", 42.16], ["music", 5.25]]], "duration": [3.14, 3.17, 2.39, 0.81, 2.24, 8.86, 10.32, 21.58]} \ No newline at end of file diff --git a/annotations_filtered/ow9U0uWCfDY_filtered.json b/annotations_filtered/ow9U0uWCfDY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..667c160f10d4ab753ccb886941d5760c4045b51c --- /dev/null +++ b/annotations_filtered/ow9U0uWCfDY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 126.79], [127.0, 126.94]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [119.79, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/ox1SVCutwv4_filtered.json b/annotations_filtered/ox1SVCutwv4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6e392c242640a7105cba67534cb472860f46c62 --- /dev/null +++ b/annotations_filtered/ox1SVCutwv4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.65], [30.0, 30.43], [31.0, 32.66], [34.0, 34.38], [35.0, 37.81], [39.0, 59.61], [65.0, 81.43], [83.0, 85.19], [86.0, 92.5], [93.0, 95.91], [97.0, 101.58], [105.0, 119.52], [123.0, 137.08], [140.0, 146.8], [149.0, 152.59], [157.0, 157.4], [158.0, 161.84], [165.0, 166.01], [168.0, 180.1]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.74, 29.34, 29.82, 35.28, 33.14, 38.08, 34.38, 30.46, 29.86, 35.6, 56.03, 0.0, 37.98, 0.0, 35.51], "audiomae_on_audioset": [null, null, null, null, [["music", 22.96], ["breaking", 10.06], ["whack, thwack", 5.58]], [["speech", 36.64], ["music", 31.98], ["cacophony", 8.8]], [["music", 57.89], ["hum", 10.7], ["throbbing", 10.09]], [["music", 30.53], ["throbbing", 28.35], ["hum", 11.32]], [["music", 68.03], ["electronic music", 7.37], ["synthesizer", 4.54]], [["music", 52.13], ["gong", 15.53], ["hum", 7.83]], [["music", 44.1], ["ambient music", 8.18], ["hum", 6.67]], [["music", 31.68], ["hum", 26.3], ["throbbing", 19.98]], [["music", 36.31], ["throbbing", 27.55], ["hum", 19.02]], [["hum", 39.42], ["mains hum", 34.45], ["speech", 5.09]], null, null, [["hum", 17.5], ["heart sounds, heartbeat", 15.18], ["music", 12.62]], null, [["mains hum", 40.24], ["hum", 39.67], ["throbbing", 5.9]]], "duration": [0.65, 0.43, 1.66, 0.38, 2.81, 20.61, 16.43, 2.19, 6.5, 2.91, 4.58, 14.52, 14.08, 6.8, 3.59, 0.4, 3.84, 1.01, 12.1]} \ No newline at end of file diff --git a/annotations_filtered/oxA2tQ6kfdE_filtered.json b/annotations_filtered/oxA2tQ6kfdE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f822489e2a68f28b98d658de7dc90fda91d4f4a --- /dev/null +++ b/annotations_filtered/oxA2tQ6kfdE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 25.69], [27.0, 29.64], [30.0, 32.68], [37.0, 38.03], [39.0, 41.42], [42.0, 43.11], [44.0, 45.27], [46.0, 47.16], [48.0, 49.52], [51.0, 53.84], [57.0, 68.72], [70.0, 71.85], [73.0, 76.67], [77.0, 78.81], [80.0, 79.88], [81.0, 87.29], [88.0, 90.78], [92.0, 93.5], [94.0, 94.39], [99.0, 99.84], [100.0, 104.52], [107.0, 107.28], [108.0, 115.25], [116.0, 125.81]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, true, false, true, true], "silence_prob": [49.87, 100.0, 94.07, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 92.48, 45.52, 0.0, 33.15, 0.0, 0.0, 30.2, 30.94, 0.0, 0.0, 0.0, 31.81, 0.0, 34.05, 42.24], "audiomae_on_audioset": [[["noise", 40.68], ["microwave oven", 5.1], ["telephone", 5.1]], null, null, null, null, null, null, null, null, null, [["music", 21.63], ["hum", 16.57], ["speech", 14.34]], null, [["music", 49.32], ["speech", 16.0], ["theremin", 8.05]], null, null, [["speech", 39.96], ["music", 16.7], ["horse", 4.6]], [["music", 28.4], ["speech", 21.04], ["didgeridoo", 11.19]], null, null, null, [["music", 17.9], ["speech", 16.3], ["didgeridoo", 6.64]], null, [["music", 46.67], ["theremin", 12.54], ["musical instrument", 8.42]], [["music", 34.43], ["didgeridoo", 13.48], ["hum", 10.29]]], "duration": [4.69, 2.64, 2.68, 1.03, 2.42, 1.11, 1.27, 1.16, 1.52, 2.84, 11.72, 1.85, 3.67, 1.81, -0.12, 6.29, 2.78, 1.5, 0.39, 0.84, 4.52, 0.28, 7.25, 9.81]} \ No newline at end of file diff --git a/annotations_filtered/oxLuG0BYYwE_filtered.json b/annotations_filtered/oxLuG0BYYwE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68b1ffdfab1a17fb76199cf0e8da5ff431c72986 --- /dev/null +++ b/annotations_filtered/oxLuG0BYYwE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.21], [12.0, 12.53], [13.0, 14.82], [16.0, 16.68], [17.0, 18.1], [19.0, 20.68], [21.0, 21.25], [21.0, 22.13], [24.0, 27.67], [34.0, 35.02], [43.0, 44.32], [46.0, 46.6], [49.0, 49.86], [52.0, 53.96], [54.0, 56.86], [58.0, 59.24], [62.0, 61.94], [65.0, 65.25], [68.0, 68.37], [71.0, 72.18], [75.0, 75.88], [82.0, 83.2], [86.0, 85.99], [91.0, 91.15], [98.0, 98.47], [99.0, 99.76], [106.0, 106.32], [112.0, 112.56], [113.0, 115.35], [119.0, 120.23], [124.0, 124.9], [126.0, 130.22], [131.0, 131.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.25, 0.0, 0.0, 0.0, 0.0, 0.0, 42.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.81, 0.0, 0.0, 35.45, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["fly, housefly", 44.77], ["insect", 36.37], ["bee, wasp, etc.", 15.19]], null, null, null, null, null, [["speech", 41.22], ["music", 12.06], ["sidetone", 5.46]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.12], ["speech", 9.08], ["cattle, bovinae", 8.52]], null, null, [["music", 43.06], ["speech", 26.14], ["synthesizer", 4.44]], null], "duration": [1.21, 0.53, 1.82, 0.68, 1.1, 1.68, 0.25, 1.13, 3.67, 1.02, 1.32, 0.6, 0.86, 1.96, 2.86, 1.24, -0.06, 0.25, 0.37, 1.18, 0.88, 1.2, -0.01, 0.15, 0.47, 0.76, 0.32, 0.56, 2.35, 1.23, 0.9, 4.22, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/oxjeihyxCnY_filtered.json b/annotations_filtered/oxjeihyxCnY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7214aeee256696613fa379f765cc5a2c7d78bf0c --- /dev/null +++ b/annotations_filtered/oxjeihyxCnY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 18.87], [20.0, 20.95], [22.0, 22.54], [24.0, 24.98], [26.0, 30.81], [32.0, 32.41], [35.0, 35.23], [37.0, 37.71], [39.0, 39.43], [42.0, 42.47], [48.0, 48.37], [49.0, 50.38], [52.0, 52.61], [54.0, 55.19], [59.0, 60.39], [63.0, 63.95], [65.0, 64.96], [66.0, 67.24], [68.0, 68.42], [69.0, 70.9], [76.0, 76.37], [79.0, 81.24], [82.0, 83.19], [119.0, 119.25], [121.0, 122.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [57.09, 0.0, 0.0, 0.0, 99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.14, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 51.87], ["effects unit", 12.84], ["distortion", 5.82]], null, null, null], "duration": [11.87, 0.95, 0.54, 0.98, 4.81, 0.41, 0.23, 0.71, 0.43, 0.47, 0.37, 1.38, 0.61, 1.19, 1.39, 0.95, -0.04, 1.24, 0.42, 1.9, 0.37, 2.24, 1.19, 0.25, 1.64]} \ No newline at end of file diff --git a/annotations_filtered/oxxBXpnn2Jw_filtered.json b/annotations_filtered/oxxBXpnn2Jw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e27017716895413d6665e706b23c2fab2b71087 --- /dev/null +++ b/annotations_filtered/oxxBXpnn2Jw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.21], [33.0, 33.44], [35.0, 43.38], [45.0, 52.51], [58.0, 58.83], [60.0, 64.18], [68.0, 68.52], [74.0, 78.88], [80.0, 87.49], [89.0, 91.25], [94.0, 106.73], [117.0, 117.58], [118.0, 118.17], [126.0, 130.79], [140.0, 143.67], [145.0, 145.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 31.75, 33.04, 0.0, 38.14, 0.0, 38.45, 38.43, 59.59, 33.2, 0.0, 0.0, 32.13, 35.26, 0.0], "audiomae_on_audioset": [null, null, [["music", 74.29], ["drum machine", 12.01], ["speech", 2.72]], [["music", 83.86], ["electronic music", 5.02], ["speech", 1.74]], null, [["music", 43.6], ["speech", 17.92], ["boing", 17.41]], null, [["music", 63.9], ["drum machine", 6.01], ["synthesizer", 5.91]], [["music", 68.31], ["speech", 5.42], ["hum", 4.51]], null, [["music", 72.31], ["electric shaver, electric razor", 4.72], ["speech", 2.65]], null, null, [["music", 74.7], ["drum machine", 6.52], ["sampler", 4.46]], [["speech", 30.84], ["music", 27.25], ["boing", 8.24]], null], "duration": [1.21, 0.44, 8.38, 7.51, 0.83, 4.18, 0.52, 4.88, 7.49, 2.25, 12.73, 0.58, 0.17, 4.79, 3.67, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/oyU6En9HN8E_filtered.json b/annotations_filtered/oyU6En9HN8E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4c1de3da89a1736ec43ddf16b4de643ce353cbd --- /dev/null +++ b/annotations_filtered/oyU6En9HN8E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.51], [8.0, 20.17], [24.0, 24.21], [25.0, 32.58], [34.0, 36.51], [38.0, 38.97], [40.0, 41.98], [44.0, 57.6], [59.0, 59.71], [64.0, 65.91], [72.0, 75.2], [110.0, 109.83], [117.0, 118.74], [128.0, 128.68], [130.0, 130.89], [134.0, 134.37], [135.0, 146.11], [163.0, 164.05], [165.0, 166.43], [166.0, 166.5], [167.0, 167.46]], "keep_status": [false, true, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.74, 0.0, 39.46, 38.1, 0.0, 0.0, 36.07, 0.0, 0.0, 30.98, 0.0, 0.0, 0.0, 0.0, 0.0, 34.3, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 23.87], ["fly, housefly", 12.18], ["buzz", 9.07]], null, [["fly, housefly", 18.63], ["speech", 18.16], ["bee, wasp, etc.", 8.55]], [["music", 17.77], ["throbbing", 13.98], ["hum", 9.26]], null, null, [["livestock, farm animals, working animals", 12.83], ["clip-clop", 12.46], ["horse", 11.92]], null, null, [["beatboxing", 62.41], ["speech", 22.59], ["music", 5.67]], null, null, null, null, null, [["speech", 81.56], ["sidetone", 4.15], ["radio", 3.99]], null, null, null, null], "duration": [0.51, 12.17, 0.21, 7.58, 2.51, 0.97, 1.98, 13.6, 0.71, 1.91, 3.2, -0.17, 1.74, 0.68, 0.89, 0.37, 11.11, 1.05, 1.43, 0.5, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/oyYuYNnSq9E_filtered.json b/annotations_filtered/oyYuYNnSq9E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3600883411daf3fadb771740902d849dd2a6e4f8 --- /dev/null +++ b/annotations_filtered/oyYuYNnSq9E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.12], [2.0, 11.16], [19.0, 24.6], [30.0, 30.33], [33.0, 33.62], [37.0, 37.47], [39.0, 40.37], [63.0, 63.58], [64.0, 68.76], [73.0, 73.41], [96.0, 96.63]], "keep_status": [true, true, true, false, false, false, false, false, true, false, false], "silence_prob": [34.67, 31.25, 35.83, 0.0, 0.0, 0.0, 0.0, 0.0, 40.88, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 30.2], ["music", 24.6], ["boing", 7.91]], [["speech", 30.87], ["cattle, bovinae", 6.53], ["moo", 4.3]], [["speech", 21.59], ["livestock, farm animals, working animals", 17.53], ["animal", 10.62]], null, null, null, null, null, [["livestock, farm animals, working animals", 26.38], ["cattle, bovinae", 16.14], ["clip-clop", 13.41]], null, null], "duration": [2.12, 9.16, 5.6, 0.33, 0.62, 0.47, 1.37, 0.58, 4.76, 0.41, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/oyZblWujofQ_filtered.json b/annotations_filtered/oyZblWujofQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b6982326ddfc8ac0828ca77fcb742950348780a --- /dev/null +++ b/annotations_filtered/oyZblWujofQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.84], [8.0, 9.39], [10.0, 10.62], [14.0, 14.34], [16.0, 18.15], [20.0, 20.7], [22.0, 26.81], [27.0, 28.21], [32.0, 60.02], [64.0, 65.4], [67.0, 78.93], [81.0, 81.73], [83.0, 84.94], [85.0, 85.72], [86.0, 86.9]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.63, 0.0, 31.74, 0.0, 30.61, 0.0, 30.17, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["explosion", 27.53], ["music", 17.4], ["burst, pop", 11.81]], null, [["speech", 66.3], ["explosion", 7.82], ["music", 5.03]], null, [["speech", 61.92], ["machine gun", 18.01], ["cacophony", 2.56]], null, [["speech", 26.26], ["machine gun", 9.45], ["explosion", 8.59]], null, null, null, null], "duration": [-0.16, 1.39, 0.62, 0.34, 2.15, 0.7, 4.81, 1.21, 28.02, 1.4, 11.93, 0.73, 1.94, 0.72, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/oyaud2-X1QM_filtered.json b/annotations_filtered/oyaud2-X1QM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a843ba6f141adf4f23fcb0c9c493a8c327ed5bed --- /dev/null +++ b/annotations_filtered/oyaud2-X1QM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.98], [8.0, 11.03], [15.0, 19.6], [26.0, 27.11], [28.0, 30.94], [33.0, 33.27], [34.0, 34.87], [37.0, 37.54], [39.0, 40.56], [42.0, 41.66], [43.0, 43.97], [45.0, 46.63], [49.0, 50.7], [52.0, 56.51], [57.0, 60.49], [61.0, 95.45], [96.0, 98.63], [100.0, 101.56], [106.0, 106.76], [108.0, 109.26], [111.0, 111.72], [113.0, 114.52], [117.0, 122.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [99.97, 93.76, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 32.92, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 29.11], ["gunshot, gunfire", 16.27], ["firecracker", 11.1]], null, null, null, null, null, null, null, null], "duration": [3.98, 3.03, 4.6, 1.11, 2.94, 0.27, 0.87, 0.54, 1.56, -0.34, 0.97, 1.63, 1.7, 4.51, 3.49, 34.45, 2.63, 1.56, 0.76, 1.26, 0.72, 1.52, 5.23]} \ No newline at end of file diff --git a/annotations_filtered/oymR3xfYh4c_filtered.json b/annotations_filtered/oymR3xfYh4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc83d9e4bd4a8d0a8080033fa011fce693020c10 --- /dev/null +++ b/annotations_filtered/oymR3xfYh4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 44.19], [45.0, 45.47], [46.0, 64.45], [65.0, 65.94], [67.0, 88.55], [91.0, 91.45], [92.0, 105.95], [107.0, 113.12], [115.0, 136.71], [137.0, 147.7], [148.0, 149.89], [150.0, 151.12], [152.0, 174.33], [175.0, 176.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.97, 0.0, 93.29, 0.0, 87.19, 0.0, 56.7, 73.97, 87.74, 39.82, 0.0, 0.0, 61.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["sidetone", 37.01], ["speech", 25.14], ["hum", 12.93]], null, null, null, null], "duration": [7.19, 0.47, 18.45, 0.94, 21.55, 0.45, 13.95, 6.12, 21.71, 10.7, 1.89, 1.12, 22.33, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/oyqIjdFcJVg_filtered.json b/annotations_filtered/oyqIjdFcJVg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5be2ecc7b3e18b2c066b228c4356f2adc429e741 --- /dev/null +++ b/annotations_filtered/oyqIjdFcJVg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 23.82], [26.0, 27.68], [45.0, 45.23], [45.0, 45.87], [47.0, 49.25], [50.0, 50.65], [51.0, 55.41], [56.0, 56.24], [58.0, 59.07]], "keep_status": [true, false, false, false, false, false, true, false, false], "silence_prob": [33.13, 0.0, 0.0, 0.0, 31.67, 0.0, 41.5, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 58.12], ["horse", 4.22], ["radio", 3.65]], null, null, null, [["telephone bell ringing", 48.28], ["telephone", 11.52], ["ringtone", 10.43]], null, [["speech", 46.84], ["radio", 14.97], ["sidetone", 6.92]], null, null], "duration": [12.82, 1.68, 0.23, 0.87, 2.25, 0.65, 4.41, 0.24, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/oyuHdD6ORAg_filtered.json b/annotations_filtered/oyuHdD6ORAg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0a5d80a3da8366c93ee9d6a559e083123a97cc7 --- /dev/null +++ b/annotations_filtered/oyuHdD6ORAg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.2], [9.0, 13.54], [14.0, 97.77]], "keep_status": [false, false, false], "silence_prob": [0.0, 29.07, 0.0], "audiomae_on_audioset": [null, [["music", 50.94], ["speech", 27.67], ["electronic music", 2.72]], null], "duration": [0.2, 4.54, 83.77]} \ No newline at end of file diff --git a/annotations_filtered/oz6wjc6xLFU_filtered.json b/annotations_filtered/oz6wjc6xLFU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d70f6e29ad165658aeedd04b5f598cd0ad92f15f --- /dev/null +++ b/annotations_filtered/oz6wjc6xLFU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.52], [6.0, 10.86], [13.0, 16.66], [20.0, 23.19], [39.0, 39.5], [40.0, 40.81], [44.0, 44.9], [46.0, 46.33], [53.0, 54.09], [56.0, 67.69], [75.0, 76.67], [88.0, 87.83], [104.0, 104.92], [107.0, 107.76], [108.0, 108.41], [111.0, 112.35], [114.0, 114.44], [116.0, 119.2], [123.0, 123.67], [126.0, 127.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 61.57, 61.77, 64.18, 0.0, 0.0, 0.0, 0.0, 0.0, 60.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.24, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["boing", 34.14], ["music", 28.23], ["speech", 6.1]], null, null], "duration": [1.52, 4.86, 3.66, 3.19, 0.5, 0.81, 0.9, 0.33, 1.09, 11.69, 1.67, -0.17, 0.92, 0.76, 0.41, 1.35, 0.44, 3.2, 0.67, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/ozAXbxleK-8_filtered.json b/annotations_filtered/ozAXbxleK-8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92b3fa4a9d3a57598dd339a2852343dcc10757ec --- /dev/null +++ b/annotations_filtered/ozAXbxleK-8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.47], [5.0, 13.56], [16.0, 16.7], [18.0, 18.4], [32.0, 35.56], [45.0, 45.67], [50.0, 49.89], [53.0, 53.1], [55.0, 57.08]], "keep_status": [false, true, false, false, false, false, false, false, false], "silence_prob": [84.98, 38.31, 0.0, 0.0, 80.82, 0.0, 0.0, 0.0, 53.59], "audiomae_on_audioset": [null, [["arrow", 28.54], ["whack, thwack", 19.13], ["mains hum", 12.44]], null, null, null, null, null, null, null], "duration": [2.47, 8.56, 0.7, 0.4, 3.56, 0.67, -0.11, 0.1, 2.08]} \ No newline at end of file diff --git a/annotations_filtered/ozf32hrXGiY_filtered.json b/annotations_filtered/ozf32hrXGiY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be2e2ca117f311811b3b80381ccb3510f28b4ec1 --- /dev/null +++ b/annotations_filtered/ozf32hrXGiY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.28], [10.0, 10.27], [14.0, 14.94], [16.0, 16.53], [24.0, 24.21], [25.0, 25.57], [27.0, 27.09], [30.0, 29.91], [35.0, 35.82], [38.0, 38.62], [52.0, 52.24], [64.0, 69.38], [70.0, 70.55], [72.0, 72.2], [74.0, 74.41], [86.0, 86.16], [88.0, 88.35], [91.0, 91.5], [93.0, 93.14], [96.0, 97.17], [98.0, 98.64], [99.0, 99.79], [101.0, 102.09], [106.0, 106.57], [111.0, 113.07], [128.0, 131.89], [135.0, 137.64], [139.0, 139.73], [142.0, 144.0], [147.0, 148.37], [151.0, 152.44], [154.0, 154.31], [156.0, 156.61], [161.0, 161.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 99.95, 99.91, 0.0, 96.77, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.28, 0.27, 0.94, 0.53, 0.21, 0.57, 0.09, -0.09, 0.82, 0.62, 0.24, 5.38, 0.55, 0.2, 0.41, 0.16, 0.35, 0.5, 0.14, 1.17, 0.64, 0.79, 1.09, 0.57, 2.07, 3.89, 2.64, 0.73, 2.0, 1.37, 1.44, 0.31, 0.61, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/ozkF8KRjeO8_filtered.json b/annotations_filtered/ozkF8KRjeO8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a03cf282e8614ce338d60638b52bf78b87383fb8 --- /dev/null +++ b/annotations_filtered/ozkF8KRjeO8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.51], [7.0, 19.47], [20.0, 28.93], [32.0, 63.07], [64.0, 64.79], [65.0, 65.99], [67.0, 67.88], [70.0, 72.79], [80.0, 97.97], [99.0, 110.96], [111.0, 112.92], [113.0, 116.78], [122.0, 123.31]], "keep_status": [true, true, true, false, false, false, false, true, false, false, false, true, false], "silence_prob": [35.84, 37.15, 33.61, 0.0, 0.0, 0.0, 0.0, 45.4, 31.11, 29.92, 0.0, 32.37, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 27.17], ["livestock, farm animals, working animals", 15.77], ["moo", 13.95]], [["cattle, bovinae", 25.68], ["moo", 19.85], ["livestock, farm animals, working animals", 18.92]], [["speech", 38.7], ["vehicle", 18.85], ["buzz", 7.54]], null, null, null, null, [["fly, housefly", 32.52], ["mosquito", 15.84], ["insect", 6.24]], [["music", 75.07], ["synthesizer", 4.99], ["musical instrument", 3.88]], [["music", 80.11], ["grunt", 2.21], ["synthesizer", 1.42]], null, [["cattle, bovinae", 26.42], ["moo", 22.33], ["livestock, farm animals, working animals", 13.52]], null], "duration": [5.51, 12.47, 8.93, 31.07, 0.79, 0.99, 0.88, 2.79, 17.97, 11.96, 1.92, 3.78, 1.31]} \ No newline at end of file diff --git a/annotations_filtered/ozksR8QLWzM_filtered.json b/annotations_filtered/ozksR8QLWzM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4a9b6d4d83e2698f43ee9c86fc6f86d4bf72600 --- /dev/null +++ b/annotations_filtered/ozksR8QLWzM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 10.03], [11.0, 23.11], [25.0, 24.93], [27.0, 27.63], [34.0, 33.94], [39.0, 45.13], [47.0, 50.95], [52.0, 51.93], [54.0, 55.22], [56.0, 57.89], [59.0, 59.95], [64.0, 68.94], [76.0, 77.58], [81.0, 82.39], [84.0, 88.86], [89.0, 88.99], [89.0, 89.11], [89.0, 98.64], [101.0, 101.07], [114.0, 115.16], [124.0, 127.2]], "keep_status": [false, true, false, false, false, true, true, false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [31.15, 31.21, 0.0, 0.0, 0.0, 32.3, 34.84, 0.0, 0.0, 0.0, 0.0, 31.11, 0.0, 0.0, 32.28, 0.0, 0.0, 31.24, 0.0, 0.0, 30.22], "audiomae_on_audioset": [[["mains hum", 71.14], ["hum", 21.64], ["speech", 1.36]], [["music", 44.46], ["cacophony", 11.19], ["speech", 7.13]], null, null, null, [["mains hum", 27.61], ["hum", 24.97], ["buzz", 8.96]], [["bee, wasp, etc.", 18.97], ["fly, housefly", 10.61], ["insect", 9.68]], null, null, null, null, [["speech", 55.24], ["vehicle", 20.86], ["car", 4.01]], null, null, [["hum", 35.62], ["mains hum", 13.06], ["music", 10.75]], null, null, [["speech", 21.15], ["mains hum", 13.79], ["hum", 11.18]], null, null, [["speech", 61.73], ["vehicle", 15.97], ["music", 5.54]]], "duration": [9.03, 12.11, -0.07, 0.63, -0.06, 6.13, 3.95, -0.07, 1.22, 1.89, 0.95, 4.94, 1.58, 1.39, 4.86, -0.01, 0.11, 9.64, 0.07, 1.16, 3.2]} \ No newline at end of file diff --git a/annotations_filtered/ozpct8zUA_U_filtered.json b/annotations_filtered/ozpct8zUA_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b5c77655e2ff50d450474c8a4ee18d9d231e1f8 --- /dev/null +++ b/annotations_filtered/ozpct8zUA_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.84], [4.0, 5.34], [9.0, 9.12], [10.0, 11.42], [12.0, 12.12], [15.0, 16.07], [19.0, 22.99], [25.0, 25.69], [27.0, 27.43], [28.0, 28.46], [30.0, 30.35], [33.0, 33.56], [35.0, 37.2], [38.0, 39.23], [43.0, 44.93], [48.0, 54.4], [55.0, 56.52], [57.0, 57.91], [59.0, 59.9], [60.0, 61.18], [63.0, 63.29], [66.0, 67.31], [71.0, 72.35], [74.0, 74.66], [77.0, 77.97], [79.0, 80.92], [83.0, 84.64], [87.0, 90.76], [92.0, 92.3], [93.0, 93.11], [95.0, 95.52], [96.0, 95.89], [100.0, 100.16], [101.0, 101.8], [103.0, 108.36], [109.0, 110.0], [111.0, 110.84], [112.0, 113.86], [116.0, 116.48], [117.0, 117.91], [120.0, 119.89], [120.0, 121.24], [123.0, 126.06], [128.0, 129.02], [130.0, 130.33], [131.0, 132.44], [133.0, 134.01], [135.0, 136.76], [137.0, 138.69], [140.0, 141.27], [144.0, 145.13], [147.0, 148.46], [149.0, 150.13], [153.0, 152.98], [155.0, 156.14], [158.0, 159.29], [160.0, 166.85], [168.0, 169.43], [170.0, 170.63], [172.0, 172.91], [178.0, 179.66], [186.0, 186.41], [188.0, 188.67], [189.0, 196.64], [199.0, 200.08], [201.0, 202.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.37, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.84, 1.34, 0.12, 1.42, 0.12, 1.07, 3.99, 0.69, 0.43, 0.46, 0.35, 0.56, 2.2, 1.23, 1.93, 6.4, 1.52, 0.91, 0.9, 1.18, 0.29, 1.31, 1.35, 0.66, 0.97, 1.92, 1.64, 3.76, 0.3, 0.11, 0.52, -0.11, 0.16, 0.8, 5.36, 1.0, -0.16, 1.86, 0.48, 0.91, -0.11, 1.24, 3.06, 1.02, 0.33, 1.44, 1.01, 1.76, 1.69, 1.27, 1.13, 1.46, 1.13, -0.02, 1.14, 1.29, 6.85, 1.43, 0.63, 0.91, 1.66, 0.41, 0.67, 7.64, 1.08, 1.98]} \ No newline at end of file diff --git a/annotations_filtered/p-5nqrOtaug_filtered.json b/annotations_filtered/p-5nqrOtaug_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b76c8a57261d305b015058f51f36a045d5c6c8bd --- /dev/null +++ b/annotations_filtered/p-5nqrOtaug_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.13], [7.0, 9.88], [16.0, 18.08], [20.0, 21.12], [24.0, 25.91], [27.0, 28.32], [30.0, 30.13], [33.0, 60.32], [61.0, 62.46], [63.0, 65.16], [66.0, 66.58], [67.0, 68.25], [71.0, 74.28], [77.0, 77.01], [79.0, 83.59], [84.0, 83.84], [84.0, 83.93], [85.0, 119.45], [123.0, 131.75]], "keep_status": [false, true, false, false, false, false, false, true, false, true, false, false, true, false, true, false, false, false, true], "silence_prob": [0.0, 36.95, 69.74, 0.0, 0.0, 0.0, 0.0, 29.89, 0.0, 47.98, 0.0, 0.0, 45.14, 0.0, 30.69, 0.0, 0.0, 0.0, 29.2], "audiomae_on_audioset": [null, [["speech", 28.75], ["music", 24.32], ["mosquito", 7.0]], null, null, null, null, null, [["cattle, bovinae", 21.13], ["livestock, farm animals, working animals", 14.68], ["moo", 12.25]], null, [["music", 36.0], ["speech", 20.83], ["didgeridoo", 9.46]], null, null, [["music", 58.57], ["speech", 5.8], ["musical instrument", 2.61]], null, [["speech", 29.93], ["music", 17.13], ["mosquito", 11.79]], null, null, null, [["speech", 21.85], ["music", 20.82], ["buzz", 6.8]]], "duration": [0.13, 2.88, 2.08, 1.12, 1.91, 1.32, 0.13, 27.32, 1.46, 2.16, 0.58, 1.25, 3.28, 0.01, 4.59, -0.16, -0.07, 34.45, 8.75]} \ No newline at end of file diff --git a/annotations_filtered/p-Kyr2Ibq3c_filtered.json b/annotations_filtered/p-Kyr2Ibq3c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f20c4cf332b3425fac5731e5aa52baa3a82b16ca --- /dev/null +++ b/annotations_filtered/p-Kyr2Ibq3c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.02], [13.0, 14.81], [16.0, 18.55], [19.0, 18.87], [19.0, 21.96], [22.0, 22.0], [25.0, 25.96], [27.0, 32.43], [34.0, 36.04], [43.0, 45.74], [51.0, 51.73], [54.0, 55.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 58.3, 0.0, 56.78, 0.0, 0.0, 62.58, 50.02, 31.8, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 72.35], ["radio", 4.81], ["dial tone", 3.82]], null, null], "duration": [1.02, 1.81, 2.55, -0.13, 2.96, 0.0, 0.96, 5.43, 2.04, 2.74, 0.73, 1.21]} \ No newline at end of file diff --git a/annotations_filtered/p-YvF5eXwYM_filtered.json b/annotations_filtered/p-YvF5eXwYM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58e8413da0b84880a21c30b19b646c36d15a1f61 --- /dev/null +++ b/annotations_filtered/p-YvF5eXwYM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.23], [7.0, 7.5], [10.0, 9.71], [10.0, 14.17], [18.0, 18.23], [20.0, 22.03], [33.0, 33.78], [39.0, 39.46], [48.0, 47.92], [49.0, 50.18], [53.0, 54.13], [57.0, 59.29], [59.0, 60.83], [64.0, 64.5], [70.0, 73.6], [78.0, 80.23], [83.0, 84.67], [91.0, 91.71], [107.0, 109.19]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, true, false, false, true, true, false, false, true], "silence_prob": [36.43, 0.0, 0.0, 34.09, 0.0, 31.64, 0.0, 0.0, 0.0, 0.0, 0.0, 43.71, 0.0, 0.0, 36.67, 36.31, 0.0, 0.0, 35.58], "audiomae_on_audioset": [[["baby laughter", 38.08], ["laughter", 10.99], ["speech", 7.09]], null, null, [["speech", 26.89], ["whack, thwack", 13.91], ["rowboat, canoe, kayak", 11.14]], null, [["speech", 61.51], ["radio", 6.27], ["noise", 2.32]], null, null, null, null, null, [["music", 32.9], ["hum", 4.11], ["gong", 3.79]], null, null, [["music", 60.14], ["musical instrument", 4.84], ["speech", 4.18]], [["music", 37.91], ["theremin", 12.89], ["synthesizer", 6.02]], null, null, [["music", 32.19], ["speech", 19.29], ["hum", 8.96]]], "duration": [2.23, 0.5, -0.29, 4.17, 0.23, 2.03, 0.78, 0.46, -0.08, 1.18, 1.13, 2.29, 1.83, 0.5, 3.6, 2.23, 1.67, 0.71, 2.19]} \ No newline at end of file diff --git a/annotations_filtered/p-echNQGbug_filtered.json b/annotations_filtered/p-echNQGbug_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd22a358bae43172f13d633d8f245f608f90de6b --- /dev/null +++ b/annotations_filtered/p-echNQGbug_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 29.13], [33.0, 37.23], [38.0, 37.74], [38.0, 37.77], [38.0, 37.88], [39.0, 49.59], [54.0, 74.76], [76.0, 76.65], [96.0, 96.97], [100.0, 101.07], [103.0, 104.3], [106.0, 107.2]], "keep_status": [true, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [31.44, 31.81, 0.0, 0.0, 0.0, 31.21, 30.38, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 17.97], ["music", 15.82], ["vehicle", 8.71]], [["music", 50.45], ["speech", 19.41], ["whack, thwack", 4.61]], null, null, null, [["speech", 33.93], ["music", 31.6], ["outside, rural or natural", 3.85]], [["music", 44.84], ["livestock, farm animals, working animals", 5.23], ["speech", 4.15]], null, null, null, null, null], "duration": [26.13, 4.23, -0.26, -0.23, -0.12, 10.59, 20.76, 0.65, 0.97, 1.07, 1.3, 1.2]} \ No newline at end of file diff --git a/annotations_filtered/p-mlLMZXqg4_filtered.json b/annotations_filtered/p-mlLMZXqg4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..132f4c59ba523b3fdabd66507aeb24221d615e2b --- /dev/null +++ b/annotations_filtered/p-mlLMZXqg4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 95.94], [104.0, 104.65]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [54.94, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/p-tvo3Hz3nw_filtered.json b/annotations_filtered/p-tvo3Hz3nw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..589e01587e61758681f521ffb746d5f4a62ac3ff --- /dev/null +++ b/annotations_filtered/p-tvo3Hz3nw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 23.41], [32.0, 37.2], [40.0, 45.2], [46.0, 47.76], [50.0, 78.51], [82.0, 82.16], [88.0, 91.74], [93.0, 94.76]], "keep_status": [true, false, true, false, false, false, true, false], "silence_prob": [29.81, 68.28, 33.77, 0.0, 34.57, 0.0, 44.52, 0.0], "audiomae_on_audioset": [[["music", 32.78], ["smash, crash", 15.04], ["whack, thwack", 10.45]], null, [["cattle, bovinae", 15.95], ["livestock, farm animals, working animals", 15.44], ["animal", 7.41]], null, [["hum", 39.33], ["throbbing", 30.2], ["music", 8.32]], null, [["music", 50.14], ["synthesizer", 6.97], ["electronic music", 5.66]], null], "duration": [15.41, 5.2, 5.2, 1.76, 28.51, 0.16, 3.74, 1.76]} \ No newline at end of file diff --git a/annotations_filtered/p0-xbD-mRLs_filtered.json b/annotations_filtered/p0-xbD-mRLs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..349a6a8787c74d47cc22dad13234d33d06220dc4 --- /dev/null +++ b/annotations_filtered/p0-xbD-mRLs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.14], [8.0, 10.37], [12.0, 15.3], [19.0, 19.6], [24.0, 24.68], [26.0, 30.28], [33.0, 40.54], [42.0, 42.65], [44.0, 44.63], [50.0, 50.84], [55.0, 55.14], [57.0, 57.97], [59.0, 59.43], [61.0, 61.48], [63.0, 63.37], [67.0, 67.42], [70.0, 70.82], [72.0, 77.35], [81.0, 81.16], [87.0, 87.78], [92.0, 94.27], [100.0, 101.71], [110.0, 111.6]], "keep_status": [true, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [40.9, 98.44, 49.18, 0.0, 0.0, 42.13, 90.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.38, 0.0, 0.0, 47.86, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 23.34], ["music", 13.38], ["noise", 12.25]], null, [["cattle, bovinae", 19.36], ["moo", 16.1], ["speech", 13.97]], null, null, [["speech", 53.96], ["noise", 11.85], ["radio", 3.74]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 65.01], ["hum", 3.41], ["throbbing", 2.87]], null, null, [["gurgling", 9.52], ["stomach rumble", 8.09], ["patter", 7.93]], null, null], "duration": [3.14, 2.37, 3.3, 0.6, 0.68, 4.28, 7.54, 0.65, 0.63, 0.84, 0.14, 0.97, 0.43, 0.48, 0.37, 0.42, 0.82, 5.35, 0.16, 0.78, 2.27, 1.71, 1.6]} \ No newline at end of file diff --git a/annotations_filtered/p03u3v6GF-Y_filtered.json b/annotations_filtered/p03u3v6GF-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca84335babd313913e683bc73fdcf67d9d613732 --- /dev/null +++ b/annotations_filtered/p03u3v6GF-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.98], [10.0, 16.77], [24.0, 28.29], [33.0, 49.18], [56.0, 59.19], [61.0, 79.86], [80.0, 86.02], [93.0, 104.89], [107.0, 116.48], [116.0, 116.51], [117.0, 116.95], [117.0, 127.45], [132.0, 134.0], [137.0, 144.9]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 35.37, 33.3, 32.09, 32.48, 32.47, 32.79, 33.18, 32.09, 0.0, 0.0, 32.66, 36.58, 33.67], "audiomae_on_audioset": [null, [["music", 39.71], ["gong", 31.89], ["musical instrument", 4.81]], [["music", 51.32], ["synthesizer", 10.24], ["musical instrument", 7.9]], [["music", 73.5], ["musical instrument", 7.21], ["echo", 2.73]], [["music", 86.89], ["musical instrument", 2.2], ["echo", 0.83]], [["music", 67.37], ["musical instrument", 7.94], ["trombone", 3.97]], [["music", 81.0], ["musical instrument", 4.96], ["theremin", 4.79]], [["music", 57.08], ["musical instrument", 12.27], ["brass instrument", 9.72]], [["music", 61.37], ["synthesizer", 7.88], ["musical instrument", 7.47]], null, null, [["music", 38.25], ["trombone", 27.28], ["brass instrument", 19.96]], [["music", 48.37], ["theremin", 25.41], ["effects unit", 7.41]], [["gong", 38.01], ["music", 16.39], ["synthesizer", 6.7]]], "duration": [0.98, 6.77, 4.29, 16.18, 3.19, 18.86, 6.02, 11.89, 9.48, 0.51, -0.05, 10.45, 2.0, 7.9]} \ No newline at end of file diff --git a/annotations_filtered/p07sXB8H3zQ_filtered.json b/annotations_filtered/p07sXB8H3zQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb5488ec9b043fdea4b14663d67551a5b27b39e8 --- /dev/null +++ b/annotations_filtered/p07sXB8H3zQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.32], [10.0, 10.2], [12.0, 12.38], [20.0, 24.24], [26.0, 28.7], [31.0, 32.22], [33.0, 34.3], [36.0, 36.36], [38.0, 38.4], [42.0, 42.67], [44.0, 47.53], [58.0, 58.75], [63.0, 67.85], [69.0, 71.61], [76.0, 81.84], [87.0, 89.5]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 30.27, 31.62, 0.0, 0.0, 0.0, 0.0, 0.0, 36.16, 0.0, 31.41, 32.33, 31.53, 32.68], "audiomae_on_audioset": [null, null, null, [["music", 42.07], ["hum", 20.02], ["electronic music", 6.1]], [["music", 29.26], ["speech", 28.91], ["hum", 6.75]], null, null, null, null, null, [["music", 50.98], ["didgeridoo", 12.18], ["speech", 6.88]], null, [["speech", 47.1], ["whale vocalization", 22.78], ["music", 7.82]], [["speech", 69.45], ["chuckle, chortle", 4.39], ["snicker", 3.75]], [["music", 45.07], ["throbbing", 5.08], ["electronic music", 4.54]], [["music", 63.52], ["didgeridoo", 4.33], ["hum", 4.32]]], "duration": [0.32, 0.2, 0.38, 4.24, 2.7, 1.22, 1.3, 0.36, 0.4, 0.67, 3.53, 0.75, 4.85, 2.61, 5.84, 2.5]} \ No newline at end of file diff --git a/annotations_filtered/p0BpMFTYFpU_filtered.json b/annotations_filtered/p0BpMFTYFpU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee6ffe2a43fb5916c4787e73bafd40c970734b53 --- /dev/null +++ b/annotations_filtered/p0BpMFTYFpU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 32.48], [34.0, 34.89], [37.0, 37.34], [40.0, 39.82], [46.0, 48.54], [64.0, 67.76], [69.0, 71.49], [72.0, 82.97], [85.0, 84.94], [88.0, 88.79], [94.0, 96.74], [100.0, 100.9], [104.0, 103.99], [113.0, 112.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [70.58, 0.0, 0.0, 0.0, 44.87, 99.93, 93.76, 84.25, 0.0, 0.0, 98.36, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 43.0], ["a capella", 22.94], ["yodeling", 8.42]], null, null, null, null, null, null, null, null, null], "duration": [12.48, 0.89, 0.34, -0.18, 2.54, 3.76, 2.49, 10.97, -0.06, 0.79, 2.74, 0.9, -0.01, -0.17]} \ No newline at end of file diff --git a/annotations_filtered/p0CKoz0u6Eo_filtered.json b/annotations_filtered/p0CKoz0u6Eo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..591356675863f0c5afb742176a06ef6307606aac --- /dev/null +++ b/annotations_filtered/p0CKoz0u6Eo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.27], [17.0, 32.14], [36.0, 37.1], [39.0, 42.13], [42.0, 48.71], [49.0, 51.92], [52.0, 55.68], [59.0, 59.56], [60.0, 60.66], [62.0, 63.21], [66.0, 66.24], [83.0, 83.03], [89.0, 89.97], [92.0, 92.43], [94.0, 94.46], [96.0, 96.9], [98.0, 100.16], [103.0, 103.99], [106.0, 107.6], [108.0, 110.4]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 40.92, 0.0, 33.84, 33.42, 41.56, 39.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.57, 0.0, 0.0, 60.05], "audiomae_on_audioset": [null, [["effects unit", 21.98], ["echo", 12.84], ["distortion", 6.59]], null, [["speech", 32.44], ["whimper", 5.4], ["music", 4.95]], [["music", 34.69], ["didgeridoo", 33.3], ["speech", 7.22]], [["sidetone", 30.96], ["music", 26.59], ["speech", 12.56]], [["music", 78.95], ["musical instrument", 6.23], ["synthesizer", 3.31]], null, null, null, null, null, null, null, null, null, [["speech", 19.86], ["animal", 7.92], ["livestock, farm animals, working animals", 5.43]], null, null, null], "duration": [0.27, 15.14, 1.1, 3.13, 6.71, 2.92, 3.68, 0.56, 0.66, 1.21, 0.24, 0.03, 0.97, 0.43, 0.46, 0.9, 2.16, 0.99, 1.6, 2.4]} \ No newline at end of file diff --git a/annotations_filtered/p0CQcDumPh8_filtered.json b/annotations_filtered/p0CQcDumPh8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e037535174280424fca31be0e77fa93b3ba0ec2 --- /dev/null +++ b/annotations_filtered/p0CQcDumPh8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 36.88], [40.0, 44.71], [47.0, 73.77], [76.0, 76.22], [79.0, 81.4], [85.0, 87.69], [94.0, 95.12], [96.0, 96.13], [97.0, 98.51], [104.0, 104.38], [107.0, 107.1], [108.0, 109.34], [111.0, 111.64], [113.0, 113.41], [116.0, 117.69], [118.0, 119.04], [121.0, 121.81], [125.0, 125.66], [129.0, 130.22], [133.0, 135.16], [141.0, 140.78], [144.0, 144.21], [146.0, 146.91], [148.0, 149.25], [150.0, 151.75], [154.0, 154.58], [157.0, 156.91], [159.0, 161.87]], "keep_status": [true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.0, 31.22, 30.12, 0.0, 37.25, 99.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.26], "audiomae_on_audioset": [[["music", 36.16], ["animal", 8.22], ["drum machine", 4.08]], [["music", 53.03], ["speech", 8.84], ["cattle, bovinae", 4.63]], [["music", 64.0], ["cattle, bovinae", 12.75], ["moo", 5.61]], null, [["speech", 24.59], ["telephone", 19.23], ["insect", 6.44]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.88, 4.71, 26.77, 0.22, 2.4, 2.69, 1.12, 0.13, 1.51, 0.38, 0.1, 1.34, 0.64, 0.41, 1.69, 1.04, 0.81, 0.66, 1.22, 2.16, -0.22, 0.21, 0.91, 1.25, 1.75, 0.58, -0.09, 2.87]} \ No newline at end of file diff --git a/annotations_filtered/p0Ov897MYiw_filtered.json b/annotations_filtered/p0Ov897MYiw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f9eeafd103139fad2f4b7196a579602a16ac517 --- /dev/null +++ b/annotations_filtered/p0Ov897MYiw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.54], [7.0, 27.26], [35.0, 37.62], [38.0, 38.33], [38.0, 45.54], [46.0, 46.74], [49.0, 49.96], [56.0, 64.5], [66.0, 95.57], [96.0, 99.54], [101.0, 110.93], [111.0, 111.45], [111.0, 120.48], [120.0, 120.51]], "keep_status": [false, false, true, false, true, false, false, true, false, true, false, false, true, false], "silence_prob": [0.0, 47.82, 31.21, 0.0, 33.27, 0.0, 0.0, 29.68, 30.22, 32.39, 30.14, 0.0, 33.02, 0.0], "audiomae_on_audioset": [null, [["hum", 41.15], ["mains hum", 24.43], ["music", 5.06]], [["music", 40.45], ["musical instrument", 6.78], ["effects unit", 5.31]], null, [["music", 51.88], ["synthesizer", 11.15], ["effects unit", 5.72]], null, null, [["music", 51.26], ["trombone", 9.45], ["musical instrument", 7.9]], [["music", 57.81], ["vehicle", 10.84], ["car", 6.89]], [["music", 19.44], ["hum", 13.92], ["mains hum", 12.03]], [["music", 68.76], ["vehicle", 3.83], ["electronic music", 2.69]], null, [["music", 36.45], ["theremin", 9.01], ["didgeridoo", 8.22]], null], "duration": [0.54, 20.26, 2.62, 0.33, 7.54, 0.74, 0.96, 8.5, 29.57, 3.54, 9.93, 0.45, 9.48, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/p0cf4-1zuOk_filtered.json b/annotations_filtered/p0cf4-1zuOk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5832947a174760cf9107c1d52c7b0622564de283 --- /dev/null +++ b/annotations_filtered/p0cf4-1zuOk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[57.0, 56.84], [58.0, 58.94], [60.0, 60.29], [63.0, 67.64], [71.0, 73.75], [74.0, 75.29], [75.0, 94.66], [96.0, 111.55], [112.0, 113.43], [114.0, 118.12], [123.0, 124.55]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.63, 30.86, 0.0, 29.94, 31.01, 0.0, 89.9, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 41.8], ["hum", 18.67], ["throbbing", 17.25]], [["music", 79.32], ["meow", 3.86], ["throbbing", 2.88]], null, [["music", 52.54], ["hum", 6.89], ["throbbing", 5.97]], [["music", 40.5], ["didgeridoo", 8.63], ["synthesizer", 5.59]], null, null, null], "duration": [-0.16, 0.94, 0.29, 4.64, 2.75, 1.29, 19.66, 15.55, 1.43, 4.12, 1.55]} \ No newline at end of file diff --git a/annotations_filtered/p0vZhGqM_Rs_filtered.json b/annotations_filtered/p0vZhGqM_Rs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9271600cb44b2ad54d2fa4cbdeae1ed5662341f0 --- /dev/null +++ b/annotations_filtered/p0vZhGqM_Rs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[55.0, 55.41], [56.0, 56.03], [56.0, 69.09], [74.0, 77.31], [80.0, 81.36], [83.0, 84.57], [88.0, 90.37], [93.0, 94.31], [98.0, 100.6], [101.0, 102.2], [106.0, 107.45], [109.0, 111.25], [115.0, 116.11], [119.0, 118.99], [119.0, 119.38], [123.0, 125.95], [136.0, 137.69], [138.0, 142.69], [144.0, 144.93], [146.0, 152.24], [154.0, 153.93], [156.0, 156.83]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.56, 48.39, 0.0, 0.0, 49.73, 0.0, 56.55, 0.0, 0.0, 57.97, 0.0, 0.0, 0.0, 53.72, 0.0, 59.51, 0.0, 55.39, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["sonar", 40.19], ["music", 25.05], ["hum", 4.94]], [["music", 15.25], ["sonar", 11.46], ["hum", 6.78]], null, null, [["music", 29.18], ["whale vocalization", 9.69], ["hum", 9.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.41, 0.03, 13.09, 3.31, 1.36, 1.57, 2.37, 1.31, 2.6, 1.2, 1.45, 2.25, 1.11, -0.01, 0.38, 2.95, 1.69, 4.69, 0.93, 6.24, -0.07, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/p12YiRom_Kw_filtered.json b/annotations_filtered/p12YiRom_Kw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d0defa1489826ca09146943cbff2bb91cf4d945 --- /dev/null +++ b/annotations_filtered/p12YiRom_Kw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.0], [12.0, 12.77], [13.0, 14.54], [19.0, 19.09], [21.0, 22.69], [24.0, 25.79]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [1.0, 0.77, 1.54, 0.09, 1.69, 1.79]} \ No newline at end of file diff --git a/annotations_filtered/p1e3NC3IIF8_filtered.json b/annotations_filtered/p1e3NC3IIF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a39ccdfa7c83be52a14075a2162ccd5e4a7b112 --- /dev/null +++ b/annotations_filtered/p1e3NC3IIF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.72], [20.0, 24.29], [34.0, 35.48], [37.0, 38.64], [42.0, 43.85], [46.0, 46.77], [50.0, 49.92], [54.0, 53.86], [58.0, 60.02], [61.0, 62.83], [65.0, 65.42], [71.0, 71.04], [72.0, 83.44], [86.0, 86.07], [88.0, 96.84], [97.0, 97.93], [100.0, 104.63], [108.0, 107.79], [121.0, 130.79], [133.0, 132.9], [141.0, 141.3], [141.0, 141.74], [145.0, 144.64], [145.0, 146.16], [148.0, 148.42], [151.0, 155.12], [157.0, 157.6], [161.0, 162.04], [165.0, 166.13], [167.0, 167.44], [171.0, 173.69], [175.0, 178.85], [179.0, 182.24]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 41.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.95, 0.0, 0.0, 0.0, 32.77, 0.0, 38.12, 0.0, 62.27, 0.0, 45.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.7, 0.0, 0.0, 0.0, 0.0, 55.18, 45.14, 44.55], "audiomae_on_audioset": [null, [["music", 45.14], ["didgeridoo", 5.98], ["hum", 5.25]], null, null, null, null, null, null, [["music", 57.82], ["throbbing", 7.95], ["hum", 7.05]], null, null, null, [["music", 40.52], ["hum", 17.17], ["mains hum", 10.43]], null, [["speech", 59.92], ["hum", 16.89], ["mains hum", 4.44]], null, null, null, [["music", 49.61], ["hum", 5.65], ["fly, housefly", 4.28]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.46], ["speech", 17.1], ["synthesizer", 3.62]], [["music", 52.37], ["speech", 13.02], ["hum", 7.9]]], "duration": [-0.28, 4.29, 1.48, 1.64, 1.85, 0.77, -0.08, -0.14, 2.02, 1.83, 0.42, 0.04, 11.44, 0.07, 8.84, 0.93, 4.63, -0.21, 9.79, -0.1, 0.3, 0.74, -0.36, 1.16, 0.42, 4.12, 0.6, 1.04, 1.13, 0.44, 2.69, 3.85, 3.24]} \ No newline at end of file diff --git a/annotations_filtered/p1lnXM7l2_g_filtered.json b/annotations_filtered/p1lnXM7l2_g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfef0d4267660f4bc8c5a58faf7640207ed1658e --- /dev/null +++ b/annotations_filtered/p1lnXM7l2_g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.26], [9.0, 10.98], [12.0, 15.53], [17.0, 22.64], [24.0, 24.48], [24.0, 33.69], [38.0, 38.94], [40.0, 40.02], [47.0, 48.56], [59.0, 60.61], [63.0, 66.95], [68.0, 68.81], [71.0, 71.36], [75.0, 76.06], [84.0, 85.67], [88.0, 92.96], [94.0, 94.29], [96.0, 96.3]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 34.63, 32.31, 0.0, 31.8, 0.0, 0.0, 0.0, 0.0, 31.11, 0.0, 0.0, 0.0, 0.0, 33.85, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 19.62], ["gong", 17.68], ["mains hum", 13.38]], [["music", 35.49], ["speech", 11.21], ["mains hum", 7.84]], null, [["music", 72.96], ["musical instrument", 9.85], ["synthesizer", 3.35]], null, null, null, null, [["didgeridoo", 35.07], ["music", 28.72], ["speech", 15.77]], null, null, null, null, [["didgeridoo", 33.69], ["music", 10.45], ["fart", 5.94]], null, null], "duration": [1.26, 1.98, 3.53, 5.64, 0.48, 9.69, 0.94, 0.02, 1.56, 1.61, 3.95, 0.81, 0.36, 1.06, 1.67, 4.96, 0.29, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/p29GuFPbzsg_filtered.json b/annotations_filtered/p29GuFPbzsg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..daf3ac37b59ba266c37c2c15d0cc3a1d25d00fdd --- /dev/null +++ b/annotations_filtered/p29GuFPbzsg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.7], [24.0, 27.5], [29.0, 29.86], [31.0, 32.02], [39.0, 40.1], [42.0, 42.01], [43.0, 43.26], [45.0, 45.42], [54.0, 59.24], [69.0, 69.67], [78.0, 78.49], [85.0, 85.63], [95.0, 96.53], [98.0, 99.94], [105.0, 114.24], [124.0, 125.63], [142.0, 142.8], [144.0, 145.17], [145.0, 145.67], [146.0, 147.04], [148.0, 148.64], [149.0, 149.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.66, 0.0, 0.0, 0.0, 0.0, 0.0, 40.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 30.8], ["bell", 15.05], ["church bell", 10.64]], null, null, null, null, null, null, null], "duration": [0.7, 3.5, 0.86, 1.02, 1.1, 0.01, 0.26, 0.42, 5.24, 0.67, 0.49, 0.63, 1.53, 1.94, 9.24, 1.63, 0.8, 1.17, 0.67, 1.04, 0.64, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/p2CR0S7DHyQ_filtered.json b/annotations_filtered/p2CR0S7DHyQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..232dd42dd278be5801d3180b3a8d6a22197374dc --- /dev/null +++ b/annotations_filtered/p2CR0S7DHyQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.52], [7.0, 7.86], [9.0, 10.25], [11.0, 11.52], [13.0, 13.63], [14.0, 15.26], [17.0, 17.88], [18.0, 26.89], [27.0, 31.82], [34.0, 36.54], [37.0, 51.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.62, 74.44, 93.91, 81.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 0.86, 1.25, 0.52, 0.63, 1.26, 0.88, 8.89, 4.82, 2.54, 14.02]} \ No newline at end of file diff --git a/annotations_filtered/p2Md_248enw_filtered.json b/annotations_filtered/p2Md_248enw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e82b0b44ed826346cfbab58992e6a36bec50a424 --- /dev/null +++ b/annotations_filtered/p2Md_248enw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.19], [6.0, 5.88], [6.0, 6.98], [7.0, 7.82], [8.0, 7.96], [8.0, 9.19], [11.0, 15.63], [21.0, 21.17], [26.0, 26.11], [28.0, 29.73], [30.0, 30.69], [32.0, 32.19], [33.0, 34.13], [34.0, 34.43], [37.0, 36.91], [39.0, 42.74], [49.0, 49.11], [50.0, 52.19], [53.0, 53.18], [60.0, 60.94], [65.0, 65.91], [67.0, 67.69], [68.0, 69.99], [81.0, 81.36], [83.0, 83.49], [84.0, 84.47], [86.0, 86.54], [93.0, 94.93], [95.0, 95.47], [98.0, 98.56], [101.0, 101.17], [103.0, 105.76], [107.0, 107.43], [122.0, 122.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.33, 0.0, 39.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 61.79], ["sidetone", 17.04], ["radio", 5.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.19, -0.12, 0.98, 0.82, -0.04, 1.19, 4.63, 0.17, 0.11, 1.73, 0.69, 0.19, 1.13, 0.43, -0.09, 3.74, 0.11, 2.19, 0.18, 0.94, 0.91, 0.69, 1.99, 0.36, 0.49, 0.47, 0.54, 1.93, 0.47, 0.56, 0.17, 2.76, 0.43, 0.08]} \ No newline at end of file diff --git a/annotations_filtered/p2QiCFAQ-qQ_filtered.json b/annotations_filtered/p2QiCFAQ-qQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0527a23576cedb7ade8d11b3093d821beb445105 --- /dev/null +++ b/annotations_filtered/p2QiCFAQ-qQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 16.9], [17.0, 18.62], [19.0, 20.51], [23.0, 23.25], [24.0, 24.31], [28.0, 28.46], [33.0, 34.67], [43.0, 43.09], [44.0, 44.32], [45.0, 47.34], [48.0, 48.56], [51.0, 51.34], [55.0, 54.94], [56.0, 57.01], [62.0, 62.07], [65.0, 67.54], [68.0, 69.28], [71.0, 71.78], [76.0, 77.48], [79.0, 81.04], [82.0, 99.0], [99.0, 100.72], [103.0, 103.33], [105.0, 108.46], [116.0, 116.29], [117.0, 117.68], [118.0, 119.55], [120.0, 120.66], [126.0, 125.88], [129.0, 130.35], [134.0, 134.27], [135.0, 135.55], [137.0, 140.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 93.91, 0.0, 0.0, 0.0, 99.65, 31.16, 0.0, 0.0, 54.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.45], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["noise", 49.43], ["speech", 19.26], ["music", 16.98]], null, null, null, null, null, null, null, null, null, null, null, [["music", 71.56], ["breaking", 19.63], ["smash, crash", 2.26]]], "duration": [3.9, 1.62, 1.51, 0.25, 0.31, 0.46, 1.67, 0.09, 0.32, 2.34, 0.56, 0.34, -0.06, 1.01, 0.07, 2.54, 1.28, 0.78, 1.48, 2.04, 17.0, 1.72, 0.33, 3.46, 0.29, 0.68, 1.55, 0.66, -0.12, 1.35, 0.27, 0.55, 3.37]} \ No newline at end of file diff --git a/annotations_filtered/p2fHtpp_umI_filtered.json b/annotations_filtered/p2fHtpp_umI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f383a87cdc1d44cbf442505759fcb4b0f08fd11 --- /dev/null +++ b/annotations_filtered/p2fHtpp_umI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.29], [4.0, 4.41], [13.0, 13.14], [15.0, 14.98], [16.0, 16.55], [18.0, 18.0], [19.0, 19.63], [23.0, 23.95], [27.0, 27.75], [29.0, 29.27], [32.0, 34.65], [47.0, 47.21], [61.0, 60.72], [64.0, 64.59], [67.0, 68.5], [70.0, 70.55], [72.0, 72.91], [75.0, 75.22], [77.0, 78.16], [80.0, 81.13], [85.0, 85.72], [86.0, 87.62], [89.0, 89.97], [91.0, 91.64], [92.0, 93.02], [94.0, 95.49], [96.0, 98.42], [99.0, 100.35], [101.0, 101.71], [105.0, 104.92], [106.0, 106.32], [107.0, 108.09], [110.0, 110.76], [112.0, 112.87], [115.0, 115.84], [117.0, 117.26], [118.0, 118.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 0.41, 0.14, -0.02, 0.55, 0.0, 0.63, 0.95, 0.75, 0.27, 2.65, 0.21, -0.28, 0.59, 1.5, 0.55, 0.91, 0.22, 1.16, 1.13, 0.72, 1.62, 0.97, 0.64, 1.02, 1.49, 2.42, 1.35, 0.71, -0.08, 0.32, 1.09, 0.76, 0.87, 0.84, 0.26, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/p2zDdb_MqmI_filtered.json b/annotations_filtered/p2zDdb_MqmI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33a957da0615285a633790464f59a7e96a6cead1 --- /dev/null +++ b/annotations_filtered/p2zDdb_MqmI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.8], [24.0, 24.8], [25.0, 35.01], [35.0, 36.24], [41.0, 42.74], [43.0, 45.22], [50.0, 52.62], [56.0, 61.72], [67.0, 70.7], [81.0, 81.38], [83.0, 93.55], [95.0, 96.5], [99.0, 106.69], [109.0, 109.85], [112.0, 112.51], [117.0, 117.61], [118.0, 117.71], [118.0, 120.02], [121.0, 125.9], [132.0, 143.75], [144.0, 144.75], [147.0, 146.74], [148.0, 150.16], [151.0, 153.79], [158.0, 159.66], [161.0, 161.67], [162.0, 174.65], [176.0, 190.31], [192.0, 193.62]], "keep_status": [true, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, true, true, true, false, false, false, true, false, false, true, true, false], "silence_prob": [34.12, 0.0, 30.33, 0.0, 0.0, 32.69, 31.17, 30.57, 33.24, 0.0, 31.54, 0.0, 30.97, 0.0, 0.0, 0.0, 0.0, 38.94, 36.85, 30.78, 0.0, 0.0, 50.16, 34.43, 0.0, 0.0, 33.12, 30.76, 0.0], "audiomae_on_audioset": [[["music", 28.58], ["speech", 24.64], ["quack", 5.52]], null, [["music", 43.78], ["speech", 29.45], ["vehicle", 3.38]], null, null, [["music", 44.0], ["speech", 26.21], ["trombone", 4.16]], [["music", 49.03], ["speech", 13.7], ["cattle, bovinae", 6.99]], [["music", 60.28], ["throbbing", 4.01], ["cattle, bovinae", 3.42]], [["music", 17.66], ["throbbing", 10.4], ["honk", 7.18]], null, [["livestock, farm animals, working animals", 38.02], ["moo", 23.55], ["cattle, bovinae", 20.52]], null, [["music", 52.15], ["speech", 14.0], ["throbbing", 4.83]], null, null, null, null, [["noise", 14.7], ["livestock, farm animals, working animals", 9.37], ["cattle, bovinae", 9.3]], [["fart", 25.32], ["speech", 24.22], ["noise", 15.26]], [["smash, crash", 22.94], ["livestock, farm animals, working animals", 17.59], ["music", 16.04]], null, null, null, [["music", 17.52], ["fly, housefly", 10.57], ["didgeridoo", 9.2]], null, null, [["music", 37.48], ["throbbing", 12.59], ["hum", 11.83]], [["vehicle", 30.73], ["car", 16.06], ["race car, auto racing", 10.09]], null], "duration": [3.8, 0.8, 10.01, 1.24, 1.74, 2.22, 2.62, 5.72, 3.7, 0.38, 10.55, 1.5, 7.69, 0.85, 0.51, 0.61, -0.29, 2.02, 4.9, 11.75, 0.75, -0.26, 2.16, 2.79, 1.66, 0.67, 12.65, 14.31, 1.62]} \ No newline at end of file diff --git a/annotations_filtered/p32OEIazBew_filtered.json b/annotations_filtered/p32OEIazBew_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60fde73d6b19dc09e9506632381697d06b36a9bc --- /dev/null +++ b/annotations_filtered/p32OEIazBew_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 12.8], [13.0, 20.78], [24.0, 27.63], [28.0, 33.51], [34.0, 39.23], [41.0, 41.45], [43.0, 44.69], [47.0, 57.65], [59.0, 59.81], [63.0, 63.8], [66.0, 67.59], [70.0, 80.72], [84.0, 83.78], [84.0, 91.03], [91.0, 92.99], [93.0, 93.02], [94.0, 100.9], [110.0, 122.37], [123.0, 140.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [37.38, 34.58, 39.43, 37.75, 32.52, 0.0, 0.0, 33.99, 0.0, 0.0, 0.0, 32.92, 0.0, 32.22, 0.0, 0.0, 31.63, 33.58, 38.79], "audiomae_on_audioset": [[["music", 89.32], ["lullaby", 1.99], ["humming", 1.02]], [["music", 79.8], ["lullaby", 2.64], ["musical instrument", 2.05]], [["music", 44.2], ["harp", 21.08], ["pizzicato", 9.13]], [["music", 69.75], ["lullaby", 4.01], ["singing", 2.98]], [["music", 78.64], ["lullaby", 11.38], ["singing", 0.78]], null, null, [["music", 84.46], ["lullaby", 1.81], ["singing", 1.51]], null, null, null, [["music", 85.34], ["singing", 1.62], ["harp", 1.34]], null, [["music", 83.43], ["humming", 2.92], ["lullaby", 2.61]], null, null, [["music", 89.61], ["synthetic singing", 2.75], ["lullaby", 2.41]], [["music", 84.11], ["chorus effect", 3.42], ["singing", 1.29]], [["music", 52.51], ["singing bowl", 6.8], ["synthesizer", 3.19]]], "duration": [5.8, 7.78, 3.63, 5.51, 5.23, 0.45, 1.69, 10.65, 0.81, 0.8, 1.59, 10.72, -0.22, 7.03, 1.99, 0.02, 6.9, 12.37, 17.95]} \ No newline at end of file diff --git a/annotations_filtered/p39lIRTEPY4_filtered.json b/annotations_filtered/p39lIRTEPY4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5379449ce1e19047e240fec7efd11dc85c634a4f --- /dev/null +++ b/annotations_filtered/p39lIRTEPY4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 46.09], [48.0, 93.45], [95.0, 101.28], [102.0, 131.95]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 0.0, 92.15, 29.06], "audiomae_on_audioset": [null, null, null, [["music", 21.68], ["breaking", 14.75], ["rumble", 8.77]]], "duration": [42.09, 45.45, 6.28, 29.95]} \ No newline at end of file diff --git a/annotations_filtered/p3ZnaRMhD_A_filtered.json b/annotations_filtered/p3ZnaRMhD_A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d69566bb8932521c09c51f098c5ce9bd1c3eeb33 --- /dev/null +++ b/annotations_filtered/p3ZnaRMhD_A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.39], [8.0, 9.91], [14.0, 16.43], [19.0, 20.04], [22.0, 24.14], [27.0, 33.12], [35.0, 37.35], [40.0, 41.0], [43.0, 44.61], [47.0, 50.13], [51.0, 52.47], [55.0, 56.39], [59.0, 61.28], [63.0, 64.74], [70.0, 70.28], [75.0, 75.78], [85.0, 86.43], [88.0, 90.36], [96.0, 96.77], [98.0, 99.3], [104.0, 104.38], [113.0, 114.4], [115.0, 115.99], [117.0, 119.16], [121.0, 126.57], [128.0, 129.79], [131.0, 133.1], [135.0, 135.75], [139.0, 139.16], [140.0, 140.76], [144.0, 158.36], [161.0, 162.85], [163.0, 168.37], [169.0, 170.11], [171.0, 171.63], [175.0, 176.59], [178.0, 178.63], [180.0, 182.21], [184.0, 185.03], [189.0, 190.17], [193.0, 199.22], [200.0, 201.19], [203.0, 203.82], [210.0, 212.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 73.97, 0.0, 97.54, 99.98, 57.32, 0.0, 0.0, 100.0, 0.0, 0.0, 72.16, 0.0, 0.0, 0.0, 0.0, 99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 43.9, 0.0, 0.0, 0.0, 96.17, 0.0, 53.47, 0.0, 0.0, 0.0, 0.0, 90.78, 0.0, 0.0, 66.27, 0.0, 0.0, 97.73], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["stomach rumble", 41.72], ["sidetone", 7.25], ["effects unit", 6.19]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.39, 1.91, 2.43, 1.04, 2.14, 6.12, 2.35, 1.0, 1.61, 3.13, 1.47, 1.39, 2.28, 1.74, 0.28, 0.78, 1.43, 2.36, 0.77, 1.3, 0.38, 1.4, 0.99, 2.16, 5.57, 1.79, 2.1, 0.75, 0.16, 0.76, 14.36, 1.85, 5.37, 1.11, 0.63, 1.59, 0.63, 2.21, 1.03, 1.17, 6.22, 1.19, 0.82, 2.58]} \ No newline at end of file diff --git a/annotations_filtered/p3zb4fwFd3E_filtered.json b/annotations_filtered/p3zb4fwFd3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..634ecce56d77c807e4ba1193f4513e06a564c984 --- /dev/null +++ b/annotations_filtered/p3zb4fwFd3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 119.35], [120.0, 123.33], [124.0, 140.37], [142.0, 161.59], [167.0, 169.94], [172.0, 187.49], [189.0, 190.54]], "keep_status": [false, true, false, false, true, true, false], "silence_prob": [0.0, 39.35, 29.93, 30.66, 33.68, 31.39, 0.0], "audiomae_on_audioset": [null, [["music", 29.36], ["hum", 18.6], ["throbbing", 10.84]], [["hum", 42.93], ["music", 25.55], ["throbbing", 9.96]], [["music", 46.18], ["throbbing", 25.98], ["hum", 7.97]], [["music", 28.64], ["frog", 11.05], ["croak", 6.6]], [["gong", 32.68], ["music", 24.65], ["hum", 11.76]], null], "duration": [53.35, 3.33, 16.37, 19.59, 2.94, 15.49, 1.54]} \ No newline at end of file diff --git a/annotations_filtered/p43EnAUd3-w_filtered.json b/annotations_filtered/p43EnAUd3-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..997bab723ef344f2358e5a7759b9cfc6975005ee --- /dev/null +++ b/annotations_filtered/p43EnAUd3-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.46], [21.0, 27.03], [27.0, 28.22], [30.0, 35.48], [36.0, 42.9], [44.0, 45.37], [46.0, 46.84], [49.0, 49.11], [50.0, 51.68]], "keep_status": [false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 77.87, 0.0, 100.0, 31.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 19.24], ["music", 11.62], ["carnatic music", 7.52]], null, null, null, null], "duration": [1.46, 6.03, 1.22, 5.48, 6.9, 1.37, 0.84, 0.11, 1.68]} \ No newline at end of file diff --git a/annotations_filtered/p4HqnBtsz1I_filtered.json b/annotations_filtered/p4HqnBtsz1I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..215954be729f5debad13ceb620844eac15024c86 --- /dev/null +++ b/annotations_filtered/p4HqnBtsz1I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.54], [4.0, 5.39], [6.0, 6.72], [10.0, 10.12], [12.0, 12.29], [13.0, 13.91], [15.0, 15.45], [16.0, 21.15], [25.0, 29.46], [31.0, 38.25], [41.0, 44.15], [48.0, 53.65], [56.0, 56.61], [58.0, 58.63], [59.0, 59.68], [60.0, 61.15], [62.0, 62.97], [65.0, 65.84], [68.0, 68.99], [70.0, 70.26], [72.0, 73.38], [74.0, 75.83], [78.0, 81.24], [89.0, 90.07], [95.0, 97.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.33, 61.97, 47.46, 55.67, 76.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 99.73], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 57.81], ["ambient music", 19.46], ["singing bowl", 6.87]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.54, 1.39, 0.72, 0.12, 0.29, 0.91, 0.45, 5.15, 4.46, 7.25, 3.15, 5.65, 0.61, 0.63, 0.68, 1.15, 0.97, 0.84, 0.99, 0.26, 1.38, 1.83, 3.24, 1.07, 2.53]} \ No newline at end of file diff --git a/annotations_filtered/p4IUUBVAUJA_filtered.json b/annotations_filtered/p4IUUBVAUJA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a1a62fb7c98bd365f06820665838ef40871b340 --- /dev/null +++ b/annotations_filtered/p4IUUBVAUJA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 32.24], [37.0, 44.49], [48.0, 57.94], [60.0, 64.66], [67.0, 76.94]], "keep_status": [false, false, true, true, true], "silence_prob": [88.64, 99.26, 28.84, 30.65, 29.98], "audiomae_on_audioset": [null, null, [["speech", 29.97], ["rumble", 10.94], ["hum", 10.39]], [["hum", 21.23], ["throbbing", 16.42], ["music", 10.35]], [["music", 47.11], ["speech", 11.98], ["throbbing", 4.93]]], "duration": [3.24, 7.49, 9.94, 4.66, 9.94]} \ No newline at end of file diff --git a/annotations_filtered/p4JPMo4bMa4_filtered.json b/annotations_filtered/p4JPMo4bMa4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e253eea408e1f16c667b08b262bab6bd82b72a7 --- /dev/null +++ b/annotations_filtered/p4JPMo4bMa4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 17.81], [20.0, 24.0]], "keep_status": [false, true], "silence_prob": [31.43, 31.19], "audiomae_on_audioset": [[["buzz", 71.35], ["music", 14.51], ["hum", 2.71]], [["whale vocalization", 32.81], ["music", 15.69], ["moo", 6.1]]], "duration": [12.81, 4.0]} \ No newline at end of file diff --git a/annotations_filtered/p4Pq9aZVV9Y_filtered.json b/annotations_filtered/p4Pq9aZVV9Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1eb5a13c232c250578bd9489575798190b820a76 --- /dev/null +++ b/annotations_filtered/p4Pq9aZVV9Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.99], [16.0, 17.1], [19.0, 20.66], [27.0, 28.43], [31.0, 35.38], [37.0, 39.18], [42.0, 43.5], [44.0, 44.96], [47.0, 48.47], [50.0, 58.65], [59.0, 58.73], [59.0, 67.15], [69.0, 69.82], [76.0, 82.46], [85.0, 95.23], [102.0, 101.9], [105.0, 105.48], [127.0, 129.64]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.48, 49.68, 0.0, 0.0, 0.0, 45.21, 0.0, 33.15, 0.0, 32.96, 30.17, 0.0, 0.0, 63.74], "audiomae_on_audioset": [null, null, null, null, [["speech", 49.63], ["music", 21.75], ["boing", 3.19]], [["speech", 46.61], ["fireworks", 9.12], ["music", 3.79]], null, null, null, [["speech", 35.42], ["music", 24.87], ["fart", 6.25]], null, [["music", 53.48], ["throbbing", 9.33], ["hum", 6.51]], null, [["music", 60.65], ["speech", 16.76], ["skateboard", 2.5]], [["music", 52.56], ["hum", 9.94], ["throbbing", 3.75]], null, null, null], "duration": [-0.01, 1.1, 1.66, 1.43, 4.38, 2.18, 1.5, 0.96, 1.47, 8.65, -0.27, 8.15, 0.82, 6.46, 10.23, -0.1, 0.48, 2.64]} \ No newline at end of file diff --git a/annotations_filtered/p4SqclCqxuU_filtered.json b/annotations_filtered/p4SqclCqxuU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85e22e26d357aa955070ebc359a05c4a445fbdc5 --- /dev/null +++ b/annotations_filtered/p4SqclCqxuU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 16.87], [18.0, 18.08], [24.0, 26.27], [26.0, 29.57], [35.0, 35.4], [54.0, 55.51], [56.0, 56.44], [57.0, 60.78]], "keep_status": [true, false, true, false, false, false, false, false], "silence_prob": [42.28, 0.0, 37.92, 50.06, 0.0, 0.0, 0.0, 56.7], "audiomae_on_audioset": [[["speech", 23.79], ["burping, eructation", 18.49], ["whale vocalization", 8.52]], null, [["speech", 38.67], ["scratch", 10.67], ["quack", 3.94]], null, null, null, null, null], "duration": [3.87, 0.08, 2.27, 3.57, 0.4, 1.51, 0.44, 3.78]} \ No newline at end of file diff --git a/annotations_filtered/p4TZcBFacUg_filtered.json b/annotations_filtered/p4TZcBFacUg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51abd11f9bd5cb67211fd2b614389ebf81366b71 --- /dev/null +++ b/annotations_filtered/p4TZcBFacUg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[86.0, 116.28], [119.0, 122.84], [124.0, 124.56], [126.0, 125.9], [128.0, 142.53], [146.0, 156.44], [158.0, 165.42], [170.0, 176.3], [177.0, 182.76], [184.0, 192.65], [196.0, 197.8]], "keep_status": [false, true, false, false, true, true, true, true, true, true, false], "silence_prob": [0.0, 43.82, 0.0, 0.0, 38.19, 36.61, 38.42, 37.42, 40.14, 36.56, 0.0], "audiomae_on_audioset": [null, [["mains hum", 29.53], ["hum", 18.16], ["music", 10.43]], null, null, [["buzz", 32.62], ["music", 11.27], ["electric shaver, electric razor", 6.78]], [["noise", 16.2], ["vehicle", 13.45], ["cacophony", 11.02]], [["mains hum", 11.21], ["vehicle", 10.33], ["speech", 8.58]], [["vehicle", 30.27], ["buzz", 16.08], ["motorcycle", 9.24]], [["speech", 60.38], ["explosion", 3.99], ["buzz", 2.79]], [["hum", 35.37], ["mains hum", 19.31], ["vehicle", 8.16]], null], "duration": [30.28, 3.84, 0.56, -0.1, 14.53, 10.44, 7.42, 6.3, 5.76, 8.65, 1.8]} \ No newline at end of file diff --git a/annotations_filtered/p4yCboEAjLk_filtered.json b/annotations_filtered/p4yCboEAjLk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0ca168d98bcebe7d1e9a4ad3f290d281798b7f4 --- /dev/null +++ b/annotations_filtered/p4yCboEAjLk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 46.23], [48.0, 51.9], [53.0, 53.7], [55.0, 56.34], [58.0, 57.77], [59.0, 70.5], [71.0, 72.15], [75.0, 76.47], [77.0, 77.57], [83.0, 86.75], [89.0, 91.5], [103.0, 108.94], [130.0, 134.47], [137.0, 154.06]], "keep_status": [true, true, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [39.46, 37.25, 0.0, 0.0, 0.0, 41.95, 0.0, 0.0, 0.0, 42.04, 41.52, 35.41, 56.93, 35.03], "audiomae_on_audioset": [[["speech", 27.31], ["thunk", 14.38], ["music", 14.29]], [["music", 22.45], ["hum", 14.61], ["electric shaver, electric razor", 10.77]], null, null, null, [["throbbing", 31.57], ["hum", 21.15], ["music", 17.66]], null, null, null, [["music", 49.65], ["throbbing", 6.3], ["speech", 5.36]], [["music", 57.79], ["synthesizer", 9.43], ["sampler", 4.37]], [["music", 73.45], ["throbbing", 3.45], ["musical instrument", 2.07]], null, [["throbbing", 32.32], ["music", 25.49], ["hum", 24.99]]], "duration": [20.23, 3.9, 0.7, 1.34, -0.23, 11.5, 1.15, 1.47, 0.57, 3.75, 2.5, 5.94, 4.47, 17.06]} \ No newline at end of file diff --git a/annotations_filtered/p4ylvDhfiQw_filtered.json b/annotations_filtered/p4ylvDhfiQw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45035655a5c69681b7c604a3c8ca9baf3ea96e28 --- /dev/null +++ b/annotations_filtered/p4ylvDhfiQw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 21.93], [23.0, 23.14], [26.0, 27.11], [28.0, 34.53], [35.0, 35.45], [37.0, 43.63], [45.0, 45.3], [48.0, 54.18], [69.0, 86.02], [86.0, 87.25], [98.0, 107.4], [110.0, 114.05], [115.0, 115.77], [122.0, 122.3], [128.0, 129.49], [132.0, 133.83], [142.0, 147.36], [150.0, 153.81], [156.0, 164.91], [170.0, 172.34], [176.0, 175.96]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 28.72, 0.0, 28.32, 0.0, 28.21, 28.41, 0.0, 28.57, 28.59, 0.0, 0.0, 0.0, 0.0, 28.62, 28.7, 28.45, 28.71, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 43.92], ["speech", 26.49], ["throbbing", 8.54]], null, [["throbbing", 30.41], ["music", 22.07], ["hum", 10.49]], null, [["whale vocalization", 19.28], ["animal", 15.63], ["music", 6.28]], [["music", 80.89], ["skateboard", 1.63], ["livestock, farm animals, working animals", 1.28]], null, [["music", 57.99], ["speech", 13.42], ["cacophony", 3.1]], [["music", 73.86], ["speech", 6.95], ["didgeridoo", 3.75]], null, null, null, null, [["music", 44.53], ["speech", 27.21], ["throbbing", 3.51]], [["music", 33.02], ["motorcycle", 10.88], ["livestock, farm animals, working animals", 10.07]], [["music", 55.17], ["vehicle", 8.08], ["speech", 7.71]], [["music", 24.01], ["cacophony", 12.09], ["vehicle", 8.08]], null], "duration": [1.93, 0.14, 1.11, 6.53, 0.45, 6.63, 0.3, 6.18, 17.02, 1.25, 9.4, 4.05, 0.77, 0.3, 1.49, 1.83, 5.36, 3.81, 8.91, 2.34, -0.04]} \ No newline at end of file diff --git a/annotations_filtered/p5BfdwK92UI_filtered.json b/annotations_filtered/p5BfdwK92UI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71773c08102e49e591ec4fbf701f6dd201ffa657 --- /dev/null +++ b/annotations_filtered/p5BfdwK92UI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.91], [19.0, 19.57], [21.0, 21.0], [23.0, 22.79], [28.0, 29.07], [32.0, 33.54], [34.0, 35.85], [37.0, 37.89], [39.0, 49.82], [52.0, 52.91], [64.0, 71.09], [73.0, 75.29], [81.0, 82.26], [83.0, 83.35], [84.0, 84.6], [86.0, 88.75], [94.0, 97.34], [100.0, 103.99], [109.0, 115.94], [116.0, 128.71], [134.0, 134.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [82.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.71, 0.0, 42.28, 65.32, 0.0, 0.0, 0.0, 56.48, 34.22, 30.19, 29.6, 31.32, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 54.41], ["speech", 34.92], ["electronic music", 0.53]], null, [["cattle, bovinae", 23.91], ["animal", 17.97], ["moo", 14.15]], null, null, null, null, null, [["music", 51.95], ["throbbing", 5.75], ["sidetone", 3.06]], [["music", 78.05], ["boing", 2.56], ["musical instrument", 2.22]], [["music", 58.78], ["speech", 6.55], ["boing", 6.4]], [["speech", 55.12], ["music", 25.59], ["hum", 1.95]], null], "duration": [2.91, 0.57, 0.0, -0.21, 1.07, 1.54, 1.85, 0.89, 10.82, 0.91, 7.09, 2.29, 1.26, 0.35, 0.6, 2.75, 3.34, 3.99, 6.94, 12.71, 0.35]} \ No newline at end of file diff --git a/annotations_filtered/p5lEvn7ejJI_filtered.json b/annotations_filtered/p5lEvn7ejJI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b480d223322604e62121cbdfdf7cefd39b38d7d --- /dev/null +++ b/annotations_filtered/p5lEvn7ejJI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 40.91], [42.0, 43.39], [45.0, 44.86], [47.0, 50.33], [58.0, 57.7], [60.0, 67.51], [69.0, 69.85], [74.0, 80.57], [81.0, 81.58], [82.0, 82.73], [92.0, 97.75], [100.0, 105.24], [107.0, 110.27], [112.0, 112.58], [114.0, 115.52], [123.0, 128.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [67.89, 0.0, 0.0, 99.91, 0.0, 53.34, 0.0, 77.53, 0.0, 0.0, 63.1, 55.18, 51.28, 0.0, 0.0, 99.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [24.91, 1.39, -0.14, 3.33, -0.3, 7.51, 0.85, 6.57, 0.58, 0.73, 5.75, 5.24, 3.27, 0.58, 1.52, 5.51]} \ No newline at end of file diff --git a/annotations_filtered/p6HbXVaNFfc_filtered.json b/annotations_filtered/p6HbXVaNFfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59288c0ded8dd75e61db2b30e42d26cb50e664c7 --- /dev/null +++ b/annotations_filtered/p6HbXVaNFfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.91], [4.0, 4.45], [8.0, 15.3], [16.0, 20.83], [26.0, 48.56], [58.0, 64.99], [65.0, 65.45], [66.0, 65.89], [67.0, 68.39], [69.0, 72.54], [73.0, 96.18], [97.0, 99.18], [101.0, 101.24], [107.0, 115.52], [116.0, 153.55], [157.0, 166.01], [166.0, 190.59], [194.0, 213.49], [216.0, 216.36], [217.0, 217.65], [219.0, 219.01]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 56.1, 34.72, 33.85, 0.0, 0.0, 0.0, 34.42, 34.64, 38.2, 0.0, 35.59, 0.0, 34.69, 35.28, 36.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 82.92], ["funk", 2.55], ["house music", 2.25]], [["music", 76.0], ["funk", 2.89], ["disco", 1.33]], null, null, null, [["music", 60.92], ["synthesizer", 2.13], ["sampler", 2.02]], [["music", 80.49], ["house music", 1.51], ["singing", 1.31]], [["music", 74.26], ["musical instrument", 5.06], ["synthesizer", 2.9]], null, [["music", 81.22], ["funk", 2.83], ["disco", 1.31]], null, [["music", 80.37], ["singing", 1.33], ["middle eastern music", 1.13]], [["music", 78.31], ["house music", 1.59], ["disco", 1.53]], [["music", 62.88], ["clarinet", 2.66], ["musical instrument", 2.42]], null, null, null], "duration": [0.91, 0.45, 7.3, 4.83, 22.56, 6.99, 0.45, -0.11, 1.39, 3.54, 23.18, 2.18, 0.24, 8.52, 37.55, 9.01, 24.59, 19.49, 0.36, 0.65, 0.01]} \ No newline at end of file diff --git a/annotations_filtered/p6IvB-2jYtY_filtered.json b/annotations_filtered/p6IvB-2jYtY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c97401118d8f65f57bb758c5f29d623fbeb6b0e --- /dev/null +++ b/annotations_filtered/p6IvB-2jYtY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.37], [7.0, 7.59], [11.0, 12.07], [14.0, 16.23], [21.0, 22.23], [23.0, 23.13], [26.0, 28.12], [31.0, 33.24], [35.0, 35.65], [37.0, 42.36], [43.0, 44.59], [46.0, 51.12], [52.0, 57.67], [59.0, 59.44], [61.0, 61.82], [65.0, 67.96], [70.0, 71.39], [74.0, 75.29], [76.0, 77.85], [81.0, 82.95], [87.0, 88.03], [95.0, 96.42], [97.0, 98.41], [100.0, 100.77], [103.0, 107.79], [109.0, 110.73], [112.0, 113.31], [114.0, 114.98], [116.0, 118.91], [120.0, 120.72], [123.0, 123.31], [130.0, 129.71]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 95.78, 0.0, 0.0, 36.09, 85.35, 0.0, 36.2, 0.0, 34.47, 38.6, 0.0, 0.0, 38.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.83, 0.0, 0.0, 0.0, 67.13, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["chant", 12.84], ["mantra", 10.6], ["synthetic singing", 9.61]], null, null, [["theremin", 54.16], ["music", 27.61], ["musical instrument", 2.9]], null, [["theremin", 60.24], ["music", 27.31], ["musical instrument", 2.16]], [["theremin", 90.01], ["music", 3.32], ["wind instrument, woodwind instrument", 1.32]], null, null, [["theremin", 56.1], ["music", 34.57], ["musical instrument", 1.82]], null, null, null, null, null, null, null, null, [["music", 41.91], ["theremin", 29.55], ["synthesizer", 2.44]], null, null, null, null, null, null, null], "duration": [1.37, 0.59, 1.07, 2.23, 1.23, 0.13, 2.12, 2.24, 0.65, 5.36, 1.59, 5.12, 5.67, 0.44, 0.82, 2.96, 1.39, 1.29, 1.85, 1.95, 1.03, 1.42, 1.41, 0.77, 4.79, 1.73, 1.31, 0.98, 2.91, 0.72, 0.31, -0.29]} \ No newline at end of file diff --git a/annotations_filtered/p6LXVK9rPbw_filtered.json b/annotations_filtered/p6LXVK9rPbw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ce33cef85f69e5dd0f6dd7524acdb27736d316a --- /dev/null +++ b/annotations_filtered/p6LXVK9rPbw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 23.36], [25.0, 28.76], [30.0, 38.08], [39.0, 40.95], [41.0, 44.54], [46.0, 51.61], [53.0, 56.54], [58.0, 61.45], [63.0, 69.79]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [97.33, 97.33, 99.62, 0.0, 93.6, 93.29, 97.11, 99.05, 99.21], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [7.36, 3.76, 8.08, 1.95, 3.54, 5.61, 3.54, 3.45, 6.79]} \ No newline at end of file diff --git a/annotations_filtered/p6oIR31ZgyA_filtered.json b/annotations_filtered/p6oIR31ZgyA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0eb5eef54a8a6206c83d983193ed24d3e3c545d0 --- /dev/null +++ b/annotations_filtered/p6oIR31ZgyA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 38.08], [39.0, 41.93], [43.0, 45.1], [47.0, 49.08], [51.0, 55.49], [60.0, 65.2], [69.0, 68.84], [72.0, 72.35], [77.0, 80.4], [81.0, 93.21], [95.0, 95.99], [97.0, 98.54], [101.0, 136.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 73.82, 88.1, 89.72, 79.59, 98.86, 0.0, 0.0, 93.13, 58.55, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [34.08, 2.93, 2.1, 2.08, 4.49, 5.2, -0.16, 0.35, 3.4, 12.21, 0.99, 1.54, 35.39]} \ No newline at end of file diff --git a/annotations_filtered/p70o9g5gcdY_filtered.json b/annotations_filtered/p70o9g5gcdY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3377d3aeac1e352fc52675a288f1cfcbd1860ce2 --- /dev/null +++ b/annotations_filtered/p70o9g5gcdY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.61], [12.0, 13.12], [13.0, 13.2], [14.0, 17.04], [17.0, 17.42], [45.0, 45.3], [51.0, 51.7], [53.0, 60.27], [65.0, 78.92], [83.0, 83.39], [85.0, 91.77], [100.0, 100.09], [100.0, 103.2], [105.0, 114.37], [115.0, 122.39]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 43.3, 0.0, 0.0, 0.0, 31.96, 30.58, 0.0, 31.39, 0.0, 31.45, 30.7, 30.96], "audiomae_on_audioset": [null, null, null, [["music", 86.12], ["musical instrument", 4.0], ["synthesizer", 2.06]], null, null, null, [["music", 73.91], ["boing", 2.98], ["speech", 2.79]], [["music", 64.99], ["sampler", 2.74], ["male singing", 2.18]], null, [["music", 73.16], ["electronic music", 3.04], ["throbbing", 2.67]], null, [["music", 63.07], ["drum machine", 4.14], ["house music", 3.36]], [["music", 84.27], ["funk", 2.69], ["disco", 1.72]], [["music", 66.56], ["funk", 13.79], ["disco", 4.0]]], "duration": [0.61, 1.12, 0.2, 3.04, 0.42, 0.3, 0.7, 7.27, 13.92, 0.39, 6.77, 0.09, 3.2, 9.37, 7.39]} \ No newline at end of file diff --git a/annotations_filtered/p7bpv3zs8Dk_filtered.json b/annotations_filtered/p7bpv3zs8Dk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e9569a355ea5bbcfb71d15bbb64964621786d1f --- /dev/null +++ b/annotations_filtered/p7bpv3zs8Dk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.04], [6.0, 6.22], [10.0, 15.18], [38.0, 53.59], [58.0, 58.45], [59.0, 62.28], [63.0, 62.72], [64.0, 70.38], [72.0, 72.4], [84.0, 84.42], [86.0, 86.39], [92.0, 104.01], [106.0, 110.44], [111.0, 111.5], [112.0, 112.95], [115.0, 115.91], [116.0, 116.48], [117.0, 117.0], [119.0, 119.92], [121.0, 121.36], [123.0, 123.26], [126.0, 127.26], [128.0, 131.23], [135.0, 135.04], [137.0, 137.49], [139.0, 140.05], [141.0, 141.76], [142.0, 143.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.56, 0.0, 51.28, 45.14, 0.0, 62.27, 0.0, 97.11, 0.0, 0.0, 0.0, 65.2, 92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.52, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 41.99], ["moo", 29.47], ["livestock, farm animals, working animals", 15.05]], null, null, [["speech", 64.7], ["groan", 8.08], ["animal", 3.11]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.04, 0.22, 5.18, 15.59, 0.45, 3.28, -0.28, 6.38, 0.4, 0.42, 0.39, 12.01, 4.44, 0.5, 0.95, 0.91, 0.48, 0.0, 0.92, 0.36, 0.26, 1.26, 3.23, 0.04, 0.49, 1.05, 0.76, 1.36]} \ No newline at end of file diff --git a/annotations_filtered/p7cYf7GaXgY_filtered.json b/annotations_filtered/p7cYf7GaXgY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7771a5b574c37e2ea5f29c3be6d2f15f174b1974 --- /dev/null +++ b/annotations_filtered/p7cYf7GaXgY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.31], [16.0, 17.49], [19.0, 27.09], [31.0, 43.77], [45.0, 47.63], [49.0, 55.73], [56.0, 61.94], [62.0, 75.79], [76.0, 77.33], [77.0, 83.42]], "keep_status": [false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 36.71, 64.75, 59.96, 40.73, 38.67, 36.85, 0.0, 37.04], "audiomae_on_audioset": [null, null, [["bouncing", 26.57], ["door", 13.9], ["speech", 8.9]], null, null, [["music", 35.73], ["hum", 9.15], ["theremin", 8.84]], [["music", 57.25], ["theremin", 15.5], ["singing bowl", 6.72]], [["music", 59.06], ["didgeridoo", 6.86], ["theremin", 6.68]], null, [["hum", 29.19], ["speech", 22.77], ["mains hum", 22.25]]], "duration": [0.31, 1.49, 8.09, 12.77, 2.63, 6.73, 5.94, 13.79, 1.33, 6.42]} \ No newline at end of file diff --git a/annotations_filtered/p7rtU_AM1bE_filtered.json b/annotations_filtered/p7rtU_AM1bE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a21c7a4d2cce6c9aef94e4e0c668c841859309e --- /dev/null +++ b/annotations_filtered/p7rtU_AM1bE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[63.0, 94.98]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [31.98]} \ No newline at end of file diff --git a/annotations_filtered/p7zF3vZL-4s_filtered.json b/annotations_filtered/p7zF3vZL-4s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54a3658df064e4945ef300a829a2d9528a3f0d99 --- /dev/null +++ b/annotations_filtered/p7zF3vZL-4s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 75.78], [77.0, 87.05]], "keep_status": [false, true], "silence_prob": [39.37, 37.85], "audiomae_on_audioset": [[["fly, housefly", 35.57], ["insect", 21.03], ["bee, wasp, etc.", 15.75]], [["fly, housefly", 27.73], ["insect", 14.96], ["speech", 14.9]]], "duration": [29.78, 10.05]} \ No newline at end of file diff --git a/annotations_filtered/p84uEGZqFlk_filtered.json b/annotations_filtered/p84uEGZqFlk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab13d1bbdfd44f34270598a855bbc001df8feaa3 --- /dev/null +++ b/annotations_filtered/p84uEGZqFlk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.39], [11.0, 11.26], [12.0, 34.06], [41.0, 41.72], [42.0, 45.0], [50.0, 57.74], [61.0, 61.32], [62.0, 82.61], [87.0, 112.8], [118.0, 123.79], [124.0, 130.5], [135.0, 137.79], [138.0, 151.07], [158.0, 158.14]], "keep_status": [false, false, false, false, false, false, false, true, true, true, false, true, true, false], "silence_prob": [0.0, 0.0, 34.4, 0.0, 46.12, 32.56, 0.0, 34.79, 36.18, 38.35, 37.56, 36.11, 31.92, 0.0], "audiomae_on_audioset": [null, null, [["music", 57.8], ["speech", 23.74], ["timpani", 1.46]], null, [["music", 40.93], ["speech", 33.45], ["gong", 5.64]], [["music", 53.91], ["throbbing", 9.88], ["speech", 8.74]], null, [["music", 43.77], ["speech", 9.3], ["musical instrument", 4.71]], [["music", 48.41], ["speech", 15.45], ["outside, rural or natural", 2.82]], [["music", 29.1], ["didgeridoo", 19.0], ["speech", 7.36]], [["music", 65.84], ["foghorn", 11.88], ["brass instrument", 3.59]], [["music", 33.71], ["cattle, bovinae", 13.72], ["moo", 13.11]], [["music", 33.28], ["speech", 24.45], ["outside, rural or natural", 2.68]], null], "duration": [0.39, 0.26, 22.06, 0.72, 3.0, 7.74, 0.32, 20.61, 25.8, 5.79, 6.5, 2.79, 13.07, 0.14]} \ No newline at end of file diff --git a/annotations_filtered/p890hIa1w9k_filtered.json b/annotations_filtered/p890hIa1w9k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..414ccbb58489b72efb018623611b8fd0afc3cab2 --- /dev/null +++ b/annotations_filtered/p890hIa1w9k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.93], [5.0, 5.51], [7.0, 9.44], [10.0, 11.18], [12.0, 13.42], [14.0, 16.28], [22.0, 22.06], [26.0, 26.05], [29.0, 29.34], [34.0, 34.32], [35.0, 36.73], [39.0, 40.2], [46.0, 46.58], [48.0, 48.96], [52.0, 52.07], [56.0, 56.42], [61.0, 61.48], [64.0, 67.2], [70.0, 73.4], [75.0, 77.5], [78.0, 79.32], [81.0, 85.65], [86.0, 88.08], [89.0, 91.3], [94.0, 98.17], [100.0, 101.22], [103.0, 104.95], [107.0, 110.27], [111.0, 111.0], [120.0, 123.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 74.6, 0.0, 0.0, 57.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.18, 94.52, 42.84, 0.0, 99.68, 86.45, 74.76, 51.82, 0.0, 0.0, 38.9, 0.0, 36.52], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.89], ["music", 20.75], ["synthesizer", 3.03]], null, [["speech", 49.79], ["sidetone", 33.9], ["whale vocalization", 2.69]], null, null, null, null, null, null, null, [["hum", 16.53], ["throbbing", 10.87], ["mains hum", 9.73]], null, [["fly, housefly", 56.37], ["insect", 18.02], ["bee, wasp, etc.", 12.56]]], "duration": [0.93, 0.51, 2.44, 1.18, 1.42, 2.28, 0.06, 0.05, 0.34, 0.32, 1.73, 1.2, 0.58, 0.96, 0.07, 0.42, 0.48, 3.2, 3.4, 2.5, 1.32, 4.65, 2.08, 2.3, 4.17, 1.22, 1.95, 3.27, 0.0, 3.52]} \ No newline at end of file diff --git a/annotations_filtered/p8CPTHEAfJc_filtered.json b/annotations_filtered/p8CPTHEAfJc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32ce5ad4ffd67ea6e5512faadc5f83174fb4cb69 --- /dev/null +++ b/annotations_filtered/p8CPTHEAfJc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.09], [0.0, 0.16], [3.0, 2.98], [8.0, 11.82], [13.0, 14.05], [43.0, 44.37], [52.0, 52.35], [54.0, 54.5], [56.0, 56.08], [57.0, 58.14], [65.0, 65.67], [66.0, 67.22], [68.0, 69.57], [72.0, 74.46], [75.0, 76.28], [84.0, 84.35], [85.0, 85.41], [89.0, 90.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.97, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 79.19], ["radio", 8.52], ["electric shaver, electric razor", 2.13]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.09, 0.16, -0.02, 3.82, 1.05, 1.37, 0.35, 0.5, 0.08, 1.14, 0.67, 1.22, 1.57, 2.46, 1.28, 0.35, 0.41, 1.64]} \ No newline at end of file diff --git a/annotations_filtered/p8J-YmVs1j0_filtered.json b/annotations_filtered/p8J-YmVs1j0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9110512de4436a707647e4e85dc33cdb09bf887 --- /dev/null +++ b/annotations_filtered/p8J-YmVs1j0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.87], [24.0, 24.63], [26.0, 29.03], [36.0, 36.02], [37.0, 38.53], [40.0, 40.71], [42.0, 43.5], [47.0, 49.67], [54.0, 57.47], [64.0, 66.02], [69.0, 71.52], [72.0, 73.9], [74.0, 78.95], [80.0, 85.23], [87.0, 89.19], [91.0, 103.27], [109.0, 110.42], [112.0, 123.35], [125.0, 125.0], [126.0, 127.48], [128.0, 130.01], [132.0, 137.89], [143.0, 143.09], [144.0, 145.99], [149.0, 153.67], [161.0, 164.52], [165.0, 164.61], [170.0, 173.8]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, true, true, false, false], "silence_prob": [38.86, 0.0, 83.34, 0.0, 0.0, 0.0, 0.0, 95.51, 73.82, 91.3, 88.64, 0.0, 64.97, 75.07, 83.7, 30.49, 0.0, 31.04, 0.0, 0.0, 33.18, 41.56, 0.0, 0.0, 40.09, 32.6, 0.0, 33.6], "audiomae_on_audioset": [[["noise", 15.51], ["music", 12.41], ["zipper (clothing)", 8.23]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 66.49], ["groan", 5.36], ["grunt", 4.05]], null, [["music", 27.62], ["whack, thwack", 12.71], ["animal", 5.57]], null, null, [["music", 25.78], ["speech", 10.38], ["didgeridoo", 9.32]], [["heart sounds, heartbeat", 26.58], ["throbbing", 7.71], ["dog", 7.53]], null, null, [["music", 24.25], ["hum", 12.52], ["fart", 9.19]], [["music", 21.29], ["cattle, bovinae", 8.88], ["moo", 7.46]], null, [["livestock, farm animals, working animals", 50.01], ["cattle, bovinae", 19.11], ["moo", 16.53]]], "duration": [4.87, 0.63, 3.03, 0.02, 1.53, 0.71, 1.5, 2.67, 3.47, 2.02, 2.52, 1.9, 4.95, 5.23, 2.19, 12.27, 1.42, 11.35, 0.0, 1.48, 2.01, 5.89, 0.09, 1.99, 4.67, 3.52, -0.39, 3.8]} \ No newline at end of file diff --git a/annotations_filtered/p8L6CtsqDE4_filtered.json b/annotations_filtered/p8L6CtsqDE4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2494125cd4bbd39619bc09842dc128099e4aae16 --- /dev/null +++ b/annotations_filtered/p8L6CtsqDE4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.47], [5.0, 5.86], [11.0, 11.4], [21.0, 23.33], [28.0, 28.43], [32.0, 32.31], [33.0, 33.72], [36.0, 38.23], [40.0, 41.66], [42.0, 43.38], [45.0, 51.0], [51.0, 51.46], [53.0, 55.05], [57.0, 57.43], [59.0, 59.88], [64.0, 64.81], [73.0, 73.74], [79.0, 80.52], [81.0, 81.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 64.75, 0.0, 0.0, 0.0, 71.14, 0.0, 0.0, 36.52, 0.0, 42.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["insect", 26.04], ["hammer", 12.18], ["cricket", 6.99]], null, [["speech", 32.04], ["wood", 16.53], ["glass", 4.75]], null, null, null, null, null, null], "duration": [0.47, 0.86, 0.4, 2.33, 0.43, 0.31, 0.72, 2.23, 1.66, 1.38, 6.0, 0.46, 2.05, 0.43, 0.88, 0.81, 0.74, 1.52, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/p8fPj1-nKw0_filtered.json b/annotations_filtered/p8fPj1-nKw0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9067283c5e600db22048a05b58eb18ae78353a1f --- /dev/null +++ b/annotations_filtered/p8fPj1-nKw0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.96], [7.0, 14.99]], "keep_status": [true, true], "silence_prob": [44.34, 36.2], "audiomae_on_audioset": [[["music", 32.25], ["theremin", 8.44], ["car", 5.57]], [["speech", 28.36], ["hum", 15.08], ["mains hum", 13.55]]], "duration": [2.96, 7.99]} \ No newline at end of file diff --git a/annotations_filtered/p8t_xV4Lf0A_filtered.json b/annotations_filtered/p8t_xV4Lf0A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed543afd1b8bb90763db9baf1c03b7698b977601 --- /dev/null +++ b/annotations_filtered/p8t_xV4Lf0A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.61], [21.0, 21.74], [32.0, 32.17], [34.0, 36.53], [40.0, 40.34], [45.0, 45.89], [47.0, 47.31], [51.0, 51.54], [57.0, 59.43], [62.0, 61.82], [63.0, 65.91], [67.0, 68.93], [71.0, 72.81], [77.0, 79.24], [80.0, 80.77], [82.0, 82.31], [83.0, 83.13]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 45.75, 0.0, 0.0, 0.0, 0.0, 54.9, 0.0, 42.02, 0.0, 0.0, 39.27, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 32.85], ["synthesizer", 8.25], ["speech", 5.92]], null, null, null, null, null, null, [["telephone dialing, dtmf", 11.03], ["music", 9.87], ["car", 8.71]], null, null, [["music", 53.19], ["rattle (instrument)", 9.51], ["speech", 3.5]], null, null, null], "duration": [0.61, 0.74, 0.17, 2.53, 0.34, 0.89, 0.31, 0.54, 2.43, -0.18, 2.91, 1.93, 1.81, 2.24, 0.77, 0.31, 0.13]} \ No newline at end of file diff --git a/annotations_filtered/p8wvEC_cBU4_filtered.json b/annotations_filtered/p8wvEC_cBU4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26c4e263c90f4464f2db5b035cacac72e7c784da --- /dev/null +++ b/annotations_filtered/p8wvEC_cBU4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.34], [9.0, 9.53], [14.0, 16.36], [21.0, 21.91], [31.0, 31.43], [38.0, 38.77], [44.0, 44.49], [45.0, 45.91], [47.0, 47.26], [50.0, 50.97], [56.0, 59.66], [64.0, 64.18], [71.0, 71.14], [74.0, 76.79], [78.0, 79.57], [83.0, 83.59], [85.0, 87.34], [90.0, 94.41], [96.0, 101.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [51.71, 0.0, 66.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.36, 0.0, 0.0, 59.51, 0.0, 0.0, 50.56, 48.35, 42.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 62.45], ["livestock, farm animals, working animals", 7.76], ["music", 3.06]], null, null, null, null, null, null, [["speech", 27.04], ["music", 24.85], ["hum", 17.58]], [["music", 38.72], ["speech", 22.44], ["throbbing", 10.2]]], "duration": [4.34, 0.53, 2.36, 0.91, 0.43, 0.77, 0.49, 0.91, 0.26, 0.97, 3.66, 0.18, 0.14, 2.79, 1.57, 0.59, 2.34, 4.41, 5.14]} \ No newline at end of file diff --git a/annotations_filtered/p92CKGAeQUY_filtered.json b/annotations_filtered/p92CKGAeQUY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a4648d899dd661d5e64d285692fdfbe443b8eec --- /dev/null +++ b/annotations_filtered/p92CKGAeQUY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.89], [8.0, 9.58], [12.0, 17.07], [20.0, 21.29], [22.0, 23.6], [24.0, 42.77], [47.0, 47.38], [49.0, 50.26], [51.0, 52.27], [54.0, 54.48], [63.0, 62.72], [65.0, 65.79], [72.0, 72.81], [77.0, 78.16], [81.0, 81.5], [83.0, 84.32], [86.0, 86.86], [92.0, 96.3], [96.0, 98.42], [99.0, 99.89], [101.0, 101.56], [103.0, 104.52], [105.0, 105.17], [108.0, 109.0], [112.0, 112.13], [112.0, 113.41], [114.0, 114.66], [117.0, 117.58], [119.0, 119.18], [123.0, 123.47], [129.0, 134.65], [137.0, 137.52], [139.0, 140.44], [143.0, 143.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 83.34, 0.0, 0.0, 68.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.61, 37.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.33, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 23.46], ["didgeridoo", 7.83], ["speech", 7.26]], [["speech", 18.52], ["music", 12.82], ["fly, housefly", 9.07]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 1.58, 5.07, 1.29, 1.6, 18.77, 0.38, 1.26, 1.27, 0.48, -0.28, 0.79, 0.81, 1.16, 0.5, 1.32, 0.86, 4.3, 2.42, 0.89, 0.56, 1.52, 0.17, 1.0, 0.13, 1.41, 0.66, 0.58, 0.18, 0.47, 5.65, 0.52, 1.44, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/p9Bo67_slJY_filtered.json b/annotations_filtered/p9Bo67_slJY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c74cdb62cbdcb564874c746b2f8d708d0a07bce0 --- /dev/null +++ b/annotations_filtered/p9Bo67_slJY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.11], [5.0, 6.56], [8.0, 10.49], [12.0, 12.77], [18.0, 18.06], [23.0, 25.88], [29.0, 29.78], [31.0, 38.94], [39.0, 39.68], [40.0, 40.58], [43.0, 43.33], [46.0, 56.05], [57.0, 58.11], [60.0, 61.21], [63.0, 64.12], [69.0, 69.3], [71.0, 71.68], [72.0, 73.47], [76.0, 76.37], [78.0, 79.62], [85.0, 86.48], [88.0, 88.2], [89.0, 92.64], [94.0, 96.23], [97.0, 98.09], [99.0, 106.0], [107.0, 108.58], [109.0, 111.01], [112.0, 117.41], [119.0, 123.92], [126.0, 126.62]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, true, true, false], "silence_prob": [44.99, 0.0, 44.2, 0.0, 0.0, 44.43, 0.0, 34.93, 0.0, 0.0, 0.0, 32.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.18, 38.8, 0.0, 34.82, 0.0, 38.79, 41.28, 36.69, 0.0], "audiomae_on_audioset": [[["speech", 38.1], ["music", 16.66], ["synthesizer", 3.9]], null, [["music", 26.85], ["throbbing", 8.03], ["fly, housefly", 6.64]], null, null, [["music", 43.36], ["throbbing", 16.65], ["hum", 13.07]], null, [["hum", 38.84], ["music", 21.38], ["mains hum", 16.53]], null, null, null, [["hum", 47.53], ["music", 20.21], ["mains hum", 19.13]], null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 27.19], ["speech", 8.76], ["hum", 7.52]], [["sidetone", 26.74], ["speech", 26.38], ["hum", 7.14]], null, [["hum", 55.43], ["mains hum", 16.67], ["music", 7.49]], null, [["hum", 36.98], ["mains hum", 9.43], ["throbbing", 7.14]], [["hum", 29.42], ["mains hum", 29.39], ["throbbing", 6.66]], [["rumble", 16.29], ["music", 13.75], ["hum", 8.32]], null], "duration": [2.11, 1.56, 2.49, 0.77, 0.06, 2.88, 0.78, 7.94, 0.68, 0.58, 0.33, 10.05, 1.11, 1.21, 1.12, 0.3, 0.68, 1.47, 0.37, 1.62, 1.48, 0.2, 3.64, 2.23, 1.09, 7.0, 1.58, 2.01, 5.41, 4.92, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/p9W9PhaNGOY_filtered.json b/annotations_filtered/p9W9PhaNGOY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0361e228b76b8585c7ee6effc90647de671e33e6 --- /dev/null +++ b/annotations_filtered/p9W9PhaNGOY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 38.45], [39.0, 56.56], [62.0, 85.8], [86.0, 92.18], [93.0, 95.35]], "keep_status": [false, true, true, false, false], "silence_prob": [0.0, 29.58, 29.77, 34.13, 41.76], "audiomae_on_audioset": [null, [["music", 48.96], ["sidetone", 7.96], ["synthesizer", 5.89]], [["music", 27.01], ["livestock, farm animals, working animals", 8.2], ["speech", 7.31]], [["didgeridoo", 39.07], ["music", 24.53], ["speech", 15.12]], [["music", 64.56], ["didgeridoo", 7.74], ["musical instrument", 4.81]]], "duration": [1.45, 17.56, 23.8, 6.18, 2.35]} \ No newline at end of file diff --git a/annotations_filtered/p9XIPtizl3s_filtered.json b/annotations_filtered/p9XIPtizl3s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08d2eca572dbda61923191b3ae94b623532daff9 --- /dev/null +++ b/annotations_filtered/p9XIPtizl3s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 14.4], [15.0, 40.12], [40.0, 40.15], [40.0, 40.19], [40.0, 40.22], [40.0, 40.26], [41.0, 40.63], [41.0, 40.66], [41.0, 40.69], [41.0, 40.76], [41.0, 52.74], [60.0, 67.39], [68.0, 68.76], [69.0, 85.89], [86.0, 86.48], [87.0, 88.13], [93.0, 93.45], [94.0, 107.94], [108.0, 144.29], [145.0, 145.66]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, true, false, false], "silence_prob": [29.45, 29.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.86, 29.54, 0.0, 28.93, 0.0, 0.0, 0.0, 33.88, 0.0, 0.0], "audiomae_on_audioset": [[["clang", 42.27], ["ding", 16.65], ["music", 7.37]], [["whack, thwack", 66.13], ["music", 10.49], ["fly, housefly", 2.05]], null, null, null, null, null, null, null, null, [["clang", 22.89], ["music", 16.53], ["speech", 8.81]], [["whack, thwack", 24.42], ["clang", 23.73], ["ding", 10.2]], null, [["music", 30.68], ["whack, thwack", 18.87], ["boing", 9.19]], null, null, null, [["hum", 21.62], ["music", 15.92], ["throbbing", 13.07]], null, null], "duration": [7.4, 25.12, 0.15, 0.19, 0.22, 0.26, -0.37, -0.34, -0.31, -0.24, 11.74, 7.39, 0.76, 16.89, 0.48, 1.13, 0.45, 13.94, 36.29, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/p9shpHAh8uc_filtered.json b/annotations_filtered/p9shpHAh8uc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de1f4c8e0436ce57b498109560b1269e36cfc194 --- /dev/null +++ b/annotations_filtered/p9shpHAh8uc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[101.0, 102.84], [104.0, 109.68], [115.0, 119.7], [122.0, 122.49], [124.0, 125.46], [127.0, 128.11]], "keep_status": [false, true, false, false, false, false], "silence_prob": [0.0, 37.89, 60.14, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 30.8], ["theremin", 10.24], ["gunshot, gunfire", 5.9]], null, null, null, null], "duration": [1.84, 5.68, 4.7, 0.49, 1.46, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/pAZOyJPs5bo_filtered.json b/annotations_filtered/pAZOyJPs5bo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f88c9e868cb3acc00922e5fcbcdd1cc6d0fd2599 --- /dev/null +++ b/annotations_filtered/pAZOyJPs5bo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 32.16], [33.0, 33.44], [36.0, 45.71], [49.0, 50.5], [52.0, 62.14], [65.0, 69.42], [74.0, 74.43]], "keep_status": [false, false, true, false, true, true, false], "silence_prob": [0.0, 0.0, 37.69, 0.0, 29.29, 31.41, 0.0], "audiomae_on_audioset": [null, null, [["thunk", 38.67], ["music", 21.61], ["breaking", 7.29]], null, [["speech", 34.55], ["music", 23.58], ["machine gun", 10.95]], [["music", 33.33], ["hum", 18.77], ["throbbing", 7.59]], null], "duration": [0.16, 0.44, 9.71, 1.5, 10.14, 4.42, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/pAs8uvKNkcU_filtered.json b/annotations_filtered/pAs8uvKNkcU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32c9493c8e44b0bc2ae6b7081352fd6e43354515 --- /dev/null +++ b/annotations_filtered/pAs8uvKNkcU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.95], [12.0, 12.45], [13.0, 13.56], [15.0, 17.42], [18.0, 19.58], [21.0, 24.71], [28.0, 28.59], [32.0, 32.43], [33.0, 33.67], [36.0, 36.26], [38.0, 38.7], [42.0, 41.86], [43.0, 44.47], [48.0, 50.06], [50.0, 52.08], [54.0, 54.75], [58.0, 61.45], [62.0, 62.67], [63.0, 64.0], [67.0, 71.02], [71.0, 73.18], [75.0, 75.0], [76.0, 76.45], [79.0, 82.09], [83.0, 84.47], [91.0, 93.63], [94.0, 95.13], [96.0, 95.94], [98.0, 98.47], [100.0, 101.83], [102.0, 103.27], [105.0, 106.07], [107.0, 109.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [89.19, 0.0, 0.0, 100.0, 0.0, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 54.3, 0.0, 100.0, 0.0, 0.0, 100.0, 62.47, 0.0, 0.0, 99.85, 0.0, 63.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.38], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 49.05], ["dial tone", 9.87], ["sidetone", 6.61]]], "duration": [3.95, 0.45, 0.56, 2.42, 1.58, 3.71, 0.59, 0.43, 0.67, 0.26, 0.7, -0.14, 1.47, 2.06, 2.08, 0.75, 3.45, 0.67, 1.0, 4.02, 2.18, 0.0, 0.45, 3.09, 1.47, 2.63, 1.13, -0.06, 0.47, 1.83, 1.27, 1.07, 2.41]} \ No newline at end of file diff --git a/annotations_filtered/pAwdeWy9yYM_filtered.json b/annotations_filtered/pAwdeWy9yYM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..744fff4d3298f9a39852a8bd85338d2cf7e70d80 --- /dev/null +++ b/annotations_filtered/pAwdeWy9yYM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 40.0], [44.0, 44.85], [53.0, 53.23], [56.0, 57.25], [58.0, 70.73], [84.0, 84.47], [86.0, 85.78], [89.0, 92.21], [94.0, 94.26], [94.0, 112.19], [113.0, 114.49], [116.0, 116.58], [117.0, 122.84], [126.0, 128.29], [129.0, 139.16], [141.0, 141.0], [144.0, 150.04], [156.0, 160.27], [173.0, 182.31], [187.0, 193.7]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, true, false, false, false, false, true, true, true], "silence_prob": [30.78, 0.0, 0.0, 0.0, 33.26, 0.0, 0.0, 36.66, 0.0, 29.74, 0.0, 0.0, 30.29, 52.16, 51.02, 0.0, 31.24, 30.99, 30.22, 31.63], "audiomae_on_audioset": [[["music", 67.47], ["throbbing", 4.9], ["synthesizer", 2.9]], null, null, null, [["hum", 26.1], ["music", 20.48], ["throbbing", 14.45]], null, null, [["music", 23.92], ["boing", 17.96], ["throbbing", 15.12]], null, [["boing", 37.93], ["music", 28.94], ["speech", 15.68]], null, null, [["livestock, farm animals, working animals", 25.37], ["music", 17.95], ["speech", 8.72]], null, null, null, [["cattle, bovinae", 28.04], ["music", 27.56], ["moo", 16.91]], [["music", 30.13], ["fart", 23.84], ["speech", 13.64]], [["throbbing", 36.52], ["music", 17.28], ["hum", 11.95]], [["speech", 27.0], ["throbbing", 24.94], ["hum", 17.46]]], "duration": [26.0, 0.85, 0.23, 1.25, 12.73, 0.47, -0.22, 3.21, 0.26, 18.19, 1.49, 0.58, 5.84, 2.29, 10.16, 0.0, 6.04, 4.27, 9.31, 6.7]} \ No newline at end of file diff --git a/annotations_filtered/pAwoA-XPzsQ_filtered.json b/annotations_filtered/pAwoA-XPzsQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de7c8bdd3a03cc4bde96104c00250ba45cce0e84 --- /dev/null +++ b/annotations_filtered/pAwoA-XPzsQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[102.0, 102.02], [102.0, 115.42], [117.0, 124.43], [126.0, 127.01], [132.0, 133.15]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 30.71, 31.12, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 42.41], ["speech", 30.18], ["throbbing", 7.07]], [["music", 48.36], ["throbbing", 19.44], ["hum", 7.54]], null, null], "duration": [0.02, 13.42, 7.43, 1.01, 1.15]} \ No newline at end of file diff --git a/annotations_filtered/pB-bN-RkJLM_filtered.json b/annotations_filtered/pB-bN-RkJLM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed965ff6a82e8d2f3cdd7fd1652f0f5dafd9198c --- /dev/null +++ b/annotations_filtered/pB-bN-RkJLM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.54], [10.0, 34.4], [36.0, 36.17], [37.0, 40.61], [42.0, 42.85], [46.0, 48.76], [52.0, 52.89], [56.0, 58.11], [64.0, 63.91], [67.0, 67.05], [70.0, 77.43], [79.0, 80.18]], "keep_status": [false, true, false, false, false, true, false, false, false, false, true, false], "silence_prob": [0.0, 33.2, 0.0, 29.7, 0.0, 31.92, 0.0, 39.01, 0.0, 0.0, 36.13, 0.0], "audiomae_on_audioset": [null, [["insect", 18.14], ["fly, housefly", 10.8], ["whack, thwack", 9.79]], null, [["speech", 61.8], ["livestock, farm animals, working animals", 5.22], ["cattle, bovinae", 4.07]], null, [["speech", 28.23], ["sheep", 15.19], ["whale vocalization", 13.93]], null, [["cattle, bovinae", 40.19], ["moo", 29.27], ["livestock, farm animals, working animals", 18.79]], null, null, [["whale vocalization", 9.38], ["whack, thwack", 7.71], ["fart", 6.99]], null], "duration": [0.54, 24.4, 0.17, 3.61, 0.85, 2.76, 0.89, 2.11, -0.09, 0.05, 7.43, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/pBNKarJukms_filtered.json b/annotations_filtered/pBNKarJukms_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41518330a24ff11b65cc14ba82858817e8ae7c51 --- /dev/null +++ b/annotations_filtered/pBNKarJukms_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 36.73], [37.0, 37.56], [39.0, 42.67], [44.0, 44.68]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 40.5, 0.0], "audiomae_on_audioset": [null, null, [["music", 44.07], ["throbbing", 24.29], ["hum", 5.95]], null], "duration": [0.73, 0.56, 3.67, 0.68]} \ No newline at end of file diff --git a/annotations_filtered/pBd7XYjjvRw_filtered.json b/annotations_filtered/pBd7XYjjvRw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cdd077ebe54dfedc29f6718d1129f8777c77d4b9 --- /dev/null +++ b/annotations_filtered/pBd7XYjjvRw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [6.0, 12.46], [16.0, 23.58], [24.0, 25.08], [27.0, 27.72], [28.0, 49.11], [50.0, 51.04], [54.0, 55.07], [57.0, 56.94], [59.0, 60.2], [61.0, 62.31], [64.0, 64.42], [65.0, 66.38], [68.0, 69.35], [75.0, 76.25], [81.0, 80.87], [83.0, 82.66], [85.0, 85.4], [91.0, 91.71], [94.0, 95.1], [97.0, 98.41], [103.0, 103.82], [105.0, 105.73], [109.0, 109.36], [112.0, 112.99], [119.0, 119.5], [122.0, 122.62], [124.0, 124.95], [126.0, 126.79], [135.0, 136.0], [137.0, 137.32], [142.0, 143.09], [148.0, 147.85], [152.0, 152.15], [156.0, 157.33], [160.0, 160.24], [162.0, 163.65], [165.0, 166.56], [168.0, 169.3], [171.0, 172.32], [173.0, 174.02]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 81.17, 72.9, 0.0, 0.0, 45.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["chink, clink", 20.83], ["glass", 13.96], ["tuning fork", 6.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 6.46, 7.58, 1.08, 0.72, 21.11, 1.04, 1.07, -0.06, 1.2, 1.31, 0.42, 1.38, 1.35, 1.25, -0.13, -0.34, 0.4, 0.71, 1.1, 1.41, 0.82, 0.73, 0.36, 0.99, 0.5, 0.62, 0.95, 0.79, 1.0, 0.32, 1.09, -0.15, 0.15, 1.33, 0.24, 1.65, 1.56, 1.3, 1.32, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/pBq_lpX9LTw_filtered.json b/annotations_filtered/pBq_lpX9LTw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8565b59e2c15b50a8c02ce25956c54ed8279ddbf --- /dev/null +++ b/annotations_filtered/pBq_lpX9LTw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 17.27], [20.0, 26.86], [28.0, 33.32], [35.0, 49.98], [73.0, 73.57], [77.0, 84.45], [94.0, 94.31], [95.0, 95.84], [96.0, 99.27], [99.0, 99.33], [100.0, 99.79]], "keep_status": [true, true, true, true, false, true, false, false, false, false, false], "silence_prob": [31.21, 30.72, 29.38, 30.67, 0.0, 30.09, 0.0, 0.0, 74.6, 0.0, 0.0], "audiomae_on_audioset": [[["fly, housefly", 22.48], ["insect", 14.45], ["grunt", 9.23]], [["cacophony", 13.67], ["music", 13.25], ["noise", 11.6]], [["music", 26.27], ["livestock, farm animals, working animals", 5.49], ["sound effect", 4.89]], [["music", 11.65], ["speech", 9.29], ["thump, thud", 7.38]], null, [["music", 51.63], ["hum", 5.68], ["sound effect", 4.51]], null, null, null, null, null], "duration": [7.27, 6.86, 5.32, 14.98, 0.57, 7.45, 0.31, 0.84, 3.27, 0.33, -0.21]} \ No newline at end of file diff --git a/annotations_filtered/pCFld9GCy_Q_filtered.json b/annotations_filtered/pCFld9GCy_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49d3cba47abcadbe8b742813bd39b18aa6ddab62 --- /dev/null +++ b/annotations_filtered/pCFld9GCy_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.93], [28.0, 28.39], [32.0, 31.62], [34.0, 58.68], [60.0, 61.03], [65.0, 75.57], [76.0, 76.76], [80.0, 80.4], [103.0, 103.72], [109.0, 109.58], [110.0, 120.99], [122.0, 122.88], [125.0, 129.22], [130.0, 133.3], [137.0, 137.71], [139.0, 142.21], [143.0, 144.56], [148.0, 149.47], [151.0, 151.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 92.97, 0.0, 36.0, 0.0, 0.0, 0.0, 0.0, 77.7, 0.0, 94.95, 92.48, 0.0, 97.54, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 66.85], ["sidetone", 10.35], ["music", 3.55]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.93, 0.39, -0.38, 24.68, 1.03, 10.57, 0.76, 0.4, 0.72, 0.58, 10.99, 0.88, 4.22, 3.3, 0.71, 3.21, 1.56, 1.47, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/pCHHv7ojfiw_filtered.json b/annotations_filtered/pCHHv7ojfiw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10c275c9104e2d50067245fed2f65902407dcdfc --- /dev/null +++ b/annotations_filtered/pCHHv7ojfiw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 26.42], [28.0, 44.9], [46.0, 57.52], [59.0, 59.66], [63.0, 63.22], [68.0, 91.39], [95.0, 113.63], [117.0, 131.58]], "keep_status": [false, true, true, false, false, true, true, true], "silence_prob": [61.87, 30.19, 31.35, 0.0, 0.0, 33.17, 30.91, 29.62], "audiomae_on_audioset": [null, [["speech", 30.13], ["music", 22.43], ["vehicle", 7.52]], [["music", 40.2], ["speech", 14.07], ["foghorn", 11.61]], null, null, [["speech", 32.46], ["music", 22.05], ["foghorn", 8.42]], [["music", 28.54], ["explosion", 23.25], ["speech", 15.64]], [["explosion", 36.23], ["hum", 8.97], ["eruption", 7.84]]], "duration": [7.42, 16.9, 11.52, 0.66, 0.22, 23.39, 18.63, 14.58]} \ No newline at end of file diff --git a/annotations_filtered/pCQ0k_WvwvQ_filtered.json b/annotations_filtered/pCQ0k_WvwvQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36568642e20a7c90ac5a93e0eec0be7603aa757a --- /dev/null +++ b/annotations_filtered/pCQ0k_WvwvQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.11], [23.0, 25.74], [38.0, 44.29], [45.0, 55.83], [58.0, 68.15], [71.0, 89.51], [94.0, 95.98], [104.0, 110.27]], "keep_status": [false, false, false, true, true, false, false, false], "silence_prob": [0.0, 72.9, 31.29, 31.72, 32.52, 32.04, 0.0, 33.0], "audiomae_on_audioset": [null, null, [["music", 80.85], ["singing", 1.44], ["vocal music", 1.21]], [["music", 62.22], ["funny music", 3.9], ["speech", 3.56]], [["music", 57.45], ["speech", 6.03], ["boing", 4.54]], [["music", 56.95], ["a capella", 25.42], ["vocal music", 7.36]], null, [["music", 69.8], ["busy signal", 9.94], ["boing", 5.21]]], "duration": [0.11, 2.74, 6.29, 10.83, 10.15, 18.51, 1.98, 6.27]} \ No newline at end of file diff --git a/annotations_filtered/pCQuhXDlfL8_filtered.json b/annotations_filtered/pCQuhXDlfL8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a02701bde8a5d6cabb5530944e8b403e13887b0e --- /dev/null +++ b/annotations_filtered/pCQuhXDlfL8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.83], [3.0, 4.43], [6.0, 12.11], [12.0, 14.03], [16.0, 17.42], [18.0, 18.98], [20.0, 21.0], [21.0, 21.32], [22.0, 29.86], [31.0, 32.46], [33.0, 34.64], [35.0, 57.4], [63.0, 64.72], [65.0, 66.72], [67.0, 67.93], [68.0, 70.12], [71.0, 71.19], [72.0, 72.01], [73.0, 73.43], [74.0, 74.31], [75.0, 75.54], [76.0, 76.64], [77.0, 77.73], [78.0, 78.14], [80.0, 80.11], [81.0, 81.13], [82.0, 82.41], [83.0, 83.89], [85.0, 84.79], [85.0, 85.94], [87.0, 87.89], [88.0, 89.16], [90.0, 90.95], [91.0, 92.1], [92.0, 93.02], [93.0, 94.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 72.16, 0.0, 0.0, 32.56, 0.0, 0.0, 0.0, 43.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 55.6], ["eruption", 14.51], ["animal", 7.08]], null, null, null, [["speech", 25.73], ["animal", 10.64], ["oink", 5.59]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.83, 1.43, 6.11, 2.03, 1.42, 0.98, 1.0, 0.32, 7.86, 1.46, 1.64, 22.4, 1.72, 1.72, 0.93, 2.12, 0.19, 0.01, 0.43, 0.31, 0.54, 0.64, 0.73, 0.14, 0.11, 0.13, 0.41, 0.89, -0.21, 0.94, 0.89, 1.16, 0.95, 1.1, 1.02, 1.59]} \ No newline at end of file diff --git a/annotations_filtered/pCiwEO_6xS0_filtered.json b/annotations_filtered/pCiwEO_6xS0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc6584c687bba305d43476a23982b22029145e62 --- /dev/null +++ b/annotations_filtered/pCiwEO_6xS0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 34.23], [36.0, 40.51], [41.0, 41.88], [43.0, 47.61], [49.0, 49.42], [51.0, 52.62], [54.0, 54.24], [56.0, 56.93], [60.0, 64.34], [66.0, 68.28], [70.0, 84.13], [85.0, 86.07], [87.0, 93.88], [94.0, 94.32], [99.0, 99.28], [100.0, 100.9], [110.0, 111.11], [112.0, 113.75], [115.0, 117.12], [118.0, 119.08], [122.0, 122.61], [125.0, 125.15]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.82, 50.71, 0.0, 46.97, 0.0, 0.0, 0.0, 0.0, 49.09, 63.74, 46.86, 0.0, 44.84, 0.0, 0.0, 0.0, 0.0, 0.0, 59.51, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 67.82], ["piano", 7.42], ["keyboard (musical)", 4.58]], null, null, [["music", 46.12], ["guitar", 12.33], ["plucked string instrument", 9.5]], null, null, null, null, [["music", 45.72], ["cello", 5.88], ["foghorn", 5.2]], null, [["music", 67.88], ["musical instrument", 4.63], ["keyboard (musical)", 3.48]], null, [["music", 61.19], ["musical instrument", 6.78], ["harp", 4.46]], null, null, null, null, null, null, null, null, null], "duration": [25.23, 4.51, 0.88, 4.61, 0.42, 1.62, 0.24, 0.93, 4.34, 2.28, 14.13, 1.07, 6.88, 0.32, 0.28, 0.9, 1.11, 1.75, 2.12, 1.08, 0.61, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/pDCzYY0bjbc_filtered.json b/annotations_filtered/pDCzYY0bjbc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dbf97ca3cb6ddd08649a2b37bf6aebd517d8f3ff --- /dev/null +++ b/annotations_filtered/pDCzYY0bjbc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.39], [13.0, 13.56], [19.0, 20.17], [36.0, 37.34], [40.0, 40.04], [45.0, 52.42], [54.0, 70.71], [76.0, 115.11], [119.0, 125.69], [129.0, 129.49], [130.0, 130.72], [132.0, 133.71], [141.0, 142.82], [144.0, 152.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.09, 0.0, 0.0, 0.0, 0.0, 31.87, 30.21, 0.0, 30.27, 0.0, 0.0, 0.0, 0.0, 28.6], "audiomae_on_audioset": [[["music", 49.13], ["speech", 28.08], ["didgeridoo", 2.84]], null, null, null, null, [["music", 44.51], ["speech", 27.09], ["hum", 6.07]], [["speech", 41.7], ["music", 34.68], ["whack, thwack", 4.39]], null, [["music", 71.45], ["throbbing", 10.04], ["hum", 3.79]], null, null, null, null, [["music", 70.97], ["synthesizer", 4.41], ["cacophony", 4.36]]], "duration": [4.39, 0.56, 1.17, 1.34, 0.04, 7.42, 16.71, 39.11, 6.69, 0.49, 0.72, 1.71, 1.82, 8.29]} \ No newline at end of file diff --git a/annotations_filtered/pDEJr2Sqhxc_filtered.json b/annotations_filtered/pDEJr2Sqhxc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa86cd96a62722769657923ce9d58ad4a8c7b742 --- /dev/null +++ b/annotations_filtered/pDEJr2Sqhxc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.72], [16.0, 16.98], [32.0, 32.37], [34.0, 36.63], [38.0, 38.52], [40.0, 41.32], [42.0, 43.56], [45.0, 45.77], [47.0, 47.38], [49.0, 50.23], [51.0, 51.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 0.98, 0.37, 2.63, 0.52, 1.32, 1.56, 0.77, 0.38, 1.23, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/pDWR5RkWRTY_filtered.json b/annotations_filtered/pDWR5RkWRTY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f22418cdb6e5c76266fed2193cfb0013947034b1 --- /dev/null +++ b/annotations_filtered/pDWR5RkWRTY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.02], [5.0, 7.43], [8.0, 8.29], [13.0, 13.49], [14.0, 32.7], [34.0, 34.28], [38.0, 47.11], [47.0, 47.83], [54.0, 56.42], [60.0, 70.8], [74.0, 78.85], [80.0, 82.12], [87.0, 89.36]], "keep_status": [false, false, false, false, true, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 68.8, 0.0, 0.0, 32.23, 0.0, 47.9, 0.0, 48.1, 33.73, 35.98, 93.91, 91.3], "audiomae_on_audioset": [null, null, null, null, [["music", 39.87], ["whale vocalization", 19.42], ["echo", 5.26]], null, [["music", 59.14], ["buzz", 12.81], ["theremin", 6.73]], null, [["music", 25.59], ["didgeridoo", 8.79], ["speech", 6.71]], [["speech", 51.24], ["music", 7.78], ["buzz", 6.95]], [["whale vocalization", 45.13], ["noise", 30.96], ["music", 8.93]], null, null], "duration": [1.02, 2.43, 0.29, 0.49, 18.7, 0.28, 9.11, 0.83, 2.42, 10.8, 4.85, 2.12, 2.36]} \ No newline at end of file diff --git a/annotations_filtered/pDcPRvZ9sDU_filtered.json b/annotations_filtered/pDcPRvZ9sDU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..315fd98eec904ef2af24b9b63a135d8313d96c8d --- /dev/null +++ b/annotations_filtered/pDcPRvZ9sDU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.86], [8.0, 30.72], [37.0, 39.68], [41.0, 41.25], [47.0, 47.43], [48.0, 49.64], [50.0, 51.19], [52.0, 52.79], [55.0, 56.71], [57.0, 58.11], [61.0, 62.38], [63.0, 63.24], [64.0, 64.22], [67.0, 69.15], [70.0, 71.05], [73.0, 73.45], [74.0, 75.73], [78.0, 79.35], [81.0, 82.22], [89.0, 95.66], [96.0, 95.77], [96.0, 104.57], [105.0, 107.25], [109.0, 110.64], [111.0, 112.63], [115.0, 118.02], [121.0, 123.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 87.55, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 99.1, 0.0, 99.76, 99.16, 0.0, 0.0, 96.54, 88.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.86, 22.72, 2.68, 0.25, 0.43, 1.64, 1.19, 0.79, 1.71, 1.11, 1.38, 0.24, 0.22, 2.15, 1.05, 0.45, 1.73, 1.35, 1.22, 6.66, -0.23, 8.57, 2.25, 1.64, 1.63, 3.02, 2.75]} \ No newline at end of file diff --git a/annotations_filtered/pDj1GM3RRWs_filtered.json b/annotations_filtered/pDj1GM3RRWs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8884596a16091834fbb841aead45ab8e7f62e066 --- /dev/null +++ b/annotations_filtered/pDj1GM3RRWs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.39], [4.0, 4.24], [6.0, 6.18], [10.0, 10.2], [12.0, 12.34], [19.0, 20.65], [29.0, 30.55], [31.0, 31.21], [32.0, 33.71], [34.0, 36.8], [38.0, 39.46], [64.0, 70.43], [71.0, 72.15], [76.0, 77.16], [81.0, 81.97], [87.0, 91.93], [94.0, 100.45], [104.0, 108.3], [110.0, 110.37], [111.0, 112.68], [113.0, 121.17], [122.0, 140.0], [141.0, 146.45], [147.0, 149.71], [151.0, 158.28], [159.0, 165.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.32, 0.0, 98.36, 0.0, 0.0, 0.0, 99.96, 92.31, 89.9, 0.0, 0.0, 65.79, 63.21, 58.05, 57.81, 61.67, 45.65], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.26], ["speech", 26.51], ["ambient music", 3.54]]], "duration": [0.39, 0.24, 0.18, 0.2, 0.34, 1.65, 1.55, 0.21, 1.71, 2.8, 1.46, 6.43, 1.15, 1.16, 0.97, 4.93, 6.45, 4.3, 0.37, 1.68, 8.17, 18.0, 5.45, 2.71, 7.28, 6.72]} \ No newline at end of file diff --git a/annotations_filtered/pDjY4qorZrg_filtered.json b/annotations_filtered/pDjY4qorZrg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1bcc473f31d3304e6eca0c882b4a72d410e0f48 --- /dev/null +++ b/annotations_filtered/pDjY4qorZrg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 30.89], [33.0, 46.58], [48.0, 48.24], [49.0, 49.84], [52.0, 54.94], [56.0, 64.03], [65.0, 66.82], [69.0, 69.06], [71.0, 71.69], [74.0, 74.65], [82.0, 82.46], [84.0, 85.5], [91.0, 93.16], [94.0, 93.77], [96.0, 97.38], [106.0, 106.91], [112.0, 113.0], [121.0, 121.44], [125.0, 125.1], [136.0, 137.05], [140.0, 141.2], [157.0, 157.3], [157.0, 157.67], [161.0, 161.33], [165.0, 165.15], [166.0, 166.7], [169.0, 170.6], [175.0, 175.91], [177.0, 177.45], [179.0, 192.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [34.02, 30.9, 0.0, 0.0, 32.71, 31.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.05], "audiomae_on_audioset": [[["music", 44.74], ["theremin", 23.97], ["hum", 13.1]], [["music", 46.25], ["speech", 30.53], ["fly, housefly", 2.83]], null, null, [["whale vocalization", 41.86], ["music", 28.5], ["cattle, bovinae", 2.36]], [["speech", 63.9], ["cattle, bovinae", 3.53], ["explosion", 3.47]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 51.3], ["music", 11.06], ["vehicle", 4.72]]], "duration": [20.89, 13.58, 0.24, 0.84, 2.94, 8.03, 1.82, 0.06, 0.69, 0.65, 0.46, 1.5, 2.16, -0.23, 1.38, 0.91, 1.0, 0.44, 0.1, 1.05, 1.2, 0.3, 0.67, 0.33, 0.15, 0.7, 1.6, 0.91, 0.45, 13.11]} \ No newline at end of file diff --git a/annotations_filtered/pDnPZ0Ccdus_filtered.json b/annotations_filtered/pDnPZ0Ccdus_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b5e1fd77036121168419568666bf33c5f3c97aa --- /dev/null +++ b/annotations_filtered/pDnPZ0Ccdus_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 28.29], [32.0, 38.15], [45.0, 46.87], [51.0, 51.54], [55.0, 68.69], [72.0, 73.31], [78.0, 79.19], [84.0, 84.0], [94.0, 94.24], [102.0, 135.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.95, 42.62, 0.0, 0.0, 31.98, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 74.23], ["theremin", 3.38], ["musical instrument", 2.92]], [["speech", 62.64], ["grunt", 8.46], ["burping, eructation", 6.67]], null, null, [["music", 70.86], ["brass instrument", 7.05], ["trombone", 5.09]], null, null, null, null, null], "duration": [7.29, 6.15, 1.87, 0.54, 13.69, 1.31, 1.19, 0.0, 0.24, 33.77]} \ No newline at end of file diff --git a/annotations_filtered/pDy41hvdq4s_filtered.json b/annotations_filtered/pDy41hvdq4s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c24a7f241622cba619903a0e3878e977984ca601 --- /dev/null +++ b/annotations_filtered/pDy41hvdq4s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.08], [10.0, 16.28], [17.0, 20.75], [22.0, 22.65], [23.0, 24.19], [26.0, 48.34], [52.0, 53.16], [55.0, 55.92], [66.0, 67.73], [69.0, 68.67], [69.0, 72.42], [74.0, 75.68], [76.0, 78.19], [79.0, 90.31], [106.0, 106.44], [109.0, 112.45], [121.0, 136.09], [137.0, 138.84], [139.0, 141.39], [142.0, 142.32], [143.0, 143.87], [145.0, 146.35], [148.0, 148.44], [150.0, 151.06], [153.0, 153.5], [155.0, 155.92], [171.0, 171.71]], "keep_status": [false, false, true, false, false, true, false, false, false, false, true, false, false, true, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.13, 29.91, 0.0, 0.0, 32.46, 0.0, 0.0, 0.0, 0.0, 39.54, 0.0, 61.97, 34.71, 0.0, 32.65, 33.4, 0.0, 48.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 46.75], ["theremin", 35.09], ["musical instrument", 6.58]], [["trombone", 30.57], ["music", 24.5], ["brass instrument", 7.64]], null, null, [["music", 44.08], ["vehicle", 5.02], ["cattle, bovinae", 4.73]], null, null, null, null, [["whale vocalization", 31.04], ["speech", 13.97], ["music", 12.44]], null, null, [["music", 34.42], ["speech", 31.67], ["outside, rural or natural", 3.89]], null, [["music", 41.47], ["theremin", 25.06], ["speech", 11.01]], [["speech", 43.23], ["mains hum", 17.0], ["hum", 7.02]], null, [["speech", 57.59], ["fart", 6.67], ["fly, housefly", 5.56]], null, null, null, null, null, null, null, null], "duration": [1.08, 6.28, 3.75, 0.65, 1.19, 22.34, 1.16, 0.92, 1.73, -0.33, 3.42, 1.68, 2.19, 11.31, 0.44, 3.45, 15.09, 1.84, 2.39, 0.32, 0.87, 1.35, 0.44, 1.06, 0.5, 0.92, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/pE0vTejjWuk_filtered.json b/annotations_filtered/pE0vTejjWuk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5adeedd3667b9acef5847cd959fb05a196de9ee5 --- /dev/null +++ b/annotations_filtered/pE0vTejjWuk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.68], [3.0, 2.89], [5.0, 5.36], [7.0, 9.12], [10.0, 26.2], [28.0, 28.61], [30.0, 30.18], [31.0, 31.41], [33.0, 42.03], [44.0, 44.63], [45.0, 45.76], [47.0, 47.71], [50.0, 50.57], [55.0, 55.54], [58.0, 58.82], [60.0, 60.64], [63.0, 63.46], [66.0, 68.01], [70.0, 69.96], [71.0, 71.64], [73.0, 73.72], [75.0, 76.89], [78.0, 79.15], [80.0, 81.38], [84.0, 84.05], [87.0, 88.11], [90.0, 90.39], [92.0, 92.13], [97.0, 97.23], [98.0, 98.76], [100.0, 101.63]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.35, 35.58, 0.0, 0.0, 0.0, 54.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["liquid", 11.82], ["mains hum", 10.66], ["whale vocalization", 9.59]], [["horse", 44.74], ["clip-clop", 25.97], ["hum", 8.25]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.68, -0.11, 0.36, 2.12, 16.2, 0.61, 0.18, 0.41, 9.03, 0.63, 0.76, 0.71, 0.57, 0.54, 0.82, 0.64, 0.46, 2.01, -0.04, 0.64, 0.72, 1.89, 1.15, 1.38, 0.05, 1.11, 0.39, 0.13, 0.23, 0.76, 1.63]} \ No newline at end of file diff --git a/annotations_filtered/pE5pl9UG93I_filtered.json b/annotations_filtered/pE5pl9UG93I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a658778d44faf4d490e6854429f330c3f4ab593a --- /dev/null +++ b/annotations_filtered/pE5pl9UG93I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 15.75], [20.0, 20.7], [22.0, 22.18], [24.0, 24.88], [26.0, 28.22], [30.0, 30.33], [34.0, 35.31], [37.0, 37.32], [38.0, 40.09], [42.0, 42.58], [46.0, 46.77], [48.0, 48.42], [50.0, 50.77], [54.0, 54.84], [55.0, 55.7], [56.0, 56.98], [58.0, 57.94], [61.0, 61.3], [64.0, 64.94], [66.0, 66.11], [69.0, 68.94], [81.0, 82.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.87, 0.0, 0.0, 0.0, 98.1, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 83.42], ["sidetone", 3.62], ["didgeridoo", 2.22]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.75, 0.7, 0.18, 0.88, 2.22, 0.33, 1.31, 0.32, 2.09, 0.58, 0.77, 0.42, 0.77, 0.84, 0.7, 0.98, -0.06, 0.3, 0.94, 0.11, -0.06, 1.63]} \ No newline at end of file diff --git a/annotations_filtered/pEa07GOtQs4_filtered.json b/annotations_filtered/pEa07GOtQs4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff3b41b531c185dabcb6e418089d1877207bfa29 --- /dev/null +++ b/annotations_filtered/pEa07GOtQs4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.91], [10.0, 10.34], [15.0, 15.21], [21.0, 22.82], [28.0, 28.92], [31.0, 33.39], [36.0, 36.83], [38.0, 38.85], [39.0, 39.93], [40.0, 40.41], [42.0, 42.52], [45.0, 44.79], [46.0, 48.56], [55.0, 56.25], [57.0, 58.45], [62.0, 61.75], [66.0, 67.68], [69.0, 69.4], [73.0, 73.5], [75.0, 76.06], [81.0, 81.6], [87.0, 89.07], [90.0, 91.37], [97.0, 98.83], [104.0, 107.84], [109.0, 109.41], [111.0, 111.89], [114.0, 114.74], [116.0, 118.5], [120.0, 120.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 91.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.1, 0.0, 0.0, 98.19, 0.0, 0.0, 0.0, 95.37, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.09, 0.34, 0.21, 1.82, 0.92, 2.39, 0.83, 0.85, 0.93, 0.41, 0.52, -0.21, 2.56, 1.25, 1.45, -0.25, 1.68, 0.4, 0.5, 1.06, 0.6, 2.07, 1.37, 1.83, 3.84, 0.41, 0.89, 0.74, 2.5, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/pF67F-hlVaA_filtered.json b/annotations_filtered/pF67F-hlVaA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e13ff46481cb730e182e820cbd28c13d0a105a7f --- /dev/null +++ b/annotations_filtered/pF67F-hlVaA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.1], [16.0, 16.63], [23.0, 23.5], [25.0, 25.12], [26.0, 56.27], [60.0, 60.42], [62.0, 64.03], [64.0, 64.66], [65.0, 66.26], [67.0, 74.78], [78.0, 78.44], [81.0, 81.28]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.8, 0.0, 0.0, 33.26, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 38.21], ["music", 25.96], ["whack, thwack", 4.81]], null, null], "duration": [0.1, 0.63, 0.5, 0.12, 30.27, 0.42, 2.03, 0.66, 1.26, 7.78, 0.44, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/pFXW-7VNngk_filtered.json b/annotations_filtered/pFXW-7VNngk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a46f94d309971d513bc31f179cfbf77b8415b636 --- /dev/null +++ b/annotations_filtered/pFXW-7VNngk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.29], [13.0, 20.87], [25.0, 29.79], [30.0, 44.36], [54.0, 55.11], [72.0, 73.45], [74.0, 74.65], [77.0, 77.18], [79.0, 79.15], [87.0, 91.61], [98.0, 98.74], [101.0, 101.7], [109.0, 109.81], [113.0, 119.31], [120.0, 119.79], [120.0, 120.26], [129.0, 131.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 33.34, 32.96, 30.9, 0.0, 0.0, 0.0, 0.0, 0.0, 31.18, 0.0, 0.0, 0.0, 47.46, 0.0, 0.0, 40.64], "audiomae_on_audioset": [null, [["music", 70.82], ["theremin", 5.15], ["electronic music", 4.52]], [["music", 67.05], ["electronic music", 7.26], ["speech", 6.21]], [["music", 56.68], ["police car (siren)", 9.74], ["siren", 8.19]], null, null, null, null, null, [["music", 55.14], ["hum", 15.7], ["throbbing", 7.29]], null, null, null, [["music", 32.77], ["hum", 26.36], ["mains hum", 17.6]], null, null, [["hum", 40.82], ["mains hum", 19.77], ["music", 9.1]]], "duration": [0.29, 7.87, 4.79, 14.36, 1.11, 1.45, 0.65, 0.18, 0.15, 4.61, 0.74, 0.7, 0.81, 6.31, -0.21, 0.26, 2.9]} \ No newline at end of file diff --git a/annotations_filtered/pFm8RKAyU_Q_filtered.json b/annotations_filtered/pFm8RKAyU_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2900ed8c8bda3c255e9ac3c150e30a1faf68bb3 --- /dev/null +++ b/annotations_filtered/pFm8RKAyU_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.36], [6.0, 7.1], [10.0, 10.13], [11.0, 12.04], [13.0, 13.73], [20.0, 22.69], [24.0, 25.1], [27.0, 29.52], [31.0, 37.47], [40.0, 40.12], [46.0, 46.14], [47.0, 48.47], [50.0, 50.72], [54.0, 54.45], [56.0, 65.58], [66.0, 66.55], [67.0, 67.63], [69.0, 129.29], [129.0, 174.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 43.2, 0.0, 44.15, 37.59, 0.0, 0.0, 0.0, 0.0, 0.0, 31.77, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 80.83], ["musical instrument", 3.79], ["timpani", 2.02]], null, [["music", 71.16], ["speech", 5.39], ["musical instrument", 4.01]], [["music", 65.21], ["didgeridoo", 6.7], ["theremin", 5.49]], null, null, null, null, null, [["music", 58.26], ["theremin", 13.85], ["synthesizer", 6.81]], null, null, null, null], "duration": [0.36, 1.1, 0.13, 1.04, 0.73, 2.69, 1.1, 2.52, 6.47, 0.12, 0.14, 1.47, 0.72, 0.45, 9.58, 0.55, 0.63, 60.29, 45.77]} \ No newline at end of file diff --git a/annotations_filtered/pGZtlbYLpck_filtered.json b/annotations_filtered/pGZtlbYLpck_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e03feb76d15e8cf4fc080efe15f8b48fc59bf5ed --- /dev/null +++ b/annotations_filtered/pGZtlbYLpck_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 16.63], [18.0, 19.9], [23.0, 24.44], [27.0, 37.12], [37.0, 50.6], [59.0, 104.09], [107.0, 110.12], [111.0, 111.92], [116.0, 122.3], [129.0, 136.39], [143.0, 149.99], [153.0, 160.86], [165.0, 173.58], [175.0, 176.77]], "keep_status": [true, false, false, true, true, false, false, false, true, false, false, false, false, false], "silence_prob": [40.24, 0.0, 0.0, 29.92, 29.15, 0.0, 33.1, 0.0, 29.4, 29.31, 29.05, 29.4, 29.25, 0.0], "audiomae_on_audioset": [[["music", 26.54], ["creak", 7.58], ["fart", 6.45]], null, null, [["speech", 16.41], ["siren", 9.36], ["vehicle", 8.93]], [["music", 37.05], ["didgeridoo", 6.7], ["speech", 5.68]], null, [["music", 65.09], ["musical instrument", 4.27], ["synthesizer", 3.81]], null, [["music", 38.86], ["quack", 13.03], ["groan", 5.16]], [["music", 48.75], ["boing", 15.89], ["livestock, farm animals, working animals", 8.37]], [["music", 47.52], ["speech", 27.16], ["explosion", 3.54]], [["music", 80.98], ["smash, crash", 2.05], ["throbbing", 1.66]], [["music", 43.31], ["speech", 31.54], ["smash, crash", 4.77]], null], "duration": [2.63, 1.9, 1.44, 10.12, 13.6, 45.09, 3.12, 0.92, 6.3, 7.39, 6.99, 7.86, 8.58, 1.77]} \ No newline at end of file diff --git a/annotations_filtered/pGhBFh0cXRU_filtered.json b/annotations_filtered/pGhBFh0cXRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b5c70190757f8e83c28bc17176b6f6131261294 --- /dev/null +++ b/annotations_filtered/pGhBFh0cXRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.13], [7.0, 8.09], [9.0, 19.65], [25.0, 25.83], [26.0, 32.36], [33.0, 39.93], [44.0, 43.98], [46.0, 49.98], [51.0, 53.84], [55.0, 56.35], [63.0, 63.81], [66.0, 66.75], [68.0, 69.4], [71.0, 70.85], [73.0, 74.68], [81.0, 85.48], [94.0, 110.51], [112.0, 112.78], [114.0, 124.55], [126.0, 128.61]], "keep_status": [false, false, true, false, true, true, false, true, false, false, false, false, false, false, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 32.39, 0.0, 29.61, 38.42, 0.0, 48.52, 65.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.6, 28.76, 0.0, 57.09, 39.74], "audiomae_on_audioset": [null, null, [["synthesizer", 19.85], ["music", 13.23], ["smash, crash", 8.42]], null, [["theremin", 42.08], ["music", 14.96], ["didgeridoo", 6.65]], [["music", 37.91], ["synthesizer", 16.92], ["throbbing", 9.9]], null, [["music", 27.4], ["hum", 24.39], ["didgeridoo", 14.15]], null, null, null, null, null, null, null, [["music", 32.21], ["sound effect", 6.35], ["rumble", 4.57]], [["music", 12.8], ["vehicle", 12.16], ["car", 7.64]], null, null, [["music", 55.6], ["musical instrument", 7.44], ["noise", 4.93]]], "duration": [0.13, 1.09, 10.65, 0.83, 6.36, 6.93, -0.02, 3.98, 2.84, 1.35, 0.81, 0.75, 1.4, -0.15, 1.68, 4.48, 16.51, 0.78, 10.55, 2.61]} \ No newline at end of file diff --git a/annotations_filtered/pGxyOeypYFs_filtered.json b/annotations_filtered/pGxyOeypYFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4bbc5e0975372d249af359d25ac90c391025fdb3 --- /dev/null +++ b/annotations_filtered/pGxyOeypYFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 49.91], [51.0, 74.33], [79.0, 114.72]], "keep_status": [false, false, false], "silence_prob": [0.0, 85.9, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.91, 23.33, 35.72]} \ No newline at end of file diff --git a/annotations_filtered/pHB8Z35H29k_filtered.json b/annotations_filtered/pHB8Z35H29k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..771496b8a1ef2d13136573f05c3d7ba27fea5848 --- /dev/null +++ b/annotations_filtered/pHB8Z35H29k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.17], [12.0, 11.82], [15.0, 20.51], [40.0, 43.43], [44.0, 45.28], [46.0, 49.27], [68.0, 73.3], [74.0, 74.24], [83.0, 83.1], [84.0, 84.84], [86.0, 89.73], [91.0, 91.71], [101.0, 101.55], [104.0, 104.73], [109.0, 111.65], [114.0, 119.2], [120.0, 123.7], [127.0, 126.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 86.45, 70.44, 0.0, 77.53, 92.8, 0.0, 0.0, 0.0, 98.73, 0.0, 0.0, 0.0, 54.76, 93.29, 75.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.17, -0.18, 5.51, 3.43, 1.28, 3.27, 5.3, 0.24, 0.1, 0.84, 3.73, 0.71, 0.55, 0.73, 2.65, 5.2, 3.7, -0.07]} \ No newline at end of file diff --git a/annotations_filtered/pHBKmT6eNGw_filtered.json b/annotations_filtered/pHBKmT6eNGw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3828ce7561c154ec87e32cc3d18c772818393eb --- /dev/null +++ b/annotations_filtered/pHBKmT6eNGw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.19], [14.0, 14.66], [16.0, 17.17], [20.0, 23.36], [26.0, 26.23], [28.0, 28.68], [30.0, 32.76], [35.0, 38.18], [39.0, 44.63], [48.0, 52.47], [60.0, 60.22], [60.0, 64.49], [66.0, 65.72], [66.0, 65.82], [67.0, 67.64], [70.0, 69.87], [71.0, 71.39], [72.0, 72.59], [74.0, 74.16], [75.0, 75.56], [78.0, 78.14], [80.0, 81.26], [82.0, 82.98], [88.0, 88.43], [89.0, 89.26], [90.0, 91.37], [92.0, 92.65], [95.0, 95.15], [98.0, 99.42], [103.0, 103.65], [112.0, 112.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 68.93, 0.0, 0.0, 97.64, 89.9, 99.68, 83.34, 0.0, 83.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.19, 0.66, 1.17, 3.36, 0.23, 0.68, 2.76, 3.18, 5.63, 4.47, 0.22, 4.49, -0.28, -0.18, 0.64, -0.13, 0.39, 0.59, 0.16, 0.56, 0.14, 1.26, 0.98, 0.43, 0.26, 1.37, 0.65, 0.15, 1.42, 0.65, 0.21]} \ No newline at end of file diff --git a/annotations_filtered/pHXL7yantDY_filtered.json b/annotations_filtered/pHXL7yantDY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac2eb5e2da935c76087e81e74e005ce4b99daa01 --- /dev/null +++ b/annotations_filtered/pHXL7yantDY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.62], [8.0, 9.69], [12.0, 12.19], [12.0, 16.88], [22.0, 23.65], [26.0, 30.59], [35.0, 36.22], [37.0, 37.71], [38.0, 39.02], [39.0, 43.14], [44.0, 44.81], [45.0, 45.5], [47.0, 49.35], [51.0, 51.04], [55.0, 60.91], [64.0, 63.85], [65.0, 65.65], [71.0, 72.0], [74.0, 80.5], [81.0, 82.12], [84.0, 84.35], [84.0, 87.25], [88.0, 88.62], [91.0, 93.7], [95.0, 95.27], [98.0, 100.63], [101.0, 100.67], [104.0, 106.57], [108.0, 108.14], [111.0, 126.33], [127.0, 127.63], [132.0, 132.54], [133.0, 137.32], [140.0, 140.76], [143.0, 144.21], [147.0, 149.89], [150.0, 150.77], [153.0, 157.33], [160.0, 160.44], [163.0, 163.8], [167.0, 181.6], [184.0, 185.14], [187.0, 190.02], [193.0, 194.98], [196.0, 196.57], [202.0, 203.15], [206.0, 206.78], [209.0, 209.63], [212.0, 217.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 64.52, 0.0, 60.51, 0.0, 0.0, 0.0, 75.72, 0.0, 0.0, 66.03, 0.0, 32.16, 0.0, 0.0, 0.0, 30.94, 0.0, 0.0, 31.67, 0.0, 31.37, 0.0, 31.72, 0.0, 29.51, 0.0, 31.8, 0.0, 0.0, 30.52, 0.0, 0.0, 30.3, 0.0, 31.82, 0.0, 0.0, 32.46, 0.0, 30.83, 0.0, 0.0, 0.0, 0.0, 0.0, 31.09], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.26], ["throbbing", 5.93], ["hum", 4.32]], null, null, null, [["music", 71.36], ["reggae", 4.28], ["boing", 3.52]], null, null, [["music", 59.86], ["boing", 15.32], ["didgeridoo", 2.35]], null, [["music", 63.37], ["drum machine", 3.55], ["sampler", 3.16]], null, [["music", 47.92], ["boing", 5.76], ["mosquito", 4.14]], null, [["music", 45.08], ["musical instrument", 3.7], ["livestock, farm animals, working animals", 2.65]], null, [["music", 87.34], ["musical instrument", 2.74], ["piano", 0.68]], null, null, [["music", 55.44], ["boing", 20.2], ["speech", 4.27]], null, null, [["music", 51.1], ["dubstep", 15.24], ["cacophony", 4.46]], null, [["music", 64.43], ["musical instrument", 2.42], ["video game music", 1.56]], null, null, [["music", 82.7], ["sampler", 1.88], ["didgeridoo", 1.67]], null, [["music", 70.71], ["drum machine", 3.63], ["singing", 2.43]], null, null, null, null, null, [["music", 51.96], ["speech", 9.4], ["boing", 5.77]]], "duration": [1.62, 1.69, 0.19, 4.88, 1.65, 4.59, 1.22, 0.71, 1.02, 4.14, 0.81, 0.5, 2.35, 0.04, 5.91, -0.15, 0.65, 1.0, 6.5, 1.12, 0.35, 3.25, 0.62, 2.7, 0.27, 2.63, -0.33, 2.57, 0.14, 15.33, 0.63, 0.54, 4.32, 0.76, 1.21, 2.89, 0.77, 4.33, 0.44, 0.8, 14.6, 1.14, 3.02, 1.98, 0.57, 1.15, 0.78, 0.63, 5.04]} \ No newline at end of file diff --git a/annotations_filtered/pHrp2OM19t4_filtered.json b/annotations_filtered/pHrp2OM19t4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d55fb35c8f8a5cfff6bde8d4084602f61cbb7f75 --- /dev/null +++ b/annotations_filtered/pHrp2OM19t4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 24.14], [25.0, 48.1], [50.0, 53.62], [54.0, 67.47], [69.0, 73.57], [76.0, 86.7], [101.0, 103.25], [104.0, 103.99], [104.0, 105.19], [110.0, 109.76], [118.0, 125.78], [133.0, 132.78], [140.0, 140.93], [144.0, 144.0], [146.0, 149.35], [150.0, 150.97], [151.0, 152.14], [164.0, 178.95], [179.0, 179.04]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [28.82, 29.0, 31.57, 29.39, 29.72, 30.31, 31.71, 0.0, 0.0, 0.0, 29.18, 0.0, 0.0, 0.0, 31.91, 0.0, 0.0, 29.0, 0.0], "audiomae_on_audioset": [[["mosquito", 17.66], ["music", 12.98], ["speech", 12.86]], [["music", 55.11], ["speech", 14.74], ["tabla", 2.61]], [["hum", 42.69], ["throbbing", 32.95], ["mains hum", 15.19]], [["music", 70.11], ["speech", 6.19], ["cacophony", 2.42]], [["fly, housefly", 21.7], ["cattle, bovinae", 16.86], ["moo", 15.33]], [["music", 61.14], ["buzz", 6.08], ["throbbing", 5.2]], [["music", 59.79], ["speech", 20.22], ["musical instrument", 1.13]], null, null, null, [["music", 52.94], ["animal", 18.96], ["dog", 7.7]], null, null, null, [["music", 55.67], ["musical instrument", 10.96], ["plucked string instrument", 9.42]], null, null, [["fly, housefly", 39.11], ["insect", 18.21], ["mosquito", 16.0]], null], "duration": [6.14, 23.1, 3.62, 13.47, 4.57, 10.7, 2.25, -0.01, 1.19, -0.24, 7.78, -0.22, 0.93, 0.0, 3.35, 0.97, 1.14, 14.95, 0.04]} \ No newline at end of file diff --git a/annotations_filtered/pHu6mCqzpyw_filtered.json b/annotations_filtered/pHu6mCqzpyw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e79b05c3f6dafcf13445cc25256186f8aacfc67 --- /dev/null +++ b/annotations_filtered/pHu6mCqzpyw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.81], [5.0, 5.49], [7.0, 8.31], [10.0, 11.3], [12.0, 15.55], [17.0, 16.83], [20.0, 20.68], [21.0, 22.98], [23.0, 31.95], [34.0, 33.96], [37.0, 42.16], [44.0, 43.66], [46.0, 46.75], [47.0, 48.57], [49.0, 50.8], [52.0, 54.23], [56.0, 57.91], [58.0, 58.36], [59.0, 59.48], [64.0, 67.96], [72.0, 110.91], [113.0, 113.73], [116.0, 116.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 59.96, 0.0, 0.0, 0.0, 99.36, 0.0, 69.07, 0.0, 0.0, 0.0, 0.0, 80.64, 0.0, 0.0, 0.0, 99.44, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 0.49, 1.31, 1.3, 3.55, -0.17, 0.68, 1.98, 8.95, -0.04, 5.16, -0.34, 0.75, 1.57, 1.8, 2.23, 1.91, 0.36, 0.48, 3.96, 38.91, 0.73, 0.01]} \ No newline at end of file diff --git a/annotations_filtered/pHvNvYijtBU_filtered.json b/annotations_filtered/pHvNvYijtBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5545182da6ca85de4d9727c84a62f9ca5fdaaf2 --- /dev/null +++ b/annotations_filtered/pHvNvYijtBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.33], [13.0, 14.1], [17.0, 17.85], [21.0, 22.38], [24.0, 25.54], [37.0, 39.41], [52.0, 59.59], [71.0, 72.03], [93.0, 93.12], [96.0, 96.42], [101.0, 101.07]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 52.39, 31.21, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 18.27], ["buzz", 10.63], ["whir", 8.86]], null, null, null, null], "duration": [0.33, 1.1, 0.85, 1.38, 1.54, 2.41, 7.59, 1.03, 0.12, 0.42, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/pHxvNgorTQA_filtered.json b/annotations_filtered/pHxvNgorTQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db2a447a7a1b9be8d864c158c5a422d6ba6924b5 --- /dev/null +++ b/annotations_filtered/pHxvNgorTQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 48.95], [50.0, 63.56], [64.0, 70.87], [71.0, 76.62], [77.0, 105.93], [106.0, 111.38]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 63.1, 55.74, 52.45, 31.06, 30.2], "audiomae_on_audioset": [null, null, null, null, [["music", 73.04], ["ambient music", 4.07], ["theremin", 3.77]], [["music", 57.23], ["synthesizer", 9.46], ["musical instrument", 5.9]]], "duration": [1.95, 13.56, 6.87, 5.62, 28.93, 5.38]} \ No newline at end of file diff --git a/annotations_filtered/pIPr7nbUCAw_filtered.json b/annotations_filtered/pIPr7nbUCAw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..531e8277492ceb59500442bda6e8f173e3651ad7 --- /dev/null +++ b/annotations_filtered/pIPr7nbUCAw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.99], [8.0, 8.65], [10.0, 11.35], [13.0, 20.76], [22.0, 24.44], [26.0, 36.63], [38.0, 56.86], [58.0, 61.79], [62.0, 77.13], [79.0, 79.52], [80.0, 82.46]], "keep_status": [false, false, false, true, true, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 44.12, 44.23, 30.44, 29.35, 34.55, 29.61, 0.0, 60.42], "audiomae_on_audioset": [null, null, null, [["vehicle", 16.96], ["hum", 15.82], ["mains hum", 13.04]], [["mains hum", 33.19], ["hum", 19.59], ["speech", 10.28]], [["music", 33.69], ["musical instrument", 5.93], ["vehicle", 5.4]], [["music", 29.82], ["speech", 19.51], ["trombone", 5.38]], [["music", 73.07], ["musical instrument", 6.85], ["guitar", 5.71]], [["music", 62.13], ["whack, thwack", 5.5], ["fart", 3.7]], null, null], "duration": [-0.01, 0.65, 1.35, 7.76, 2.44, 10.63, 18.86, 3.79, 15.13, 0.52, 2.46]} \ No newline at end of file diff --git a/annotations_filtered/pIWh28WPyxQ_filtered.json b/annotations_filtered/pIWh28WPyxQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0bd6e74b958dc70d8ab8d92c5bd33e3b8fb6655b --- /dev/null +++ b/annotations_filtered/pIWh28WPyxQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 40.61], [42.0, 45.47], [47.0, 47.36], [48.0, 49.77], [62.0, 63.88], [67.0, 68.94], [75.0, 76.08], [82.0, 83.07], [84.0, 87.72], [89.0, 102.25], [104.0, 103.67], [104.0, 110.57], [117.0, 119.42], [123.0, 125.41], [128.0, 130.67]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [30.77, 35.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.1, 61.67, 0.0, 51.07, 40.77, 31.6, 35.36], "audiomae_on_audioset": [[["vehicle", 35.29], ["motorcycle", 16.46], ["race car, auto racing", 12.65]], [["whale vocalization", 33.19], ["music", 16.19], ["speech", 5.02]], null, null, null, null, null, null, null, null, null, null, [["music", 48.75], ["speech", 16.41], ["theremin", 4.21]], [["music", 25.21], ["speech", 15.19], ["sound effect", 6.32]], [["music", 42.97], ["musical instrument", 10.83], ["synthesizer", 8.67]]], "duration": [21.61, 3.47, 0.36, 1.77, 1.88, 1.94, 1.08, 1.07, 3.72, 13.25, -0.33, 6.57, 2.42, 2.41, 2.67]} \ No newline at end of file diff --git a/annotations_filtered/pIvTIG3tWok_filtered.json b/annotations_filtered/pIvTIG3tWok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8262cd52f429ac5b6c76bef0c5bb06c392dd7b9 --- /dev/null +++ b/annotations_filtered/pIvTIG3tWok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 4.9], [6.0, 6.59], [7.0, 8.26], [9.0, 9.63], [10.0, 11.11], [12.0, 13.27], [14.0, 15.09], [32.0, 33.64], [35.0, 35.8], [37.0, 38.7], [39.0, 40.39], [47.0, 48.07], [49.0, 57.6], [68.0, 94.02], [97.0, 97.07], [102.0, 104.18], [113.0, 114.24], [117.0, 119.18], [123.0, 124.55], [128.0, 130.03], [146.0, 145.94], [151.0, 187.51], [196.0, 197.78], [201.0, 201.5], [215.0, 217.73], [228.0, 229.27], [232.0, 232.38], [232.0, 245.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [80.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.43, 35.94, 0.0, 37.66, 0.0, 34.75, 0.0, 35.02, 0.0, 0.0, 0.0, 0.0, 35.62, 0.0, 0.0, 35.96], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 82.39], ["speech", 2.58], ["electronic music", 2.09]], null, [["music", 54.89], ["didgeridoo", 7.33], ["sampler", 4.98]], null, [["music", 75.98], ["didgeridoo", 3.54], ["throbbing", 2.58]], null, [["music", 30.43], ["theremin", 11.32], ["synthesizer", 8.84]], null, null, null, null, [["music", 63.21], ["musical instrument", 4.81], ["didgeridoo", 4.63]], null, null, [["music", 83.27], ["reggae", 1.45], ["electronic music", 1.41]]], "duration": [4.9, 0.59, 1.26, 0.63, 1.11, 1.27, 1.09, 1.64, 0.8, 1.7, 1.39, 1.07, 8.6, 26.02, 0.07, 2.18, 1.24, 2.18, 1.55, 2.03, -0.06, 36.51, 1.78, 0.5, 2.73, 1.27, 0.38, 13.4]} \ No newline at end of file diff --git a/annotations_filtered/pJCgeOAKXyg_filtered.json b/annotations_filtered/pJCgeOAKXyg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45aa14da90142558c3a4cee60ec883dc6f326f92 --- /dev/null +++ b/annotations_filtered/pJCgeOAKXyg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.06], [34.0, 34.18], [37.0, 36.9], [59.0, 59.95], [61.0, 68.69], [70.0, 78.22], [81.0, 120.75], [122.0, 128.31], [129.0, 138.91], [141.0, 202.2], [203.0, 208.79], [210.0, 225.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.91, 32.32, 0.0, 29.47, 28.43, 0.0, 28.36, 28.54], "audiomae_on_audioset": [null, null, null, null, [["music", 62.39], ["speech", 7.38], ["electronic music", 5.42]], [["music", 55.74], ["ambient music", 11.78], ["electronic music", 5.87]], null, [["hum", 29.94], ["music", 25.5], ["throbbing", 25.47]], [["throbbing", 27.08], ["music", 25.37], ["hum", 18.22]], null, [["livestock, farm animals, working animals", 40.85], ["cattle, bovinae", 14.4], ["moo", 10.05]], [["music", 73.75], ["speech", 3.46], ["hum", 3.17]]], "duration": [0.06, 0.18, -0.1, 0.95, 7.69, 8.22, 39.75, 6.31, 9.91, 61.2, 5.79, 15.61]} \ No newline at end of file diff --git a/annotations_filtered/pJFZLCoqB9w_filtered.json b/annotations_filtered/pJFZLCoqB9w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b59d40e8f1584535fdf4faf44f7dac041b2d4164 --- /dev/null +++ b/annotations_filtered/pJFZLCoqB9w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.66], [8.0, 11.8], [12.0, 13.42], [14.0, 19.97], [21.0, 21.93], [23.0, 39.14], [40.0, 40.24], [46.0, 52.03], [53.0, 53.76], [58.0, 59.04], [61.0, 61.06], [65.0, 65.03], [67.0, 67.59], [68.0, 69.69], [71.0, 71.56], [73.0, 74.98], [78.0, 79.84], [81.0, 82.95], [84.0, 84.55], [87.0, 88.45], [89.0, 90.63], [96.0, 97.23], [98.0, 98.58], [101.0, 102.36], [104.0, 104.33], [108.0, 108.89], [110.0, 112.67], [114.0, 115.79], [124.0, 128.14]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 99.71, 0.0, 95.64, 0.0, 64.75, 0.0, 40.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.33, 0.0, 41.12], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 39.13], ["stomach rumble", 14.0], ["sidetone", 11.49]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.18], ["hum", 6.98], ["throbbing", 6.91]]], "duration": [0.66, 3.8, 1.42, 5.97, 0.93, 16.14, 0.24, 6.03, 0.76, 1.04, 0.06, 0.03, 0.59, 1.69, 0.56, 1.98, 1.84, 1.95, 0.55, 1.45, 1.63, 1.23, 0.58, 1.36, 0.33, 0.89, 2.67, 1.79, 4.14]} \ No newline at end of file diff --git a/annotations_filtered/pJIGy4zHo6E_filtered.json b/annotations_filtered/pJIGy4zHo6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5dbcec2dda3092a2b38bc7e6897c737a8d549233 --- /dev/null +++ b/annotations_filtered/pJIGy4zHo6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.65], [5.0, 6.45], [8.0, 8.19], [9.0, 9.64], [10.0, 16.87], [18.0, 58.08], [59.0, 78.81], [81.0, 86.34], [87.0, 88.42], [90.0, 97.95], [102.0, 112.11], [118.0, 121.46]], "keep_status": [false, false, false, false, true, false, false, true, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.53, 0.0, 33.75, 31.18, 0.0, 31.36, 32.16, 30.79], "audiomae_on_audioset": [null, null, null, null, [["music", 53.1], ["livestock, farm animals, working animals", 9.72], ["groan", 4.72]], null, [["hum", 45.66], ["throbbing", 16.02], ["music", 11.37]], [["animal", 16.98], ["bow-wow", 12.81], ["canidae, dogs, wolves", 11.01]], null, [["music", 58.3], ["animal", 5.57], ["theremin", 5.24]], [["vehicle", 34.78], ["car", 6.62], ["music", 6.5]], [["music", 48.68], ["musical instrument", 5.12], ["brass instrument", 4.27]]], "duration": [1.65, 1.45, 0.19, 0.64, 6.87, 40.08, 19.81, 5.34, 1.42, 7.95, 10.11, 3.46]} \ No newline at end of file diff --git a/annotations_filtered/pJImKCcPIsU_filtered.json b/annotations_filtered/pJImKCcPIsU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..474b39c1c796901f04c5d8498f5f4e2741746ebf --- /dev/null +++ b/annotations_filtered/pJImKCcPIsU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.62], [8.0, 10.64], [12.0, 12.68], [13.0, 14.91], [16.0, 16.55], [17.0, 19.89], [29.0, 29.71], [37.0, 38.53], [42.0, 42.69], [44.0, 45.55], [46.0, 49.25], [50.0, 53.72], [57.0, 57.43], [67.0, 67.2], [70.0, 72.79], [75.0, 76.54], [77.0, 78.33], [83.0, 83.98], [84.0, 84.75], [87.0, 87.4], [89.0, 91.15], [93.0, 94.15], [98.0, 99.35], [107.0, 116.21], [117.0, 117.96], [121.0, 120.99], [124.0, 124.51], [125.0, 126.99], [129.0, 129.25], [131.0, 130.89], [139.0, 139.43], [146.0, 147.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.52, 99.62, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0, 77.36, 72.16, 0.0, 0.0, 92.15, 0.0, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0, 0.0, 38.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 55.32], ["hum", 15.61], ["sidetone", 6.13]], null, null, null, null, null, null, null, null], "duration": [4.62, 2.64, 0.68, 1.91, 0.55, 2.89, 0.71, 1.53, 0.69, 1.55, 3.25, 3.72, 0.43, 0.2, 2.79, 1.54, 1.33, 0.98, 0.75, 0.4, 2.15, 1.15, 1.35, 9.21, 0.96, -0.01, 0.51, 1.99, 0.25, -0.11, 0.43, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/pJJjycrT0RA_filtered.json b/annotations_filtered/pJJjycrT0RA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fa4a329e2a378b24cab01580c00f46584eb3f54 --- /dev/null +++ b/annotations_filtered/pJJjycrT0RA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.5], [15.0, 15.67], [18.0, 19.5], [20.0, 20.24], [22.0, 22.33], [24.0, 24.41], [26.0, 26.28], [32.0, 33.56], [36.0, 37.74], [40.0, 40.26], [43.0, 42.99], [45.0, 46.16], [48.0, 49.01], [54.0, 54.53], [55.0, 58.33], [61.0, 60.79], [62.0, 62.73], [65.0, 65.47], [66.0, 66.75], [70.0, 70.23], [73.0, 76.54], [87.0, 89.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.39, 0.0, 0.0, 0.0, 0.0, 0.0, 82.97, 61.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.5, 0.67, 1.5, 0.24, 0.33, 0.41, 0.28, 1.56, 1.74, 0.26, -0.01, 1.16, 1.01, 0.53, 3.33, -0.21, 0.73, 0.47, 0.75, 0.23, 3.54, 2.23]} \ No newline at end of file diff --git a/annotations_filtered/pK35em6gl0Q_filtered.json b/annotations_filtered/pK35em6gl0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4bb3134234458efb339168e07ed5369477b79986 --- /dev/null +++ b/annotations_filtered/pK35em6gl0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.91], [16.0, 16.36], [17.0, 23.45], [24.0, 27.06], [28.0, 29.93], [32.0, 32.49], [33.0, 34.13], [35.0, 38.16], [39.0, 39.87], [41.0, 41.72], [43.0, 45.06], [48.0, 49.62], [51.0, 52.15], [53.0, 54.04], [54.0, 55.17], [56.0, 57.47], [58.0, 66.51], [67.0, 76.11], [77.0, 78.53], [80.0, 82.17], [83.0, 93.21], [94.0, 96.18], [100.0, 102.56], [104.0, 105.19], [106.0, 116.36], [117.0, 116.95], [117.0, 118.18], [119.0, 121.69], [125.0, 127.58], [129.0, 129.34], [130.0, 131.09], [133.0, 133.42], [134.0, 135.6], [138.0, 139.24], [140.0, 141.15], [142.0, 143.46], [147.0, 147.36], [148.0, 149.93], [150.0, 157.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [66.88, 0.0, 82.43, 95.09, 0.0, 0.0, 0.0, 55.46, 0.0, 0.0, 95.51, 0.0, 0.0, 0.0, 0.0, 0.0, 36.97, 31.68, 0.0, 99.1, 58.55, 99.31, 99.52, 0.0, 99.4, 0.0, 0.0, 52.33, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.47], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 23.58], ["mains hum", 22.12], ["speech", 20.66]], [["speech", 38.66], ["mains hum", 13.45], ["music", 10.54]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.91, 0.36, 6.45, 3.06, 1.93, 0.49, 1.13, 3.16, 0.87, 0.72, 2.06, 1.62, 1.15, 1.04, 1.17, 1.47, 8.51, 9.11, 1.53, 2.17, 10.21, 2.18, 2.56, 1.19, 10.36, -0.05, 1.18, 2.69, 2.58, 0.34, 1.09, 0.42, 1.6, 1.24, 1.15, 1.46, 0.36, 1.93, 7.27]} \ No newline at end of file diff --git a/annotations_filtered/pKHAhc31MOI_filtered.json b/annotations_filtered/pKHAhc31MOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e04f55bf2db9224512124d2da284420220424db1 --- /dev/null +++ b/annotations_filtered/pKHAhc31MOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.02], [3.0, 12.02], [13.0, 13.83], [17.0, 19.26], [32.0, 34.91], [37.0, 38.62], [52.0, 52.76], [56.0, 56.74], [61.0, 62.28], [76.0, 76.81], [78.0, 78.65], [85.0, 98.58], [99.0, 104.73], [107.0, 108.11], [110.0, 111.79], [115.0, 115.5], [116.0, 116.73], [119.0, 121.58], [133.0, 134.33], [143.0, 148.71], [151.0, 152.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.44, 0.0, 99.56, 96.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.64, 99.62, 0.0, 0.0, 0.0, 0.0, 99.8, 0.0, 99.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.02, 9.02, 0.83, 2.26, 2.91, 1.62, 0.76, 0.74, 1.28, 0.81, 0.65, 13.58, 5.73, 1.11, 1.79, 0.5, 0.73, 2.58, 1.33, 5.71, 1.86]} \ No newline at end of file diff --git a/annotations_filtered/pKJOqt7BtB8_filtered.json b/annotations_filtered/pKJOqt7BtB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c92c33799ee5a2607cf48cc08de114d4c9d4f7cc --- /dev/null +++ b/annotations_filtered/pKJOqt7BtB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.6], [11.0, 12.68], [17.0, 18.3], [29.0, 29.07], [37.0, 37.34], [40.0, 40.93], [45.0, 45.86], [50.0, 51.71], [52.0, 54.09], [55.0, 56.19], [57.0, 61.1], [64.0, 81.3], [84.0, 87.79], [90.0, 92.06], [96.0, 96.4], [99.0, 100.43], [108.0, 108.94], [111.0, 112.55], [116.0, 116.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.38, 0.0, 55.39, 40.09, 94.37, 97.11, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["theremin", 41.96], ["music", 36.25], ["musical instrument", 3.73]], null, null, null, null, null, null, null], "duration": [1.6, 1.68, 1.3, 0.07, 0.34, 0.93, 0.86, 1.71, 2.09, 1.19, 4.1, 17.3, 3.79, 2.06, 0.4, 1.43, 0.94, 1.55, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/pKN_6Javjnc_filtered.json b/annotations_filtered/pKN_6Javjnc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c43ef892d1bed99a1dd24467429c4af21afc5f90 --- /dev/null +++ b/annotations_filtered/pKN_6Javjnc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.65], [6.0, 8.77], [9.0, 16.78], [18.0, 19.45], [22.0, 22.25], [23.0, 25.41], [26.0, 28.02], [29.0, 30.11], [31.0, 31.7], [32.0, 32.8], [34.0, 35.7], [36.0, 37.1], [39.0, 39.19], [41.0, 41.27], [43.0, 43.97], [46.0, 45.91], [48.0, 49.45], [51.0, 52.24], [53.0, 53.57], [56.0, 57.74], [59.0, 59.21], [60.0, 60.47], [63.0, 63.63], [65.0, 65.43], [66.0, 68.13], [70.0, 70.46], [72.0, 73.08], [75.0, 78.6], [79.0, 81.73], [82.0, 86.09], [86.0, 89.78], [91.0, 94.61], [96.0, 99.87], [101.0, 101.93], [102.0, 108.97], [110.0, 110.32], [111.0, 111.79], [113.0, 122.66], [124.0, 125.63], [127.0, 127.48], [128.0, 129.47], [131.0, 130.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 56.33, 0.0, 0.0, 50.46, 65.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.54, 0.0, 0.0, 96.17, 81.0, 99.78, 95.37, 100.0, 100.0, 0.0, 98.36, 0.0, 0.0, 92.48, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.65, 2.77, 7.78, 1.45, 0.25, 2.41, 2.02, 1.11, 0.7, 0.8, 1.7, 1.1, 0.19, 0.27, 0.97, -0.09, 1.45, 1.24, 0.57, 1.74, 0.21, 0.47, 0.63, 0.43, 2.13, 0.46, 1.08, 3.6, 2.73, 4.09, 3.78, 3.61, 3.87, 0.93, 6.97, 0.32, 0.79, 9.66, 1.63, 0.48, 1.47, -0.04]} \ No newline at end of file diff --git a/annotations_filtered/pKNsKKRGrzs_filtered.json b/annotations_filtered/pKNsKKRGrzs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f082c9294d871075cffa4544f898b1c8e4806eb2 --- /dev/null +++ b/annotations_filtered/pKNsKKRGrzs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 14.69], [19.0, 20.11], [22.0, 38.87], [40.0, 40.83], [42.0, 42.63], [44.0, 45.1], [47.0, 48.19], [50.0, 51.56], [53.0, 54.11], [56.0, 56.71], [58.0, 58.33], [59.0, 60.2], [62.0, 64.61], [65.0, 66.45], [67.0, 68.71], [70.0, 80.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [59.42, 0.0, 33.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.81, 0.0, 0.0, 31.86], "audiomae_on_audioset": [null, null, [["music", 69.47], ["musical instrument", 4.45], ["applause", 3.8]], null, null, null, null, null, null, null, null, null, [["music", 49.11], ["sidetone", 14.59], ["theremin", 8.68]], null, null, [["music", 49.9], ["applause", 6.42], ["electronic music", 4.31]]], "duration": [9.69, 1.11, 16.87, 0.83, 0.63, 1.1, 1.19, 1.56, 1.11, 0.71, 0.33, 1.2, 2.61, 1.45, 1.71, 10.94]} \ No newline at end of file diff --git a/annotations_filtered/pKdszbbvQGc_filtered.json b/annotations_filtered/pKdszbbvQGc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee4c6de34d0393c8fd02c9476f934349bd53847d --- /dev/null +++ b/annotations_filtered/pKdszbbvQGc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.32], [6.0, 7.13], [9.0, 9.86], [13.0, 14.84], [16.0, 16.41], [17.0, 18.52], [20.0, 21.27], [32.0, 32.68], [35.0, 35.51], [43.0, 43.9], [49.0, 55.83], [59.0, 59.97], [84.0, 85.11], [87.0, 88.01], [102.0, 103.5], [107.0, 107.97], [110.0, 110.32], [132.0, 133.34], [136.0, 136.16], [144.0, 144.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 70.81], ["musical instrument", 1.93], ["reggae", 1.88]], null, null, null, null, null, null, null, null, null], "duration": [0.32, 1.13, 0.86, 1.84, 0.41, 1.52, 1.27, 0.68, 0.51, 0.9, 6.83, 0.97, 1.11, 1.01, 1.5, 0.97, 0.32, 1.34, 0.16, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/pKjMt3cBv6g_filtered.json b/annotations_filtered/pKjMt3cBv6g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d86bf00e180c27aa8eb1dd9ef79a56d64d3b2385 --- /dev/null +++ b/annotations_filtered/pKjMt3cBv6g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 20.8], [26.0, 45.64], [46.0, 47.97], [49.0, 52.46], [53.0, 54.94], [56.0, 58.24], [59.0, 59.83], [61.0, 63.32], [64.0, 64.98], [66.0, 66.04], [67.0, 67.69], [69.0, 71.98]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.3, 35.08, 0.0, 55.25, 0.0, 58.81, 0.0, 65.79, 0.0, 0.0, 0.0, 77.03], "audiomae_on_audioset": [[["speech", 57.03], ["music", 6.89], ["sidetone", 5.92]], [["music", 69.06], ["didgeridoo", 11.65], ["musical instrument", 6.44]], null, null, null, null, null, null, null, null, null, null], "duration": [17.8, 19.64, 1.97, 3.46, 1.94, 2.24, 0.83, 2.32, 0.98, 0.04, 0.69, 2.98]} \ No newline at end of file diff --git a/annotations_filtered/pKsa_9TFG48_filtered.json b/annotations_filtered/pKsa_9TFG48_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e213ab32dda989b7fc0436d181748d3ba5149d20 --- /dev/null +++ b/annotations_filtered/pKsa_9TFG48_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 17.91], [22.0, 22.64], [26.0, 27.08]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [-0.09, 0.64, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/pLC_hRDO7Hk_filtered.json b/annotations_filtered/pLC_hRDO7Hk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18ee65a7757f51669044c36bcc457ff48b1f8185 --- /dev/null +++ b/annotations_filtered/pLC_hRDO7Hk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.32], [22.0, 22.42], [29.0, 30.25], [31.0, 32.27], [35.0, 35.92], [42.0, 42.33], [47.0, 47.17], [50.0, 50.21], [60.0, 61.43], [62.0, 63.19], [64.0, 64.96], [68.0, 68.22], [78.0, 78.41], [81.0, 82.9], [85.0, 85.21], [86.0, 87.02], [92.0, 92.18], [96.0, 98.81], [103.0, 102.95], [109.0, 109.7], [115.0, 116.01], [122.0, 124.01], [127.0, 126.82], [128.0, 130.6], [133.0, 133.3], [134.0, 134.06], [137.0, 137.59], [142.0, 142.8], [152.0, 152.1], [152.0, 152.15], [152.0, 152.31], [152.0, 153.62], [161.0, 160.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.97, 0.0, 0.0, 0.0, 83.34, 0.0, 75.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 60.62], ["carnatic music", 4.58], ["tabla", 4.55]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.32, 0.42, 1.25, 1.27, 0.92, 0.33, 0.17, 0.21, 1.43, 1.19, 0.96, 0.22, 0.41, 1.9, 0.21, 1.02, 0.18, 2.81, -0.05, 0.7, 1.01, 2.01, -0.18, 2.6, 0.3, 0.06, 0.59, 0.8, 0.1, 0.15, 0.31, 1.62, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/pLKZ0Adi70c_filtered.json b/annotations_filtered/pLKZ0Adi70c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac793054bcc2b1404e45a1365dd92bedc2d83116 --- /dev/null +++ b/annotations_filtered/pLKZ0Adi70c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.81], [18.0, 21.22], [25.0, 25.59], [28.0, 29.37], [30.0, 30.89], [37.0, 37.69], [39.0, 50.73]], "keep_status": [false, true, false, false, false, false, false], "silence_prob": [0.0, 29.93, 0.0, 0.0, 0.0, 0.0, 32.38], "audiomae_on_audioset": [null, [["explosion", 31.13], ["eruption", 17.61], ["speech", 9.7]], null, null, null, null, [["music", 59.04], ["didgeridoo", 11.53], ["synthesizer", 3.23]]], "duration": [1.81, 3.22, 0.59, 1.37, 0.89, 0.69, 11.73]} \ No newline at end of file diff --git a/annotations_filtered/pLRk4xG-JCI_filtered.json b/annotations_filtered/pLRk4xG-JCI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20eded957824b0ddfe916d938b0125314d54a710 --- /dev/null +++ b/annotations_filtered/pLRk4xG-JCI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 66.68]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [56.68]} \ No newline at end of file diff --git a/annotations_filtered/pLlcwabi5AQ_filtered.json b/annotations_filtered/pLlcwabi5AQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63e945bb6a6623e70b8e104e2e3dd87845defc6f --- /dev/null +++ b/annotations_filtered/pLlcwabi5AQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.5], [11.0, 11.75], [39.0, 39.24], [48.0, 47.73], [68.0, 68.86], [70.0, 70.7], [84.0, 85.01], [98.0, 98.64], [132.0, 132.63], [136.0, 137.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 0.75, 0.24, -0.27, 0.86, 0.7, 1.01, 0.64, 0.63, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/pLm07s8fnzM_filtered.json b/annotations_filtered/pLm07s8fnzM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e929c47a3e7e80e60bb98c9dee107a24d0c2315 --- /dev/null +++ b/annotations_filtered/pLm07s8fnzM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.84], [18.0, 18.2], [56.0, 59.14], [95.0, 95.07], [98.0, 97.92]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.41, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["yodeling", 50.99], ["music", 35.89], ["synthetic singing", 2.89]], null, null], "duration": [0.84, 0.2, 3.14, 0.07, -0.08]} \ No newline at end of file diff --git a/annotations_filtered/pLooDtjrhv8_filtered.json b/annotations_filtered/pLooDtjrhv8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11f6f54ec00547c95340d4c92940c6d4a5b73cd9 --- /dev/null +++ b/annotations_filtered/pLooDtjrhv8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.59], [5.0, 7.64], [13.0, 12.75], [17.0, 17.51], [19.0, 20.16], [24.0, 25.07], [26.0, 26.06], [27.0, 31.75], [33.0, 33.56], [34.0, 34.3], [35.0, 35.73], [45.0, 45.25], [50.0, 51.12], [60.0, 60.35], [63.0, 63.15], [78.0, 78.51], [84.0, 84.57], [87.0, 87.44], [87.0, 87.51], [100.0, 99.99], [101.0, 104.82], [108.0, 116.46], [119.0, 130.84], [142.0, 146.45], [146.0, 147.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 55.74, 0.0, 0.0, 0.0, 0.0, 0.0, 59.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.71, 28.81, 28.85, 28.88, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 21.25], ["cattle, bovinae", 19.15], ["music", 18.41]], [["music", 51.19], ["electronic music", 12.07], ["speech", 10.91]], [["speech", 48.65], ["music", 21.75], ["electronic music", 8.09]], [["speech", 22.39], ["cattle, bovinae", 21.75], ["moo", 12.78]], null], "duration": [-0.41, 2.64, -0.25, 0.51, 1.16, 1.07, 0.06, 4.75, 0.56, 0.3, 0.73, 0.25, 1.12, 0.35, 0.15, 0.51, 0.57, 0.44, 0.51, -0.01, 3.82, 8.46, 11.84, 4.45, 1.23]} \ No newline at end of file diff --git a/annotations_filtered/pLqoZtmyxxk_filtered.json b/annotations_filtered/pLqoZtmyxxk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad42a0b9068ed39f41eac6030d53cce4274710f8 --- /dev/null +++ b/annotations_filtered/pLqoZtmyxxk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 11.25], [13.0, 14.52], [21.0, 24.97], [26.0, 27.03], [29.0, 36.54], [40.0, 42.09], [47.0, 47.43], [48.0, 47.9], [48.0, 47.98], [48.0, 53.08], [55.0, 58.35], [61.0, 74.82], [76.0, 80.76], [86.0, 87.0], [89.0, 124.93], [127.0, 127.87]], "keep_status": [true, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false], "silence_prob": [36.05, 0.0, 67.63, 0.0, 37.73, 54.43, 0.0, 0.0, 0.0, 33.63, 40.28, 38.9, 35.82, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 20.59], ["animal", 14.0], ["livestock, farm animals, working animals", 9.72]], null, null, null, [["music", 58.58], ["synthesizer", 7.48], ["speech", 4.71]], null, null, null, null, [["speech", 26.8], ["music", 22.17], ["cattle, bovinae", 5.0]], [["speech", 25.14], ["music", 19.2], ["radio", 7.16]], [["speech", 34.35], ["music", 31.84], ["radio", 3.98]], [["livestock, farm animals, working animals", 19.33], ["cattle, bovinae", 19.3], ["moo", 18.03]], null, null, null], "duration": [10.25, 1.52, 3.97, 1.03, 7.54, 2.09, 0.43, -0.1, -0.02, 5.08, 3.35, 13.82, 4.76, 1.0, 35.93, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/pLra48c-SuA_filtered.json b/annotations_filtered/pLra48c-SuA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9aa77b8523c6b5f2247fb11de364e5f81c88d3ce --- /dev/null +++ b/annotations_filtered/pLra48c-SuA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 49.33], [52.0, 52.83], [54.0, 57.94], [66.0, 66.55], [68.0, 76.89], [79.0, 78.95], [81.0, 89.8]], "keep_status": [false, false, true, false, true, false, true], "silence_prob": [0.0, 0.0, 41.28, 0.0, 34.58, 0.0, 31.7], "audiomae_on_audioset": [null, null, [["music", 40.33], ["ambient music", 15.48], ["gong", 11.91]], null, [["rumble", 30.04], ["music", 14.13], ["hum", 12.27]], null, [["music", 30.99], ["hum", 20.05], ["mains hum", 11.59]]], "duration": [40.33, 0.83, 3.94, 0.55, 8.89, -0.05, 8.8]} \ No newline at end of file diff --git a/annotations_filtered/pM87ObBNOk4_filtered.json b/annotations_filtered/pM87ObBNOk4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..622886fa5781820012a7f0783e13b4334f24a7d1 --- /dev/null +++ b/annotations_filtered/pM87ObBNOk4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 67.98], [71.0, 70.95], [75.0, 75.24], [88.0, 88.48], [91.0, 95.86], [96.0, 97.02]], "keep_status": [false, false, false, false, true, false], "silence_prob": [40.04, 0.0, 0.0, 0.0, 37.02, 0.0], "audiomae_on_audioset": [[["speech", 55.52], ["sidetone", 10.56], ["whip", 5.76]], null, null, null, [["frog", 17.07], ["fart", 15.19], ["grunt", 8.85]], null], "duration": [17.98, -0.05, 0.24, 0.48, 4.86, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/pMPJV8sYt7k_filtered.json b/annotations_filtered/pMPJV8sYt7k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20e058089e1ca3b66ee22f9d947ef069dbe09822 --- /dev/null +++ b/annotations_filtered/pMPJV8sYt7k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.11], [5.0, 6.29], [7.0, 8.11], [10.0, 11.47], [18.0, 19.33], [22.0, 24.44], [29.0, 33.64], [36.0, 38.4], [41.0, 41.22], [42.0, 42.33], [44.0, 44.51], [45.0, 45.62], [46.0, 46.68], [48.0, 50.89], [55.0, 59.34], [64.0, 66.01], [69.0, 72.45], [74.0, 79.86], [82.0, 92.1], [96.0, 103.84], [110.0, 114.88], [115.0, 116.28], [118.0, 119.64], [121.0, 121.98], [123.0, 122.82], [123.0, 124.34], [127.0, 127.68], [129.0, 129.76], [131.0, 138.38], [141.0, 142.18], [143.0, 149.99], [153.0, 180.17]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 82.07, 35.65, 40.84, 0.0, 0.0, 0.0, 0.0, 0.0, 47.74, 40.21, 35.81, 32.37, 32.1, 32.93, 32.31, 34.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.7, 0.0, 54.83, 31.33], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 69.49], ["didgeridoo", 8.17], ["speech", 3.6]], [["music", 59.31], ["mantra", 4.89], ["singing bowl", 2.45]], null, null, null, null, null, [["music", 36.91], ["marimba, xylophone", 5.92], ["glockenspiel", 5.38]], [["music", 49.07], ["musical instrument", 5.41], ["guitar", 4.29]], [["didgeridoo", 48.94], ["music", 29.82], ["musical instrument", 6.48]], [["music", 40.48], ["didgeridoo", 31.89], ["theremin", 6.59]], [["music", 53.61], ["musical instrument", 7.58], ["carnatic music", 7.32]], [["music", 67.2], ["didgeridoo", 26.93], ["speech", 1.16]], [["music", 62.25], ["didgeridoo", 33.74], ["musical instrument", 0.56]], [["music", 80.18], ["didgeridoo", 7.36], ["singing", 1.51]], null, null, null, null, null, null, null, null, null, null, [["music", 91.59], ["didgeridoo", 3.63], ["musical instrument", 0.52]]], "duration": [0.11, 1.29, 1.11, 1.47, 1.33, 2.44, 4.64, 2.4, 0.22, 0.33, 0.51, 0.62, 0.68, 2.89, 4.34, 2.01, 3.45, 5.86, 10.1, 7.84, 4.88, 1.28, 1.64, 0.98, -0.18, 1.34, 0.68, 0.76, 7.38, 1.18, 6.99, 27.17]} \ No newline at end of file diff --git a/annotations_filtered/pMQxW1t8guI_filtered.json b/annotations_filtered/pMQxW1t8guI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b9b22907b7b218c326fd04f9b1d83c8e000a480 --- /dev/null +++ b/annotations_filtered/pMQxW1t8guI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.34], [4.0, 7.89], [9.0, 9.88], [10.0, 16.21], [17.0, 19.65], [21.0, 27.01], [28.0, 28.78], [31.0, 38.7], [42.0, 43.71], [45.0, 45.23], [46.0, 47.14], [48.0, 50.77], [55.0, 91.59], [93.0, 123.21], [124.0, 135.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 93.6, 0.0, 99.56, 99.99, 99.36, 0.0, 99.96, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0, 33.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 39.34], ["mains hum", 13.09], ["speech", 11.69]]], "duration": [0.34, 3.89, 0.88, 6.21, 2.65, 6.01, 0.78, 7.7, 1.71, 0.23, 1.14, 2.77, 36.59, 30.21, 11.43]} \ No newline at end of file diff --git a/annotations_filtered/pMTlNUKE7yg_filtered.json b/annotations_filtered/pMTlNUKE7yg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..853e0a8d67a43877e13931b0be0c4ce19d6e0476 --- /dev/null +++ b/annotations_filtered/pMTlNUKE7yg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.38], [9.0, 9.53], [11.0, 11.16], [12.0, 48.34], [50.0, 51.95], [55.0, 58.46], [60.0, 59.71], [64.0, 64.69], [67.0, 75.02], [88.0, 89.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 29.07, 0.0, 0.0, 34.2, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 80.59], ["throbbing", 3.88], ["didgeridoo", 2.18]], null, null, [["music", 48.1], ["speech", 17.45], ["throbbing", 5.31]], null], "duration": [0.38, 0.53, 0.16, 36.34, 1.95, 3.46, -0.29, 0.69, 8.02, 1.97]} \ No newline at end of file diff --git a/annotations_filtered/pMoxr-jgd58_filtered.json b/annotations_filtered/pMoxr-jgd58_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4178e978318a2ff2eed10c5781ed2cf0e8c2e5c0 --- /dev/null +++ b/annotations_filtered/pMoxr-jgd58_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.64], [12.0, 13.1], [14.0, 15.21], [17.0, 16.93], [18.0, 18.62], [19.0, 33.83], [34.0, 35.97], [37.0, 38.58], [41.0, 42.62], [44.0, 44.17], [53.0, 54.09], [55.0, 57.69], [58.0, 60.98], [63.0, 66.5], [77.0, 78.09], [80.0, 81.08], [83.0, 84.0], [85.0, 85.94], [88.0, 99.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 77.03, 0.0, 0.0, 0.0, 0.0, 0.0, 78.89, 57.09, 38.6, 0.0, 0.0, 0.0, 0.0, 32.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 36.85], ["didgeridoo", 14.41], ["mains hum", 5.29]], null, null, null, null, [["music", 33.1], ["speech", 25.86], ["hum", 8.35]]], "duration": [0.64, 1.1, 1.21, -0.07, 0.62, 14.83, 1.97, 1.58, 1.62, 0.17, 1.09, 2.69, 2.98, 3.5, 1.09, 1.08, 1.0, 0.94, 11.42]} \ No newline at end of file diff --git a/annotations_filtered/pMrk3l8El24_filtered.json b/annotations_filtered/pMrk3l8El24_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6190e0e5c1a31ddfd47a8b806cd2a6b05ca7ccf --- /dev/null +++ b/annotations_filtered/pMrk3l8El24_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.1], [9.0, 11.28], [23.0, 38.03], [39.0, 51.7], [52.0, 53.64], [57.0, 57.59], [62.0, 65.43], [67.0, 74.12], [77.0, 77.82], [79.0, 79.66], [81.0, 81.33], [83.0, 84.55], [96.0, 96.33], [98.0, 99.82], [104.0, 104.08], [107.0, 109.54], [112.0, 114.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.97, 40.66, 57.48, 0.0, 0.0, 52.98, 94.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.58, 79.41], "audiomae_on_audioset": [null, [["speech", 50.9], ["music", 17.85], ["boing", 3.71]], [["speech", 35.71], ["whack, thwack", 30.01], ["breaking", 9.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.1, 2.28, 15.03, 12.7, 1.64, 0.59, 3.43, 7.12, 0.82, 0.66, 0.33, 1.55, 0.33, 1.82, 0.08, 2.54, 2.07]} \ No newline at end of file diff --git a/annotations_filtered/pMx5aSV7qFg_filtered.json b/annotations_filtered/pMx5aSV7qFg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a2bd6424ec7dea026578746f21556234c84badde --- /dev/null +++ b/annotations_filtered/pMx5aSV7qFg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.97], [7.0, 10.27], [11.0, 14.44], [15.0, 17.98], [18.0, 21.02], [23.0, 30.37], [32.0, 33.99], [36.0, 40.29], [41.0, 65.26], [70.0, 76.05], [76.0, 77.87], [80.0, 79.56], [80.0, 96.16], [100.0, 110.3], [112.0, 112.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.42, 92.48, 91.64, 94.81, 93.91, 0.0, 91.98, 37.52, 33.58, 0.0, 0.0, 35.24, 33.8, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["hum", 58.83], ["throbbing", 16.19], ["mains hum", 15.43]], [["music", 32.15], ["hum", 21.67], ["speech", 17.32]], null, null, [["speech", 39.58], ["music", 23.44], ["sidetone", 14.41]], [["music", 55.8], ["speech", 11.51], ["cacophony", 6.49]], null], "duration": [1.97, 3.27, 3.44, 2.98, 3.02, 7.37, 1.99, 4.29, 24.26, 6.05, 1.87, -0.44, 16.16, 10.3, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/pN5RlyFWJBA_filtered.json b/annotations_filtered/pN5RlyFWJBA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abd30550909167e3b065ed0882654637b6f333da --- /dev/null +++ b/annotations_filtered/pN5RlyFWJBA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 38.28], [42.0, 42.3], [45.0, 45.3], [49.0, 49.67], [51.0, 52.34], [56.0, 72.71], [77.0, 78.48], [80.0, 83.47], [88.0, 131.63]], "keep_status": [true, false, false, false, false, true, false, false, false], "silence_prob": [32.38, 0.0, 0.0, 0.0, 0.0, 34.26, 0.0, 34.0, 0.0], "audiomae_on_audioset": [[["music", 19.69], ["didgeridoo", 11.66], ["fly, housefly", 11.16]], null, null, null, null, [["insect", 29.22], ["fly, housefly", 19.71], ["music", 12.12]], null, [["music", 69.0], ["throbbing", 4.79], ["electronic music", 3.45]], null], "duration": [15.28, 0.3, 0.3, 0.67, 1.34, 16.71, 1.48, 3.47, 43.63]} \ No newline at end of file diff --git a/annotations_filtered/pN7yX45G6WA_filtered.json b/annotations_filtered/pN7yX45G6WA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c6286e2e50261e0e04a2c0d204701202eaf9b67 --- /dev/null +++ b/annotations_filtered/pN7yX45G6WA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.94], [7.0, 6.99], [7.0, 12.29], [13.0, 18.47], [25.0, 25.02], [26.0, 26.0], [27.0, 27.26], [29.0, 29.52], [34.0, 36.02], [38.0, 38.79], [40.0, 40.69], [42.0, 57.6], [70.0, 74.46], [75.0, 84.08], [85.0, 91.03], [92.0, 92.99], [94.0, 94.39], [98.0, 98.93], [101.0, 103.32], [105.0, 107.32], [109.0, 108.67], [110.0, 110.47], [116.0, 117.36], [119.0, 120.11], [124.0, 124.31], [127.0, 128.14], [130.0, 129.86], [130.0, 131.79], [136.0, 142.16], [147.0, 148.47]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 37.56, 36.6, 0.0, 0.0, 0.0, 0.0, 49.92, 0.0, 0.0, 31.97, 31.72, 39.58, 46.86, 0.0, 0.0, 0.0, 52.39, 64.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.31, 0.0], "audiomae_on_audioset": [null, null, [["music", 39.13], ["speech", 20.89], ["theremin", 4.37]], [["music", 73.09], ["didgeridoo", 11.36], ["musical instrument", 6.09]], null, null, null, null, [["speech", 12.38], ["creak", 11.77], ["fly, housefly", 11.75]], null, null, [["music", 71.99], ["didgeridoo", 10.0], ["speech", 3.62]], [["music", 50.36], ["boing", 29.89], ["speech", 2.44]], [["didgeridoo", 69.47], ["music", 9.56], ["speech", 6.69]], [["didgeridoo", 27.37], ["music", 17.37], ["radio", 6.91]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 52.17], ["didgeridoo", 11.49], ["theremin", 7.61]], null], "duration": [0.94, -0.01, 5.29, 5.47, 0.02, 0.0, 0.26, 0.52, 2.02, 0.79, 0.69, 15.6, 4.46, 9.08, 6.03, 0.99, 0.39, 0.93, 2.32, 2.32, -0.33, 0.47, 1.36, 1.11, 0.31, 1.14, -0.14, 1.79, 6.16, 1.47]} \ No newline at end of file diff --git a/annotations_filtered/pNJRoSfVZxo_filtered.json b/annotations_filtered/pNJRoSfVZxo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e3a58ac401502b8a65b07896988a707070eac79 --- /dev/null +++ b/annotations_filtered/pNJRoSfVZxo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.83], [22.0, 39.28], [40.0, 45.25], [46.0, 46.43], [47.0, 47.28], [48.0, 57.25], [58.0, 59.12]], "keep_status": [false, false, true, false, false, true, false], "silence_prob": [0.0, 30.58, 30.6, 0.0, 0.0, 30.24, 0.0], "audiomae_on_audioset": [null, [["brass instrument", 32.15], ["trombone", 31.84], ["music", 15.84]], [["speech", 15.05], ["vehicle", 11.98], ["music", 10.29]], null, null, [["fly, housefly", 10.61], ["hum", 10.1], ["mains hum", 7.94]], null], "duration": [0.83, 17.28, 5.25, 0.43, 0.28, 9.25, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/pOPWdQO9bK4_filtered.json b/annotations_filtered/pOPWdQO9bK4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b213e7d9e530015712cfb98d8b9555aea2e0cfa --- /dev/null +++ b/annotations_filtered/pOPWdQO9bK4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.03], [11.0, 13.09], [16.0, 16.5], [22.0, 25.56], [29.0, 29.74], [31.0, 33.32], [38.0, 38.69], [43.0, 43.12], [46.0, 49.35], [51.0, 51.0], [52.0, 52.27], [54.0, 54.55], [55.0, 55.05], [59.0, 59.34], [61.0, 62.7]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.81, 0.0, 31.11, 0.0, 30.63, 0.0, 0.0, 36.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 79.29], ["boing", 9.94], ["radio", 3.05]], null, [["speech", 21.4], ["didgeridoo", 13.26], ["music", 7.18]], null, [["speech", 25.75], ["field recording", 21.39], ["fart", 13.77]], null, null, [["speech", 56.17], ["didgeridoo", 16.72], ["music", 3.69]], null, null, null, null, null, null], "duration": [0.03, 2.09, 0.5, 3.56, 0.74, 2.32, 0.69, 0.12, 3.35, 0.0, 0.27, 0.55, 0.05, 0.34, 1.7]} \ No newline at end of file diff --git a/annotations_filtered/pOQv_Ng3CaU_filtered.json b/annotations_filtered/pOQv_Ng3CaU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dbd6c4658dc6aaac7e2d4c79ba44013004fab5c6 --- /dev/null +++ b/annotations_filtered/pOQv_Ng3CaU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 26.15], [28.0, 46.55], [48.0, 53.87], [54.0, 80.28], [83.0, 92.99], [94.0, 94.46], [98.0, 97.65], [100.0, 100.03], [101.0, 101.83], [103.0, 112.13], [113.0, 114.32], [117.0, 118.72], [119.0, 130.6], [132.0, 132.78], [136.0, 138.92], [140.0, 140.56], [141.0, 143.01], [143.0, 143.94], [146.0, 146.48], [148.0, 149.88], [152.0, 156.61], [158.0, 171.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [39.67, 33.27, 39.98, 32.21, 55.46, 0.0, 0.0, 0.0, 0.0, 76.2, 0.0, 0.0, 88.1, 0.0, 74.13, 0.0, 36.91, 0.0, 0.0, 0.0, 79.24, 69.74], "audiomae_on_audioset": [[["music", 78.02], ["singing", 3.6], ["classical music", 2.72]], [["theremin", 56.93], ["music", 37.44], ["musical instrument", 1.27]], [["music", 56.44], ["theremin", 33.92], ["musical instrument", 2.69]], [["music", 55.96], ["theremin", 35.5], ["keyboard (musical)", 1.31]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 28.85], ["speech", 10.51], ["didgeridoo", 4.87]], null, null, null, null, null], "duration": [12.15, 18.55, 5.87, 26.28, 9.99, 0.46, -0.35, 0.03, 0.83, 9.13, 1.32, 1.72, 11.6, 0.78, 2.92, 0.56, 2.01, 0.94, 0.48, 1.88, 4.61, 13.48]} \ No newline at end of file diff --git a/annotations_filtered/pOgf3IaWlgU_filtered.json b/annotations_filtered/pOgf3IaWlgU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..290fd34a2083c15c2b0ce64a7a6dadc3c604a250 --- /dev/null +++ b/annotations_filtered/pOgf3IaWlgU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.1], [5.0, 6.56], [18.0, 19.75], [21.0, 22.47], [25.0, 27.85], [32.0, 33.29], [38.0, 40.0], [41.0, 43.77], [47.0, 48.59], [50.0, 53.81], [55.0, 55.92], [58.0, 58.29], [60.0, 60.79], [66.0, 71.22], [77.0, 76.86], [78.0, 78.8], [84.0, 87.61], [89.0, 90.21], [93.0, 93.8], [97.0, 113.61], [115.0, 116.61], [119.0, 120.78], [121.0, 122.74], [124.0, 124.6], [126.0, 126.87], [128.0, 129.86], [134.0, 135.62], [137.0, 139.43], [140.0, 141.25], [143.0, 146.74], [149.0, 150.35], [152.0, 153.76], [157.0, 160.69], [163.0, 164.42], [166.0, 168.4], [169.0, 173.28], [174.0, 181.41], [182.0, 185.11], [186.0, 186.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 41.56, 0.0, 100.0, 93.6, 0.0, 90.78, 0.0, 0.0, 0.0, 99.84, 0.0, 0.0, 100.0, 0.0, 0.0, 70.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.98, 0.0, 0.0, 100.0, 0.0, 100.0, 100.0, 98.44, 95.09, 0.0], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 67.15], ["speech", 17.44], ["hum", 4.55]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.1, 1.56, 1.75, 1.47, 2.85, 1.29, 2.0, 2.77, 1.59, 3.81, 0.92, 0.29, 0.79, 5.22, -0.14, 0.8, 3.61, 1.21, 0.8, 16.61, 1.61, 1.78, 1.74, 0.6, 0.87, 1.86, 1.62, 2.43, 1.25, 3.74, 1.35, 1.76, 3.69, 1.42, 2.4, 4.28, 7.41, 3.11, 0.98]} \ No newline at end of file diff --git a/annotations_filtered/pPCq9SIyHqE_filtered.json b/annotations_filtered/pPCq9SIyHqE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..966d56714e89d1943afc2ad355936b41b94426ea --- /dev/null +++ b/annotations_filtered/pPCq9SIyHqE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.99], [6.0, 6.98], [8.0, 8.51], [11.0, 17.05], [21.0, 21.73], [24.0, 30.89], [34.0, 35.72], [37.0, 50.53], [53.0, 68.27], [71.0, 103.86], [104.0, 106.03], [107.0, 113.04], [113.0, 113.86], [116.0, 119.97], [121.0, 121.31], [122.0, 123.21], [126.0, 132.04], [133.0, 136.8], [142.0, 142.21]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 34.49, 0.0, 30.23, 0.0, 30.89, 34.16, 0.0, 32.22, 32.4, 0.0, 30.78, 0.0, 0.0, 32.25, 32.58, 0.0], "audiomae_on_audioset": [null, null, null, [["throbbing", 27.37], ["music", 27.01], ["hum", 22.3]], null, [["car", 37.44], ["vehicle", 20.77], ["hum", 7.95]], null, [["music", 79.3], ["hum", 3.51], ["throbbing", 3.39]], [["speech", 45.15], ["music", 23.19], ["door", 6.09]], null, [["music", 44.87], ["speech", 21.65], ["hum", 7.08]], [["music", 43.9], ["animal", 7.15], ["dog", 6.74]], null, [["speech", 27.1], ["music", 25.39], ["gunshot, gunfire", 10.73]], null, null, [["hum", 28.63], ["throbbing", 25.55], ["music", 24.48]], [["speech", 31.33], ["music", 12.52], ["hum", 11.75]], null], "duration": [0.99, 0.98, 0.51, 6.05, 0.73, 6.89, 1.72, 13.53, 15.27, 32.86, 2.03, 6.04, 0.86, 3.97, 0.31, 1.21, 6.04, 3.8, 0.21]} \ No newline at end of file diff --git a/annotations_filtered/pPDz5TWc0Zw_filtered.json b/annotations_filtered/pPDz5TWc0Zw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c387df99a22ece9cb0bd8862bea8c7ac5ec454a8 --- /dev/null +++ b/annotations_filtered/pPDz5TWc0Zw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.51], [6.0, 7.62], [9.0, 12.61], [13.0, 18.74], [20.0, 21.69], [23.0, 60.69], [61.0, 60.72], [61.0, 60.96], [62.0, 63.75], [65.0, 66.19], [67.0, 69.15], [70.0, 74.04], [75.0, 76.87], [79.0, 81.67], [83.0, 84.47], [86.0, 86.54], [87.0, 100.43], [101.0, 103.91], [107.0, 115.79], [117.0, 119.55], [120.0, 123.03], [123.0, 124.58]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [42.0, 0.0, 48.06, 37.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 99.65, 0.0, 100.0, 0.0, 0.0, 99.93, 99.96, 99.94, 98.59, 97.11, 0.0], "audiomae_on_audioset": [[["music", 29.44], ["effects unit", 24.39], ["distortion", 12.77]], null, [["music", 50.12], ["didgeridoo", 15.28], ["synthesizer", 4.5]], [["livestock, farm animals, working animals", 40.1], ["cattle, bovinae", 35.2], ["moo", 21.28]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.51, 1.62, 3.61, 5.74, 1.69, 37.69, -0.28, -0.04, 1.75, 1.19, 2.15, 4.04, 1.87, 2.67, 1.47, 0.54, 13.43, 2.91, 8.79, 2.55, 3.03, 1.58]} \ No newline at end of file diff --git a/annotations_filtered/pPZ7eetT6oI_filtered.json b/annotations_filtered/pPZ7eetT6oI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/pPZ7eetT6oI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/pPZMrs3QGug_filtered.json b/annotations_filtered/pPZMrs3QGug_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7400f5568a0257ec73d7cb7a024b0f87eb8f5a0 --- /dev/null +++ b/annotations_filtered/pPZMrs3QGug_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.61], [10.0, 9.88], [11.0, 12.24], [16.0, 19.16], [30.0, 33.78], [36.0, 36.15], [40.0, 40.63], [42.0, 44.09], [46.0, 45.84], [48.0, 48.73], [50.0, 50.67], [54.0, 54.97], [60.0, 66.65], [69.0, 69.48], [73.0, 75.41], [78.0, 79.24], [80.0, 81.94], [82.0, 84.38], [85.0, 87.15], [88.0, 113.31], [115.0, 115.92]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 38.52, 98.1, 0.0, 0.0, 33.11, 0.0, 0.0, 0.0, 0.0, 42.53, 0.0, 63.96, 0.0, 0.0, 44.49, 47.31, 32.9, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 27.72], ["fart", 17.64], ["sidetone", 16.13]], null, null, null, [["burping, eructation", 78.06], ["speech", 14.2], ["male speech, man speaking", 2.64]], null, null, null, null, [["hum", 25.85], ["mains hum", 19.28], ["sine wave", 18.66]], null, null, null, null, [["speech", 51.32], ["sidetone", 33.15], ["sine wave", 3.28]], [["sine wave", 50.85], ["chirp tone", 33.31], ["hum", 4.87]], [["speech", 49.76], ["thunk", 7.86], ["sidetone", 6.4]], null], "duration": [0.61, -0.12, 1.24, 3.16, 3.78, 0.15, 0.63, 2.09, -0.16, 0.73, 0.67, 0.97, 6.65, 0.48, 2.41, 1.24, 1.94, 2.38, 2.15, 25.31, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/pPcxCk8YBVs_filtered.json b/annotations_filtered/pPcxCk8YBVs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b3212c005dd0feacd1b57a400afcb769ad2663d --- /dev/null +++ b/annotations_filtered/pPcxCk8YBVs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.3], [27.0, 27.18], [29.0, 29.35], [30.0, 37.86], [40.0, 40.15], [42.0, 43.04], [44.0, 63.96], [65.0, 65.5], [68.0, 69.6], [72.0, 77.31], [82.0, 87.42], [90.0, 91.13], [93.0, 108.8], [111.0, 126.37], [129.0, 144.78], [145.0, 146.28], [148.0, 148.17], [150.0, 150.01], [151.0, 151.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.71, 0.0, 0.0, 30.6, 0.0, 0.0, 30.41, 32.54, 0.0, 29.29, 29.05, 33.48, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 41.59], ["speech", 20.68], ["hum", 9.75]], null, null, [["mains hum", 39.19], ["hum", 19.46], ["music", 12.59]], null, null, [["throbbing", 28.13], ["music", 27.19], ["hum", 21.72]], [["rumble", 28.22], ["hum", 18.38], ["mains hum", 17.07]], null, [["music", 34.86], ["mains hum", 24.31], ["hum", 22.1]], [["music", 77.47], ["whip", 3.09], ["outside, rural or natural", 2.2]], [["music", 66.19], ["scary music", 8.09], ["ambient music", 4.11]], null, null, null, null], "duration": [1.3, 0.18, 0.35, 7.86, 0.15, 1.04, 19.96, 0.5, 1.6, 5.31, 5.42, 1.13, 15.8, 15.37, 15.78, 1.28, 0.17, 0.01, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/pPjYhPGkhGA_filtered.json b/annotations_filtered/pPjYhPGkhGA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a27a14bc8edc8c3b6bf16fd3cf9270ec4d670a0f --- /dev/null +++ b/annotations_filtered/pPjYhPGkhGA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.27], [12.0, 14.17], [17.0, 19.8], [22.0, 23.57], [25.0, 26.99], [28.0, 30.6], [32.0, 44.88], [49.0, 53.57], [54.0, 58.08], [59.0, 60.13], [61.0, 63.59]], "keep_status": [false, false, false, false, false, false, true, true, false, false, true], "silence_prob": [35.69, 43.82, 51.99, 0.0, 0.0, 36.2, 43.82, 33.6, 33.01, 0.0, 33.9], "audiomae_on_audioset": [[["noise", 50.79], ["hum", 17.65], ["white noise", 7.83]], [["speech", 35.04], ["sine wave", 24.89], ["sidetone", 22.83]], null, null, null, [["speech", 70.65], ["sidetone", 6.62], ["hum", 1.84]], [["hum", 22.89], ["music", 21.77], ["mains hum", 12.37]], [["music", 50.41], ["ambient music", 11.16], ["synthesizer", 5.99]], [["music", 70.07], ["ambient music", 5.16], ["synthesizer", 2.4]], null, [["hum", 22.54], ["music", 21.21], ["mains hum", 12.62]]], "duration": [5.27, 2.17, 2.8, 1.57, 1.99, 2.6, 12.88, 4.57, 4.08, 1.13, 2.59]} \ No newline at end of file diff --git a/annotations_filtered/pPuAKVnqJdk_filtered.json b/annotations_filtered/pPuAKVnqJdk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b47c5b6187311f3a1a4c56d1cd67856ce536f5aa --- /dev/null +++ b/annotations_filtered/pPuAKVnqJdk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.97], [7.0, 25.74], [26.0, 69.4]], "keep_status": [false, false, false], "silence_prob": [0.0, 38.0, 0.0], "audiomae_on_audioset": [null, [["music", 37.59], ["speech", 32.07], ["hum", 12.99]], null], "duration": [0.97, 18.74, 43.4]} \ No newline at end of file diff --git a/annotations_filtered/pQ68ImO9dBU_filtered.json b/annotations_filtered/pQ68ImO9dBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..589789f53e46a631e1f69fc92ae5a94e93875ee0 --- /dev/null +++ b/annotations_filtered/pQ68ImO9dBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.74], [7.0, 8.41], [9.0, 10.89], [14.0, 19.63], [20.0, 21.29], [22.0, 23.4], [26.0, 28.32], [30.0, 31.06], [32.0, 34.87], [37.0, 44.41], [45.0, 48.32], [51.0, 52.0], [56.0, 57.4], [59.0, 59.1], [61.0, 62.95], [64.0, 64.42], [67.0, 67.14], [68.0, 69.9], [71.0, 77.75], [79.0, 82.38], [83.0, 85.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.74, 1.41, 1.89, 5.63, 1.29, 1.4, 2.32, 1.06, 2.87, 7.41, 3.32, 1.0, 1.4, 0.1, 1.95, 0.42, 0.14, 1.9, 6.75, 3.38, 2.58]} \ No newline at end of file diff --git a/annotations_filtered/pQT-QFy5Nig_filtered.json b/annotations_filtered/pQT-QFy5Nig_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d3862651dcb47cbbafb7128359ca1d1c04b2d17 --- /dev/null +++ b/annotations_filtered/pQT-QFy5Nig_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 66.65], [114.0, 115.91], [157.0, 190.48], [207.0, 210.95], [215.0, 216.65], [217.0, 216.72], [217.0, 216.89], [219.0, 220.01], [224.0, 228.55]], "keep_status": [false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.66, 0.0, 0.0, 0.0, 0.0, 31.4], "audiomae_on_audioset": [null, null, null, [["music", 52.53], ["quack", 6.32], ["burst, pop", 3.06]], null, null, null, null, [["music", 46.03], ["speech", 23.76], ["sidetone", 11.33]]], "duration": [0.65, 1.91, 33.48, 3.95, 1.65, -0.28, -0.11, 1.01, 4.55]} \ No newline at end of file diff --git a/annotations_filtered/pQeZSHyCe4Q_filtered.json b/annotations_filtered/pQeZSHyCe4Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3afb5687ffd4aaae966417ebd891a4a635d2eab1 --- /dev/null +++ b/annotations_filtered/pQeZSHyCe4Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 40.44], [44.0, 45.59], [50.0, 64.54], [68.0, 69.16], [69.0, 85.78], [87.0, 89.78]], "keep_status": [false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 34.03, 0.0, 29.23, 36.52], "audiomae_on_audioset": [null, null, [["whack, thwack", 25.46], ["hum", 24.0], ["music", 11.71]], null, [["music", 29.79], ["speech", 28.73], ["mains hum", 19.11]], [["music", 29.75], ["hum", 13.13], ["mains hum", 12.89]]], "duration": [31.44, 1.59, 14.54, 1.16, 16.78, 2.78]} \ No newline at end of file diff --git a/annotations_filtered/pQv0ZtpRdNk_filtered.json b/annotations_filtered/pQv0ZtpRdNk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..131420d278c9167687bc5e7c378ce4ce06f489f9 --- /dev/null +++ b/annotations_filtered/pQv0ZtpRdNk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.72], [4.0, 6.15], [7.0, 9.53], [15.0, 20.11], [24.0, 24.51], [32.0, 32.76], [35.0, 39.24], [41.0, 44.02], [46.0, 47.48], [49.0, 52.02], [55.0, 55.46], [59.0, 59.95], [62.0, 62.92], [63.0, 63.1], [64.0, 65.18], [67.0, 68.4], [69.0, 71.46], [72.0, 75.19], [77.0, 79.39], [82.0, 82.7], [87.0, 87.78], [92.0, 93.5], [98.0, 102.96], [108.0, 116.43], [120.0, 120.02], [124.0, 129.12], [132.0, 132.48], [134.0, 135.38], [136.0, 136.76], [138.0, 139.67], [143.0, 143.16], [145.0, 145.99], [148.0, 149.54]], "keep_status": [false, false, false, false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 78.89, 68.67, 51.12, 0.0, 0.0, 32.62, 32.4, 0.0, 41.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.55, 55.96, 52.16, 0.0, 0.0, 0.0, 42.69, 40.07, 0.0, 36.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["crowd", 26.19], ["cheering", 9.75], ["vehicle", 8.61]], [["vehicle", 22.58], ["car", 5.8], ["motorcycle", 5.25]], null, [["speech", 45.3], ["music", 21.73], ["busy signal", 2.81]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.08], ["singing bowl", 15.16], ["theremin", 10.77]], [["music", 46.14], ["ambient music", 12.3], ["synthesizer", 5.73]], null, [["music", 41.32], ["whale vocalization", 20.14], ["theremin", 16.36]], null, null, null, null, null, null, null], "duration": [0.72, 2.15, 2.53, 5.11, 0.51, 0.76, 4.24, 3.02, 1.48, 3.02, 0.46, 0.95, 0.92, 0.1, 1.18, 1.4, 2.46, 3.19, 2.39, 0.7, 0.78, 1.5, 4.96, 8.43, 0.02, 5.12, 0.48, 1.38, 0.76, 1.67, 0.16, 0.99, 1.54]} \ No newline at end of file diff --git a/annotations_filtered/pR8Lt5DyU88_filtered.json b/annotations_filtered/pR8Lt5DyU88_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd2417176084f3ac38ae1fc80f3411fba130c716 --- /dev/null +++ b/annotations_filtered/pR8Lt5DyU88_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.51], [24.0, 24.6], [35.0, 35.36], [47.0, 49.91], [58.0, 58.21], [65.0, 70.73], [90.0, 92.8], [114.0, 114.57], [122.0, 123.42], [127.0, 127.18], [129.0, 130.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 48.95, 0.0, 56.18, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 62.42], ["synthesizer", 7.26], ["musical instrument", 2.53]], null, null, null, null, null, null, null], "duration": [0.51, 0.6, 0.36, 2.91, 0.21, 5.73, 2.8, 0.57, 1.42, 0.18, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/pRyH7gS__WI_filtered.json b/annotations_filtered/pRyH7gS__WI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef47d4f55ec739b0e08f618dd97725f8b0571646 --- /dev/null +++ b/annotations_filtered/pRyH7gS__WI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 97.58], [103.0, 124.85], [127.0, 164.2], [167.0, 186.27], [187.0, 188.57], [190.0, 193.8], [194.0, 195.44]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 34.85, 0.0, 31.48, 0.0, 95.91, 0.0], "audiomae_on_audioset": [null, [["hum", 48.23], ["mains hum", 34.57], ["music", 8.04]], null, [["hum", 54.64], ["mains hum", 17.02], ["throbbing", 11.37]], null, null, null], "duration": [51.58, 21.85, 37.2, 19.27, 1.57, 3.8, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/pS-KE1LXpXU_filtered.json b/annotations_filtered/pS-KE1LXpXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f3a098c0f488cb57e6aac32cfc8112084800b65 --- /dev/null +++ b/annotations_filtered/pS-KE1LXpXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.37], [3.0, 4.53], [5.0, 6.13], [9.0, 12.18], [14.0, 14.88], [23.0, 23.52], [25.0, 25.34], [29.0, 29.56], [30.0, 32.22], [35.0, 36.69], [42.0, 42.67], [45.0, 53.0], [54.0, 54.84], [56.0, 57.28], [61.0, 61.16], [66.0, 66.85], [68.0, 68.44], [70.0, 70.34], [71.0, 71.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 71.72, 0.0, 0.0, 0.0, 0.0, 76.2, 0.0, 0.0, 41.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 87.59], ["speech", 8.8], ["telephone", 0.72]], null, null, null, null, null, null, null], "duration": [1.37, 1.53, 1.13, 3.18, 0.88, 0.52, 0.34, 0.56, 2.22, 1.69, 0.67, 8.0, 0.84, 1.28, 0.16, 0.85, 0.44, 0.34, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/pSzusQmqyxE_filtered.json b/annotations_filtered/pSzusQmqyxE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1558df9ccfaf9475f10db8c83e6bebba031a93fa --- /dev/null +++ b/annotations_filtered/pSzusQmqyxE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 25.27], [27.0, 27.63], [28.0, 28.75]], "keep_status": [false, false, false], "silence_prob": [75.55, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [16.27, 0.63, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/pT9GPloXjA8_filtered.json b/annotations_filtered/pT9GPloXjA8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f7e7b819721c0343a495a66f9c8b5d9c9a9dc40 --- /dev/null +++ b/annotations_filtered/pT9GPloXjA8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.35], [2.0, 1.83], [4.0, 13.8], [16.0, 16.55], [20.0, 20.65], [21.0, 21.84], [23.0, 24.17], [27.0, 27.46], [28.0, 30.0], [31.0, 32.43], [34.0, 35.11], [36.0, 39.65], [42.0, 43.38], [49.0, 49.64], [52.0, 51.71], [52.0, 54.04], [55.0, 56.1], [61.0, 61.28], [66.0, 66.68], [67.0, 75.59], [78.0, 78.11], [79.0, 79.78], [83.0, 84.11], [84.0, 84.86], [85.0, 87.54], [94.0, 94.88], [100.0, 100.45], [109.0, 111.59], [117.0, 118.2], [127.0, 127.62], [139.0, 139.77], [156.0, 171.22], [172.0, 173.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 45.95, 0.0, 0.0, 0.0, 0.0, 0.0, 99.62, 0.0, 0.0, 52.05, 0.0, 0.0, 0.0, 83.52, 0.0, 0.0, 0.0, 40.75, 0.0, 0.0, 0.0, 0.0, 41.91, 0.0, 0.0, 40.36, 0.0, 0.0, 0.0, 39.07, 0.0], "audiomae_on_audioset": [null, null, [["speech", 62.95], ["sidetone", 16.3], ["noise", 3.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 79.75], ["sidetone", 10.63], ["male speech, man speaking", 1.32]], null, null, null, null, [["speech", 74.31], ["speech synthesizer", 7.24], ["sidetone", 6.19]], null, null, [["speech", 65.06], ["music", 12.29], ["inside, small room", 3.01]], null, null, null, [["heart sounds, heartbeat", 21.45], ["speech", 17.29], ["hum", 17.01]], null], "duration": [0.35, -0.17, 9.8, 0.55, 0.65, 0.84, 1.17, 0.46, 2.0, 1.43, 1.11, 3.65, 1.38, 0.64, -0.29, 2.04, 1.1, 0.28, 0.68, 8.59, 0.11, 0.78, 1.11, 0.86, 2.54, 0.88, 0.45, 2.59, 1.2, 0.62, 0.77, 15.22, 1.35]} \ No newline at end of file diff --git a/annotations_filtered/pTCTgL7_9gY_filtered.json b/annotations_filtered/pTCTgL7_9gY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7514f2809ad05e855a4514457b57da6ef45b313 --- /dev/null +++ b/annotations_filtered/pTCTgL7_9gY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.68], [14.0, 16.97], [18.0, 19.67], [23.0, 24.88], [28.0, 30.2], [32.0, 32.68], [36.0, 37.69], [40.0, 40.61], [41.0, 43.51], [47.0, 48.2], [53.0, 56.59], [57.0, 58.31], [60.0, 60.78], [62.0, 63.68], [65.0, 66.29], [67.0, 68.49], [73.0, 73.01], [74.0, 76.32], [77.0, 77.36], [80.0, 81.08], [81.0, 83.81], [85.0, 86.63], [89.0, 90.48], [99.0, 100.77], [101.0, 103.06], [106.0, 107.76], [112.0, 113.24], [118.0, 121.29], [123.0, 125.79], [127.0, 129.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 99.56, 0.0, 0.0, 0.0, 98.73, 0.0, 0.0, 99.97, 99.99, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.68, 2.97, 1.67, 1.88, 2.2, 0.68, 1.69, 0.61, 2.51, 1.2, 3.59, 1.31, 0.78, 1.68, 1.29, 1.49, 0.01, 2.32, 0.36, 1.08, 2.81, 1.63, 1.48, 1.77, 2.06, 1.76, 1.24, 3.29, 2.79, 2.51]} \ No newline at end of file diff --git a/annotations_filtered/pTptxpcYySI_filtered.json b/annotations_filtered/pTptxpcYySI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6876fa24dadcd9f5e542ce71b34c2f63bb487920 --- /dev/null +++ b/annotations_filtered/pTptxpcYySI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.41], [7.0, 8.67], [18.0, 18.49], [19.0, 20.68], [22.0, 22.11], [24.0, 25.3], [28.0, 28.16], [30.0, 30.92], [34.0, 36.61], [38.0, 41.94], [44.0, 44.9], [49.0, 49.77], [53.0, 57.47], [60.0, 64.45], [67.0, 67.24], [68.0, 68.69], [73.0, 73.43], [77.0, 78.93], [81.0, 81.46], [85.0, 87.71], [90.0, 90.86], [94.0, 100.84], [106.0, 115.86], [117.0, 121.56], [125.0, 126.37], [129.0, 131.19], [139.0, 142.4], [146.0, 148.05], [150.0, 153.89], [156.0, 157.17], [159.0, 162.33], [163.0, 167.51]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, true, true, false, false, false, false, false, true, false, true, true, false, false, true, true, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.04, 31.99, 0.0, 0.0, 35.06, 31.27, 0.0, 0.0, 0.0, 0.0, 0.0, 39.58, 0.0, 39.27, 35.35, 37.27, 0.0, 36.6, 39.57, 40.64, 35.79, 0.0, 30.1, 34.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 8.82], ["synthesizer", 6.36], ["hum", 6.1]], [["music", 38.78], ["hum", 15.4], ["musical instrument", 13.54]], null, null, [["hum", 33.54], ["throbbing", 22.8], ["music", 13.54]], [["music", 52.44], ["hum", 8.04], ["throbbing", 5.43]], null, null, null, null, null, [["hum", 31.11], ["throbbing", 15.79], ["music", 14.11]], null, [["music", 19.38], ["hum", 18.24], ["synthesizer", 17.28]], [["music", 39.77], ["hum", 11.09], ["throbbing", 9.22]], [["throbbing", 37.94], ["hum", 31.66], ["whale vocalization", 5.35]], null, [["hum", 32.83], ["throbbing", 14.14], ["rumble", 6.86]], [["speech", 18.06], ["music", 10.77], ["hum", 10.49]], [["hum", 44.9], ["throbbing", 27.89], ["mains hum", 14.21]], [["whale vocalization", 20.05], ["mains hum", 13.98], ["hum", 12.45]], null, [["eruption", 28.03], ["hum", 24.19], ["explosion", 9.37]], [["hum", 52.81], ["throbbing", 18.06], ["mains hum", 11.93]]], "duration": [0.41, 1.67, 0.49, 1.68, 0.11, 1.3, 0.16, 0.92, 2.61, 3.94, 0.9, 0.77, 4.47, 4.45, 0.24, 0.69, 0.43, 1.93, 0.46, 2.71, 0.86, 6.84, 9.86, 4.56, 1.37, 2.19, 3.4, 2.05, 3.89, 1.17, 3.33, 4.51]} \ No newline at end of file diff --git a/annotations_filtered/pTvbSVyWP9I_filtered.json b/annotations_filtered/pTvbSVyWP9I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db28a7c87543f379a9d425e38094f27725428a50 --- /dev/null +++ b/annotations_filtered/pTvbSVyWP9I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 48.54], [51.0, 80.57], [82.0, 88.13], [96.0, 114.96], [115.0, 115.05]], "keep_status": [true, false, true, true, false], "silence_prob": [33.28, 37.32, 40.14, 32.32, 0.0], "audiomae_on_audioset": [[["music", 25.45], ["hum", 18.05], ["throbbing", 11.54]], [["music", 51.88], ["throbbing", 24.78], ["hum", 9.93]], [["music", 29.12], ["hum", 27.86], ["mains hum", 8.43]], [["music", 38.17], ["speech", 6.66], ["whack, thwack", 6.28]], null], "duration": [24.54, 29.57, 6.13, 18.96, 0.05]} \ No newline at end of file diff --git a/annotations_filtered/pU3klLr1CPA_filtered.json b/annotations_filtered/pU3klLr1CPA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb8ffc2a9e6fb28ffedf5b53784c424a36127f59 --- /dev/null +++ b/annotations_filtered/pU3klLr1CPA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.96], [22.0, 41.32], [43.0, 45.84], [53.0, 55.86], [63.0, 66.51], [67.0, 69.2], [70.0, 75.46], [76.0, 79.98], [80.0, 83.62], [84.0, 87.86], [88.0, 91.0], [91.0, 95.94], [99.0, 111.01], [111.0, 114.96], [115.0, 133.91], [134.0, 137.37], [139.0, 160.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.21, 99.91, 99.99, 99.99, 99.99, 99.05, 100.0, 100.0, 70.02, 100.0, 86.82, 77.53, 99.96, 66.39, 81.53, 99.93, 73.82], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.96, 19.32, 2.84, 2.86, 3.51, 2.2, 5.46, 3.98, 3.62, 3.86, 3.0, 4.94, 12.01, 3.96, 18.91, 3.37, 21.19]} \ No newline at end of file diff --git a/annotations_filtered/pUPliO3qy04_filtered.json b/annotations_filtered/pUPliO3qy04_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac3fe63dc4b00e1bfcd7c2da578c3b9c32ee4040 --- /dev/null +++ b/annotations_filtered/pUPliO3qy04_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.42], [12.0, 14.62], [16.0, 18.57], [20.0, 23.62], [25.0, 28.36], [29.0, 31.72], [32.0, 33.88], [35.0, 36.88], [39.0, 45.52], [48.0, 53.25], [54.0, 65.58], [67.0, 67.64], [69.0, 70.73], [72.0, 76.52], [77.0, 79.0], [80.0, 83.08], [83.0, 88.82], [90.0, 95.91], [97.0, 99.32], [101.0, 101.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 61.27, 64.41, 65.91, 76.04, 75.39, 0.0, 0.0, 77.2, 72.75, 61.47, 0.0, 0.0, 45.24, 53.4, 74.29, 46.26, 73.36, 56.86, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.67], ["didgeridoo", 5.6], ["singing bowl", 4.97]], null, null, [["music", 44.5], ["theremin", 24.05], ["speech", 8.78]], null, null, null], "duration": [0.42, 2.62, 2.57, 3.62, 3.36, 2.72, 1.88, 1.88, 6.52, 5.25, 11.58, 0.64, 1.73, 4.52, 2.0, 3.08, 5.82, 5.91, 2.32, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/pUmu0VJuwOA_filtered.json b/annotations_filtered/pUmu0VJuwOA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2df7e248f1e53d00f41243fec9ffa19b2ff01345 --- /dev/null +++ b/annotations_filtered/pUmu0VJuwOA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.37], [4.0, 4.7], [5.0, 7.69], [10.0, 12.41], [13.0, 13.42], [15.0, 16.23], [17.0, 17.88], [34.0, 35.16], [37.0, 37.2], [40.0, 40.36], [50.0, 51.04], [55.0, 55.24], [55.0, 56.24], [58.0, 58.92], [60.0, 60.69], [63.0, 66.61], [68.0, 68.3], [69.0, 70.04], [83.0, 85.68], [86.0, 88.53], [89.0, 91.37], [94.0, 96.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 44.96, 50.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.01, 0.0, 0.0, 56.18, 51.18, 29.71, 40.19], "audiomae_on_audioset": [null, null, [["speech", 60.76], ["clang", 5.29], ["telephone", 4.3]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 62.38], ["radio", 10.17], ["music", 8.98]], null, null, null, null, [["music", 41.77], ["explosion", 14.0], ["speech", 10.95]], [["noise", 53.79], ["radio", 12.57], ["sidetone", 7.12]]], "duration": [1.37, 0.7, 2.69, 2.41, 0.42, 1.23, 0.88, 1.16, 0.2, 0.36, 1.04, 0.24, 1.24, 0.92, 0.69, 3.61, 0.3, 1.04, 2.68, 2.53, 2.37, 2.79]} \ No newline at end of file diff --git a/annotations_filtered/pUtdFHAAGhE_filtered.json b/annotations_filtered/pUtdFHAAGhE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6bbdc322bd6580f8c7609cb1a1f16149e9a30c69 --- /dev/null +++ b/annotations_filtered/pUtdFHAAGhE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.38], [7.0, 8.14], [20.0, 21.3], [25.0, 26.99], [30.0, 30.96], [33.0, 33.94], [49.0, 50.92], [53.0, 53.42], [54.0, 54.87], [67.0, 67.78], [71.0, 71.66], [73.0, 73.58], [75.0, 75.56], [91.0, 92.26], [95.0, 95.55], [100.0, 99.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.38, 1.14, 1.3, 1.99, 0.96, 0.94, 1.92, 0.42, 0.87, 0.78, 0.66, 0.58, 0.56, 1.26, 0.55, -0.38]} \ No newline at end of file diff --git a/annotations_filtered/pV2y0et0TT4_filtered.json b/annotations_filtered/pV2y0et0TT4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e012f2673913cc66ad82858e6a1d3292e7dff874 --- /dev/null +++ b/annotations_filtered/pV2y0et0TT4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 26.77], [30.0, 31.18], [31.0, 32.05], [37.0, 43.75], [56.0, 65.1], [66.0, 77.3], [79.0, 79.62], [81.0, 94.86], [97.0, 121.42]], "keep_status": [false, false, false, false, false, true, false, false, true], "silence_prob": [51.5, 0.0, 0.0, 60.6, 30.81, 32.46, 0.0, 30.68, 32.21], "audiomae_on_audioset": [null, null, null, null, [["music", 41.53], ["theremin", 29.99], ["synthesizer", 5.18]], [["music", 49.43], ["musical instrument", 12.0], ["brass instrument", 5.92]], null, [["music", 58.56], ["musical instrument", 9.84], ["brass instrument", 7.08]], [["music", 44.19], ["brass instrument", 14.43], ["musical instrument", 9.55]]], "duration": [10.77, 1.18, 1.05, 6.75, 9.1, 11.3, 0.62, 13.86, 24.42]} \ No newline at end of file diff --git a/annotations_filtered/pVB70-zPv5E_filtered.json b/annotations_filtered/pVB70-zPv5E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f00903343030f6dcd2e57f8a9918802bfb170fac --- /dev/null +++ b/annotations_filtered/pVB70-zPv5E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[81.0, 81.11], [84.0, 89.51], [90.0, 91.37]], "keep_status": [false, true, false], "silence_prob": [0.0, 35.77, 0.0], "audiomae_on_audioset": [null, [["music", 34.98], ["hum", 15.21], ["mains hum", 12.45]], null], "duration": [0.11, 5.51, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/pVfx0OQcmBk_filtered.json b/annotations_filtered/pVfx0OQcmBk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1288fc531ea49790a202c6fc5f2501c58a1961f5 --- /dev/null +++ b/annotations_filtered/pVfx0OQcmBk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.74], [4.0, 10.3], [11.0, 20.61], [24.0, 63.54]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 31.45, 32.31, 0.0], "audiomae_on_audioset": [null, [["music", 71.68], ["scary music", 8.62], ["animal", 3.42]], [["music", 40.34], ["hum", 23.91], ["mains hum", 9.4]], null], "duration": [-0.26, 6.3, 9.61, 39.54]} \ No newline at end of file diff --git a/annotations_filtered/pVjh7-4ux7g_filtered.json b/annotations_filtered/pVjh7-4ux7g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09d9acdd00ee4cdbe46ce59d1fbb50a0e456987f --- /dev/null +++ b/annotations_filtered/pVjh7-4ux7g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.63], [8.0, 10.0], [10.0, 14.08], [16.0, 22.42], [23.0, 23.31], [24.0, 26.92], [28.0, 29.49], [31.0, 32.36], [34.0, 38.43], [41.0, 45.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [59.07, 32.2, 30.83, 36.59, 0.0, 56.55, 0.0, 0.0, 66.15, 72.46], "audiomae_on_audioset": [null, [["sidetone", 55.41], ["hum", 11.14], ["mains hum", 9.22]], [["speech", 95.48], ["speech synthesizer", 1.29], ["music", 0.45]], [["speech", 55.62], ["sidetone", 23.93], ["radio", 6.39]], null, null, null, null, null, null], "duration": [4.63, 2.0, 4.08, 6.42, 0.31, 2.92, 1.49, 1.36, 4.43, 4.77]} \ No newline at end of file diff --git a/annotations_filtered/pVqOcGEbZvo_filtered.json b/annotations_filtered/pVqOcGEbZvo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e9d7b896aeb7b626b2ed2a040b4250ad974c535 --- /dev/null +++ b/annotations_filtered/pVqOcGEbZvo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[94.0, 98.61], [99.0, 98.68], [99.0, 100.03], [101.0, 102.44]], "keep_status": [true, false, false, false], "silence_prob": [31.16, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 33.02], ["animal", 6.97], ["beatboxing", 3.47]], null, null, null], "duration": [4.61, -0.32, 1.03, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/pVssi5x6rxI_filtered.json b/annotations_filtered/pVssi5x6rxI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b875db1d2196ecb2839081c94cf10df60b052db4 --- /dev/null +++ b/annotations_filtered/pVssi5x6rxI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.0], [29.0, 29.0], [30.0, 30.77], [43.0, 42.87], [45.0, 48.46], [54.0, 55.14], [56.0, 56.4], [60.0, 60.49], [77.0, 77.5], [79.0, 79.49], [80.0, 80.4], [93.0, 92.92], [107.0, 107.47], [114.0, 116.33], [117.0, 117.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.39, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 0.0, 0.77, -0.13, 3.46, 1.14, 0.4, 0.49, 0.5, 0.49, 0.4, -0.08, 0.47, 2.33, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/pW-ZHlM3RxI_filtered.json b/annotations_filtered/pW-ZHlM3RxI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..15bf869a748cc422d44bbca1c1b66ccfdf53e438 --- /dev/null +++ b/annotations_filtered/pW-ZHlM3RxI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.0], [6.0, 8.51], [9.0, 12.36], [14.0, 15.52], [18.0, 18.45], [19.0, 19.9], [20.0, 22.17], [23.0, 25.39], [29.0, 30.28], [36.0, 36.29], [51.0, 51.44], [66.0, 66.83], [79.0, 83.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 72.6, 100.0, 0.0, 0.0, 0.0, 99.78, 97.83, 0.0, 0.0, 0.0, 0.0, 99.94], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.0, 2.51, 3.36, 1.52, 0.45, 0.9, 2.17, 2.39, 1.28, 0.29, 0.44, 0.83, 4.71]} \ No newline at end of file diff --git a/annotations_filtered/pWGGQmeKdkk_filtered.json b/annotations_filtered/pWGGQmeKdkk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..813b0e718db78d8a2e74981a72e477619ed090b3 --- /dev/null +++ b/annotations_filtered/pWGGQmeKdkk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.33], [8.0, 8.95], [10.0, 10.77], [11.0, 11.87], [13.0, 13.17], [13.0, 13.69], [16.0, 16.46], [18.0, 19.6], [22.0, 22.5], [23.0, 25.51], [27.0, 26.92], [31.0, 31.67], [33.0, 39.02], [40.0, 46.58], [47.0, 47.55], [50.0, 50.94], [52.0, 52.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.89, 0.0, 0.0, 42.72, 37.62, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 37.23], ["insect", 14.94], ["mains hum", 9.38]], [["speech", 72.24], ["hum", 7.02], ["mains hum", 4.15]], null, null, null], "duration": [0.33, 0.95, 0.77, 0.87, 0.17, 0.69, 0.46, 1.6, 0.5, 2.51, -0.08, 0.67, 6.02, 6.58, 0.55, 0.94, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/pWPn-C5l3Sk_filtered.json b/annotations_filtered/pWPn-C5l3Sk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c266b2c928ea1ccf0634a6dece57476c5545fc0 --- /dev/null +++ b/annotations_filtered/pWPn-C5l3Sk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.94], [5.0, 6.47], [10.0, 13.05], [15.0, 14.94], [15.0, 15.13], [16.0, 17.66], [18.0, 19.5], [20.0, 23.57], [28.0, 28.0], [30.0, 29.74], [31.0, 51.44], [52.0, 52.49], [53.0, 53.59], [54.0, 54.87], [60.0, 60.47], [61.0, 67.9], [69.0, 71.37], [75.0, 79.3], [85.0, 85.13], [87.0, 87.25], [89.0, 91.05], [94.0, 96.28], [103.0, 105.02], [107.0, 107.32], [110.0, 110.15], [115.0, 115.26], [116.0, 116.7], [117.0, 117.46], [120.0, 126.13], [127.0, 127.23], [129.0, 132.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, true, true, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 99.88, 0.0, 0.0, 0.0, 0.0, 97.64, 0.0, 0.0, 33.76, 0.0, 0.0, 0.0, 0.0, 35.5, 41.18, 38.87, 0.0, 0.0, 39.66, 42.35, 42.46, 0.0, 0.0, 0.0, 0.0, 0.0, 47.05, 0.0, 34.32], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 51.67], ["trombone", 12.31], ["brass instrument", 10.28]], null, null, null, null, [["speech", 63.59], ["sidetone", 9.15], ["radio", 8.32]], [["speech", 30.4], ["music", 9.36], ["crowd", 7.02]], [["speech", 60.85], ["sidetone", 4.16], ["frog", 3.89]], null, null, [["speech", 36.1], ["crowd", 4.81], ["outside, urban or manmade", 3.94]], [["speech", 33.56], ["crowd", 5.39], ["cheering", 5.33]], [["speech", 26.99], ["crowd", 19.87], ["cheering", 9.22]], null, null, null, null, null, [["speech", 47.88], ["crowd", 7.36], ["sidetone", 6.16]], null, [["music", 23.4], ["didgeridoo", 15.82], ["theremin", 5.55]]], "duration": [0.94, 1.47, 3.05, -0.06, 0.13, 1.66, 1.5, 3.57, 0.0, -0.26, 20.44, 0.49, 0.59, 0.87, 0.47, 6.9, 2.37, 4.3, 0.13, 0.25, 2.05, 2.28, 2.02, 0.32, 0.15, 0.26, 0.7, 0.46, 6.13, 0.23, 3.19]} \ No newline at end of file diff --git a/annotations_filtered/pWRCxdh4PTM_filtered.json b/annotations_filtered/pWRCxdh4PTM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..787e5c4c6fcd26c780c00492888a521d5288bb2b --- /dev/null +++ b/annotations_filtered/pWRCxdh4PTM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.71], [21.0, 21.0], [21.0, 21.24], [21.0, 21.56], [22.0, 21.61], [22.0, 22.67], [23.0, 23.6], [33.0, 33.47], [34.0, 35.83], [39.0, 40.09], [50.0, 53.16], [54.0, 54.19], [56.0, 56.46], [62.0, 62.67], [69.0, 69.08], [101.0, 101.87], [103.0, 108.73], [111.0, 113.17], [115.0, 115.74], [117.0, 118.83], [119.0, 125.49], [126.0, 127.33], [128.0, 128.93], [129.0, 136.29], [137.0, 143.11], [144.0, 145.54], [147.0, 151.06], [152.0, 153.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 98.51, 0.0, 0.0, 100.0, 100.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.71, 0.0, 0.24, 0.56, -0.39, 0.67, 0.6, 0.47, 1.83, 1.09, 3.16, 0.19, 0.46, 0.67, 0.08, 0.87, 5.73, 2.17, 0.74, 1.83, 6.49, 1.33, 0.93, 7.29, 6.11, 1.54, 4.06, 1.6]} \ No newline at end of file diff --git a/annotations_filtered/pWYPN21XIEU_filtered.json b/annotations_filtered/pWYPN21XIEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32130516efc55e952dd3fc690c1d9ce6458c1627 --- /dev/null +++ b/annotations_filtered/pWYPN21XIEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.0], [5.0, 6.44], [9.0, 11.7], [13.0, 14.22], [19.0, 20.41], [22.0, 34.96], [36.0, 39.95], [41.0, 55.75], [59.0, 78.36], [81.0, 83.25], [88.0, 88.3], [90.0, 90.04], [92.0, 92.5]], "keep_status": [false, false, true, false, false, false, true, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 32.85, 0.0, 0.0, 31.91, 31.13, 32.84, 31.35, 31.06, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["cheering", 34.4], ["crowd", 15.24], ["speech", 10.45]], null, null, [["music", 50.65], ["theremin", 24.41], ["synthesizer", 2.58]], [["music", 48.86], ["theremin", 8.35], ["foghorn", 6.18]], [["music", 82.87], ["musical instrument", 3.08], ["orchestra", 2.18]], [["music", 38.56], ["speech", 8.68], ["moo", 7.71]], [["speech", 35.55], ["music", 14.73], ["outside, urban or manmade", 7.65]], null, null, null], "duration": [1.0, 1.44, 2.7, 1.22, 1.41, 12.96, 3.95, 14.75, 19.36, 2.25, 0.3, 0.04, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/pWfB7jrCgxk_filtered.json b/annotations_filtered/pWfB7jrCgxk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97890979693ff59be2324382df70fc83d7e489a8 --- /dev/null +++ b/annotations_filtered/pWfB7jrCgxk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.25], [12.0, 13.26], [26.0, 26.72], [29.0, 31.16], [31.0, 32.14], [33.0, 35.14], [35.0, 36.46], [40.0, 40.36], [51.0, 53.03], [54.0, 58.5], [66.0, 65.77], [79.0, 79.25], [84.0, 84.2], [85.0, 85.56], [86.0, 87.86], [95.0, 96.74], [99.0, 100.14], [104.0, 104.06], [106.0, 106.61], [113.0, 112.87], [116.0, 119.1], [120.0, 124.5], [126.0, 127.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [85.54, 0.0, 0.0, 63.42, 0.0, 53.34, 0.0, 0.0, 48.27, 45.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.45, 80.82, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 50.7], ["speech", 19.2], ["musical instrument", 4.28]], [["throbbing", 39.99], ["hum", 26.19], ["music", 19.32]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.25, 1.26, 0.72, 2.16, 1.14, 2.14, 1.46, 0.36, 2.03, 4.5, -0.23, 0.25, 0.2, 0.56, 1.86, 1.74, 1.14, 0.06, 0.61, -0.13, 3.1, 4.5, 1.41]} \ No newline at end of file diff --git a/annotations_filtered/pWt-GnERki0_filtered.json b/annotations_filtered/pWt-GnERki0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45ab38a33a014b0e94484c45e66b9b5fb908e38b --- /dev/null +++ b/annotations_filtered/pWt-GnERki0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.74], [7.0, 8.16], [12.0, 12.21], [13.0, 13.44], [16.0, 16.98], [22.0, 22.77], [31.0, 31.68], [61.0, 61.01]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.74, 1.16, 0.21, 0.44, 0.98, 0.77, 0.68, 0.01]} \ No newline at end of file diff --git a/annotations_filtered/pX0LbjUM5Uo_filtered.json b/annotations_filtered/pX0LbjUM5Uo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be016059bc8ab06513b36a6a8454f3d6689449aa --- /dev/null +++ b/annotations_filtered/pX0LbjUM5Uo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.44], [6.0, 6.91], [9.0, 10.88], [12.0, 12.95]], "keep_status": [true, false, false, false], "silence_prob": [46.12, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 15.02], ["music", 11.59], ["buzz", 6.14]], null, null, null], "duration": [3.44, 0.91, 1.88, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/pX71mALOPKs_filtered.json b/annotations_filtered/pX71mALOPKs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..15577b2cf61edc3b1ee2a262c0f964db20804089 --- /dev/null +++ b/annotations_filtered/pX71mALOPKs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 20.97], [22.0, 23.41], [26.0, 32.21], [33.0, 39.87], [48.0, 51.24], [52.0, 101.65], [102.0, 120.46], [122.0, 138.4], [145.0, 149.18]], "keep_status": [false, false, true, false, true, false, false, true, true], "silence_prob": [0.0, 0.0, 32.52, 33.44, 31.12, 0.0, 31.88, 31.99, 31.9], "audiomae_on_audioset": [null, null, [["music", 14.34], ["vehicle", 9.99], ["sheep", 6.54]], [["music", 41.55], ["trombone", 28.9], ["musical instrument", 7.91]], [["music", 40.9], ["trombone", 18.85], ["cacophony", 3.61]], null, [["music", 54.49], ["trombone", 16.25], ["brass instrument", 10.72]], [["music", 41.87], ["speech", 11.94], ["trombone", 8.31]], [["music", 52.65], ["brass instrument", 7.6], ["trombone", 7.51]]], "duration": [-0.03, 1.41, 6.21, 6.87, 3.24, 49.65, 18.46, 16.4, 4.18]} \ No newline at end of file diff --git a/annotations_filtered/pXGsio9H1xs_filtered.json b/annotations_filtered/pXGsio9H1xs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d05fe9f07e36ecba51d8ff2421131e479b33b43 --- /dev/null +++ b/annotations_filtered/pXGsio9H1xs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.56], [5.0, 8.02], [10.0, 10.61], [14.0, 20.44], [22.0, 23.6], [25.0, 27.94], [29.0, 29.98], [31.0, 33.15], [35.0, 43.11], [44.0, 48.42], [51.0, 60.05], [61.0, 62.77], [65.0, 72.35], [73.0, 78.21], [79.0, 85.33], [86.0, 88.23], [90.0, 92.45], [93.0, 94.17], [95.0, 98.76], [100.0, 102.27], [110.0, 111.64], [117.0, 120.02], [120.0, 121.74], [122.0, 122.94], [127.0, 133.02], [134.0, 135.73], [136.0, 137.44], [138.0, 139.94], [141.0, 145.81], [146.0, 152.63], [157.0, 157.38], [162.0, 163.16], [164.0, 164.62], [167.0, 168.35], [177.0, 184.74], [186.0, 192.25], [193.0, 197.13], [197.0, 203.93], [207.0, 207.22]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.43, 0.0, 48.95, 0.0, 99.91, 0.0, 99.98, 90.78, 99.85, 99.93, 0.0, 81.35, 99.62, 95.09, 98.27, 98.8, 0.0, 99.1, 96.04, 0.0, 99.96, 0.0, 0.0, 70.16, 0.0, 0.0, 0.0, 87.37, 96.89, 0.0, 0.0, 0.0, 0.0, 99.94, 67.25, 89.9, 51.71, 0.0], "audiomae_on_audioset": [null, null, null, [["whale vocalization", 59.88], ["cat", 3.87], ["noise", 3.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.56, 3.02, 0.61, 6.44, 1.6, 2.94, 0.98, 2.15, 8.11, 4.42, 9.05, 1.77, 7.35, 5.21, 6.33, 2.23, 2.45, 1.17, 3.76, 2.27, 1.64, 3.02, 1.74, 0.94, 6.02, 1.73, 1.44, 1.94, 4.81, 6.63, 0.38, 1.16, 0.62, 1.35, 7.74, 6.25, 4.13, 6.93, 0.22]} \ No newline at end of file diff --git a/annotations_filtered/pXe74ckEnME_filtered.json b/annotations_filtered/pXe74ckEnME_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e3ba7a426ea923b078f0a74fb75b20c628150b3 --- /dev/null +++ b/annotations_filtered/pXe74ckEnME_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.72], [9.0, 9.88], [11.0, 11.16], [12.0, 15.36], [18.0, 19.95], [22.0, 22.42], [24.0, 27.43], [39.0, 39.02], [43.0, 43.9], [45.0, 44.9], [46.0, 47.39], [48.0, 48.14], [51.0, 52.3], [53.0, 54.03], [54.0, 57.96], [59.0, 59.93], [64.0, 65.52], [67.0, 67.17], [80.0, 81.33], [83.0, 91.76], [92.0, 92.69], [97.0, 99.22], [104.0, 104.5], [105.0, 105.43], [108.0, 107.97], [109.0, 111.47], [116.0, 116.63], [117.0, 123.3], [124.0, 124.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 99.99, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.72, 0.88, 0.16, 3.36, 1.95, 0.42, 3.43, 0.02, 0.9, -0.1, 1.39, 0.14, 1.3, 1.03, 3.96, 0.93, 1.52, 0.17, 1.33, 8.76, 0.69, 2.22, 0.5, 0.43, -0.03, 2.47, 0.63, 6.3, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/pXrMAjB8ka0_filtered.json b/annotations_filtered/pXrMAjB8ka0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36e2ed567f6469a2ce9a0f66965f9517368b63ab --- /dev/null +++ b/annotations_filtered/pXrMAjB8ka0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.25], [12.0, 13.09], [14.0, 13.95], [26.0, 27.53], [30.0, 30.45], [32.0, 32.14], [33.0, 34.55], [37.0, 41.37], [43.0, 45.13], [46.0, 47.39], [49.0, 49.08], [50.0, 50.26], [53.0, 52.71], [55.0, 56.89], [57.0, 58.4], [59.0, 80.62], [83.0, 83.83], [87.0, 91.25], [94.0, 94.19], [95.0, 95.69], [96.0, 97.31], [100.0, 100.62], [102.0, 103.54], [105.0, 105.73], [107.0, 107.6], [109.0, 109.07], [110.0, 110.93], [112.0, 112.7], [113.0, 120.09], [121.0, 121.96], [123.0, 125.54], [127.0, 127.82], [129.0, 129.47], [130.0, 140.63], [142.0, 145.77], [148.0, 148.0], [149.0, 149.05], [150.0, 150.82], [152.0, 152.61], [153.0, 153.77], [154.0, 154.43], [155.0, 156.05], [157.0, 157.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [32.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.15, 36.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.23, 0.0, 32.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.25, 0.0, 30.92, 0.0, 0.0, 32.02, 30.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 45.36], ["mains hum", 40.15], ["throbbing", 7.12]], null, null, null, null, null, null, [["mains hum", 34.72], ["hum", 34.46], ["buzz", 12.45]], [["mains hum", 40.67], ["hum", 31.23], ["music", 9.08]], null, null, null, null, null, null, [["hum", 54.12], ["mains hum", 27.75], ["music", 9.73]], null, [["hum", 48.86], ["mains hum", 35.52], ["throbbing", 3.94]], null, null, null, null, null, null, null, null, null, null, [["hum", 36.37], ["throbbing", 15.49], ["mains hum", 6.84]], null, [["livestock, farm animals, working animals", 20.84], ["cattle, bovinae", 17.69], ["moo", 16.55]], null, null, [["hum", 28.28], ["buzz", 10.6], ["cattle, bovinae", 8.75]], [["whale vocalization", 36.52], ["livestock, farm animals, working animals", 20.02], ["cattle, bovinae", 7.19]], null, null, null, null, null, null, null, null], "duration": [2.25, 1.09, -0.05, 1.53, 0.45, 0.14, 1.55, 4.37, 2.13, 1.39, 0.08, 0.26, -0.29, 1.89, 1.4, 21.62, 0.83, 4.25, 0.19, 0.69, 1.31, 0.62, 1.54, 0.73, 0.6, 0.07, 0.93, 0.7, 7.09, 0.96, 2.54, 0.82, 0.47, 10.63, 3.77, 0.0, 0.05, 0.82, 0.61, 0.77, 0.43, 1.05, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/pYBS9Sp0xU8_filtered.json b/annotations_filtered/pYBS9Sp0xU8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4846fdf732608ec70254fe0652aefcd07e38c734 --- /dev/null +++ b/annotations_filtered/pYBS9Sp0xU8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.89], [18.0, 18.62], [20.0, 21.93], [23.0, 26.23], [27.0, 28.0], [31.0, 31.55], [33.0, 36.15], [37.0, 41.08], [42.0, 44.32], [46.0, 55.88], [59.0, 59.85], [64.0, 64.59], [68.0, 92.06], [98.0, 103.3], [107.0, 109.29], [111.0, 111.69], [113.0, 113.9], [116.0, 117.05], [118.0, 122.3], [123.0, 126.96], [128.0, 128.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 88.1, 0.0, 0.0, 99.94, 99.26, 98.59, 66.03, 0.0, 0.0, 72.16, 71.0, 89.9, 0.0, 0.0, 0.0, 34.03, 44.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.46], ["hum", 9.92], ["throbbing", 6.07]], [["speech", 56.79], ["inside, small room", 6.85], ["hum", 4.47]], null], "duration": [0.89, 0.62, 1.93, 3.23, 1.0, 0.55, 3.15, 4.08, 2.32, 9.88, 0.85, 0.59, 24.06, 5.3, 2.29, 0.69, 0.9, 1.05, 4.3, 3.96, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/pYBo5eS5pW8_filtered.json b/annotations_filtered/pYBo5eS5pW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d702a7b358b21f55fe6a05c9323a908c2fb905c --- /dev/null +++ b/annotations_filtered/pYBo5eS5pW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.88], [15.0, 14.96], [16.0, 17.49], [23.0, 24.78], [33.0, 33.34], [35.0, 35.11], [37.0, 36.83], [38.0, 38.87], [45.0, 45.6], [62.0, 62.55], [67.0, 69.72], [72.0, 73.62], [74.0, 75.66], [76.0, 77.55], [78.0, 80.22], [83.0, 83.46], [85.0, 85.58], [92.0, 92.3], [93.0, 96.42], [99.0, 98.86], [99.0, 99.13], [100.0, 101.63], [103.0, 103.22], [105.0, 105.11], [108.0, 108.6], [111.0, 111.05], [122.0, 122.34], [129.0, 129.52], [138.0, 138.52], [140.0, 141.25], [145.0, 145.4], [156.0, 156.63], [158.0, 157.82], [158.0, 159.11], [172.0, 171.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.46, 0.0, 0.0, 0.0, 37.98, 0.0, 0.0, 0.0, 35.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 70.7], ["electronic music", 3.04], ["musical instrument", 2.96]], null, null, null, [["speech", 35.5], ["music", 23.12], ["sidetone", 14.15]], null, null, null, [["music", 68.87], ["musical instrument", 5.04], ["plop", 4.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, -0.04, 1.49, 1.78, 0.34, 0.11, -0.17, 0.87, 0.6, 0.55, 2.72, 1.62, 1.66, 1.55, 2.22, 0.46, 0.58, 0.3, 3.42, -0.14, 0.13, 1.63, 0.22, 0.11, 0.6, 0.05, 0.34, 0.52, 0.52, 1.25, 0.4, 0.63, -0.18, 1.11, -0.14]} \ No newline at end of file diff --git a/annotations_filtered/pYI0bXZVZek_filtered.json b/annotations_filtered/pYI0bXZVZek_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..efdb958b08797e09b29e5c66f10c6831b7f6ad8b --- /dev/null +++ b/annotations_filtered/pYI0bXZVZek_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.05], [10.0, 14.79], [19.0, 21.1], [26.0, 26.59], [28.0, 29.93], [30.0, 30.75], [45.0, 45.87], [46.0, 47.56], [50.0, 50.97], [56.0, 56.86], [60.0, 59.98], [67.0, 69.43], [71.0, 73.67], [75.0, 75.22], [78.0, 78.49], [80.0, 81.78], [83.0, 82.71], [89.0, 88.67], [92.0, 92.94], [95.0, 96.08], [101.0, 102.51], [104.0, 105.95], [107.0, 108.55], [111.0, 115.48], [116.0, 123.35], [125.0, 125.95]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 61.87, 49.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.58, 65.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.04, 51.66, 0.0], "audiomae_on_audioset": [null, null, [["music", 29.89], ["musical instrument", 8.11], ["hum", 7.71]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.02], ["speech", 24.16], ["guitar", 6.7]], null, null], "duration": [0.05, 4.79, 2.1, 0.59, 1.93, 0.75, 0.87, 1.56, 0.97, 0.86, -0.02, 2.43, 2.67, 0.22, 0.49, 1.78, -0.29, -0.33, 0.94, 1.08, 1.51, 1.95, 1.55, 4.48, 7.35, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/pYXkfLVbLIQ_filtered.json b/annotations_filtered/pYXkfLVbLIQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b75fc1cfa6f30187b2d7d6c3fb9821a1324a1140 --- /dev/null +++ b/annotations_filtered/pYXkfLVbLIQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.75], [9.0, 11.96], [29.0, 36.75], [40.0, 46.21], [49.0, 57.67], [67.0, 91.59], [92.0, 93.61], [102.0, 128.97]], "keep_status": [false, true, true, false, true, false, false, false], "silence_prob": [0.0, 35.37, 30.4, 33.14, 30.68, 30.81, 0.0, 30.48], "audiomae_on_audioset": [null, [["basketball bounce", 36.09], ["hum", 12.57], ["throbbing", 9.45]], [["music", 41.57], ["speech", 14.01], ["didgeridoo", 12.66]], [["music", 44.71], ["speech", 22.19], ["throbbing", 7.66]], [["music", 46.98], ["speech", 17.03], ["buzz", 4.1]], [["music", 53.95], ["speech", 20.57], ["throbbing", 4.53]], null, [["speech", 77.84], ["music", 5.87], ["boing", 2.54]]], "duration": [-0.25, 2.96, 7.75, 6.21, 8.67, 24.59, 1.61, 26.97]} \ No newline at end of file diff --git a/annotations_filtered/pYaJ7p8RrzM_filtered.json b/annotations_filtered/pYaJ7p8RrzM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3bad8770626021647a503137a7b3522b9a3eafed --- /dev/null +++ b/annotations_filtered/pYaJ7p8RrzM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 25.41], [26.0, 26.91], [30.0, 43.88], [45.0, 46.08], [47.0, 47.98], [54.0, 54.77], [56.0, 57.43], [58.0, 60.29], [64.0, 65.16], [66.0, 67.96], [70.0, 70.21], [81.0, 82.0]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [33.97, 0.0, 36.9, 0.0, 0.0, 0.0, 0.0, 50.31, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 52.73], ["music", 6.08], ["mains hum", 4.14]], null, [["hum", 24.79], ["music", 14.05], ["throbbing", 9.36]], null, null, null, null, null, null, null, null, null], "duration": [4.41, 0.91, 13.88, 1.08, 0.98, 0.77, 1.43, 2.29, 1.16, 1.96, 0.21, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/pYhlVR9GzjA_filtered.json b/annotations_filtered/pYhlVR9GzjA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7832c553f27894ded5a9753a483f6a74e35b787a --- /dev/null +++ b/annotations_filtered/pYhlVR9GzjA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.92], [10.0, 11.13], [13.0, 13.93], [14.0, 15.06], [16.0, 19.09], [19.0, 19.68], [22.0, 65.72], [70.0, 72.57], [75.0, 78.49], [81.0, 82.83], [83.0, 83.91], [87.0, 87.18], [92.0, 92.97], [93.0, 93.04], [93.0, 93.18], [93.0, 93.23], [93.0, 93.72], [95.0, 94.74], [95.0, 97.66], [99.0, 99.44], [106.0, 106.84], [109.0, 109.88], [112.0, 112.41], [114.0, 114.81], [117.0, 118.17], [123.0, 123.23], [127.0, 127.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.95, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.92, 1.13, 0.93, 1.06, 3.09, 0.68, 43.72, 2.57, 3.49, 1.83, 0.91, 0.18, 0.97, 0.04, 0.18, 0.23, 0.72, -0.26, 2.66, 0.44, 0.84, 0.88, 0.41, 0.81, 1.17, 0.23, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/pYmo3PXF_T4_filtered.json b/annotations_filtered/pYmo3PXF_T4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b44d778dd7e5d8123adfc4321c5400a0db7af46 --- /dev/null +++ b/annotations_filtered/pYmo3PXF_T4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 32.21], [34.0, 34.69], [35.0, 37.47], [40.0, 40.27], [43.0, 50.79], [53.0, 55.88], [58.0, 62.21], [63.0, 80.77], [84.0, 87.35], [89.0, 96.75], [98.0, 101.26], [102.0, 106.78], [108.0, 109.41], [110.0, 138.96], [140.0, 145.47], [147.0, 147.61], [149.0, 149.23]], "keep_status": [false, false, true, false, false, false, false, false, true, true, false, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 40.43, 0.0, 28.87, 73.67, 31.13, 29.22, 32.42, 33.99, 35.13, 43.66, 0.0, 37.8, 49.73, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["beatboxing", 33.07], ["throbbing", 9.93], ["music", 8.86]], null, [["fly, housefly", 42.65], ["insect", 41.32], ["mosquito", 9.54]], null, [["speech", 79.84], ["music", 6.14], ["whack, thwack", 1.31]], [["speech", 35.4], ["music", 29.76], ["cattle, bovinae", 8.29]], [["music", 46.61], ["speech", 10.56], ["echo", 5.06]], [["speech", 38.54], ["chirp tone", 6.45], ["sine wave", 5.88]], [["speech", 70.78], ["sidetone", 4.87], ["groan", 2.76]], [["speech", 25.29], ["burping, eructation", 15.85], ["cough", 13.96]], null, [["speech", 42.48], ["frog", 11.8], ["croak", 4.86]], [["music", 21.34], ["singing bowl", 20.47], ["animal", 4.88]], null, null], "duration": [0.21, 0.69, 2.47, 0.27, 7.79, 2.88, 4.21, 17.77, 3.35, 7.75, 3.26, 4.78, 1.41, 28.96, 5.47, 0.61, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/pYwgIQaq9qY_filtered.json b/annotations_filtered/pYwgIQaq9qY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5041dd5e9d7ca2202be044d9dd6dc96aad2093f9 --- /dev/null +++ b/annotations_filtered/pYwgIQaq9qY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.17], [8.0, 8.09], [11.0, 12.28], [13.0, 13.04], [15.0, 17.93], [20.0, 23.18], [24.0, 24.34], [25.0, 26.16], [28.0, 28.22], [30.0, 31.7], [37.0, 37.76], [41.0, 41.45], [48.0, 48.52], [53.0, 53.3], [60.0, 60.67], [63.0, 63.9], [66.0, 66.5], [67.0, 67.64], [71.0, 71.19], [73.0, 73.84], [74.0, 75.98], [78.0, 77.82], [81.0, 81.06], [87.0, 88.05]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.07, 33.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 67.02], ["speech", 5.72], ["musical instrument", 5.08]], [["chirp tone", 34.47], ["sine wave", 15.92], ["busy signal", 14.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.17, 0.09, 1.28, 0.04, 2.93, 3.18, 0.34, 1.16, 0.22, 1.7, 0.76, 0.45, 0.52, 0.3, 0.67, 0.9, 0.5, 0.64, 0.19, 0.84, 1.98, -0.18, 0.06, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/pZJ7QK2d5-A_filtered.json b/annotations_filtered/pZJ7QK2d5-A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c13fd0f8f1ec9d260ef4b26f63fe4eb3b9ca890f --- /dev/null +++ b/annotations_filtered/pZJ7QK2d5-A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 33.35], [35.0, 36.31], [37.0, 58.43], [62.0, 63.0], [64.0, 64.18], [74.0, 75.02], [78.0, 78.73], [80.0, 80.59], [95.0, 95.34], [97.0, 99.27], [100.0, 101.07], [102.0, 103.52], [119.0, 120.11], [128.0, 128.49], [130.0, 130.59], [133.0, 132.93], [135.0, 135.43], [149.0, 149.81], [153.0, 153.08], [154.0, 154.41], [155.0, 155.24]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.84, 0.0, 30.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 49.15], ["theremin", 12.41], ["didgeridoo", 11.24]], null, [["music", 35.59], ["speech", 13.39], ["cattle, bovinae", 5.95]], null, null, null, null, null, null, [["fly, housefly", 31.59], ["insect", 18.67], ["mosquito", 11.46]], null, null, null, null, null, null, null, null, null, null, null], "duration": [20.35, 1.31, 21.43, 1.0, 0.18, 1.02, 0.73, 0.59, 0.34, 2.27, 1.07, 1.52, 1.11, 0.49, 0.59, -0.07, 0.43, 0.81, 0.08, 0.41, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/pZNQ-Jo7nsI_filtered.json b/annotations_filtered/pZNQ-Jo7nsI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e65b6f99e1b9f12577b39da7163646b7d5a2b9a --- /dev/null +++ b/annotations_filtered/pZNQ-Jo7nsI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.29], [7.0, 7.25], [16.0, 16.24], [17.0, 18.6], [27.0, 28.02], [32.0, 33.32], [41.0, 41.72]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.29, 0.25, 0.24, 1.6, 1.02, 1.32, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/pZRDwBXv7T0_filtered.json b/annotations_filtered/pZRDwBXv7T0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f04692566660a4b0ebc16883d0df86b291c3de2 --- /dev/null +++ b/annotations_filtered/pZRDwBXv7T0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[162.0, 164.54], [168.0, 168.12], [170.0, 173.87]], "keep_status": [false, false, false], "silence_prob": [35.38, 0.0, 32.29], "audiomae_on_audioset": [[["music", 75.71], ["throbbing", 9.36], ["electronic music", 3.31]], null, [["throbbing", 63.53], ["music", 12.93], ["hum", 10.19]]], "duration": [2.54, 0.12, 3.87]} \ No newline at end of file diff --git a/annotations_filtered/pZXuol2q1Yg_filtered.json b/annotations_filtered/pZXuol2q1Yg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..369b1a0e8c483f700f6d6b4259887d3d5260769a --- /dev/null +++ b/annotations_filtered/pZXuol2q1Yg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.18], [16.0, 17.71], [21.0, 23.11], [26.0, 27.58], [34.0, 35.92], [41.0, 42.55], [48.0, 49.89]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.82, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [1.18, 1.71, 2.11, 1.58, 1.92, 1.55, 1.89]} \ No newline at end of file diff --git a/annotations_filtered/pZZ60jrw6cg_filtered.json b/annotations_filtered/pZZ60jrw6cg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..460a4705a2c310b305592f2c331fa8911e864942 --- /dev/null +++ b/annotations_filtered/pZZ60jrw6cg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[52.0, 58.73], [60.0, 101.76], [105.0, 155.71]], "keep_status": [true, false, false], "silence_prob": [31.09, 0.0, 0.0], "audiomae_on_audioset": [[["vehicle", 13.54], ["hum", 13.15], ["car", 7.95]], null, null], "duration": [6.73, 41.76, 50.71]} \ No newline at end of file diff --git a/annotations_filtered/pZfva5xDNLU_filtered.json b/annotations_filtered/pZfva5xDNLU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..662be3a044cca758aac42281d770684f59fac432 --- /dev/null +++ b/annotations_filtered/pZfva5xDNLU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 43.93], [44.0, 82.59]], "keep_status": [true, false], "silence_prob": [36.35, 0.0], "audiomae_on_audioset": [[["music", 20.39], ["gunshot, gunfire", 14.32], ["speech", 10.49]], null], "duration": [14.93, 38.59]} \ No newline at end of file diff --git a/annotations_filtered/p_-Zm_G8cBI_filtered.json b/annotations_filtered/p_-Zm_G8cBI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ee380d4527480358a329bf855a39d5c97c6bb4a --- /dev/null +++ b/annotations_filtered/p_-Zm_G8cBI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.84], [14.0, 23.46], [25.0, 26.52], [38.0, 42.28], [54.0, 54.23], [58.0, 59.05], [62.0, 68.4], [69.0, 69.72], [70.0, 71.46], [73.0, 73.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 88.1, 0.0, 0.0, 52.16, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.84, 9.46, 1.52, 4.28, 0.23, 1.05, 6.4, 0.72, 1.46, 0.04]} \ No newline at end of file diff --git a/annotations_filtered/p_UeWtpIW08_filtered.json b/annotations_filtered/p_UeWtpIW08_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..933545e34fefa0d3e5ad2ed10c225fc7a0d7d9b9 --- /dev/null +++ b/annotations_filtered/p_UeWtpIW08_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 12.19], [15.0, 70.21], [72.0, 72.15], [77.0, 77.67], [87.0, 89.06], [93.0, 95.62], [96.0, 120.07]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [33.82, 0.0, 0.0, 0.0, 73.67, 96.54, 100.0], "audiomae_on_audioset": [[["music", 76.1], ["boing", 6.41], ["speech", 3.12]], null, null, null, null, null, null], "duration": [5.19, 55.21, 0.15, 0.67, 2.06, 2.62, 24.07]} \ No newline at end of file diff --git a/annotations_filtered/p_ixTZLD7k0_filtered.json b/annotations_filtered/p_ixTZLD7k0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3635cd27ddbc41a20af248f9996f3cf988c563c --- /dev/null +++ b/annotations_filtered/p_ixTZLD7k0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.12], [27.0, 28.58], [30.0, 31.8], [49.0, 50.38], [52.0, 52.46], [77.0, 78.39], [81.0, 81.95], [84.0, 84.15], [118.0, 118.45], [124.0, 124.78], [147.0, 148.42], [155.0, 155.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.12, 1.58, 1.8, 1.38, 0.46, 1.39, 0.95, 0.15, 0.45, 0.78, 1.42, 0.26]} \ No newline at end of file diff --git a/annotations_filtered/p_jspptikh8_filtered.json b/annotations_filtered/p_jspptikh8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..936ab9038983272754b34a10c89bc3eb1850a670 --- /dev/null +++ b/annotations_filtered/p_jspptikh8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.45], [6.0, 7.05], [9.0, 11.43], [14.0, 14.88], [20.0, 21.44], [24.0, 24.16], [25.0, 25.93], [26.0, 27.33], [29.0, 29.2], [30.0, 30.25], [37.0, 37.72], [41.0, 42.04], [46.0, 45.89], [49.0, 50.33], [51.0, 51.16], [54.0, 54.16], [55.0, 57.92], [58.0, 59.41], [61.0, 61.47], [64.0, 77.41], [80.0, 81.7], [83.0, 84.0], [85.0, 86.1], [89.0, 88.72], [91.0, 91.47], [93.0, 93.77], [95.0, 95.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.73, 0.0, 0.0, 33.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["insect", 24.2], ["fly, housefly", 18.0], ["telephone dialing, dtmf", 10.74]], null, null, null, null, null, null, null], "duration": [0.45, 1.05, 2.43, 0.88, 1.44, 0.16, 0.93, 1.33, 0.2, 0.25, 0.72, 1.04, -0.11, 1.33, 0.16, 0.16, 2.92, 1.41, 0.47, 13.41, 1.7, 1.0, 1.1, -0.28, 0.47, 0.77, 0.37]} \ No newline at end of file diff --git a/annotations_filtered/p_wCMFyHeUE_filtered.json b/annotations_filtered/p_wCMFyHeUE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60cb5be6d3c077d53409bb18ddbe77fc78b55c71 --- /dev/null +++ b/annotations_filtered/p_wCMFyHeUE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 19.75], [21.0, 23.68], [25.0, 27.65], [29.0, 44.04], [46.0, 98.46], [99.0, 99.94]], "keep_status": [false, true, true, false, false, false], "silence_prob": [50.56, 45.62, 46.4, 30.83, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 36.2], ["hum", 10.69], ["throbbing", 10.34]], [["music", 25.79], ["hum", 17.72], ["throbbing", 11.24]], [["speech", 27.83], ["buzz", 25.42], ["mains hum", 17.99]], null, null], "duration": [3.75, 2.68, 2.65, 15.04, 52.46, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/pa-oUPTr9LI_filtered.json b/annotations_filtered/pa-oUPTr9LI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9808f637e1cc1c3f24a9970f39083e886618235b --- /dev/null +++ b/annotations_filtered/pa-oUPTr9LI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.9], [15.0, 16.01], [22.0, 22.89], [23.0, 24.76], [27.0, 28.19], [30.0, 31.31], [34.0, 34.62], [36.0, 37.3], [38.0, 39.14], [42.0, 43.51], [44.0, 45.72], [50.0, 49.99], [51.0, 51.36], [53.0, 54.41], [57.0, 59.07], [60.0, 61.7], [65.0, 65.65], [68.0, 68.37], [87.0, 98.66], [100.0, 102.0], [104.0, 104.6]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [30.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.09, 0.0, 0.0, 0.0, 37.77, 37.49, 0.0], "audiomae_on_audioset": [[["music", 26.6], ["sidetone", 21.0], ["throbbing", 12.99]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 33.47], ["speech", 13.48], ["throbbing", 7.64]], null, null, null, [["speech", 39.83], ["music", 30.84], ["electronic music", 2.46]], [["sidetone", 15.4], ["music", 13.37], ["throbbing", 12.36]], null], "duration": [3.9, 1.01, 0.89, 1.76, 1.19, 1.31, 0.62, 1.3, 1.14, 1.51, 1.72, -0.01, 0.36, 1.41, 2.07, 1.7, 0.65, 0.37, 11.66, 2.0, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/paCyf1IAKug_filtered.json b/annotations_filtered/paCyf1IAKug_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e321533de6e5b3ae753f4deb2d9428ba8c4684b --- /dev/null +++ b/annotations_filtered/paCyf1IAKug_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.97], [3.0, 4.18], [5.0, 5.81], [7.0, 10.94], [12.0, 12.7], [15.0, 15.58], [20.0, 21.36], [21.0, 21.39], [22.0, 23.4], [26.0, 26.77], [29.0, 41.76], [46.0, 46.95], [47.0, 51.92], [52.0, 65.65], [67.0, 67.24], [69.0, 87.3], [87.0, 116.13], [118.0, 118.89], [122.0, 144.9], [147.0, 147.24], [156.0, 156.61], [160.0, 161.03], [163.0, 163.05]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false, true, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.34, 0.0, 38.47, 33.61, 0.0, 38.42, 34.55, 0.0, 33.56, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 25.99], ["grunt", 10.24], ["noise", 4.56]], null, null, null, null, null, null, [["speech", 36.88], ["music", 18.15], ["theremin", 9.75]], null, [["speech", 28.03], ["music", 16.2], ["whale vocalization", 9.74]], [["speech", 31.84], ["music", 18.55], ["buzz", 8.72]], null, [["music", 63.87], ["musical instrument", 3.87], ["hum", 2.81]], [["music", 48.14], ["speech", 14.51], ["didgeridoo", 10.9]], null, [["music", 48.12], ["didgeridoo", 9.05], ["throbbing", 5.58]], null, null, null, null], "duration": [0.97, 1.18, 0.81, 3.94, 0.7, 0.58, 1.36, 0.39, 1.4, 0.77, 12.76, 0.95, 4.92, 13.65, 0.24, 18.3, 29.13, 0.89, 22.9, 0.24, 0.61, 1.03, 0.05]} \ No newline at end of file diff --git a/annotations_filtered/paNPEeQVCTc_filtered.json b/annotations_filtered/paNPEeQVCTc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e388e8e9901f7ff5b3dc0f5bdeb8de3e17b5cad --- /dev/null +++ b/annotations_filtered/paNPEeQVCTc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.31], [8.0, 9.15], [12.0, 14.25], [16.0, 25.51], [27.0, 29.44]], "keep_status": [false, false, false, false, true], "silence_prob": [44.09, 0.0, 78.72, 69.61, 39.57], "audiomae_on_audioset": [[["hum", 31.34], ["mains hum", 28.55], ["speech", 13.82]], null, null, null, [["sine wave", 15.32], ["music", 9.75], ["whale vocalization", 8.04]]], "duration": [2.31, 1.15, 2.25, 9.51, 2.44]} \ No newline at end of file diff --git a/annotations_filtered/paPWv3HjXAI_filtered.json b/annotations_filtered/paPWv3HjXAI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6540765abafdcb80d7b36fda498d50a50f170216 --- /dev/null +++ b/annotations_filtered/paPWv3HjXAI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 22.44], [25.0, 58.09]], "keep_status": [false, false], "silence_prob": [42.13, 0.0], "audiomae_on_audioset": [[["music", 61.85], ["ambient music", 19.43], ["synthesizer", 6.21]], null], "duration": [12.44, 33.09]} \ No newline at end of file diff --git a/annotations_filtered/padXZANlFwE_filtered.json b/annotations_filtered/padXZANlFwE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e5ba05e3cb7d4b29f9d37f027d570f9e79cca0b --- /dev/null +++ b/annotations_filtered/padXZANlFwE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.84], [8.0, 9.37], [11.0, 12.31], [13.0, 17.44], [20.0, 21.02], [24.0, 24.11], [26.0, 27.92], [29.0, 30.35], [34.0, 34.59], [37.0, 49.99], [52.0, 75.79], [77.0, 85.65], [88.0, 127.43]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [68.02, 0.0, 0.0, 50.86, 0.0, 0.0, 0.0, 0.0, 0.0, 28.52, 30.1, 65.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 36.17], ["animal", 18.93], ["wild animals", 9.95]], [["music", 73.02], ["throbbing", 4.32], ["hum", 3.31]], null, null], "duration": [2.84, 1.37, 1.31, 4.44, 1.02, 0.11, 1.92, 1.35, 0.59, 12.99, 23.79, 8.65, 39.43]} \ No newline at end of file diff --git a/annotations_filtered/pb8pWn_yyF4_filtered.json b/annotations_filtered/pb8pWn_yyF4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a19ab59ccaa9394cda773a04fa30e5954a42695b --- /dev/null +++ b/annotations_filtered/pb8pWn_yyF4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 64.1], [64.0, 66.87], [68.0, 77.08], [82.0, 82.73], [83.0, 84.62], [85.0, 87.56], [88.0, 99.3], [100.0, 102.42], [104.0, 104.46], [105.0, 104.57], [105.0, 105.48], [106.0, 108.33], [108.0, 108.48], [108.0, 117.68], [118.0, 117.76], [120.0, 119.75], [120.0, 121.41], [122.0, 122.23], [125.0, 132.7], [146.0, 147.83]], "keep_status": [true, false, false, false, false, true, true, false, false, false, false, true, false, true, false, false, false, false, true, false], "silence_prob": [39.22, 39.91, 41.12, 0.0, 0.0, 40.62, 42.13, 33.89, 0.0, 0.0, 0.0, 32.77, 0.0, 33.26, 0.0, 0.0, 0.0, 0.0, 31.55, 0.0], "audiomae_on_audioset": [[["music", 47.54], ["pizzicato", 5.28], ["musical instrument", 4.55]], [["music", 55.98], ["musical instrument", 14.94], ["guitar", 9.85]], [["music", 64.3], ["guitar", 8.27], ["musical instrument", 7.9]], null, null, [["music", 56.84], ["musical instrument", 5.63], ["didgeridoo", 4.98]], [["music", 42.4], ["guitar", 8.24], ["musical instrument", 7.78]], [["music", 68.13], ["guitar", 5.71], ["musical instrument", 3.37]], null, null, null, [["speech", 44.08], ["music", 14.47], ["fart", 8.63]], null, [["speech", 46.49], ["fart", 18.86], ["fly, housefly", 4.03]], null, null, null, null, [["speech", 61.33], ["explosion", 4.72], ["burst, pop", 2.17]], null], "duration": [25.1, 2.87, 9.08, 0.73, 1.62, 2.56, 11.3, 2.42, 0.46, -0.43, 0.48, 2.33, 0.48, 9.68, -0.24, -0.25, 1.41, 0.23, 7.7, 1.83]} \ No newline at end of file diff --git a/annotations_filtered/pbI6qTih2TI_filtered.json b/annotations_filtered/pbI6qTih2TI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2a0e18a41f9e0f1a4dbc7c4f2d83d523feb6d0d --- /dev/null +++ b/annotations_filtered/pbI6qTih2TI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.03], [3.0, 3.67], [10.0, 20.66], [22.0, 22.72], [24.0, 26.28], [27.0, 43.02], [44.0, 44.34], [45.0, 46.43], [47.0, 47.95], [53.0, 54.4], [55.0, 57.27], [59.0, 61.96], [68.0, 69.45], [79.0, 80.1]], "keep_status": [false, false, true, false, false, true, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 31.62, 0.0, 78.21, 33.55, 0.0, 0.0, 0.0, 0.0, 47.74, 38.36, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 53.76], ["buzz", 3.68], ["fart", 2.96]], null, null, [["animal", 18.0], ["crow", 8.62], ["knock", 7.31]], null, null, null, null, [["fly, housefly", 10.19], ["cat", 9.27], ["domestic animals, pets", 6.59]], [["whale vocalization", 17.58], ["fly, housefly", 16.1], ["mosquito", 13.66]], null, null], "duration": [0.03, 0.67, 10.66, 0.72, 2.28, 16.02, 0.34, 1.43, 0.95, 1.4, 2.27, 2.96, 1.45, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/pbfBzWJVbX4_filtered.json b/annotations_filtered/pbfBzWJVbX4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60793f508facfd242c845f04a379b13982f488ac --- /dev/null +++ b/annotations_filtered/pbfBzWJVbX4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 3.18], [6.0, 6.76], [30.0, 30.48], [38.0, 38.18], [41.0, 41.57], [43.0, 43.23], [46.0, 46.31], [49.0, 49.37], [53.0, 57.18], [80.0, 80.32], [99.0, 99.71], [123.0, 124.16], [126.0, 126.74], [132.0, 132.66]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [40.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.04, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 62.19], ["synthesizer", 4.47], ["theremin", 2.63]], null, null, null, null, null, null, null, [["music", 71.29], ["musical instrument", 5.03], ["brass instrument", 3.08]], null, null, null, null, null], "duration": [3.18, 0.76, 0.48, 0.18, 0.57, 0.23, 0.31, 0.37, 4.18, 0.32, 0.71, 1.16, 0.74, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/pbmU2wMnuI4_filtered.json b/annotations_filtered/pbmU2wMnuI4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1080e18f08612d76fb216817b3d07a7486fe5c21 --- /dev/null +++ b/annotations_filtered/pbmU2wMnuI4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.0], [8.0, 9.22], [23.0, 23.35], [24.0, 24.14], [25.0, 25.46], [27.0, 29.15], [33.0, 34.7], [37.0, 37.35], [62.0, 73.18], [73.0, 73.21], [74.0, 79.95], [87.0, 88.16], [93.0, 99.3], [108.0, 109.22], [114.0, 119.67], [120.0, 121.17], [123.0, 132.6], [136.0, 136.39], [137.0, 137.88], [140.0, 140.53], [143.0, 144.29], [148.0, 148.95]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.66, 0.0, 0.0, 30.97, 0.0, 30.3, 0.0, 31.55, 0.0, 51.07, 0.0, 40.52, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 19.95], ["speech", 12.51], ["thunk", 7.03]], null, null, [["speech", 60.64], ["music", 17.78], ["telephone bell ringing", 4.73]], null, [["speech", 30.26], ["music", 27.97], ["hum", 6.77]], null, [["foghorn", 59.61], ["music", 12.86], ["throbbing", 8.28]], null, null, null, [["music", 63.2], ["hum", 6.45], ["scary music", 6.33]], null, null, null, null, null], "duration": [0.0, 1.22, 0.35, 0.14, 0.46, 2.15, 1.7, 0.35, 11.18, 0.21, 5.95, 1.16, 6.3, 1.22, 5.67, 1.17, 9.6, 0.39, 0.88, 0.53, 1.29, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/pbv02n_zKvo_filtered.json b/annotations_filtered/pbv02n_zKvo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f300f8c83b413c4f2787c3fab32d8e4737020cb --- /dev/null +++ b/annotations_filtered/pbv02n_zKvo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.37], [9.0, 9.81], [20.0, 20.78], [26.0, 26.5], [30.0, 31.09], [32.0, 32.26], [34.0, 44.83], [48.0, 48.03], [54.0, 54.53], [55.0, 59.27], [62.0, 65.87], [83.0, 83.62], [96.0, 95.94], [97.0, 97.61], [100.0, 101.21], [101.0, 102.15], [106.0, 106.66], [116.0, 116.33], [124.0, 125.71], [127.0, 127.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 97.83, 67.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.37, 0.81, 0.78, 0.5, 1.09, 0.26, 10.83, 0.03, 0.53, 4.27, 3.87, 0.62, -0.06, 0.61, 1.21, 1.15, 0.66, 0.33, 1.71, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/pbzjsBcOuB8_filtered.json b/annotations_filtered/pbzjsBcOuB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61991739bfd044f703ff105ce65ba68e9d9cc41c --- /dev/null +++ b/annotations_filtered/pbzjsBcOuB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 13.64], [14.0, 15.99], [20.0, 22.01], [24.0, 23.79], [27.0, 32.04], [33.0, 44.24], [46.0, 48.73], [52.0, 55.46], [59.0, 60.74], [65.0, 78.51], [81.0, 116.46], [118.0, 119.64], [120.0, 121.12], [123.0, 129.52], [130.0, 132.7], [133.0, 136.83], [138.0, 141.51], [143.0, 151.6], [155.0, 161.52], [162.0, 170.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [58.89, 0.0, 63.31, 0.0, 52.74, 40.73, 52.39, 76.7, 0.0, 43.33, 0.0, 0.0, 0.0, 38.88, 60.6, 70.3, 78.38, 34.12, 31.45, 36.25], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 35.45], ["speech", 27.64], ["mains hum", 16.85]], null, null, null, [["whale vocalization", 49.45], ["speech", 18.25], ["rumble", 7.44]], null, null, null, [["hum", 44.62], ["mains hum", 17.68], ["throbbing", 9.33]], null, null, null, [["hum", 22.17], ["speech", 18.46], ["whack, thwack", 7.81]], [["speech", 42.01], ["hum", 13.87], ["mains hum", 10.53]], [["speech", 29.84], ["clip-clop", 15.52], ["animal", 12.84]]], "duration": [6.64, 1.99, 2.01, -0.21, 5.04, 11.24, 2.73, 3.46, 1.74, 13.51, 35.46, 1.64, 1.12, 6.52, 2.7, 3.83, 3.51, 8.6, 6.52, 8.55]} \ No newline at end of file diff --git a/annotations_filtered/pcV9ceH4UvE_filtered.json b/annotations_filtered/pcV9ceH4UvE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4f4e4010afad341c78547a4071d9613341af8f8 --- /dev/null +++ b/annotations_filtered/pcV9ceH4UvE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 13.09], [14.0, 41.86], [43.0, 69.87], [72.0, 79.27], [80.0, 81.45], [83.0, 83.98], [87.0, 88.53], [90.0, 91.64], [95.0, 95.67], [98.0, 98.37], [100.0, 99.96], [101.0, 102.24], [105.0, 105.04], [106.0, 106.1], [108.0, 110.44], [111.0, 111.35], [113.0, 114.42], [116.0, 122.69], [124.0, 124.38], [126.0, 126.81], [129.0, 130.28], [132.0, 132.83], [136.0, 136.98], [140.0, 141.4], [142.0, 146.96], [147.0, 164.64], [168.0, 169.47], [171.0, 173.87]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.53, 30.47, 30.32, 32.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.84, 0.0, 0.0, 38.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.56, 31.48, 0.0, 40.16], "audiomae_on_audioset": [[["music", 80.13], ["throbbing", 4.0], ["breaking", 3.67]], [["music", 60.92], ["throbbing", 11.61], ["hum", 6.58]], [["music", 34.13], ["throbbing", 9.58], ["hum", 8.55]], [["music", 22.31], ["noise", 19.0], ["speech", 14.38]], null, null, null, null, null, null, null, null, null, null, [["music", 22.5], ["speech", 12.28], ["whack, thwack", 6.52]], null, null, [["music", 60.59], ["throbbing", 8.78], ["hum", 2.05]], null, null, null, null, null, null, [["music", 48.05], ["hum", 22.56], ["throbbing", 9.38]], [["music", 38.07], ["speech", 29.19], ["explosion", 7.25]], null, [["music", 63.66], ["throbbing", 6.28], ["hum", 2.95]]], "duration": [12.09, 27.86, 26.87, 7.27, 1.45, 0.98, 1.53, 1.64, 0.67, 0.37, -0.04, 1.24, 0.04, 0.1, 2.44, 0.35, 1.42, 6.69, 0.38, 0.81, 1.28, 0.83, 0.98, 1.4, 4.96, 17.64, 1.47, 2.87]} \ No newline at end of file diff --git a/annotations_filtered/pcj4boVT4fc_filtered.json b/annotations_filtered/pcj4boVT4fc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe13ba598f5b44092bf959d24808851e3945a6e8 --- /dev/null +++ b/annotations_filtered/pcj4boVT4fc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 37.47], [60.0, 59.97], [63.0, 68.25], [68.0, 68.71], [69.0, 69.63], [70.0, 71.34], [77.0, 77.25], [79.0, 99.05], [99.0, 99.08], [99.0, 99.12]], "keep_status": [false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.37, 0.0, 0.0, 0.0, 0.0, 34.48, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 36.38], ["double bass", 10.94], ["bowed string instrument", 8.81]], null, null, null, null, [["music", 43.96], ["brass instrument", 18.79], ["trombone", 7.58]], null, null], "duration": [0.47, -0.03, 5.25, 0.71, 0.63, 1.34, 0.25, 20.05, 0.08, 0.12]} \ No newline at end of file diff --git a/annotations_filtered/pcqaeLRop58_filtered.json b/annotations_filtered/pcqaeLRop58_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b260143d0ce6701842e20e1dc152479e4c51291 --- /dev/null +++ b/annotations_filtered/pcqaeLRop58_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.76], [26.0, 26.4], [29.0, 30.86], [35.0, 36.61], [38.0, 38.58], [41.0, 41.96], [51.0, 52.08], [56.0, 56.46], [60.0, 60.0], [71.0, 76.18], [82.0, 89.92], [90.0, 95.0], [100.0, 113.39], [115.0, 124.82], [125.0, 131.28], [132.0, 133.22], [151.0, 154.01], [158.0, 158.77], [159.0, 175.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.76, 30.39, 30.88, 30.52, 30.25, 31.08, 0.0, 31.91, 0.0, 30.08], "audiomae_on_audioset": [[["music", 48.25], ["throbbing", 25.11], ["hum", 8.42]], null, null, null, null, null, null, null, null, [["speech", 44.82], ["thunk", 19.85], ["whack, thwack", 5.42]], [["music", 36.56], ["speech", 23.41], ["boing", 12.83]], [["music", 58.19], ["speech", 8.35], ["boing", 4.75]], [["music", 83.49], ["didgeridoo", 2.17], ["electronic music", 1.94]], [["music", 81.8], ["speech", 2.15], ["didgeridoo", 1.77]], [["music", 72.79], ["speech", 2.84], ["musical instrument", 2.52]], null, [["music", 77.98], ["musical instrument", 5.29], ["guitar", 4.44]], null, [["music", 76.64], ["speech", 6.65], ["didgeridoo", 2.25]]], "duration": [6.76, 0.4, 1.86, 1.61, 0.58, 0.96, 1.08, 0.46, 0.0, 5.18, 7.92, 5.0, 13.39, 9.82, 6.28, 1.22, 3.01, 0.77, 16.56]} \ No newline at end of file diff --git a/annotations_filtered/pcyg0H7EU3c_filtered.json b/annotations_filtered/pcyg0H7EU3c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..446507ea877547c4d6d4e07e39ecc35a01ba05fd --- /dev/null +++ b/annotations_filtered/pcyg0H7EU3c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.46], [24.0, 24.11], [25.0, 26.28], [39.0, 39.51], [54.0, 57.54], [58.0, 59.37], [61.0, 61.33], [64.0, 66.82], [70.0, 70.17], [76.0, 76.35], [77.0, 77.67], [83.0, 83.3], [90.0, 89.83], [91.0, 91.77], [95.0, 98.73]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 33.66, 0.0, 0.0, 52.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.7], "audiomae_on_audioset": [null, null, null, null, [["fart", 21.18], ["livestock, farm animals, working animals", 20.72], ["cattle, bovinae", 17.37]], null, null, null, null, null, null, null, null, null, null], "duration": [0.46, 0.11, 1.28, 0.51, 3.54, 1.37, 0.33, 2.82, 0.17, 0.35, 0.67, 0.3, -0.17, 0.77, 3.73]} \ No newline at end of file diff --git a/annotations_filtered/pdE83FX-Mto_filtered.json b/annotations_filtered/pdE83FX-Mto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b32b0e4977f489e0b719b80a0b9f99cafb376243 --- /dev/null +++ b/annotations_filtered/pdE83FX-Mto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.23], [23.0, 23.73], [26.0, 26.13], [27.0, 30.38], [32.0, 33.52], [42.0, 42.43], [43.0, 45.52], [47.0, 48.63], [49.0, 52.61], [56.0, 56.13], [61.0, 62.95], [69.0, 69.96], [72.0, 87.59], [91.0, 95.62]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 35.72, 0.0, 0.0, 40.68, 0.0, 32.46, 0.0, 0.0, 0.0, 35.35, 30.94], "audiomae_on_audioset": [null, null, null, [["speech", 59.22], ["hum", 11.81], ["applause", 6.68]], null, null, [["speech", 27.75], ["cattle, bovinae", 13.92], ["boing", 13.46]], null, [["whale vocalization", 56.19], ["animal", 7.34], ["frog", 5.24]], null, null, null, [["fly, housefly", 18.72], ["insect", 12.05], ["motorboat, speedboat", 10.16]], [["water", 64.56], ["toilet flush", 7.74], ["gurgling", 3.33]]], "duration": [1.23, 0.73, 0.13, 3.38, 1.52, 0.43, 2.52, 1.63, 3.61, 0.13, 1.95, 0.96, 15.59, 4.62]} \ No newline at end of file diff --git a/annotations_filtered/pdYYAu24yVQ_filtered.json b/annotations_filtered/pdYYAu24yVQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d76b8a8db25c5e0ca2c9b09a08974e45872552e8 --- /dev/null +++ b/annotations_filtered/pdYYAu24yVQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 78.26]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [61.26]} \ No newline at end of file diff --git a/annotations_filtered/pdmo-_KXg0Y_filtered.json b/annotations_filtered/pdmo-_KXg0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b460e0b67003588e052d3d6834a6c9754a88c1c3 --- /dev/null +++ b/annotations_filtered/pdmo-_KXg0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 39.48], [41.0, 42.45], [52.0, 52.39], [63.0, 63.73], [64.0, 66.26], [68.0, 74.46], [75.0, 77.97], [85.0, 85.13], [87.0, 87.59], [104.0, 106.51], [111.0, 112.8], [117.0, 126.0], [132.0, 131.8]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 47.78, 70.72, 35.44, 0.0, 0.0, 30.24, 0.0, 29.76, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 26.83], ["speech", 22.54], ["mains hum", 10.62]], null, [["music", 29.53], ["speech", 24.45], ["musical instrument", 2.91]], null, null, [["speech", 46.64], ["music", 26.06], ["grunt", 5.63]], null, [["speech", 68.75], ["outside, rural or natural", 4.45], ["music", 4.08]], null], "duration": [1.48, 1.45, 0.39, 0.73, 2.26, 6.46, 2.97, 0.13, 0.59, 2.51, 1.8, 9.0, -0.2]} \ No newline at end of file diff --git a/annotations_filtered/pdwGNiv2q4U_filtered.json b/annotations_filtered/pdwGNiv2q4U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7cc6608983bcf3e10e70106d438e84c873b74ae4 --- /dev/null +++ b/annotations_filtered/pdwGNiv2q4U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 21.76], [23.0, 23.58], [27.0, 27.36], [29.0, 29.78], [31.0, 31.13], [32.0, 33.89], [36.0, 36.8], [38.0, 38.48], [40.0, 46.4], [47.0, 48.19], [51.0, 53.69], [55.0, 58.21], [58.0, 60.1], [60.0, 61.69], [63.0, 63.78], [71.0, 71.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.17, 0.0, 90.43, 90.6, 71.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.76, 0.58, 0.36, 0.78, 0.13, 1.89, 0.8, 0.48, 6.4, 1.19, 2.69, 3.21, 2.1, 1.69, 0.78, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/pe8vv-fGpWk_filtered.json b/annotations_filtered/pe8vv-fGpWk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..272cc08e46146e37f298403a81166f6d2ba0985b --- /dev/null +++ b/annotations_filtered/pe8vv-fGpWk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 25.52], [26.0, 42.18], [43.0, 50.65]], "keep_status": [false, false, false], "silence_prob": [100.0, 99.8, 100.0], "audiomae_on_audioset": [null, null, null], "duration": [11.52, 16.18, 7.65]} \ No newline at end of file diff --git a/annotations_filtered/peBuMWtkw8s_filtered.json b/annotations_filtered/peBuMWtkw8s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a5fc5405b6876bd247dfaa2d3c979fe43b990a4 --- /dev/null +++ b/annotations_filtered/peBuMWtkw8s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 25.27], [26.0, 36.19], [40.0, 47.22], [49.0, 50.21], [58.0, 58.77], [67.0, 68.91], [82.0, 83.13], [87.0, 88.43]], "keep_status": [false, false, true, false, false, false, false, false], "silence_prob": [0.0, 31.08, 31.25, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 63.84], ["groan", 14.46], ["speech", 5.54]], [["speech", 39.01], ["sidetone", 15.81], ["music", 12.37]], null, null, null, null, null], "duration": [1.27, 10.19, 7.22, 1.21, 0.77, 1.91, 1.13, 1.43]} \ No newline at end of file diff --git a/annotations_filtered/peUyLXrgYZ0_filtered.json b/annotations_filtered/peUyLXrgYZ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b697d653629cd2ad91f9c08dc110eddc316b4154 --- /dev/null +++ b/annotations_filtered/peUyLXrgYZ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.46], [17.0, 18.77], [20.0, 20.53], [21.0, 22.18], [29.0, 35.65], [38.0, 50.67], [52.0, 52.44], [54.0, 54.7], [60.0, 60.03], [61.0, 62.31], [66.0, 65.65], [71.0, 72.32], [78.0, 79.54], [81.0, 81.62], [84.0, 84.1], [86.0, 96.52], [97.0, 97.34], [98.0, 100.21], [114.0, 114.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 54.1, 50.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.31, 0.0, 35.62, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["ding", 44.69], ["clang", 17.57], ["boing", 14.84]], null, [["throbbing", 34.98], ["hum", 17.79], ["music", 10.2]], null], "duration": [0.46, 1.77, 0.53, 1.18, 6.65, 12.67, 0.44, 0.7, 0.03, 1.31, -0.35, 1.32, 1.54, 0.62, 0.1, 10.52, 0.34, 2.21, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/pesYeCruSyI_filtered.json b/annotations_filtered/pesYeCruSyI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f077aa459b363b01b15322763f3695d70bf5858 --- /dev/null +++ b/annotations_filtered/pesYeCruSyI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 27.18], [30.0, 31.08], [32.0, 42.48], [46.0, 46.99], [49.0, 48.84], [51.0, 50.8], [52.0, 53.49], [56.0, 57.6], [58.0, 61.11], [62.0, 63.58], [68.0, 69.18], [71.0, 72.01], [74.0, 79.54], [83.0, 86.49], [88.0, 102.54], [105.0, 109.98], [111.0, 112.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 99.85, 99.88, 97.64, 99.97, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.18, 1.08, 10.48, 0.99, -0.16, -0.2, 1.49, 1.6, 3.11, 1.58, 1.18, 1.01, 5.54, 3.49, 14.54, 4.98, 1.21]} \ No newline at end of file diff --git a/annotations_filtered/petKvkHfPJo_filtered.json b/annotations_filtered/petKvkHfPJo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b15d2a464e94e52ae0c8142bb2b457041e627105 --- /dev/null +++ b/annotations_filtered/petKvkHfPJo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.51], [21.0, 21.93], [26.0, 26.4], [28.0, 29.46], [31.0, 31.53], [39.0, 38.7], [43.0, 44.54], [46.0, 48.44], [50.0, 49.79], [51.0, 51.71], [52.0, 51.98], [54.0, 54.01], [59.0, 59.41], [61.0, 62.87], [64.0, 64.13], [65.0, 65.21], [65.0, 65.25], [70.0, 70.01], [80.0, 83.81], [85.0, 85.36], [94.0, 93.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.64, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["breaking", 51.99], ["music", 16.17], ["reverberation", 4.32]], null, null, null, null, null, null, null, null, null, null, [["breaking", 90.78], ["smash, crash", 1.41], ["crack", 1.22]], null, null], "duration": [0.51, 0.93, 0.4, 1.46, 0.53, -0.3, 1.54, 2.44, -0.21, 0.71, -0.02, 0.01, 0.41, 1.87, 0.13, 0.21, 0.25, 0.01, 3.81, 0.36, -0.17]} \ No newline at end of file diff --git a/annotations_filtered/pf0erXl4pwQ_filtered.json b/annotations_filtered/pf0erXl4pwQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80e706b49008f659dfa19bf39f568f825e03fdf4 --- /dev/null +++ b/annotations_filtered/pf0erXl4pwQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.27], [7.0, 8.97], [10.0, 11.21], [15.0, 16.17], [26.0, 26.79], [39.0, 39.19], [41.0, 42.48], [44.0, 45.06], [59.0, 59.21], [72.0, 73.25], [77.0, 77.84], [78.0, 86.61], [88.0, 88.25], [90.0, 92.87], [94.0, 94.85], [99.0, 99.18], [100.0, 101.82], [107.0, 108.18], [112.0, 111.89], [113.0, 116.41], [117.0, 119.52], [123.0, 122.82], [131.0, 133.83], [135.0, 138.97], [139.0, 140.12], [144.0, 144.29], [147.0, 148.8], [153.0, 153.12], [155.0, 156.42], [164.0, 165.2], [172.0, 177.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.4, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 51.6, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 62.15], ["thunk", 21.92], ["thump, thud", 1.93]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.27, 1.97, 1.21, 1.17, 0.79, 0.19, 1.48, 1.06, 0.21, 1.25, 0.84, 8.61, 0.25, 2.87, 0.85, 0.18, 1.82, 1.18, -0.11, 3.41, 2.52, -0.18, 2.83, 3.97, 1.12, 0.29, 1.8, 0.12, 1.42, 1.2, 5.33]} \ No newline at end of file diff --git a/annotations_filtered/pf2q0HemaFs_filtered.json b/annotations_filtered/pf2q0HemaFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95a0913e775780301fa5e2109e4ce22c7466c586 --- /dev/null +++ b/annotations_filtered/pf2q0HemaFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.41], [5.0, 6.34], [9.0, 9.07], [36.0, 36.95], [39.0, 39.75], [40.0, 40.93], [110.0, 111.1], [112.0, 112.87], [114.0, 114.29], [120.0, 120.16], [122.0, 123.69], [139.0, 139.43], [144.0, 144.31], [148.0, 148.29], [150.0, 150.69], [165.0, 166.04], [213.0, 213.44], [215.0, 215.94], [234.0, 233.9], [234.0, 235.5], [237.0, 237.05], [247.0, 247.87], [253.0, 253.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.41, 1.34, 0.07, 0.95, 0.75, 0.93, 1.1, 0.87, 0.29, 0.16, 1.69, 0.43, 0.31, 0.29, 0.69, 1.04, 0.44, 0.94, -0.1, 1.5, 0.05, 0.87, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/pfLTbzU0FXo_filtered.json b/annotations_filtered/pfLTbzU0FXo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c6aed44233e4f1be818a0860452f593faae4f02 --- /dev/null +++ b/annotations_filtered/pfLTbzU0FXo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[60.0, 70.92], [72.0, 113.71], [115.0, 115.96], [117.0, 118.23], [118.0, 118.86], [122.0, 123.33]], "keep_status": [false, false, false, false, false, false], "silence_prob": [29.63, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 52.54], ["trombone", 12.1], ["speech", 11.98]], null, null, null, null, null], "duration": [10.92, 41.71, 0.96, 1.23, 0.86, 1.33]} \ No newline at end of file diff --git a/annotations_filtered/pfOJfhbqJhY_filtered.json b/annotations_filtered/pfOJfhbqJhY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d44e348145e9c9a6fb3f1bdccb54d1a43e82322d --- /dev/null +++ b/annotations_filtered/pfOJfhbqJhY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.18], [27.0, 29.29], [31.0, 32.17], [35.0, 39.63], [40.0, 45.76], [46.0, 53.94], [55.0, 61.6], [62.0, 62.43], [65.0, 71.71], [84.0, 85.04], [85.0, 85.67], [91.0, 92.97]], "keep_status": [false, true, false, true, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 34.06, 0.0, 39.58, 34.09, 34.67, 31.07, 0.0, 31.75, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["whale vocalization", 45.64], ["fart", 11.74], ["creak", 4.72]], null, [["speech", 29.42], ["honk", 11.5], ["hum", 8.88]], [["speech", 53.24], ["animal", 11.61], ["horse", 4.1]], [["horse", 27.51], ["speech", 24.46], ["clip-clop", 12.76]], [["music", 58.54], ["brass instrument", 7.42], ["trombone", 6.17]], null, [["cattle, bovinae", 43.54], ["livestock, farm animals, working animals", 21.69], ["moo", 19.87]], null, null, null], "duration": [0.18, 2.29, 1.17, 4.63, 5.76, 7.94, 6.6, 0.43, 6.71, 1.04, 0.67, 1.97]} \ No newline at end of file diff --git a/annotations_filtered/pfVP6HBoflg_filtered.json b/annotations_filtered/pfVP6HBoflg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8397316835506dae0f219cba08bf91ad086836f7 --- /dev/null +++ b/annotations_filtered/pfVP6HBoflg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.21], [6.0, 6.08], [10.0, 29.05], [30.0, 37.34], [42.0, 44.73], [58.0, 58.35], [62.0, 65.35], [68.0, 69.42], [73.0, 103.65], [105.0, 122.23], [123.0, 123.45], [123.0, 123.74], [124.0, 132.21], [149.0, 150.03], [154.0, 157.99], [169.0, 169.06], [170.0, 170.73], [172.0, 177.89]], "keep_status": [false, false, false, true, true, false, false, false, false, true, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 38.6, 33.17, 35.7, 0.0, 33.88, 0.0, 0.0, 39.46, 0.0, 0.0, 32.48, 0.0, 46.83, 0.0, 0.0, 46.43], "audiomae_on_audioset": [null, null, [["music", 49.09], ["speech", 15.47], ["hum", 6.28]], [["cattle, bovinae", 23.85], ["speech", 22.28], ["livestock, farm animals, working animals", 15.55]], [["music", 23.34], ["cattle, bovinae", 21.67], ["moo", 15.65]], null, [["foghorn", 36.24], ["music", 31.52], ["trombone", 6.18]], null, null, [["speech", 31.28], ["radio", 16.02], ["vehicle", 6.9]], null, null, [["speech", 67.62], ["splash, splatter", 4.46], ["explosion", 4.13]], null, [["music", 39.1], ["whale vocalization", 11.74], ["hum", 11.16]], null, null, [["music", 41.41], ["hum", 13.64], ["mains hum", 7.86]]], "duration": [0.21, 0.08, 19.05, 7.34, 2.73, 0.35, 3.35, 1.42, 30.65, 17.23, 0.45, 0.74, 8.21, 1.03, 3.99, 0.06, 0.73, 5.89]} \ No newline at end of file diff --git a/annotations_filtered/pgL4IvoR7tw_filtered.json b/annotations_filtered/pgL4IvoR7tw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13f49773c9d8b22a50f065e73ba46c6d18809ecf --- /dev/null +++ b/annotations_filtered/pgL4IvoR7tw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.67], [7.0, 7.74], [8.0, 11.31], [14.0, 15.04], [16.0, 17.24], [22.0, 23.84], [28.0, 108.65]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 41.18, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 50.13], ["musical instrument", 5.6], ["synthesizer", 5.48]], null, null, null, null], "duration": [1.67, 0.74, 3.31, 1.04, 1.24, 1.84, 80.65]} \ No newline at end of file diff --git a/annotations_filtered/ph2dq-pPBnA_filtered.json b/annotations_filtered/ph2dq-pPBnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9c0aaaecd8d3c7072ae27f8de727715fe556e73 --- /dev/null +++ b/annotations_filtered/ph2dq-pPBnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.93], [8.0, 8.46], [15.0, 16.36], [19.0, 23.84], [27.0, 32.88], [34.0, 34.28], [37.0, 38.77], [47.0, 47.98], [51.0, 54.19], [55.0, 64.29], [68.0, 69.36], [71.0, 71.09], [71.0, 72.77], [77.0, 77.21], [78.0, 79.15], [96.0, 96.52], [106.0, 107.15], [114.0, 117.95], [120.0, 121.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.36, 0.0, 0.0, 96.04, 97.73, 0.0, 0.0, 0.0, 85.9, 98.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.93, 0.46, 1.36, 4.84, 5.88, 0.28, 1.77, 0.98, 3.19, 9.29, 1.36, 0.09, 1.77, 0.21, 1.15, 0.52, 1.15, 3.95, 1.24]} \ No newline at end of file diff --git a/annotations_filtered/phGwatUEyzc_filtered.json b/annotations_filtered/phGwatUEyzc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5258e7c8fcbfbf4e84bf8ab01b2e7c0bd3dcaeb --- /dev/null +++ b/annotations_filtered/phGwatUEyzc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.1], [4.0, 4.83], [17.0, 17.22], [19.0, 19.03], [26.0, 27.09], [34.0, 34.26], [37.0, 39.72], [40.0, 40.2], [79.0, 80.52], [84.0, 86.46], [90.0, 90.0], [90.0, 90.53], [94.0, 94.36], [95.0, 96.16], [102.0, 101.8], [103.0, 103.82], [105.0, 106.39], [110.0, 113.48], [115.0, 126.33], [128.0, 129.68], [133.0, 137.24], [138.0, 145.44], [146.0, 146.87], [164.0, 166.08], [168.0, 169.37]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.4, 0.0, 0.0, 36.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.98, 29.39, 0.0, 29.37, 28.92, 0.0, 47.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 27.23], ["speech", 17.38], ["musical instrument", 4.03]], null, null, [["music", 46.17], ["saxophone", 8.12], ["musical instrument", 6.79]], null, null, null, null, null, null, null, [["music", 64.74], ["electronic tuner", 3.41], ["boing", 3.35]], [["music", 71.32], ["carnatic music", 7.22], ["musical instrument", 2.67]], null, [["music", 57.03], ["boing", 5.79], ["harmonic", 3.09]], [["music", 83.14], ["carnatic music", 4.2], ["singing", 1.61]], null, [["foghorn", 19.79], ["music", 14.7], ["speech", 12.61]], null], "duration": [1.1, 0.83, 0.22, 0.03, 1.09, 0.26, 2.72, 0.2, 1.52, 2.46, 0.0, 0.53, 0.36, 1.16, -0.2, 0.82, 1.39, 3.48, 11.33, 1.68, 4.24, 7.44, 0.87, 2.08, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/phJJFbxyino_filtered.json b/annotations_filtered/phJJFbxyino_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0db2fd4f981197a22e26cf8563983d7fc761aa85 --- /dev/null +++ b/annotations_filtered/phJJFbxyino_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.05], [16.0, 16.41], [23.0, 24.83], [26.0, 26.62], [41.0, 41.64], [43.0, 42.99], [43.0, 43.7], [47.0, 47.48], [49.0, 49.71], [54.0, 54.43], [55.0, 56.52], [57.0, 66.68], [73.0, 88.91], [129.0, 131.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.51, 59.42, 66.03], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.05, 0.41, 1.83, 0.62, 0.64, -0.01, 0.7, 0.48, 0.71, 0.43, 1.52, 9.68, 15.91, 2.55]} \ No newline at end of file diff --git a/annotations_filtered/phKe4peWFG8_filtered.json b/annotations_filtered/phKe4peWFG8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0695d8a461f636361cf959678ae25486cd51a2b --- /dev/null +++ b/annotations_filtered/phKe4peWFG8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.4], [7.0, 7.86], [10.0, 10.47], [19.0, 21.32], [24.0, 24.44], [29.0, 30.35], [35.0, 36.68], [38.0, 39.95], [41.0, 41.98], [43.0, 43.34], [50.0, 51.09], [54.0, 56.19], [57.0, 59.46], [70.0, 76.5], [78.0, 78.65], [81.0, 82.32], [83.0, 82.97], [84.0, 84.0], [86.0, 86.97], [87.0, 88.74], [91.0, 91.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 58.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05, 100.0, 74.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 0.86, 0.47, 2.32, 0.44, 1.35, 1.68, 1.95, 0.98, 0.34, 1.09, 2.19, 2.46, 6.5, 0.65, 1.32, -0.03, 0.0, 0.97, 1.74, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/phzJ2Iam214_filtered.json b/annotations_filtered/phzJ2Iam214_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb6ceea221bf731d3aed7d71fec6e66536ed126d --- /dev/null +++ b/annotations_filtered/phzJ2Iam214_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.15], [14.0, 14.23], [16.0, 16.65], [17.0, 18.54], [19.0, 21.47], [22.0, 26.01], [27.0, 26.82], [27.0, 28.07], [31.0, 33.54], [36.0, 36.56], [37.0, 39.38], [43.0, 44.02], [46.0, 50.95], [52.0, 75.3], [76.0, 77.62], [78.0, 79.14], [85.0, 85.89], [87.0, 89.01], [97.0, 98.22], [101.0, 101.82], [103.0, 103.38], [104.0, 103.82], [107.0, 107.62], [108.0, 108.68], [109.0, 109.54], [110.0, 112.19], [114.0, 115.11], [116.0, 116.63], [118.0, 119.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 96.42, 97.11, 0.0, 0.0, 89.19, 0.0, 73.21, 0.0, 97.73, 56.18, 0.0, 0.0, 0.0, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.23, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.15, 0.23, 0.65, 1.54, 2.47, 4.01, -0.18, 1.07, 2.54, 0.56, 2.38, 1.02, 4.95, 23.3, 1.62, 1.14, 0.89, 2.01, 1.22, 0.82, 0.38, -0.18, 0.62, 0.68, 0.54, 2.19, 1.11, 0.63, 1.79]} \ No newline at end of file diff --git a/annotations_filtered/pi6SInyE0sw_filtered.json b/annotations_filtered/pi6SInyE0sw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47c73673bc80e743b2d9400e1228661c19856489 --- /dev/null +++ b/annotations_filtered/pi6SInyE0sw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.54], [13.0, 14.34], [15.0, 15.94], [19.0, 19.06], [20.0, 20.8], [22.0, 22.42], [26.0, 26.35], [29.0, 30.25], [31.0, 31.97], [33.0, 33.27], [39.0, 39.58], [41.0, 41.44], [43.0, 44.02], [46.0, 46.65], [51.0, 52.07], [56.0, 56.88], [58.0, 58.21], [59.0, 60.71], [62.0, 63.98], [64.0, 64.69], [69.0, 69.26], [71.0, 71.39], [73.0, 74.04], [77.0, 77.82], [82.0, 82.78], [83.0, 83.4], [85.0, 85.87], [87.0, 87.0], [88.0, 89.19], [90.0, 90.46], [97.0, 98.69], [101.0, 103.01], [104.0, 106.32], [117.0, 117.59], [122.0, 122.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.37, 97.64, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 32.07], ["telephone", 19.44], ["radio", 12.0]], null, null, null], "duration": [1.54, 1.34, 0.94, 0.06, 0.8, 0.42, 0.35, 1.25, 0.97, 0.27, 0.58, 0.44, 1.02, 0.65, 1.07, 0.88, 0.21, 1.71, 1.98, 0.69, 0.26, 0.39, 1.04, 0.82, 0.78, 0.4, 0.87, 0.0, 1.19, 0.46, 1.69, 2.01, 2.32, 0.59, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/piFTKwqrqYA_filtered.json b/annotations_filtered/piFTKwqrqYA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8594e4470a2c63e10bd07ef3c0b3d4bf2439746d --- /dev/null +++ b/annotations_filtered/piFTKwqrqYA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.92], [4.0, 6.1], [7.0, 8.18], [9.0, 13.07], [16.0, 21.95], [24.0, 25.12], [29.0, 31.24], [33.0, 34.91]], "keep_status": [false, true, false, true, true, false, true, false], "silence_prob": [0.0, 32.31, 0.0, 39.55, 37.84, 0.0, 34.43, 0.0], "audiomae_on_audioset": [null, [["speech", 26.93], ["music", 12.8], ["hum", 5.43]], null, [["music", 28.02], ["hum", 17.64], ["musical instrument", 4.54]], [["music", 18.19], ["hum", 15.61], ["whale vocalization", 15.54]], null, [["music", 35.72], ["hum", 17.46], ["throbbing", 10.72]], null], "duration": [1.92, 2.1, 1.18, 4.07, 5.95, 1.12, 2.24, 1.91]} \ No newline at end of file diff --git a/annotations_filtered/piOTzME87Dg_filtered.json b/annotations_filtered/piOTzME87Dg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb5e4865d1e7626331f631f9d754924a2cdca0d5 --- /dev/null +++ b/annotations_filtered/piOTzME87Dg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 83.02], [86.0, 93.14], [93.0, 93.34], [96.0, 103.94], [104.0, 110.37], [112.0, 114.15]], "keep_status": [false, false, false, true, false, true], "silence_prob": [0.0, 31.3, 0.0, 30.41, 30.38, 30.03], "audiomae_on_audioset": [null, [["music", 75.11], ["throbbing", 3.86], ["theremin", 3.71]], null, [["music", 45.57], ["fart", 7.92], ["speech", 4.89]], [["music", 85.52], ["electronic music", 2.77], ["ambient music", 2.66]], [["music", 38.63], ["hum", 25.01], ["electronic music", 5.78]]], "duration": [51.02, 7.14, 0.34, 7.94, 6.37, 2.15]} \ No newline at end of file diff --git a/annotations_filtered/piTAjb8dd2Y_filtered.json b/annotations_filtered/piTAjb8dd2Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d5d8186ad74a9a93394de50f9e6f534b6cbff11 --- /dev/null +++ b/annotations_filtered/piTAjb8dd2Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.35], [4.0, 4.06], [11.0, 11.01], [20.0, 23.7], [28.0, 39.5], [44.0, 46.97], [48.0, 58.68], [61.0, 61.59], [64.0, 102.12], [107.0, 106.95], [107.0, 107.05], [107.0, 125.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.85, 55.04, 76.37, 56.03, 0.0, 0.0, 0.0, 0.0, 39.17], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 43.09], ["speech", 27.85], ["musical instrument", 2.67]]], "duration": [0.35, 0.06, 0.01, 3.7, 11.5, 2.97, 10.68, 0.59, 38.12, -0.05, 0.05, 18.47]} \ No newline at end of file diff --git a/annotations_filtered/pikAt8prREE_filtered.json b/annotations_filtered/pikAt8prREE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c5ae227f8cae20f2083a563e0b3c4825576e58f --- /dev/null +++ b/annotations_filtered/pikAt8prREE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[57.0, 58.43], [61.0, 62.5], [72.0, 73.2], [74.0, 73.7], [74.0, 74.33], [75.0, 75.76], [77.0, 78.78], [84.0, 88.48], [97.0, 97.53], [114.0, 114.86], [133.0, 133.29], [141.0, 143.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 29.68], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["moo", 19.25], ["livestock, farm animals, working animals", 18.65], ["cattle, bovinae", 18.09]]], "duration": [1.43, 1.5, 1.2, -0.3, 0.33, 0.76, 1.78, 4.48, 0.53, 0.86, 0.29, 2.33]} \ No newline at end of file diff --git a/annotations_filtered/pizMaFdtY-s_filtered.json b/annotations_filtered/pizMaFdtY-s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be4c995b7b60445743893dd577fcb6851455939c --- /dev/null +++ b/annotations_filtered/pizMaFdtY-s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.55], [9.0, 9.26], [13.0, 13.83], [15.0, 15.5], [17.0, 18.06], [20.0, 19.6], [20.0, 20.95], [23.0, 23.73], [25.0, 25.49], [29.0, 29.47], [31.0, 31.65], [32.0, 33.32], [34.0, 36.56], [38.0, 40.39], [45.0, 45.47], [46.0, 47.49], [49.0, 51.02], [53.0, 53.11], [54.0, 55.41], [56.0, 57.15], [58.0, 59.86], [61.0, 65.67], [67.0, 67.73], [70.0, 72.54], [74.0, 81.14], [83.0, 89.65], [92.0, 93.68], [100.0, 101.29], [102.0, 102.95], [103.0, 103.45], [103.0, 103.72], [107.0, 109.58], [110.0, 112.13], [118.0, 118.64], [124.0, 126.12], [129.0, 129.68], [131.0, 130.96], [136.0, 136.43], [137.0, 137.93], [141.0, 176.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.13, 31.13, 0.0, 0.0, 32.62, 0.0, 0.0, 0.0, 0.0, 32.84, 0.0, 32.58, 32.49, 32.06, 0.0, 0.0, 0.0, 0.0, 0.0, 45.43, 49.82, 0.0, 35.93, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 61.18], ["hum", 7.33], ["throbbing", 5.64]], [["music", 68.11], ["electronic music", 4.22], ["guitar", 3.32]], null, null, [["music", 69.88], ["musical instrument", 4.99], ["electronic music", 3.9]], null, null, null, null, [["music", 34.01], ["throbbing", 17.79], ["hum", 6.88]], null, [["music", 68.52], ["electronic music", 9.29], ["hum", 2.36]], [["music", 37.35], ["hum", 24.71], ["throbbing", 15.65]], [["hum", 38.38], ["mains hum", 37.02], ["throbbing", 10.11]], null, null, null, null, null, [["music", 56.36], ["whale vocalization", 3.78], ["hum", 2.99]], [["music", 31.17], ["ambient music", 10.49], ["hum", 10.2]], null, [["music", 48.8], ["electronic music", 12.76], ["whale vocalization", 8.71]], null, null, null, null, null], "duration": [0.55, 0.26, 0.83, 0.5, 1.06, -0.4, 0.95, 0.73, 0.49, 0.47, 0.65, 1.32, 2.56, 2.39, 0.47, 1.49, 2.02, 0.11, 1.41, 1.15, 1.86, 4.67, 0.73, 2.54, 7.14, 6.65, 1.68, 1.29, 0.95, 0.45, 0.72, 2.58, 2.13, 0.64, 2.12, 0.68, -0.04, 0.43, 0.93, 35.59]} \ No newline at end of file diff --git a/annotations_filtered/pjF6bofXAvQ_filtered.json b/annotations_filtered/pjF6bofXAvQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7980a3d6a95d5fcc7dfd6b9134e37bf1fa66321 --- /dev/null +++ b/annotations_filtered/pjF6bofXAvQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.16], [0.0, 3.06], [10.0, 11.55], [22.0, 23.11], [24.0, 26.55], [30.0, 31.5], [34.0, 33.86], [46.0, 46.65], [49.0, 51.07], [55.0, 57.3], [59.0, 59.63], [67.0, 68.55], [70.0, 73.74], [79.0, 78.78], [83.0, 84.27], [98.0, 98.46], [101.0, 103.22], [106.0, 107.47], [109.0, 111.74], [112.0, 113.61], [127.0, 127.77], [130.0, 130.0], [131.0, 136.16], [137.0, 138.35], [144.0, 145.0], [149.0, 149.52], [152.0, 152.61], [155.0, 155.44], [158.0, 158.8], [161.0, 161.4], [163.0, 163.39], [164.0, 164.44]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 57.89, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 48.91, 37.84, 0.0, 0.0, 40.61, 0.0, 0.0, 0.0, 42.08, 0.0, 54.7, 0.0, 0.0, 0.0, 42.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 37.6], ["creak", 8.57], ["musical instrument", 3.78]], [["music", 40.7], ["breaking", 10.98], ["screaming", 9.05]], null, null, [["speech", 67.68], ["music", 7.79], ["breaking", 2.53]], null, null, null, [["music", 10.84], ["livestock, farm animals, working animals", 9.59], ["sheep", 8.17]], null, null, null, null, null, [["music", 43.43], ["screaming", 9.26], ["speech", 8.74]], null, null, null, null, null, null, null, null, null], "duration": [0.16, 3.06, 1.55, 1.11, 2.55, 1.5, -0.14, 0.65, 2.07, 2.3, 0.63, 1.55, 3.74, -0.22, 1.27, 0.46, 2.22, 1.47, 2.74, 1.61, 0.77, 0.0, 5.16, 1.35, 1.0, 0.52, 0.61, 0.44, 0.8, 0.4, 0.39, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/pjX20gL-rnc_filtered.json b/annotations_filtered/pjX20gL-rnc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..217b38211c65084b34fdf89e1f669fe49f17bed7 --- /dev/null +++ b/annotations_filtered/pjX20gL-rnc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.92], [9.0, 10.61], [23.0, 23.41], [27.0, 27.45], [29.0, 28.85], [36.0, 36.86], [40.0, 41.07], [42.0, 42.7], [46.0, 46.45], [48.0, 52.71], [55.0, 55.54], [56.0, 56.67], [63.0, 63.49], [66.0, 67.73], [69.0, 69.26], [77.0, 77.7], [82.0, 84.25], [85.0, 85.82], [88.0, 89.33], [92.0, 92.89], [100.0, 100.38], [105.0, 105.49], [107.0, 108.08], [109.0, 113.12], [114.0, 114.98], [116.0, 116.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.5, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 23.42], ["didgeridoo", 12.05], ["boing", 10.53]], null, null, null, null, null, null, [["gasp", 11.96], ["echo", 7.93], ["snort", 7.07]], null, null], "duration": [1.92, 1.61, 0.41, 0.45, -0.15, 0.86, 1.07, 0.7, 0.45, 4.71, 0.54, 0.67, 0.49, 1.73, 0.26, 0.7, 2.25, 0.82, 1.33, 0.89, 0.38, 0.49, 1.08, 4.12, 0.98, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/pjmRcGHqKZ0_filtered.json b/annotations_filtered/pjmRcGHqKZ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ecae4c33f98ffbcfd809e405c049d3d0f69ce630 --- /dev/null +++ b/annotations_filtered/pjmRcGHqKZ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.13], [20.0, 20.92], [25.0, 25.19], [26.0, 26.42], [30.0, 31.89], [32.0, 61.1], [64.0, 83.67], [84.0, 90.29]], "keep_status": [false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 34.47, 31.89, 59.33], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 50.47], ["hum", 12.63], ["mains hum", 3.83]], [["explosion", 44.52], ["speech", 25.7], ["burst, pop", 7.57]], null], "duration": [0.13, 0.92, 0.19, 0.42, 1.89, 29.1, 19.67, 6.29]} \ No newline at end of file diff --git a/annotations_filtered/pkfyn6mYlCg_filtered.json b/annotations_filtered/pkfyn6mYlCg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ecd83f838516b274ee9e8d81b46393a057fe099 --- /dev/null +++ b/annotations_filtered/pkfyn6mYlCg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.86], [23.0, 40.53], [44.0, 49.0], [52.0, 57.79], [58.0, 59.05], [63.0, 64.77], [66.0, 72.22], [73.0, 74.31], [76.0, 76.91], [78.0, 80.2], [81.0, 99.2], [100.0, 103.44], [104.0, 110.67], [112.0, 125.02], [126.0, 127.97], [131.0, 133.61]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, true, true, false, false, false], "silence_prob": [0.0, 33.53, 30.51, 30.6, 0.0, 0.0, 42.04, 0.0, 0.0, 41.32, 44.87, 40.93, 38.27, 31.09, 0.0, 30.14], "audiomae_on_audioset": [null, [["music", 69.86], ["didgeridoo", 5.24], ["speech", 5.23]], [["music", 72.43], ["groan", 7.0], ["didgeridoo", 6.84]], [["music", 52.98], ["groan", 17.48], ["whimper", 4.58]], null, null, [["music", 35.73], ["didgeridoo", 22.5], ["musical instrument", 8.44]], null, null, [["music", 59.58], ["synthesizer", 8.98], ["hum", 2.95]], [["music", 19.94], ["synthesizer", 12.8], ["hum", 6.45]], [["music", 22.3], ["whale vocalization", 14.14], ["mains hum", 10.59]], [["music", 36.02], ["synthesizer", 8.37], ["ambient music", 6.86]], [["music", 44.51], ["theremin", 21.99], ["ambient music", 10.45]], null, [["hum", 45.47], ["throbbing", 26.06], ["mains hum", 10.33]]], "duration": [0.86, 17.53, 5.0, 5.79, 1.05, 1.77, 6.22, 1.31, 0.91, 2.2, 18.2, 3.44, 6.67, 13.02, 1.97, 2.61]} \ No newline at end of file diff --git a/annotations_filtered/pkogDQ3CK9E_filtered.json b/annotations_filtered/pkogDQ3CK9E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4702f308054e484980d805afdb9c09492cd45a3 --- /dev/null +++ b/annotations_filtered/pkogDQ3CK9E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.62], [18.0, 18.91], [41.0, 42.62], [46.0, 47.7], [56.0, 59.14], [75.0, 75.39], [86.0, 89.9], [105.0, 108.45], [113.0, 113.43], [123.0, 124.12], [140.0, 142.1], [146.0, 151.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.81, 0.0, 31.75, 31.57, 0.0, 0.0, 31.11, 30.36], "audiomae_on_audioset": [null, null, null, null, [["music", 44.82], ["grunt", 28.06], ["synthesizer", 5.65]], null, [["music", 62.07], ["grunt", 5.63], ["sound effect", 3.88]], [["music", 40.34], ["throbbing", 20.88], ["hum", 18.53]], null, null, [["hum", 19.79], ["rumble", 13.2], ["music", 11.5]], [["music", 71.5], ["animal", 3.54], ["speech", 1.61]]], "duration": [1.62, 0.91, 1.62, 1.7, 3.14, 0.39, 3.9, 3.45, 0.43, 1.12, 2.1, 5.98]} \ No newline at end of file diff --git a/annotations_filtered/pkqyDC9YnfM_filtered.json b/annotations_filtered/pkqyDC9YnfM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cb43da0568cdf2928c5eef29c41e11dabfdcac1 --- /dev/null +++ b/annotations_filtered/pkqyDC9YnfM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[59.0, 58.89], [60.0, 71.42], [73.0, 74.11], [75.0, 79.54], [82.0, 85.23], [87.0, 88.32], [92.0, 114.35], [115.0, 122.28], [124.0, 137.27], [137.0, 137.3], [139.0, 142.82], [146.0, 146.45], [151.0, 152.31], [153.0, 153.84], [155.0, 175.39]], "keep_status": [false, true, false, false, true, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 35.3, 0.0, 35.2, 36.7, 0.0, 32.25, 33.23, 38.0, 0.0, 71.0, 0.0, 0.0, 0.0, 32.24], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 16.93], ["electric shaver, electric razor", 16.91], ["music", 11.09]], null, [["music", 62.64], ["didgeridoo", 10.0], ["musical instrument", 5.4]], [["music", 47.22], ["speech", 15.67], ["didgeridoo", 5.81]], null, [["speech", 67.19], ["music", 20.64], ["basketball bounce", 1.56]], [["mains hum", 33.87], ["hum", 20.97], ["speech", 12.81]], [["speech", 62.42], ["explosion", 9.23], ["hum", 5.01]], null, null, null, null, null, [["music", 50.73], ["fly, housefly", 6.66], ["animal", 5.72]]], "duration": [-0.11, 11.42, 1.11, 4.54, 3.23, 1.32, 22.35, 7.28, 13.27, 0.3, 3.82, 0.45, 1.31, 0.84, 20.39]} \ No newline at end of file diff --git a/annotations_filtered/pkwGEagSVT0_filtered.json b/annotations_filtered/pkwGEagSVT0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8cdf91906ae498a58ec0714d0c36881374908663 --- /dev/null +++ b/annotations_filtered/pkwGEagSVT0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 15.74], [18.0, 50.8], [52.0, 52.69], [68.0, 68.47], [92.0, 92.84], [97.0, 130.74]], "keep_status": [false, false, false, false, false, false], "silence_prob": [29.93, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 74.02], ["throbbing", 6.44], ["mantra", 4.13]], null, null, null, null, null], "duration": [12.74, 32.8, 0.69, 0.47, 0.84, 33.74]} \ No newline at end of file diff --git a/annotations_filtered/pkylHxUSxLM_filtered.json b/annotations_filtered/pkylHxUSxLM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..644ebdcbd04af6c7d543c94ccd3440f95360d8ad --- /dev/null +++ b/annotations_filtered/pkylHxUSxLM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.59], [8.0, 7.74], [9.0, 17.74], [20.0, 20.04], [22.0, 22.11], [24.0, 24.76], [28.0, 28.63], [29.0, 29.47], [31.0, 31.97], [32.0, 40.78], [42.0, 42.85], [45.0, 45.71], [47.0, 47.39], [49.0, 49.06], [53.0, 52.89], [53.0, 53.76], [55.0, 55.32], [58.0, 58.41], [60.0, 60.51], [65.0, 66.34], [68.0, 69.38], [71.0, 75.36], [76.0, 76.49], [77.0, 80.54], [81.0, 83.79], [85.0, 86.85], [88.0, 92.18], [93.0, 105.85], [107.0, 108.4], [110.0, 116.48], [118.0, 119.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 90.25, 0.0, 100.0, 100.0, 0.0, 93.13, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.59, -0.26, 8.74, 0.04, 0.11, 0.76, 0.63, 0.47, 0.97, 8.78, 0.85, 0.71, 0.39, 0.06, -0.11, 0.76, 0.32, 0.41, 0.51, 1.34, 1.38, 4.36, 0.49, 3.54, 2.79, 1.85, 4.18, 12.85, 1.4, 6.48, 1.87]} \ No newline at end of file diff --git a/annotations_filtered/pl7JzW6eGZg_filtered.json b/annotations_filtered/pl7JzW6eGZg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9612fa865ea34e116fa65a14f9cfb47d33998fbe --- /dev/null +++ b/annotations_filtered/pl7JzW6eGZg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 36.48], [37.0, 37.79], [38.0, 39.61]], "keep_status": [false, false, false], "silence_prob": [52.22, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [5.48, 0.79, 1.61]} \ No newline at end of file diff --git a/annotations_filtered/plUXguATsTQ_filtered.json b/annotations_filtered/plUXguATsTQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6dd238a110e68a35e34d1d982b066150f9ce7719 --- /dev/null +++ b/annotations_filtered/plUXguATsTQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.99], [7.0, 8.07], [12.0, 24.48], [27.0, 87.81], [95.0, 107.62], [109.0, 109.19], [110.0, 154.5]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.03, 0.0, 34.15, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 76.94], ["guitar", 2.17], ["bass guitar", 1.97]], null, [["music", 77.96], ["sidetone", 4.29], ["speech", 2.14]], null, null], "duration": [1.99, 1.07, 12.48, 60.81, 12.62, 0.19, 44.5]} \ No newline at end of file diff --git a/annotations_filtered/plcl4YShR5Q_filtered.json b/annotations_filtered/plcl4YShR5Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4087b4ac07a41a9e4dbd67ee07bc76e83c4cfcb5 --- /dev/null +++ b/annotations_filtered/plcl4YShR5Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.78], [25.0, 25.89], [27.0, 28.0], [29.0, 30.74], [33.0, 33.05], [35.0, 44.78], [46.0, 46.68], [51.0, 56.07], [65.0, 71.12], [74.0, 74.46], [75.0, 81.33], [83.0, 84.2], [86.0, 87.44], [93.0, 95.08], [96.0, 96.6], [98.0, 106.59], [109.0, 114.84], [118.0, 150.53]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 38.43, 0.0, 29.2, 37.27, 0.0, 32.97, 0.0, 0.0, 67.51, 0.0, 31.21, 46.4, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 48.71], ["hum", 19.94], ["mains hum", 7.43]], null, [["speech", 61.52], ["gunshot, gunfire", 14.62], ["explosion", 8.33]], [["music", 21.86], ["hum", 13.02], ["throbbing", 8.19]], null, [["speech", 17.41], ["hum", 17.09], ["mains hum", 8.69]], null, null, null, null, [["mains hum", 63.65], ["hum", 29.05], ["speech", 1.38]], [["music", 28.81], ["hum", 15.91], ["mains hum", 6.17]], null], "duration": [0.78, 0.89, 1.0, 1.74, 0.05, 9.78, 0.68, 5.07, 6.12, 0.46, 6.33, 1.2, 1.44, 2.08, 0.6, 8.59, 5.84, 32.53]} \ No newline at end of file diff --git a/annotations_filtered/plovZLxlpGk_filtered.json b/annotations_filtered/plovZLxlpGk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58094fd26a0dc8527ab382bde170651416fe1e48 --- /dev/null +++ b/annotations_filtered/plovZLxlpGk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 32.86], [33.0, 34.15], [35.0, 35.14], [41.0, 44.85], [74.0, 75.74], [88.0, 91.13], [95.0, 97.87], [107.0, 107.38], [108.0, 125.05], [127.0, 127.62]], "keep_status": [false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 52.51, 0.0, 95.51, 94.07, 0.0, 43.48, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 29.47], ["music", 16.93], ["bee, wasp, etc.", 11.6]], null], "duration": [0.86, 1.15, 0.14, 3.85, 1.74, 3.13, 2.87, 0.38, 17.05, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/plqzeUB9B-w_filtered.json b/annotations_filtered/plqzeUB9B-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/plqzeUB9B-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/plu5YA3t2l8_filtered.json b/annotations_filtered/plu5YA3t2l8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cb6526bcbb08c47cd8543880c481e48acd092ec --- /dev/null +++ b/annotations_filtered/plu5YA3t2l8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 26.33], [27.0, 69.62]], "keep_status": [false, false], "silence_prob": [32.91, 0.0], "audiomae_on_audioset": [[["music", 54.68], ["singing bowl", 10.04], ["ambient music", 6.32]], null], "duration": [19.33, 42.62]} \ No newline at end of file diff --git a/annotations_filtered/pm7LihLP7kQ_filtered.json b/annotations_filtered/pm7LihLP7kQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf02871a3cd2c1e47aeaf935db8b5d824ccf601c --- /dev/null +++ b/annotations_filtered/pm7LihLP7kQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.73], [6.0, 13.58], [14.0, 18.81], [20.0, 20.31], [21.0, 23.38], [25.0, 27.45], [28.0, 28.41], [29.0, 30.87], [32.0, 33.49], [35.0, 37.72], [38.0, 40.42], [42.0, 43.6], [44.0, 44.91], [47.0, 53.2], [54.0, 55.9], [57.0, 57.55], [61.0, 60.98], [66.0, 66.66], [70.0, 71.09], [74.0, 75.03], [93.0, 94.14], [95.0, 98.66], [100.0, 103.08], [108.0, 110.93], [112.0, 114.29], [119.0, 120.55], [124.0, 124.23], [129.0, 128.9], [134.0, 136.51], [142.0, 144.24], [145.0, 145.91], [148.0, 151.68], [153.0, 153.6], [154.0, 156.27], [158.0, 159.09], [163.0, 162.78], [163.0, 163.05], [164.0, 164.76], [165.0, 166.78], [168.0, 168.72], [169.0, 170.55], [171.0, 173.03], [173.0, 174.48], [176.0, 176.35], [179.0, 181.33], [182.0, 185.13]], "keep_status": [false, true, true, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 48.44, 44.96, 0.0, 50.21, 57.32, 0.0, 0.0, 0.0, 44.43, 84.62, 0.0, 0.0, 44.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.44, 97.73, 56.4, 49.54, 0.0, 0.0, 0.0, 56.4, 99.4, 0.0, 56.55, 0.0, 42.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 38.19, 43.13], "audiomae_on_audioset": [null, [["speech", 34.71], ["cattle, bovinae", 17.5], ["livestock, farm animals, working animals", 11.47]], [["speech", 52.73], ["telephone", 9.24], ["inside, small room", 7.7]], null, null, null, null, null, null, [["dial tone", 9.44], ["hum", 9.27], ["tuning fork", 8.93]], null, null, null, [["gasp", 21.98], ["speech", 19.65], ["sigh", 13.96]], null, null, null, null, null, null, null, null, null, null, [["crow", 21.63], ["caw", 11.44], ["gasp", 7.59]], null, null, null, null, null, null, null, null, [["speech", 36.11], ["sine wave", 26.17], ["chirp tone", 13.4]], null, null, null, null, null, null, null, null, null, null, [["speech", 45.44], ["sidetone", 10.48], ["chirp tone", 5.51]], [["speech", 52.29], ["sidetone", 25.63], ["telephone", 3.63]]], "duration": [1.73, 7.58, 4.81, 0.31, 2.38, 2.45, 0.41, 1.87, 1.49, 2.72, 2.42, 1.6, 0.91, 6.2, 1.9, 0.55, -0.02, 0.66, 1.09, 1.03, 1.14, 3.66, 3.08, 2.93, 2.29, 1.55, 0.23, -0.1, 2.51, 2.24, 0.91, 3.68, 0.6, 2.27, 1.09, -0.22, 0.05, 0.76, 1.78, 0.72, 1.55, 2.03, 1.48, 0.35, 2.33, 3.13]} \ No newline at end of file diff --git a/annotations_filtered/pmAZlEkONa0_filtered.json b/annotations_filtered/pmAZlEkONa0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..347fcb800e5696bb7cbd9b7c3aaa04c557362439 --- /dev/null +++ b/annotations_filtered/pmAZlEkONa0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 38.16], [38.0, 40.32], [44.0, 45.84], [46.0, 47.48], [52.0, 52.98], [56.0, 57.11], [58.0, 73.45], [75.0, 78.66], [79.0, 78.98], [79.0, 85.53], [86.0, 87.4], [89.0, 93.72], [94.0, 95.44], [97.0, 98.76], [100.0, 100.09], [101.0, 103.82], [105.0, 128.75], [134.0, 134.67], [136.0, 136.95], [138.0, 150.55]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, true, false, false, false, true, true, false, false, true], "silence_prob": [0.0, 40.79, 0.0, 0.0, 0.0, 0.0, 31.02, 30.56, 0.0, 31.39, 0.0, 36.52, 0.0, 0.0, 0.0, 36.49, 30.18, 0.0, 0.0, 29.49], "audiomae_on_audioset": [null, [["music", 26.38], ["didgeridoo", 11.54], ["mains hum", 11.01]], null, null, null, null, [["music", 62.34], ["hum", 7.49], ["throbbing", 7.35]], [["music", 34.07], ["speech", 20.85], ["fart", 18.37]], null, [["music", 51.76], ["throbbing", 6.84], ["breaking", 4.87]], null, [["music", 27.78], ["hum", 12.13], ["noise", 10.84]], null, null, null, [["music", 30.26], ["didgeridoo", 19.17], ["mains hum", 12.86]], [["music", 19.51], ["hum", 15.51], ["speech", 11.73]], null, null, [["speech", 17.36], ["music", 16.74], ["hum", 11.45]]], "duration": [30.16, 2.32, 1.84, 1.48, 0.98, 1.11, 15.45, 3.66, -0.02, 6.53, 1.4, 4.72, 1.44, 1.76, 0.09, 2.82, 23.75, 0.67, 0.95, 12.55]} \ No newline at end of file diff --git a/annotations_filtered/pmC3rsgHD9E_filtered.json b/annotations_filtered/pmC3rsgHD9E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..558455e8bd4726fb7376bdd7694ddd646fed6d7e --- /dev/null +++ b/annotations_filtered/pmC3rsgHD9E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 46.7], [54.0, 56.17], [57.0, 58.33], [61.0, 62.11], [63.0, 64.15], [65.0, 66.18], [67.0, 69.03], [75.0, 77.48], [79.0, 80.4], [82.0, 82.71], [88.0, 89.16], [90.0, 98.46], [102.0, 104.21], [107.0, 108.46], [109.0, 111.38], [112.0, 113.12], [114.0, 115.3], [116.0, 121.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.88, 0.0, 0.0, 0.0, 0.0, 40.95, 100.0, 0.0, 0.0, 0.0, 84.07, 99.36, 0.0, 64.18, 0.0, 0.0, 86.64], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 67.57], ["fart", 3.19], ["animal", 3.07]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.7, 2.17, 1.33, 1.11, 1.15, 1.18, 2.03, 2.48, 1.4, 0.71, 1.16, 8.46, 2.21, 1.46, 2.38, 1.12, 1.3, 5.68]} \ No newline at end of file diff --git a/annotations_filtered/pmLP0QQPqFw_filtered.json b/annotations_filtered/pmLP0QQPqFw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f09eb9ff8216ec6f6d60980b9c4ef2853427de60 --- /dev/null +++ b/annotations_filtered/pmLP0QQPqFw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.77], [11.0, 29.59]], "keep_status": [true, true], "silence_prob": [33.02, 31.47], "audiomae_on_audioset": [[["music", 33.18], ["explosion", 22.22], ["hum", 4.33]], [["music", 26.2], ["hum", 12.57], ["cacophony", 8.91]]], "duration": [2.77, 18.59]} \ No newline at end of file diff --git a/annotations_filtered/pmqBmTWq420_filtered.json b/annotations_filtered/pmqBmTWq420_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2183d317a013d49d8e2c9a5089fc90327a652fc1 --- /dev/null +++ b/annotations_filtered/pmqBmTWq420_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.8], [16.0, 16.41], [21.0, 22.23], [29.0, 31.6], [38.0, 38.21], [38.0, 38.26], [38.0, 39.56], [42.0, 52.96], [56.0, 58.26], [67.0, 71.19], [78.0, 87.83], [90.0, 91.47], [95.0, 95.99], [99.0, 101.92], [110.0, 110.03], [121.0, 123.33], [128.0, 129.52], [132.0, 136.71], [145.0, 145.94], [149.0, 150.97], [153.0, 153.5]], "keep_status": [false, false, false, false, false, false, false, true, true, true, true, false, false, true, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 29.22, 0.0, 0.0, 0.0, 28.62, 28.52, 28.6, 28.71, 0.0, 0.0, 28.89, 0.0, 44.34, 0.0, 30.12, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["livestock, farm animals, working animals", 58.89], ["cattle, bovinae", 20.69], ["moo", 10.59]], null, null, null, [["speech", 26.95], ["music", 15.14], ["explosion", 11.22]], [["speech", 16.25], ["mains hum", 14.88], ["fly, housefly", 9.04]], [["speech", 20.25], ["insect", 16.29], ["fly, housefly", 11.17]], [["music", 61.46], ["buzz", 5.64], ["didgeridoo", 2.71]], null, null, [["music", 48.18], ["groan", 4.44], ["didgeridoo", 4.34]], null, [["music", 49.31], ["speech", 9.68], ["sine wave", 8.15]], null, [["speech", 51.54], ["music", 8.85], ["electric shaver, electric razor", 6.42]], null, null, null], "duration": [0.8, 0.41, 1.23, 2.6, 0.21, 0.26, 1.56, 10.96, 2.26, 4.19, 9.83, 1.47, 0.99, 2.92, 0.03, 2.33, 1.52, 4.71, 0.94, 1.97, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/pnTtzyItCQA_filtered.json b/annotations_filtered/pnTtzyItCQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2ed6d2e1f64826d8128635eece88610b5ebf3f0 --- /dev/null +++ b/annotations_filtered/pnTtzyItCQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.06], [10.0, 23.23], [25.0, 25.46], [26.0, 29.0], [31.0, 31.4], [45.0, 45.32], [47.0, 47.22], [48.0, 78.44], [82.0, 103.18], [109.0, 108.87], [109.0, 109.04], [111.0, 112.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.16, 0.0, 47.74, 0.0, 0.0, 0.0, 0.0, 31.56, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 34.86], ["music", 33.78], ["animal", 3.83]], null, [["music", 65.75], ["musical instrument", 4.94], ["theremin", 2.63]], null, null, null, null, [["music", 49.98], ["didgeridoo", 13.73], ["theremin", 9.07]], null, null, null], "duration": [1.06, 13.23, 0.46, 3.0, 0.4, 0.32, 0.22, 30.44, 21.18, -0.13, 0.04, 1.24]} \ No newline at end of file diff --git a/annotations_filtered/pnaWqq2eRcc_filtered.json b/annotations_filtered/pnaWqq2eRcc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc9b163855292f1a85c83ef5a6b07d35f47a7a60 --- /dev/null +++ b/annotations_filtered/pnaWqq2eRcc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 12.61], [15.0, 21.68], [35.0, 37.69], [48.0, 48.07], [49.0, 50.79], [60.0, 68.86], [71.0, 82.02], [91.0, 92.3], [94.0, 94.59], [99.0, 105.54], [106.0, 110.56], [113.0, 113.81], [115.0, 124.04], [137.0, 137.37], [144.0, 144.48], [149.0, 149.86], [155.0, 158.5], [165.0, 169.72]], "keep_status": [false, true, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, true], "silence_prob": [0.0, 38.35, 56.18, 0.0, 0.0, 31.39, 37.57, 0.0, 0.0, 39.94, 43.1, 0.0, 38.49, 0.0, 0.0, 0.0, 33.71, 32.3], "audiomae_on_audioset": [null, [["telephone bell ringing", 14.98], ["telephone", 14.05], ["speech", 13.14]], null, null, null, [["music", 45.02], ["speech", 21.7], ["musical instrument", 4.07]], [["speech", 60.01], ["music", 17.44], ["fart", 4.48]], null, null, [["music", 41.3], ["theremin", 23.12], ["hum", 4.81]], [["music", 50.52], ["speech", 4.25], ["synthesizer", 4.18]], null, [["music", 44.39], ["telephone", 11.78], ["speech", 9.01]], null, null, null, [["music", 63.71], ["thunk", 21.03], ["crack", 2.31]], [["music", 51.31], ["theremin", 5.04], ["musical instrument", 4.74]]], "duration": [-0.39, 6.68, 2.69, 0.07, 1.79, 8.86, 11.02, 1.3, 0.59, 6.54, 4.56, 0.81, 9.04, 0.37, 0.48, 0.86, 3.5, 4.72]} \ No newline at end of file diff --git a/annotations_filtered/pnvy9q4UpZw_filtered.json b/annotations_filtered/pnvy9q4UpZw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d03bec3f13ab08ffb3542d5509bbd442e95e8ced --- /dev/null +++ b/annotations_filtered/pnvy9q4UpZw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.04], [5.0, 6.96], [7.0, 9.98], [11.0, 11.94], [14.0, 22.15], [23.0, 23.68], [44.0, 45.64], [50.0, 50.41], [55.0, 56.1], [57.0, 59.09], [61.0, 61.96], [63.0, 63.12], [64.0, 66.33], [84.0, 84.72], [86.0, 87.22], [89.0, 90.59], [94.0, 98.17], [101.0, 101.19]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [97.43, 0.0, 42.0, 0.0, 45.59, 0.0, 0.0, 0.0, 0.0, 99.52, 0.0, 0.0, 60.89, 0.0, 0.0, 0.0, 33.51, 0.0], "audiomae_on_audioset": [null, null, [["throbbing", 21.42], ["heart sounds, heartbeat", 18.49], ["speech", 16.91]], null, [["speech", 48.47], ["dog", 8.71], ["animal", 7.7]], null, null, null, null, null, null, null, null, null, null, null, [["music", 55.75], ["synthesizer", 3.85], ["musical instrument", 3.82]], null], "duration": [2.04, 1.96, 2.98, 0.94, 8.15, 0.68, 1.64, 0.41, 1.1, 2.09, 0.96, 0.12, 2.33, 0.72, 1.22, 1.59, 4.17, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/po0Gj897Tmk_filtered.json b/annotations_filtered/po0Gj897Tmk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52d8aa7fec272913bbdb203e958892ae34d8d595 --- /dev/null +++ b/annotations_filtered/po0Gj897Tmk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.59], [7.0, 7.84], [11.0, 19.7], [20.0, 20.56], [29.0, 29.49], [34.0, 34.26], [52.0, 53.94], [55.0, 55.97], [56.0, 57.16], [65.0, 65.7], [68.0, 72.99], [80.0, 83.42], [87.0, 94.47], [99.0, 112.43], [113.0, 123.47], [124.0, 125.85], [128.0, 147.93], [152.0, 152.27]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 44.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.78, 36.23, 34.57, 30.78, 30.21, 0.0, 31.92, 0.0], "audiomae_on_audioset": [null, null, [["music", 12.55], ["telephone dialing, dtmf", 12.42], ["speech", 12.37]], null, null, null, null, null, null, null, [["music", 36.67], ["throbbing", 22.14], ["hum", 14.44]], [["throbbing", 21.21], ["speech", 17.28], ["hum", 14.81]], [["throbbing", 35.38], ["music", 26.39], ["hum", 16.38]], [["hum", 23.61], ["gong", 17.55], ["music", 17.32]], [["music", 36.05], ["gong", 26.52], ["ambient music", 9.68]], null, [["music", 48.59], ["noise", 8.73], ["hum", 7.04]], null], "duration": [0.59, 0.84, 8.7, 0.56, 0.49, 0.26, 1.94, 0.97, 1.16, 0.7, 4.99, 3.42, 7.47, 13.43, 10.47, 1.85, 19.93, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/poAxbGphYmA_filtered.json b/annotations_filtered/poAxbGphYmA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68c0a3c3648772bdbab21c9554c8ff8ee313212f --- /dev/null +++ b/annotations_filtered/poAxbGphYmA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.19], [4.0, 4.38], [9.0, 9.49], [19.0, 19.6], [28.0, 28.48], [36.0, 110.07]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [1.19, 0.38, 0.49, 0.6, 0.48, 74.07]} \ No newline at end of file diff --git a/annotations_filtered/poTqVcSgFRE_filtered.json b/annotations_filtered/poTqVcSgFRE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09486fde35d0080283da62ff71ece04c9e2f064f --- /dev/null +++ b/annotations_filtered/poTqVcSgFRE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.04], [2.0, 2.94], [4.0, 4.95], [7.0, 7.69], [9.0, 10.96], [12.0, 13.32], [15.0, 15.55], [16.0, 17.9], [21.0, 22.42], [36.0, 37.59], [46.0, 47.39], [61.0, 61.42], [64.0, 65.58], [72.0, 73.13], [76.0, 78.04], [80.0, 80.4], [82.0, 83.73], [87.0, 87.25], [98.0, 98.34], [100.0, 100.3], [104.0, 104.6], [106.0, 106.2], [107.0, 107.91], [110.0, 110.47], [113.0, 112.67], [114.0, 122.18], [123.0, 123.92], [125.0, 125.96], [143.0, 144.44], [151.0, 151.09], [164.0, 165.35], [168.0, 168.03], [171.0, 170.85], [172.0, 173.11], [176.0, 177.45], [180.0, 181.11], [183.0, 183.59], [193.0, 194.43], [203.0, 204.53], [205.0, 205.46], [206.0, 206.15], [207.0, 208.47], [209.0, 210.81], [213.0, 213.36], [217.0, 217.43], [218.0, 220.13], [223.0, 224.16], [226.0, 226.61], [230.0, 230.1], [231.0, 232.5], [234.0, 235.84], [242.0, 243.68], [244.0, 245.37], [246.0, 249.18], [250.0, 251.18], [253.0, 254.2], [257.0, 259.78], [260.0, 261.22], [262.0, 264.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 0.0, 99.31, 0.0, 97.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.04, 0.94, 0.95, 0.69, 1.96, 1.32, 0.55, 1.9, 1.42, 1.59, 1.39, 0.42, 1.58, 1.13, 2.04, 0.4, 1.73, 0.25, 0.34, 0.3, 0.6, 0.2, 0.91, 0.47, -0.33, 8.18, 0.92, 0.96, 1.44, 0.09, 1.35, 0.03, -0.15, 1.11, 1.45, 1.11, 0.59, 1.43, 1.53, 0.46, 0.15, 1.47, 1.81, 0.36, 0.43, 2.13, 1.16, 0.61, 0.1, 1.5, 1.84, 1.68, 1.37, 3.18, 1.18, 1.2, 2.78, 1.22, 2.79]} \ No newline at end of file diff --git a/annotations_filtered/poU8QxFJjbo_filtered.json b/annotations_filtered/poU8QxFJjbo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..375b908f5784cfe88aef591726f8c962555b9876 --- /dev/null +++ b/annotations_filtered/poU8QxFJjbo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 42.84], [44.0, 45.6], [46.0, 66.21], [68.0, 67.93], [69.0, 70.33], [72.0, 108.18], [109.0, 109.59], [112.0, 166.43], [167.0, 169.32], [170.0, 171.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 28.98, 0.0, 0.0, 0.0, 0.0, 0.0, 56.86, 0.0], "audiomae_on_audioset": [null, null, [["music", 81.4], ["hum", 2.51], ["electronic music", 1.78]], null, null, null, null, null, null, null], "duration": [40.84, 1.6, 20.21, -0.07, 1.33, 36.18, 0.59, 54.43, 2.32, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/pobSophb2UE_filtered.json b/annotations_filtered/pobSophb2UE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..263b411ddf84ae693b174e167c16a0e4b832e5fa --- /dev/null +++ b/annotations_filtered/pobSophb2UE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.12], [3.0, 4.75], [6.0, 6.32], [6.0, 6.49], [13.0, 14.27], [16.0, 16.97], [18.0, 18.49], [20.0, 20.12], [24.0, 23.95], [26.0, 29.71], [30.0, 31.4], [33.0, 33.79], [36.0, 36.34], [37.0, 37.81], [43.0, 44.37], [47.0, 48.56], [50.0, 50.58], [52.0, 52.83], [54.0, 55.85], [57.0, 59.05]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["hum", 24.51], ["throbbing", 12.55], ["music", 8.74]], null, null, null, null, null, null, null, null, null, null], "duration": [1.12, 1.75, 0.32, 0.49, 1.27, 0.97, 0.49, 0.12, -0.05, 3.71, 1.4, 0.79, 0.34, 0.81, 1.37, 1.56, 0.58, 0.83, 1.85, 2.05]} \ No newline at end of file diff --git a/annotations_filtered/poswRRB_2i0_filtered.json b/annotations_filtered/poswRRB_2i0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0539aecb10e696cfeaa13dec41e32d7b119b592b --- /dev/null +++ b/annotations_filtered/poswRRB_2i0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.21], [11.0, 11.55], [16.0, 22.0], [23.0, 24.19], [27.0, 29.96], [38.0, 45.27], [48.0, 51.41], [52.0, 58.45], [59.0, 61.96], [65.0, 67.49], [76.0, 77.89], [78.0, 78.39], [81.0, 81.09], [81.0, 85.02], [86.0, 86.36], [88.0, 87.86], [93.0, 96.33], [99.0, 109.11], [111.0, 121.47], [123.0, 126.52], [129.0, 129.66], [131.0, 131.6], [134.0, 134.91], [136.0, 138.28], [142.0, 150.28], [159.0, 160.0], [165.0, 166.8], [168.0, 168.69], [170.0, 170.95], [173.0, 173.57], [179.0, 178.6], [179.0, 179.07], [180.0, 180.17], [181.0, 184.45], [185.0, 185.18], [186.0, 186.56], [193.0, 193.46], [195.0, 196.05], [197.0, 205.68], [209.0, 208.8], [213.0, 213.76], [231.0, 230.79], [231.0, 233.25], [238.0, 240.44], [242.0, 243.19], [244.0, 259.01], [259.0, 261.6], [264.0, 268.74], [271.0, 280.4]], "keep_status": [true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, false], "silence_prob": [44.07, 0.0, 44.63, 0.0, 44.32, 49.45, 39.52, 38.83, 55.6, 45.95, 0.0, 0.0, 0.0, 52.56, 0.0, 0.0, 54.76, 67.0, 68.93, 72.01, 0.0, 0.0, 0.0, 57.09, 70.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.5, 0.0, 0.0, 0.0, 0.0, 30.57, 0.0, 0.0, 0.0, 35.14, 39.67, 0.0, 32.44, 37.27, 32.42, 32.21], "audiomae_on_audioset": [[["music", 27.74], ["humming", 7.4], ["theremin", 5.93]], null, [["music", 38.46], ["carnatic music", 8.44], ["vocal music", 8.03]], null, [["music", 33.92], ["humming", 10.02], ["chant", 8.67]], [["music", 66.32], ["carnatic music", 10.55], ["singing", 2.17]], [["music", 75.82], ["singing", 3.35], ["humming", 1.98]], [["music", 46.47], ["speech", 20.45], ["boing", 6.61]], null, [["music", 73.24], ["singing", 1.34], ["song", 1.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 71.03], ["singing", 2.87], ["gospel music", 2.03]], null, null, null, null, [["music", 79.87], ["carnatic music", 3.17], ["singing", 2.62]], null, null, null, [["music", 29.38], ["burping, eructation", 16.06], ["guitar", 4.99]], [["music", 61.27], ["quack", 4.87], ["synthesizer", 2.2]], null, [["music", 89.46], ["singing", 1.18], ["musical instrument", 0.88]], [["music", 35.39], ["guitar", 8.41], ["plucked string instrument", 6.17]], [["music", 76.37], ["gospel music", 1.87], ["carnatic music", 1.84]], [["music", 81.99], ["singing", 2.34], ["musical instrument", 1.98]]], "duration": [4.21, 0.55, 6.0, 1.19, 2.96, 7.27, 3.41, 6.45, 2.96, 2.49, 1.89, 0.39, 0.09, 4.02, 0.36, -0.14, 3.33, 10.11, 10.47, 3.52, 0.66, 0.6, 0.91, 2.28, 8.28, 1.0, 1.8, 0.69, 0.95, 0.57, -0.4, 0.07, 0.17, 3.45, 0.18, 0.56, 0.46, 1.05, 8.68, -0.2, 0.76, -0.21, 2.25, 2.44, 1.19, 15.01, 2.6, 4.74, 9.4]} \ No newline at end of file diff --git a/annotations_filtered/ppGd-2nEOVQ_filtered.json b/annotations_filtered/ppGd-2nEOVQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e9c53be392435b7b2a9ac299b70d39ad4cefa0d --- /dev/null +++ b/annotations_filtered/ppGd-2nEOVQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.38], [8.0, 8.48], [10.0, 10.3], [12.0, 12.72], [14.0, 15.67], [20.0, 22.49], [26.0, 25.93], [31.0, 31.63], [37.0, 37.56], [39.0, 39.73], [41.0, 41.67], [43.0, 44.27], [47.0, 47.39], [49.0, 50.33], [52.0, 53.47], [56.0, 57.33], [61.0, 63.9], [64.0, 65.11], [67.0, 74.29], [76.0, 78.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 61.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.41, 0.0, 35.79, 34.42], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["rumble", 33.38], ["whale vocalization", 12.79], ["gong", 5.86]], null, [["hum", 63.82], ["throbbing", 22.77], ["mains hum", 5.91]], [["music", 18.79], ["vehicle", 9.42], ["rumble", 5.66]]], "duration": [0.38, 0.48, 0.3, 0.72, 1.67, 2.49, -0.07, 0.63, 0.56, 0.73, 0.67, 1.27, 0.39, 1.33, 1.47, 1.33, 2.9, 1.11, 7.29, 2.56]} \ No newline at end of file diff --git a/annotations_filtered/ppWi_bhS2eQ_filtered.json b/annotations_filtered/ppWi_bhS2eQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..931059077a255fd5c5c3da2764b117390e2d6486 --- /dev/null +++ b/annotations_filtered/ppWi_bhS2eQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.57], [6.0, 7.28], [8.0, 8.13], [10.0, 10.27], [16.0, 16.53], [29.0, 29.22], [30.0, 32.7], [36.0, 38.23], [41.0, 44.1], [49.0, 49.37], [50.0, 51.56], [53.0, 53.11], [55.0, 55.76], [58.0, 58.41], [61.0, 61.91], [64.0, 64.96], [70.0, 70.92], [77.0, 77.16], [79.0, 88.8], [97.0, 99.32], [100.0, 104.77], [108.0, 108.28]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.99, 58.55, 42.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.12, 64.18, 31.85, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 44.08], ["music", 37.38], ["hum", 2.51]], null, [["frog", 20.04], ["hum", 13.52], ["mains hum", 11.13]], null, null, null, null, null, null, null, null, null, [["music", 20.6], ["speech", 13.83], ["fart", 12.94]], null, [["sound effect", 49.32], ["music", 10.18], ["whoosh, swoosh, swish", 4.95]], null], "duration": [0.57, 1.28, 0.13, 0.27, 0.53, 0.22, 2.7, 2.23, 3.1, 0.37, 1.56, 0.11, 0.76, 0.41, 0.91, 0.96, 0.92, 0.16, 9.8, 2.32, 4.77, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/ppjyB2MpxBU_filtered.json b/annotations_filtered/ppjyB2MpxBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5c0bab5f0699d90b7cf9d11c5161168ec81f279 --- /dev/null +++ b/annotations_filtered/ppjyB2MpxBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.65], [5.0, 8.95], [11.0, 19.9], [21.0, 32.12], [33.0, 67.78], [71.0, 86.66], [87.0, 90.26], [92.0, 92.67], [94.0, 96.6], [98.0, 100.8], [102.0, 102.59], [104.0, 105.46], [107.0, 108.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 80.64, 60.7, 97.92, 0.0, 97.0, 88.1, 0.0, 100.0, 99.76, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.65, 3.95, 8.9, 11.12, 34.78, 15.66, 3.26, 0.67, 2.6, 2.8, 0.59, 1.46, 1.41]} \ No newline at end of file diff --git a/annotations_filtered/pppK-fl9a2E_filtered.json b/annotations_filtered/pppK-fl9a2E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1dd92b9f1f60822e1d02c104ca33689b5ad2a063 --- /dev/null +++ b/annotations_filtered/pppK-fl9a2E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.75], [4.0, 5.66], [7.0, 8.23], [9.0, 9.58], [11.0, 13.73], [15.0, 16.55], [17.0, 20.6], [22.0, 22.18], [22.0, 23.45], [42.0, 41.89], [44.0, 47.09], [48.0, 51.26], [54.0, 55.26], [56.0, 56.34], [69.0, 69.79], [75.0, 75.66], [76.0, 79.41], [80.0, 83.05], [85.0, 85.16], [87.0, 95.28], [97.0, 97.58], [103.0, 103.47], [107.0, 106.98], [117.0, 118.22], [126.0, 127.26], [134.0, 133.81], [134.0, 134.76], [136.0, 137.15], [138.0, 138.5], [140.0, 141.84], [145.0, 145.3], [147.0, 147.56], [149.0, 149.15], [150.0, 150.58]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 47.9, 0.0, 38.67, 0.0, 0.0, 0.0, 30.78, 28.64, 0.0, 0.0, 0.0, 0.0, 36.75, 33.12, 0.0, 33.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 25.65], ["quack", 7.48], ["croak", 6.29]], null, [["speech", 37.21], ["music", 30.06], ["hum", 3.74]], null, null, null, [["music", 62.8], ["theremin", 7.61], ["ambient music", 7.31]], [["thunk", 27.51], ["whack, thwack", 17.88], ["music", 10.35]], null, null, null, null, [["hum", 21.38], ["music", 19.78], ["mains hum", 15.55]], [["speech", 45.5], ["sidetone", 25.18], ["telephone", 11.9]], null, [["music", 69.87], ["synthesizer", 7.0], ["musical instrument", 5.68]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.25, 1.66, 1.23, 0.58, 2.73, 1.55, 3.6, 0.18, 1.45, -0.11, 3.09, 3.26, 1.26, 0.34, 0.79, 0.66, 3.41, 3.05, 0.16, 8.28, 0.58, 0.47, -0.02, 1.22, 1.26, -0.19, 0.76, 1.15, 0.5, 1.84, 0.3, 0.56, 0.15, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/pq9dj2Q6edw_filtered.json b/annotations_filtered/pq9dj2Q6edw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91879429e2006e9fa693a33ba4f8b6443348c198 --- /dev/null +++ b/annotations_filtered/pq9dj2Q6edw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.43], [14.0, 28.66], [30.0, 33.1], [34.0, 41.96], [43.0, 44.81], [47.0, 52.39], [54.0, 56.71], [59.0, 60.89], [62.0, 65.31], [68.0, 70.92], [73.0, 74.19], [77.0, 79.98], [89.0, 91.5], [96.0, 99.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.37, 80.82, 93.6, 77.2, 0.0, 87.19, 90.43, 0.0, 60.98, 78.89, 0.0, 96.89, 64.18, 84.8], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.43, 14.66, 3.1, 7.96, 1.81, 5.39, 2.71, 1.89, 3.31, 2.92, 1.19, 2.98, 2.5, 3.27]} \ No newline at end of file diff --git a/annotations_filtered/pqDU_EJrb2g_filtered.json b/annotations_filtered/pqDU_EJrb2g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a455635eb8fed626176b8c4242c4c503a5bac827 --- /dev/null +++ b/annotations_filtered/pqDU_EJrb2g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 30.01], [30.0, 31.56], [37.0, 46.45], [47.0, 48.19], [53.0, 130.33]], "keep_status": [false, false, false, false, false], "silence_prob": [41.09, 0.0, 52.16, 0.0, 0.0], "audiomae_on_audioset": [[["music", 69.24], ["speech", 5.69], ["throbbing", 3.22]], null, null, null, null], "duration": [7.01, 1.56, 9.45, 1.19, 77.33]} \ No newline at end of file diff --git a/annotations_filtered/pqLAni94IEI_filtered.json b/annotations_filtered/pqLAni94IEI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f2e6c43256557608382e5616bbf7d96f30e14a7 --- /dev/null +++ b/annotations_filtered/pqLAni94IEI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.22], [11.0, 14.08], [16.0, 17.81], [20.0, 24.97], [26.0, 29.88], [33.0, 36.61], [37.0, 40.49], [42.0, 48.81], [51.0, 89.09], [90.0, 92.62], [93.0, 92.94]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [62.68, 58.47, 0.0, 54.7, 52.92, 50.56, 38.72, 42.24, 0.0, 31.29, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 51.45], ["hum", 9.04], ["whale vocalization", 4.65]], [["hum", 43.57], ["mains hum", 16.45], ["heart sounds, heartbeat", 6.22]], null, [["music", 62.69], ["musical instrument", 6.06], ["hum", 4.99]], null], "duration": [2.22, 3.08, 1.81, 4.97, 3.88, 3.61, 3.49, 6.81, 38.09, 2.62, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/prAOME_9oP8_filtered.json b/annotations_filtered/prAOME_9oP8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e87585b153cf746fd7a6473d352b883e3893fc52 --- /dev/null +++ b/annotations_filtered/prAOME_9oP8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 30.94], [32.0, 37.2], [42.0, 42.35], [46.0, 73.72], [76.0, 76.45], [77.0, 78.04], [80.0, 87.81], [89.0, 90.09], [92.0, 121.1], [122.0, 126.45], [129.0, 130.65], [133.0, 142.01], [149.0, 161.45], [166.0, 170.53], [171.0, 175.95]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false, true, false, true], "silence_prob": [30.86, 50.02, 0.0, 42.58, 0.0, 0.0, 38.25, 0.0, 42.51, 33.79, 0.0, 28.96, 32.6, 34.97, 34.42], "audiomae_on_audioset": [[["machine gun", 24.31], ["speech", 23.13], ["music", 17.3]], null, null, [["music", 51.01], ["throbbing", 22.92], ["hum", 8.37]], null, null, [["hum", 40.15], ["speech", 18.52], ["throbbing", 15.28]], null, [["hum", 36.5], ["speech", 24.69], ["throbbing", 15.44]], [["music", 31.69], ["hum", 17.62], ["throbbing", 8.14]], null, [["music", 60.91], ["throbbing", 4.87], ["hum", 4.36]], [["car", 17.36], ["music", 13.51], ["explosion", 11.85]], [["fart", 38.56], ["speech", 28.94], ["noise", 13.62]], [["music", 21.48], ["noise", 7.15], ["thunk", 5.63]]], "duration": [10.94, 5.2, 0.35, 27.72, 0.45, 1.04, 7.81, 1.09, 29.1, 4.45, 1.65, 9.01, 12.45, 4.53, 4.95]} \ No newline at end of file diff --git a/annotations_filtered/prLok_8YD8w_filtered.json b/annotations_filtered/prLok_8YD8w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ab00587c4ba1c877faed3927d4af135f5e78672 --- /dev/null +++ b/annotations_filtered/prLok_8YD8w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.33], [6.0, 9.22], [14.0, 15.16], [16.0, 17.51], [19.0, 20.16], [22.0, 22.55], [25.0, 25.95], [27.0, 34.74], [36.0, 37.77], [40.0, 40.59], [43.0, 46.01], [47.0, 46.89], [47.0, 47.21], [48.0, 49.11], [50.0, 53.76], [54.0, 65.11], [66.0, 71.42], [73.0, 81.19], [83.0, 91.17], [92.0, 121.37], [122.0, 122.57], [125.0, 126.4], [127.0, 128.56], [137.0, 139.33], [141.0, 145.57], [146.0, 145.93], [147.0, 154.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 99.36, 0.0, 0.0, 0.0, 100.0, 99.84, 100.0, 98.19, 44.6, 39.96, 0.0, 0.0, 0.0, 85.54, 43.9, 0.0, 99.48], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 76.8], ["noise", 6.75], ["sidetone", 1.86]], [["grunt", 27.95], ["animal", 16.69], ["groan", 15.95]], null, null, null, null, [["grunt", 44.46], ["groan", 29.34], ["sound effect", 4.51]], null, null], "duration": [1.33, 3.22, 1.16, 1.51, 1.16, 0.55, 0.95, 7.74, 1.77, 0.59, 3.01, -0.11, 0.21, 1.11, 3.76, 11.11, 5.42, 8.19, 8.17, 29.37, 0.57, 1.4, 1.56, 2.33, 4.57, -0.07, 7.9]} \ No newline at end of file diff --git a/annotations_filtered/prTlJO34AHE_filtered.json b/annotations_filtered/prTlJO34AHE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7f514216433bcaddc20e2b7ad8b3a1d4332a91b --- /dev/null +++ b/annotations_filtered/prTlJO34AHE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 22.1], [23.0, 22.89], [25.0, 24.71], [25.0, 27.65], [37.0, 37.22], [43.0, 45.64], [46.0, 52.41], [55.0, 56.32], [59.0, 61.13], [65.0, 66.73], [71.0, 79.98], [80.0, 88.6], [95.0, 96.67], [98.0, 98.83], [99.0, 104.19], [107.0, 107.7], [113.0, 115.99], [119.0, 121.0], [125.0, 128.04], [130.0, 131.55], [134.0, 135.5], [142.0, 145.29], [147.0, 152.71], [154.0, 156.57], [157.0, 158.89], [159.0, 167.09], [169.0, 174.06], [174.0, 176.99]], "keep_status": [true, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, true, true, false, false, true, false, true, false, true, false, true], "silence_prob": [34.58, 0.0, 0.0, 37.85, 0.0, 74.76, 75.88, 0.0, 61.77, 0.0, 31.85, 31.58, 0.0, 0.0, 37.9, 0.0, 50.81, 35.95, 46.43, 0.0, 0.0, 32.92, 32.47, 37.28, 0.0, 34.34, 34.85, 33.65], "audiomae_on_audioset": [[["music", 24.84], ["speech", 20.71], ["didgeridoo", 6.39]], null, null, [["grunt", 32.69], ["speech", 18.82], ["music", 12.71]], null, null, null, null, null, null, [["music", 23.55], ["hum", 19.73], ["throbbing", 11.75]], [["music", 46.42], ["groan", 14.6], ["speech", 9.62]], null, null, [["speech", 50.23], ["music", 32.82], ["groan", 4.14]], null, null, [["music", 29.3], ["sheep", 21.48], ["bleat", 18.25]], [["music", 37.73], ["throbbing", 13.83], ["synthesizer", 7.03]], null, null, [["music", 50.91], ["honk", 9.78], ["goose", 8.01]], [["music", 47.27], ["groan", 22.84], ["speech", 9.05]], [["music", 29.05], ["bow-wow", 10.8], ["animal", 10.44]], null, [["music", 28.08], ["animal", 19.63], ["speech", 9.04]], [["music", 43.53], ["speech", 40.63], ["brass instrument", 2.59]], [["music", 38.4], ["speech", 27.61], ["didgeridoo", 3.4]]], "duration": [5.1, -0.11, -0.29, 2.65, 0.22, 2.64, 6.41, 1.32, 2.13, 1.73, 8.98, 8.6, 1.67, 0.83, 5.19, 0.7, 2.99, 2.0, 3.04, 1.55, 1.5, 3.29, 5.71, 2.57, 1.89, 8.09, 5.06, 2.99]} \ No newline at end of file diff --git a/annotations_filtered/prnQLmVg5V8_filtered.json b/annotations_filtered/prnQLmVg5V8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..021f240d77821cf45d1b26a7ba49d9a0e1079091 --- /dev/null +++ b/annotations_filtered/prnQLmVg5V8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.04], [19.0, 26.28], [27.0, 36.24], [39.0, 39.39], [41.0, 43.33], [46.0, 46.28], [48.0, 57.69], [60.0, 60.2], [61.0, 61.87], [63.0, 63.41], [102.0, 102.96], [106.0, 107.11], [111.0, 113.04], [117.0, 117.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 53.59, 68.28, 0.0, 75.72, 0.0, 62.58, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.04, 7.28, 9.24, 0.39, 2.33, 0.28, 9.69, 0.2, 0.87, 0.41, 0.96, 1.11, 2.04, 0.09]} \ No newline at end of file diff --git a/annotations_filtered/psB3Ta-5XWY_filtered.json b/annotations_filtered/psB3Ta-5XWY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd033e72c4bed3a548c24779ab11166e3216165b --- /dev/null +++ b/annotations_filtered/psB3Ta-5XWY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.81], [5.0, 6.99], [9.0, 10.22], [12.0, 12.51], [14.0, 14.62], [16.0, 20.16], [21.0, 26.76], [31.0, 31.41], [32.0, 33.05], [43.0, 43.73], [44.0, 45.69], [48.0, 49.92], [51.0, 51.46], [54.0, 57.75], [60.0, 61.13], [62.0, 62.63], [66.0, 69.18], [70.0, 72.39], [74.0, 75.91], [79.0, 79.29], [80.0, 80.52], [81.0, 81.09], [82.0, 83.69], [84.0, 84.3], [85.0, 86.86], [89.0, 90.73], [97.0, 99.2], [101.0, 102.27], [104.0, 104.6], [107.0, 108.16], [110.0, 117.22], [121.0, 129.86], [131.0, 150.96], [153.0, 156.22], [158.0, 164.52], [165.0, 167.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.4, 0.0, 0.0, 0.0, 0.0, 63.21, 60.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 99.98, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.74, 0.0, 0.0, 0.0, 47.16, 31.75, 30.96, 31.33, 31.41, 32.53], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 72.69], ["guitar", 3.33], ["acoustic guitar", 2.74]], [["music", 66.45], ["firecracker", 5.39], ["speech", 4.17]], [["music", 63.39], ["musical instrument", 6.19], ["guitar", 5.01]], [["skateboard", 47.7], ["music", 26.77], ["speech", 2.3]], [["music", 58.0], ["didgeridoo", 11.89], ["skateboard", 2.87]], [["music", 73.76], ["guitar", 5.2], ["musical instrument", 4.15]]], "duration": [2.81, 1.99, 1.22, 0.51, 0.62, 4.16, 5.76, 0.41, 1.05, 0.73, 1.69, 1.92, 0.46, 3.75, 1.13, 0.63, 3.18, 2.39, 1.91, 0.29, 0.52, 0.09, 1.69, 0.3, 1.86, 1.73, 2.2, 1.27, 0.6, 1.16, 7.22, 8.86, 19.96, 3.22, 6.52, 2.59]} \ No newline at end of file diff --git a/annotations_filtered/psDnYKqgVT8_filtered.json b/annotations_filtered/psDnYKqgVT8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ed212efa258570d5502b2a7ad68fabf0ef4c3ce --- /dev/null +++ b/annotations_filtered/psDnYKqgVT8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[67.0, 96.74], [98.0, 98.32]], "keep_status": [false, false], "silence_prob": [30.41, 0.0], "audiomae_on_audioset": [[["music", 71.26], ["didgeridoo", 2.56], ["throbbing", 2.4]], null], "duration": [29.74, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/psDtqypK3hI_filtered.json b/annotations_filtered/psDtqypK3hI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..056061cc88be3e3136c3ff2dc13f4760e5b1639c --- /dev/null +++ b/annotations_filtered/psDtqypK3hI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.43], [11.0, 11.91], [16.0, 17.69], [21.0, 20.66], [27.0, 27.65], [32.0, 32.76], [35.0, 36.12], [47.0, 47.17], [57.0, 58.14], [62.0, 62.31], [65.0, 70.68], [73.0, 97.66], [103.0, 183.66], [185.0, 185.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.45, 42.51, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 42.84], ["livestock, farm animals, working animals", 9.99], ["cattle, bovinae", 9.63]], [["music", 69.8], ["wind instrument, woodwind instrument", 10.59], ["flute", 6.73]], null, null], "duration": [0.43, 0.91, 1.69, -0.34, 0.65, 0.76, 1.12, 0.17, 1.14, 0.31, 5.68, 24.66, 80.66, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/psW7sLoNutA_filtered.json b/annotations_filtered/psW7sLoNutA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75a000369b50b05ee8cd6a2f78542b86d4eda597 --- /dev/null +++ b/annotations_filtered/psW7sLoNutA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.12], [3.0, 3.28], [9.0, 9.9], [11.0, 12.19], [20.0, 20.88], [24.0, 27.24], [31.0, 33.3], [37.0, 37.86], [38.0, 39.8], [41.0, 42.89], [45.0, 45.69], [47.0, 52.08], [53.0, 53.76], [55.0, 55.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 82.97, 89.01, 0.0, 0.0, 0.0, 0.0, 89.72, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.12, 0.28, 0.9, 1.19, 0.88, 3.24, 2.3, 0.86, 1.8, 1.89, 0.69, 5.08, 0.76, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/pt-Ir7xS29Y_filtered.json b/annotations_filtered/pt-Ir7xS29Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/pt-Ir7xS29Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/ptAdtShJa_0_filtered.json b/annotations_filtered/ptAdtShJa_0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57e90ff83d001ae3e8440e611fd51b29d3d77adb --- /dev/null +++ b/annotations_filtered/ptAdtShJa_0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.51], [19.0, 20.49], [21.0, 21.09], [22.0, 21.63], [23.0, 26.1], [27.0, 27.87], [28.0, 29.25], [32.0, 32.71], [34.0, 37.39], [38.0, 38.7], [42.0, 42.8], [49.0, 49.84], [50.0, 50.62], [51.0, 52.15], [53.0, 53.55], [56.0, 58.04], [58.0, 59.16], [62.0, 62.63], [64.0, 65.7], [68.0, 69.33], [71.0, 73.97], [86.0, 86.49], [90.0, 91.0], [93.0, 94.68], [98.0, 100.89], [101.0, 103.94], [104.0, 105.22], [106.0, 106.79], [108.0, 109.63], [114.0, 131.45], [133.0, 148.64], [152.0, 162.89], [166.0, 167.43], [168.0, 170.77], [172.0, 172.34], [174.0, 174.19], [176.0, 176.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 42.88, 0.0, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 0.0, 0.0, 41.95, 0.0, 0.0, 0.0, 88.64, 38.75, 0.0, 0.0, 0.0, 44.29, 45.46, 37.24, 0.0, 35.94, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 38.34], ["speech", 21.07], ["music", 13.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 69.7], ["sidetone", 14.42], ["radio", 3.77]], null, null, null, null, [["speech", 60.77], ["telephone dialing, dtmf", 16.36], ["telephone", 14.44]], null, null, null, [["hum", 27.36], ["music", 19.78], ["mains hum", 19.54]], [["music", 74.58], ["theremin", 3.92], ["cello", 2.35]], [["music", 55.04], ["crack", 4.24], ["thunk", 2.57]], null, [["speech", 46.79], ["music", 21.96], ["radio", 19.33]], null, null, null], "duration": [1.51, 1.49, 0.09, -0.37, 3.1, 0.87, 1.25, 0.71, 3.39, 0.7, 0.8, 0.84, 0.62, 1.15, 0.55, 2.04, 1.16, 0.63, 1.7, 1.33, 2.97, 0.49, 1.0, 1.68, 2.89, 2.94, 1.22, 0.79, 1.63, 17.45, 15.64, 10.89, 1.43, 2.77, 0.34, 0.19, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/ptBGusJjkTU_filtered.json b/annotations_filtered/ptBGusJjkTU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7996028a8ad68b18d5993f9ba564719a711110c --- /dev/null +++ b/annotations_filtered/ptBGusJjkTU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 14.59], [16.0, 16.5], [20.0, 24.75], [25.0, 27.33], [29.0, 30.94], [33.0, 33.96], [35.0, 36.19], [37.0, 37.49], [38.0, 39.11], [40.0, 40.42], [42.0, 47.49], [48.0, 47.88], [48.0, 49.22], [50.0, 53.23], [54.0, 55.71], [58.0, 62.29], [65.0, 66.8], [68.0, 72.55], [78.0, 80.18], [89.0, 90.66]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [96.89, 0.0, 94.07, 43.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 97.54, 0.0, 99.91, 0.0, 48.14, 61.37, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 52.02], ["music", 9.54], ["frog", 5.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["radio", 16.22], ["noise", 15.39], ["speech", 10.07]], null, null], "duration": [10.59, 0.5, 4.75, 2.33, 1.94, 0.96, 1.19, 0.49, 1.11, 0.42, 5.49, -0.12, 1.22, 3.23, 1.71, 4.29, 1.8, 4.55, 2.18, 1.66]} \ No newline at end of file diff --git a/annotations_filtered/ptJ8x9AERwA_filtered.json b/annotations_filtered/ptJ8x9AERwA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f22c9b0f59a3c0e21d0bf860930d5c3235cf1337 --- /dev/null +++ b/annotations_filtered/ptJ8x9AERwA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.32], [12.0, 18.39], [19.0, 20.41], [23.0, 24.53], [25.0, 26.3], [28.0, 30.15], [31.0, 31.63], [33.0, 34.86], [39.0, 40.91], [42.0, 43.7], [50.0, 50.67], [52.0, 53.79], [56.0, 57.86], [60.0, 66.72], [70.0, 78.58], [81.0, 82.56], [89.0, 90.93], [95.0, 96.33], [98.0, 98.58], [104.0, 104.99], [107.0, 108.57], [111.0, 112.53], [113.0, 114.17], [115.0, 116.5], [118.0, 119.4], [123.0, 124.58], [125.0, 126.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.97, 100.0, 0.0, 0.0, 0.0, 72.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.32, 6.39, 1.41, 1.53, 1.3, 2.15, 0.63, 1.86, 1.91, 1.7, 0.67, 1.79, 1.86, 6.72, 8.58, 1.56, 1.93, 1.33, 0.58, 0.99, 1.57, 1.53, 1.17, 1.5, 1.4, 1.58, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/ptOc-HdvEW0_filtered.json b/annotations_filtered/ptOc-HdvEW0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06dce4b5b22997da4a03a8c49522fa717e418958 --- /dev/null +++ b/annotations_filtered/ptOc-HdvEW0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.57], [8.0, 8.68], [11.0, 11.21], [11.0, 13.73], [28.0, 28.68], [33.0, 33.47], [46.0, 46.99], [48.0, 48.59], [56.0, 56.73], [58.0, 58.92], [87.0, 87.89], [90.0, 90.41], [99.0, 98.96], [109.0, 109.85], [115.0, 115.4], [123.0, 125.02], [126.0, 126.4], [128.0, 129.19], [131.0, 132.26], [138.0, 140.17], [143.0, 148.66], [149.0, 149.18], [150.0, 150.4], [155.0, 155.38], [161.0, 160.78], [162.0, 162.31], [163.0, 163.11], [166.0, 167.75], [169.0, 168.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.77, 0.0, 0.0, 0.0, 96.04, 44.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 85.97], ["radio", 3.67], ["telephone", 2.44]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 76.96], ["radio", 2.79], ["telephone", 1.86]], null, null, null, null, null, null, null, null], "duration": [0.57, 0.68, 0.21, 2.73, 0.68, 0.47, 0.99, 0.59, 0.73, 0.92, 0.89, 0.41, -0.04, 0.85, 0.4, 2.02, 0.4, 1.19, 1.26, 2.17, 5.66, 0.18, 0.4, 0.38, -0.22, 0.31, 0.11, 1.75, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/ptcDoIfzLtI_filtered.json b/annotations_filtered/ptcDoIfzLtI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97ba3493b119242333aaf1a6e0d7a5b3f89b8093 --- /dev/null +++ b/annotations_filtered/ptcDoIfzLtI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 22.87], [36.0, 36.54]], "keep_status": [false, false], "silence_prob": [53.72, 0.0], "audiomae_on_audioset": [null, null], "duration": [2.87, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/ptgpK6nH-5g_filtered.json b/annotations_filtered/ptgpK6nH-5g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce16a9fcb57c9b62762c6f616924b20ae51202a9 --- /dev/null +++ b/annotations_filtered/ptgpK6nH-5g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 34.77], [35.0, 37.12], [38.0, 43.06], [46.0, 48.98], [53.0, 75.41]], "keep_status": [false, true, true, true, false], "silence_prob": [0.0, 30.67, 34.13, 46.47, 30.17], "audiomae_on_audioset": [null, [["speech", 30.77], ["radio", 4.49], ["crowd", 4.42]], [["speech", 33.17], ["hum", 14.91], ["mains hum", 7.7]], [["speech", 25.69], ["fly, housefly", 17.09], ["buzz", 13.54]], [["speech", 61.02], ["music", 6.05], ["livestock, farm animals, working animals", 5.51]]], "duration": [0.77, 2.12, 5.06, 2.98, 22.41]} \ No newline at end of file diff --git a/annotations_filtered/ptiXfr5lJl8_filtered.json b/annotations_filtered/ptiXfr5lJl8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..222a518d3148a86592feb523939b8cca37d839a3 --- /dev/null +++ b/annotations_filtered/ptiXfr5lJl8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.59], [12.0, 46.14], [49.0, 53.13], [55.0, 57.94], [59.0, 64.44], [66.0, 69.21], [70.0, 88.26], [90.0, 94.14], [95.0, 98.19], [99.0, 114.4]], "keep_status": [true, false, false, false, false, true, false, false, false, false], "silence_prob": [35.22, 0.0, 82.61, 73.06, 54.04, 49.92, 34.87, 50.81, 55.67, 34.89], "audiomae_on_audioset": [[["speech", 24.65], ["cattle, bovinae", 19.69], ["moo", 9.37]], null, null, null, null, [["fly, housefly", 25.28], ["mains hum", 15.68], ["hum", 13.87]], [["music", 33.36], ["hum", 27.71], ["mains hum", 13.23]], null, null, [["hum", 46.61], ["mains hum", 19.64], ["music", 19.33]]], "duration": [6.59, 34.14, 4.13, 2.94, 5.44, 3.21, 18.26, 4.14, 3.19, 15.4]} \ No newline at end of file diff --git a/annotations_filtered/pu2ArBfwZcA_filtered.json b/annotations_filtered/pu2ArBfwZcA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6466e8d995b902e629e37789843bf42ba890c224 --- /dev/null +++ b/annotations_filtered/pu2ArBfwZcA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.98], [21.0, 22.03], [25.0, 27.51], [31.0, 144.31], [145.0, 151.93]], "keep_status": [false, false, false, false, true], "silence_prob": [0.0, 0.0, 69.47, 0.0, 39.07], "audiomae_on_audioset": [null, null, null, null, [["mosquito", 22.09], ["fly, housefly", 20.09], ["music", 11.51]]], "duration": [0.98, 1.03, 2.51, 113.31, 6.93]} \ No newline at end of file diff --git a/annotations_filtered/pu523TrIMpg_filtered.json b/annotations_filtered/pu523TrIMpg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a72f3dfa355ad2bcfb63f97d47f7f3435f69fbc9 --- /dev/null +++ b/annotations_filtered/pu523TrIMpg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 80.55], [85.0, 92.79], [95.0, 95.32], [96.0, 97.73], [99.0, 99.5], [104.0, 104.31], [105.0, 109.8], [110.0, 110.74], [111.0, 119.33], [120.0, 121.66], [123.0, 124.36], [127.0, 129.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [58.89, 88.28, 0.0, 0.0, 0.0, 0.0, 80.64, 0.0, 97.64, 0.0, 0.0, 99.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [14.55, 7.79, 0.32, 1.73, 0.5, 0.31, 4.8, 0.74, 8.33, 1.66, 1.36, 2.12]} \ No newline at end of file diff --git a/annotations_filtered/puXEHhZgXaY_filtered.json b/annotations_filtered/puXEHhZgXaY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2cc66f3c6af57b1dd233a1c111d09f5ac67393e3 --- /dev/null +++ b/annotations_filtered/puXEHhZgXaY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[63.0, 64.03], [66.0, 71.88], [76.0, 89.24], [90.0, 98.96], [102.0, 102.27], [103.0, 116.16], [121.0, 129.15], [130.0, 138.47], [140.0, 145.79], [148.0, 149.71], [150.0, 152.63], [154.0, 154.65], [159.0, 162.45]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 37.88, 41.85, 42.0, 0.0, 48.23, 71.43, 99.92, 72.31, 0.0, 75.39, 0.0, 37.97], "audiomae_on_audioset": [null, [["speech", 53.18], ["electric shaver, electric razor", 6.23], ["livestock, farm animals, working animals", 3.74]], [["speech", 36.03], ["livestock, farm animals, working animals", 20.07], ["music", 6.63]], [["speech", 43.62], ["music", 32.18], ["fart", 5.44]], null, [["speech", 54.79], ["electric shaver, electric razor", 11.19], ["music", 11.03]], null, null, null, null, null, null, [["music", 10.92], ["vehicle", 10.71], ["whale vocalization", 8.6]]], "duration": [1.03, 5.88, 13.24, 8.96, 0.27, 13.16, 8.15, 8.47, 5.79, 1.71, 2.63, 0.65, 3.45]} \ No newline at end of file diff --git a/annotations_filtered/puXiyRw_L6g_filtered.json b/annotations_filtered/puXiyRw_L6g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70bca5df6bf49a41b7e340b0f25282d60b720c30 --- /dev/null +++ b/annotations_filtered/puXiyRw_L6g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.72], [11.0, 14.27], [17.0, 18.59], [27.0, 27.85], [29.0, 29.08], [32.0, 32.32], [34.0, 38.87], [39.0, 40.1], [41.0, 42.65], [44.0, 45.18], [49.0, 49.89], [59.0, 59.86], [61.0, 63.54], [69.0, 68.93], [71.0, 72.49], [79.0, 86.64], [90.0, 108.48], [110.0, 111.79], [113.0, 116.11], [120.0, 126.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 84.25, 0.0, 0.0, 0.0, 0.0, 87.19, 0.0, 0.0, 0.0, 0.0, 0.0, 77.87, 0.0, 0.0, 93.91, 97.73, 0.0, 65.44, 69.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 3.27, 1.59, 0.85, 0.08, 0.32, 4.87, 1.1, 1.65, 1.18, 0.89, 0.86, 2.54, -0.07, 1.49, 7.64, 18.48, 1.79, 3.11, 6.96]} \ No newline at end of file diff --git a/annotations_filtered/puyN3edOOUY_filtered.json b/annotations_filtered/puyN3edOOUY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f5c2c30aaa85e3a7463543e92311184a8b120b1 --- /dev/null +++ b/annotations_filtered/puyN3edOOUY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.81], [16.0, 90.91]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.81, 74.91]} \ No newline at end of file diff --git a/annotations_filtered/pvACjy-tYFE_filtered.json b/annotations_filtered/pvACjy-tYFE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..172530cf7e618c97817157cd340a7d6a94e512ca --- /dev/null +++ b/annotations_filtered/pvACjy-tYFE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 12.46], [20.0, 27.97], [33.0, 33.56], [34.0, 43.56], [49.0, 48.96], [56.0, 56.59], [62.0, 63.34], [65.0, 67.39], [70.0, 72.99], [75.0, 76.89], [79.0, 83.79], [85.0, 89.95], [92.0, 107.94]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, true, true], "silence_prob": [30.26, 35.48, 0.0, 35.22, 0.0, 0.0, 0.0, 40.21, 29.87, 0.0, 29.16, 29.28, 29.07], "audiomae_on_audioset": [[["speech", 38.75], ["music", 27.85], ["whack, thwack", 4.44]], [["mains hum", 28.95], ["hum", 25.99], ["throbbing", 12.71]], null, [["speech", 30.79], ["hum", 22.08], ["music", 17.45]], null, null, null, [["music", 68.64], ["musical instrument", 8.64], ["synthesizer", 5.16]], [["music", 21.26], ["vehicle", 4.35], ["synthesizer", 4.02]], null, [["music", 43.53], ["throbbing", 20.11], ["static", 6.69]], [["music", 26.01], ["throbbing", 24.66], ["mains hum", 16.89]], [["music", 28.08], ["vehicle", 14.64], ["hum", 9.91]]], "duration": [9.46, 7.97, 0.56, 9.56, -0.04, 0.59, 1.34, 2.39, 2.99, 1.89, 4.79, 4.95, 15.94]} \ No newline at end of file diff --git a/annotations_filtered/pvNA2JkMfSI_filtered.json b/annotations_filtered/pvNA2JkMfSI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d34429c242754d93329a8978744c6e3bbcab705e --- /dev/null +++ b/annotations_filtered/pvNA2JkMfSI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.06], [12.0, 13.24], [17.0, 17.74], [20.0, 20.6], [21.0, 22.11], [25.0, 25.62], [29.0, 29.94], [33.0, 33.2], [36.0, 36.17], [37.0, 39.26], [47.0, 47.16], [49.0, 49.52], [51.0, 54.11], [55.0, 56.74], [58.0, 58.99], [61.0, 61.53], [64.0, 64.64], [65.0, 66.21], [83.0, 84.74], [86.0, 86.66], [87.0, 88.75], [91.0, 92.3], [95.0, 98.44], [100.0, 100.95], [102.0, 102.12], [104.0, 104.7], [106.0, 107.18], [109.0, 109.68], [110.0, 111.1], [113.0, 113.51], [114.0, 115.32], [116.0, 123.04], [126.0, 128.85], [131.0, 130.77], [135.0, 137.07], [139.0, 140.75], [145.0, 146.11], [148.0, 150.33], [153.0, 154.68], [156.0, 156.2], [157.0, 158.5], [163.0, 165.03], [168.0, 169.97], [173.0, 181.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.77, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 100.0, 0.0, 82.97, 0.0, 0.0, 95.91, 0.0, 0.0, 0.0, 97.83, 0.0, 99.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.06, 1.24, 0.74, 0.6, 1.11, 0.62, 0.94, 0.2, 0.17, 2.26, 0.16, 0.52, 3.11, 1.74, 0.99, 0.53, 0.64, 1.21, 1.74, 0.66, 1.75, 1.3, 3.44, 0.95, 0.12, 0.7, 1.18, 0.68, 1.1, 0.51, 1.32, 7.04, 2.85, -0.23, 2.07, 1.75, 1.11, 2.33, 1.68, 0.2, 1.5, 2.03, 1.97, 8.06]} \ No newline at end of file diff --git a/annotations_filtered/pvS3j8VtanM_filtered.json b/annotations_filtered/pvS3j8VtanM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56c566591e9ce9eea5e3b0a866db887c2d9f8a89 --- /dev/null +++ b/annotations_filtered/pvS3j8VtanM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.22], [6.0, 6.1], [7.0, 7.5], [20.0, 20.85], [23.0, 24.16], [28.0, 32.05], [36.0, 36.63], [40.0, 40.1], [41.0, 43.26], [44.0, 46.47], [47.0, 47.73], [48.0, 48.91], [50.0, 51.78], [53.0, 54.36], [56.0, 55.7], [58.0, 60.83], [63.0, 68.01], [69.0, 69.99], [73.0, 75.76], [79.0, 82.43], [89.0, 88.87], [93.0, 93.36], [95.0, 95.0], [96.0, 96.79], [97.0, 97.71], [100.0, 100.65], [102.0, 102.44], [114.0, 117.93], [119.0, 119.3], [121.0, 122.86], [126.0, 128.6], [142.0, 142.35], [146.0, 147.23], [149.0, 149.93], [152.0, 152.32], [154.0, 153.99], [156.0, 156.36], [157.0, 157.0], [158.0, 158.41], [162.0, 163.9]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.8, 0.0, 0.0, 39.05, 96.29, 0.0, 0.0, 0.0, 0.0, 0.0, 77.87, 46.15, 0.0, 51.5, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.86, 0.0, 0.0, 48.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 36.91], ["mains hum", 12.56], ["music", 9.47]], null, null, null, null, null, null, null, [["speech", 66.99], ["music", 7.63], ["synthesizer", 2.25]], null, null, null, null, null, null, null, null, null, null, [["speech", 60.6], ["music", 13.64], ["synthesizer", 2.89]], null, null, [["music", 63.91], ["synthesizer", 10.86], ["musical instrument", 5.24]], null, null, null, null, null, null, null, null, null], "duration": [1.22, 0.1, 0.5, 0.85, 1.16, 4.05, 0.63, 0.1, 2.26, 2.47, 0.73, 0.91, 1.78, 1.36, -0.3, 2.83, 5.01, 0.99, 2.76, 3.43, -0.13, 0.36, 0.0, 0.79, 0.71, 0.65, 0.44, 3.93, 0.3, 1.86, 2.6, 0.35, 1.23, 0.93, 0.32, -0.01, 0.36, 0.0, 0.41, 1.9]} \ No newline at end of file diff --git a/annotations_filtered/pvZXE-e5Yo4_filtered.json b/annotations_filtered/pvZXE-e5Yo4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b81e32ad496f570cd218cadf15e60787d3166e0a --- /dev/null +++ b/annotations_filtered/pvZXE-e5Yo4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.62], [6.0, 6.62], [11.0, 11.45], [14.0, 32.61], [33.0, 58.14], [59.0, 60.18], [62.0, 62.73], [67.0, 68.42], [70.0, 70.34], [72.0, 83.08], [85.0, 86.27], [88.0, 93.04], [96.0, 96.52], [102.0, 102.42], [104.0, 105.19], [106.0, 107.25], [108.0, 109.07], [110.0, 110.35], [111.0, 112.58], [114.0, 114.37], [116.0, 116.88], [118.0, 119.23], [120.0, 120.75], [122.0, 123.16], [126.0, 125.98], [129.0, 129.12], [132.0, 132.41], [134.0, 139.78], [141.0, 142.77], [145.0, 145.74], [147.0, 165.13], [166.0, 166.24], [167.0, 167.8], [169.0, 169.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 98.99, 99.65, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 99.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.17, 0.0, 0.0, 36.79, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 41.48], ["mains hum", 40.57], ["throbbing", 2.8]], null, null, null], "duration": [0.62, 0.62, 0.45, 18.61, 25.14, 1.18, 0.73, 1.42, 0.34, 11.08, 1.27, 5.04, 0.52, 0.42, 1.19, 1.25, 1.07, 0.35, 1.58, 0.37, 0.88, 1.23, 0.75, 1.16, -0.02, 0.12, 0.41, 5.78, 1.77, 0.74, 18.13, 0.24, 0.8, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/pw46kpxHbls_filtered.json b/annotations_filtered/pw46kpxHbls_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8ecb957566f1c266e351c8ec11df124b157fb71 --- /dev/null +++ b/annotations_filtered/pw46kpxHbls_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.5], [9.0, 9.69], [14.0, 16.78], [18.0, 18.45], [21.0, 21.73], [24.0, 25.02], [29.0, 31.75], [33.0, 33.1], [33.0, 33.99], [36.0, 36.85], [37.0, 38.8], [41.0, 48.41], [50.0, 50.04], [52.0, 52.79], [58.0, 58.48], [60.0, 61.37], [62.0, 63.27], [64.0, 67.42], [68.0, 69.42], [74.0, 77.89], [78.0, 80.28], [96.0, 95.91], [99.0, 99.44], [104.0, 104.43], [105.0, 107.3], [109.0, 112.01]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 46.05, 0.0, 0.0, 0.0, 0.0, 49.68, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 56.48, 51.34, 0.0, 0.0, 0.0, 54.23, 58.55], "audiomae_on_audioset": [null, null, null, null, null, null, [["boing", 32.24], ["speech", 18.34], ["beatboxing", 5.46]], null, null, null, null, [["speech", 68.87], ["busy signal", 10.38], ["sidetone", 4.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 0.69, 2.78, 0.45, 0.73, 1.02, 2.75, 0.1, 0.99, 0.85, 1.8, 7.41, 0.04, 0.79, 0.48, 1.37, 1.27, 3.42, 1.42, 3.89, 2.28, -0.09, 0.44, 0.43, 2.3, 3.01]} \ No newline at end of file diff --git a/annotations_filtered/pw5Y_7wtJmk_filtered.json b/annotations_filtered/pw5Y_7wtJmk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b9696e94c533e7594853e5b342a51e46ec5f18e --- /dev/null +++ b/annotations_filtered/pw5Y_7wtJmk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.74], [9.0, 9.68], [12.0, 12.5], [16.0, 16.02], [17.0, 18.0], [20.0, 19.84], [22.0, 22.77], [23.0, 23.4], [25.0, 24.95], [27.0, 26.96], [28.0, 28.27], [44.0, 47.58], [49.0, 49.94], [60.0, 60.02], [60.0, 60.34], [60.0, 60.42], [60.0, 60.51], [61.0, 62.01], [67.0, 67.61], [69.0, 69.42], [71.0, 71.88], [77.0, 77.48], [79.0, 79.03], [86.0, 89.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 66.15], ["sidetone", 4.82], ["clip-clop", 4.38]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.74, 0.68, 0.5, 0.02, 1.0, -0.16, 0.77, 0.4, -0.05, -0.04, 0.27, 3.58, 0.94, 0.02, 0.34, 0.42, 0.51, 1.01, 0.61, 0.42, 0.88, 0.48, 0.03, 3.36]} \ No newline at end of file diff --git a/annotations_filtered/pwL0PcIHtxQ_filtered.json b/annotations_filtered/pwL0PcIHtxQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80794b2822e30eaebf2eefe6562176447ca0e493 --- /dev/null +++ b/annotations_filtered/pwL0PcIHtxQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 60.34], [88.0, 95.47], [97.0, 106.44], [108.0, 111.0], [111.0, 128.07], [129.0, 152.31], [152.0, 152.95], [154.0, 155.04], [155.0, 156.24], [157.0, 166.63], [171.0, 171.1], [174.0, 174.28]], "keep_status": [false, false, true, true, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 83.88, 33.44, 35.84, 32.79, 30.93, 0.0, 0.0, 0.0, 30.94, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 36.99], ["speech", 14.06], ["hum", 5.64]], [["speech", 40.17], ["animal", 7.05], ["music", 5.06]], [["hum", 39.49], ["mains hum", 10.73], ["music", 9.87]], [["mains hum", 45.01], ["hum", 40.82], ["throbbing", 4.47]], null, null, null, [["music", 19.96], ["hum", 12.74], ["mains hum", 10.4]], null, null], "duration": [44.34, 7.47, 9.44, 3.0, 17.07, 23.31, 0.95, 1.04, 1.24, 9.63, 0.1, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/pwOhqGhP-mk_filtered.json b/annotations_filtered/pwOhqGhP-mk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fda57e72df73224bcb1d1dfa305b2721ec3e66a --- /dev/null +++ b/annotations_filtered/pwOhqGhP-mk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 57.45], [62.0, 94.1], [95.0, 96.85], [98.0, 138.94], [143.0, 142.52], [143.0, 148.58], [149.0, 149.5], [152.0, 168.29], [172.0, 176.93]], "keep_status": [true, false, false, false, false, false, false, true, false], "silence_prob": [39.34, 0.0, 0.0, 0.0, 0.0, 31.31, 0.0, 33.06, 89.72], "audiomae_on_audioset": [[["throbbing", 17.45], ["hum", 12.42], ["animal", 7.0]], null, null, null, null, [["noise", 71.54], ["music", 3.82], ["speech", 3.42]], null, [["noise", 43.02], ["sidetone", 7.1], ["radio", 6.48]], null], "duration": [12.45, 32.1, 1.85, 40.94, -0.48, 5.58, 0.5, 16.29, 4.93]} \ No newline at end of file diff --git a/annotations_filtered/pwSkfvXD_ug_filtered.json b/annotations_filtered/pwSkfvXD_ug_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96eb9c54f226d00f1dd83991a0118f880b23da4a --- /dev/null +++ b/annotations_filtered/pwSkfvXD_ug_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.41], [17.0, 17.59], [19.0, 169.62], [176.0, 177.31], [179.0, 178.92]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.41, 0.59, 150.62, 1.31, -0.08]} \ No newline at end of file diff --git a/annotations_filtered/pwdhau_agX0_filtered.json b/annotations_filtered/pwdhau_agX0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1e16717ed07857b19f7e4893aea8aa4e868b461 --- /dev/null +++ b/annotations_filtered/pwdhau_agX0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 18.5], [22.0, 23.01], [25.0, 26.55], [27.0, 28.98], [32.0, 46.41], [54.0, 54.62], [58.0, 58.82], [59.0, 68.1], [70.0, 72.08], [75.0, 75.37], [76.0, 76.89], [80.0, 81.7], [83.0, 84.18], [88.0, 89.07], [95.0, 98.05], [98.0, 102.02], [105.0, 105.29], [107.0, 109.21], [111.0, 117.75], [119.0, 120.48], [123.0, 127.23], [131.0, 131.79], [133.0, 133.34], [136.0, 138.37], [138.0, 138.47], [138.0, 138.5], [139.0, 147.65], [149.0, 149.93], [154.0, 159.07], [162.0, 163.0], [163.0, 163.97]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, true, false, true, false, false], "silence_prob": [42.67, 0.0, 0.0, 0.0, 39.52, 0.0, 0.0, 35.01, 52.22, 0.0, 0.0, 0.0, 0.0, 0.0, 47.98, 33.21, 0.0, 54.56, 55.53, 0.0, 30.45, 0.0, 0.0, 31.93, 0.0, 0.0, 43.38, 0.0, 47.78, 0.0, 0.0], "audiomae_on_audioset": [[["music", 48.83], ["electric shaver, electric razor", 39.13], ["hum", 3.43]], null, null, null, [["music", 55.93], ["electric shaver, electric razor", 13.34], ["buzz", 6.71]], null, null, [["speech", 22.55], ["hum", 12.31], ["insect", 9.72]], null, null, null, null, null, null, [["chirp tone", 38.93], ["sine wave", 29.35], ["hum", 9.25]], [["insect", 29.23], ["animal", 12.46], ["speech", 12.05]], null, null, null, null, [["speech", 28.3], ["electric shaver, electric razor", 13.86], ["insect", 12.72]], null, null, [["speech", 42.73], ["radio", 24.99], ["music", 8.08]], null, null, [["speech", 14.59], ["insect", 10.64], ["electric shaver, electric razor", 9.94]], null, [["hum", 21.05], ["whale vocalization", 17.08], ["mains hum", 13.4]], null, null], "duration": [12.5, 1.01, 1.55, 1.98, 14.41, 0.62, 0.82, 9.1, 2.08, 0.37, 0.89, 1.7, 1.18, 1.07, 3.05, 4.02, 0.29, 2.21, 6.75, 1.48, 4.23, 0.79, 0.34, 2.37, 0.47, 0.5, 8.65, 0.93, 5.07, 1.0, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/pwqOYWnLxBo_filtered.json b/annotations_filtered/pwqOYWnLxBo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ae8b04ed92c0055e81ed755bb1f79fa7ec37194 --- /dev/null +++ b/annotations_filtered/pwqOYWnLxBo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.41], [6.0, 8.46], [9.0, 10.88], [11.0, 27.09], [28.0, 95.13], [95.0, 95.2], [95.0, 109.04], [110.0, 110.64]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 75.55, 0.0, 52.92, 0.0, 0.0, 57.56, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.41, 2.46, 1.88, 16.09, 67.13, 0.2, 14.04, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/pwt49IF0uG0_filtered.json b/annotations_filtered/pwt49IF0uG0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59de0e52d8f021ba28291b5986afb2d4276c25c1 --- /dev/null +++ b/annotations_filtered/pwt49IF0uG0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.82], [8.0, 9.56], [14.0, 14.69], [25.0, 28.04], [29.0, 30.0], [30.0, 30.82], [31.0, 31.36], [34.0, 33.99], [35.0, 35.75], [37.0, 37.18], [40.0, 40.59], [42.0, 43.41], [46.0, 47.66], [50.0, 50.52], [51.0, 51.58], [52.0, 52.66], [55.0, 55.78], [60.0, 60.86], [63.0, 64.52], [67.0, 68.81], [72.0, 74.02], [80.0, 80.69], [81.0, 81.11], [92.0, 92.15], [94.0, 94.07], [95.0, 97.58], [99.0, 99.74], [106.0, 106.02], [107.0, 108.19], [109.0, 109.21], [111.0, 112.19], [113.0, 114.25], [116.0, 116.14], [116.0, 117.17]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.17, 0.0, 0.0, 56.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.14, 0.0, 0.0, 0.0, 0.0, 83.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["thump, thud", 17.31], ["speech", 10.41], ["groan", 8.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 70.12], ["inside, small room", 4.71], ["crumpling, crinkling", 2.15]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.82, 1.56, 0.69, 3.04, 1.0, 0.82, 0.36, -0.01, 0.75, 0.18, 0.59, 1.41, 1.66, 0.52, 0.58, 0.66, 0.78, 0.86, 1.52, 1.81, 2.02, 0.69, 0.11, 0.15, 0.07, 2.58, 0.74, 0.02, 1.19, 0.21, 1.19, 1.25, 0.14, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/px2rxAmJNHU_filtered.json b/annotations_filtered/px2rxAmJNHU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e2c51f00c43aed38709c29d575344c1b8c822c2 --- /dev/null +++ b/annotations_filtered/px2rxAmJNHU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.84], [6.0, 6.62], [9.0, 12.39], [12.0, 13.37], [16.0, 20.24], [24.0, 24.48], [28.0, 28.24], [39.0, 39.65], [42.0, 42.9], [44.0, 44.17], [47.0, 47.19], [57.0, 57.69], [64.0, 65.25], [69.0, 71.29], [76.0, 76.38], [78.0, 78.78], [84.0, 84.55], [85.0, 85.36], [87.0, 89.48], [94.0, 93.93], [95.0, 95.0], [96.0, 97.01], [98.0, 98.27], [105.0, 105.71], [113.0, 114.0], [122.0, 122.66], [123.0, 124.43], [125.0, 128.21], [130.0, 133.02], [134.0, 144.32], [146.0, 148.36], [150.0, 152.73], [154.0, 160.02], [162.0, 162.41], [168.0, 170.09]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, true, true, false, false], "silence_prob": [0.0, 0.0, 45.59, 0.0, 57.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0, 0.0, 0.0, 0.0, 37.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.05, 30.09, 29.19, 48.14, 38.66, 36.11, 0.0, 44.4], "audiomae_on_audioset": [null, null, [["speech", 33.94], ["music", 27.81], ["radio", 5.29]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 56.43], ["grunt", 14.29], ["burping, eructation", 12.18]], null, null, null, null, null, null, null, null, [["speech", 32.9], ["livestock, farm animals, working animals", 9.5], ["moo", 8.69]], [["speech", 27.59], ["music", 23.44], ["crowd", 4.77]], [["cattle, bovinae", 34.92], ["moo", 32.43], ["livestock, farm animals, working animals", 28.95]], [["speech", 53.72], ["fly, housefly", 8.62], ["insect", 4.52]], [["music", 46.15], ["speech", 16.73], ["drum machine", 6.98]], [["music", 35.24], ["speech", 23.63], ["sidetone", 9.75]], null, [["music", 68.69], ["synthesizer", 5.75], ["electronic music", 3.97]]], "duration": [0.84, 0.62, 3.39, 1.37, 4.24, 0.48, 0.24, 0.65, 0.9, 0.17, 0.19, 0.69, 1.25, 2.29, 0.38, 0.78, 0.55, 0.36, 2.48, -0.07, 0.0, 1.01, 0.27, 0.71, 1.0, 0.66, 1.43, 3.21, 3.02, 10.32, 2.36, 2.73, 6.02, 0.41, 2.09]} \ No newline at end of file diff --git a/annotations_filtered/pxQNKJWZ-t0_filtered.json b/annotations_filtered/pxQNKJWZ-t0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb36fd80a038d10d39e03c6c16807ce2890c1b11 --- /dev/null +++ b/annotations_filtered/pxQNKJWZ-t0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 20.85], [21.0, 35.83], [41.0, 53.54], [54.0, 62.8], [64.0, 76.05], [77.0, 89.9], [90.0, 90.44], [90.0, 134.05], [138.0, 146.62]], "keep_status": [true, false, false, true, false, true, false, false, true], "silence_prob": [28.96, 29.43, 29.23, 28.51, 29.33, 28.58, 0.0, 0.0, 29.76], "audiomae_on_audioset": [[["speech", 22.53], ["music", 15.97], ["roar", 9.83]], [["music", 26.99], ["hum", 25.54], ["throbbing", 19.09]], [["music", 69.68], ["throbbing", 7.4], ["theremin", 2.58]], [["speech", 16.59], ["music", 14.76], ["rumble", 6.14]], [["music", 41.08], ["speech", 27.92], ["didgeridoo", 3.31]], [["music", 29.56], ["hum", 21.45], ["mains hum", 18.39]], null, null, [["grunt", 53.3], ["roaring cats (lions, tigers)", 7.26], ["sound effect", 5.01]]], "duration": [19.85, 14.83, 12.54, 8.8, 12.05, 12.9, 0.44, 44.05, 8.62]} \ No newline at end of file diff --git a/annotations_filtered/pxSjP6JkAis_filtered.json b/annotations_filtered/pxSjP6JkAis_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35b0b27b7e9ae8e451fe562a639f35be50a8753f --- /dev/null +++ b/annotations_filtered/pxSjP6JkAis_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.59], [4.0, 4.9], [5.0, 6.72], [9.0, 9.66], [10.0, 12.21], [14.0, 14.59], [15.0, 15.75], [19.0, 27.09], [30.0, 31.63], [32.0, 38.84], [40.0, 40.46], [41.0, 51.21], [52.0, 56.03], [57.0, 64.45], [67.0, 69.57], [72.0, 73.21], [74.0, 74.55], [76.0, 77.58], [80.0, 85.97], [87.0, 87.71], [89.0, 90.88], [91.0, 91.03], [91.0, 91.86], [94.0, 96.21], [97.0, 97.23], [98.0, 98.69], [102.0, 104.52], [106.0, 107.3], [109.0, 115.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 99.88, 0.0, 71.0, 0.0, 62.89, 55.39, 43.25, 53.28, 0.0, 0.0, 0.0, 47.7, 0.0, 0.0, 0.0, 0.0, 47.2, 0.0, 0.0, 44.4, 0.0, 42.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 67.96], ["musical instrument", 5.39], ["plucked string instrument", 3.21]], null, null, null, null, [["music", 52.87], ["electric piano", 7.25], ["keyboard (musical)", 5.61]], null, null, null, null, [["music", 54.96], ["lullaby", 6.3], ["vibraphone", 4.81]], null, null, [["music", 39.71], ["electric piano", 12.7], ["keyboard (musical)", 8.31]], null, [["music", 63.37], ["guitar", 5.58], ["plucked string instrument", 4.84]]], "duration": [1.59, 0.9, 1.72, 0.66, 2.21, 0.59, 0.75, 8.09, 1.63, 6.84, 0.46, 10.21, 4.03, 7.45, 2.57, 1.21, 0.55, 1.58, 5.97, 0.71, 1.88, 0.03, 0.86, 2.21, 0.23, 0.69, 2.52, 1.3, 6.91]} \ No newline at end of file diff --git a/annotations_filtered/pxiwqleE9Do_filtered.json b/annotations_filtered/pxiwqleE9Do_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a1858dd0ab1fd69959f0e20409bf50247d5ad31 --- /dev/null +++ b/annotations_filtered/pxiwqleE9Do_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.8], [8.0, 14.08], [18.0, 18.06], [19.0, 42.72], [46.0, 53.22], [54.0, 54.7], [55.0, 55.68], [56.0, 57.69], [58.0, 59.39], [60.0, 60.98], [62.0, 63.09], [64.0, 68.2], [70.0, 70.85], [71.0, 71.98], [73.0, 75.34], [76.0, 76.32], [79.0, 80.38], [82.0, 83.29], [84.0, 84.86], [85.0, 87.72], [88.0, 100.4], [101.0, 134.43]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [52.16, 36.57, 0.0, 48.31, 41.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.66, 0.0, 0.0, 69.2, 0.0, 0.0, 0.0, 0.0, 47.2, 37.41, 0.0], "audiomae_on_audioset": [null, [["hum", 29.86], ["throbbing", 29.85], ["music", 6.83]], null, [["speech", 29.25], ["hum", 12.5], ["mains hum", 10.18]], [["fly, housefly", 56.28], ["insect", 14.1], ["mosquito", 9.21]], null, null, null, null, null, null, [["speech", 41.01], ["music", 17.5], ["fly, housefly", 6.01]], null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 16.58], ["moo", 15.74], ["cattle, bovinae", 14.36]], [["speech", 58.18], ["fart", 12.57], ["whale vocalization", 3.11]], null], "duration": [3.8, 6.08, 0.06, 23.72, 7.22, 0.7, 0.68, 1.69, 1.39, 0.98, 1.09, 4.2, 0.85, 0.98, 2.34, 0.32, 1.38, 1.29, 0.86, 2.72, 12.4, 33.43]} \ No newline at end of file diff --git a/annotations_filtered/pxy0q9dp1GA_filtered.json b/annotations_filtered/pxy0q9dp1GA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95e924d680916db239b914332dd6592d20c0ecf1 --- /dev/null +++ b/annotations_filtered/pxy0q9dp1GA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 9.24], [14.0, 17.51], [26.0, 26.27], [31.0, 30.65], [41.0, 42.28], [45.0, 48.2], [53.0, 53.27], [57.0, 57.59], [58.0, 58.58], [60.0, 60.05], [61.0, 62.48], [64.0, 64.84], [67.0, 66.78], [71.0, 72.87]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [40.95, 88.64, 0.0, 0.0, 0.0, 33.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 29.98], ["speech", 9.29], ["musical instrument", 5.72]], null, null, null, null, [["speech", 29.29], ["whack, thwack", 19.43], ["thunk", 11.75]], null, null, null, null, null, null, null, null], "duration": [8.24, 3.51, 0.27, -0.35, 1.28, 3.2, 0.27, 0.59, 0.58, 0.05, 1.48, 0.84, -0.22, 1.87]} \ No newline at end of file diff --git a/annotations_filtered/py7xqlpvCIk_filtered.json b/annotations_filtered/py7xqlpvCIk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ceae0447940da73a9b7236b5c4396bfe2c8ac632 --- /dev/null +++ b/annotations_filtered/py7xqlpvCIk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.13], [6.0, 39.16], [40.0, 55.54], [56.0, 67.63], [69.0, 101.41], [102.0, 105.48]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.31, 33.43, 0.0, 30.32], "audiomae_on_audioset": [null, null, [["hum", 52.52], ["mains hum", 32.25], ["music", 8.38]], [["music", 40.73], ["hum", 36.47], ["mains hum", 5.36]], null, [["fly, housefly", 45.85], ["insect", 28.17], ["speech", 7.25]]], "duration": [1.13, 33.16, 15.54, 11.63, 32.41, 3.48]} \ No newline at end of file diff --git a/annotations_filtered/pyXdB_AYiDs_filtered.json b/annotations_filtered/pyXdB_AYiDs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..336204354457d6bae82e99a88c5f06de867ed748 --- /dev/null +++ b/annotations_filtered/pyXdB_AYiDs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.2], [7.0, 7.8], [10.0, 10.34], [12.0, 12.31], [13.0, 13.81], [15.0, 15.26], [16.0, 16.04], [17.0, 16.92], [19.0, 25.08], [26.0, 28.07], [29.0, 30.84], [31.0, 46.92], [47.0, 88.69], [89.0, 91.4], [93.0, 97.02], [99.0, 105.07], [106.0, 117.49], [119.0, 120.72], [123.0, 123.33], [123.0, 124.14], [127.0, 135.51], [137.0, 140.37], [142.0, 143.63], [145.0, 157.4], [159.0, 165.01], [167.0, 176.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 100.0, 0.0, 43.82, 0.0, 79.24, 88.64, 82.61, 76.53, 0.0, 0.0, 0.0, 33.28, 38.11, 0.0, 49.0, 30.72, 29.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["hum", 35.37], ["mains hum", 21.36], ["music", 20.1]], null, null, null, null, null, null, null, null, [["music", 38.46], ["hum", 9.88], ["throbbing", 7.08]], [["music", 29.65], ["whale vocalization", 16.39], ["didgeridoo", 8.84]], null, [["music", 62.62], ["hum", 10.06], ["didgeridoo", 6.31]], [["music", 43.78], ["cacophony", 15.45], ["synthesizer", 7.39]], [["cacophony", 35.38], ["music", 24.78], ["smash, crash", 6.25]]], "duration": [1.2, 0.8, 0.34, 0.31, 0.81, 0.26, 0.04, -0.08, 6.08, 2.07, 1.84, 15.92, 41.69, 2.4, 4.02, 6.07, 11.49, 1.72, 0.33, 1.14, 8.51, 3.37, 1.63, 12.4, 6.01, 9.67]} \ No newline at end of file diff --git a/annotations_filtered/pyvthgZdQhc_filtered.json b/annotations_filtered/pyvthgZdQhc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99779233def9959fcfd234055a60a201c6f65120 --- /dev/null +++ b/annotations_filtered/pyvthgZdQhc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 25.41], [26.0, 40.86], [43.0, 43.48], [51.0, 51.71], [53.0, 61.79], [64.0, 67.26], [76.0, 76.44], [81.0, 81.6], [82.0, 84.91], [92.0, 92.43], [95.0, 127.11]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 53.84, 0.0, 0.0, 62.47, 33.49, 0.0, 0.0, 51.12, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 35.77], ["speech", 26.61], ["theremin", 4.05]], null, null, null, null, null], "duration": [1.41, 14.86, 0.48, 0.71, 8.79, 3.26, 0.44, 0.6, 2.91, 0.43, 32.11]} \ No newline at end of file diff --git a/annotations_filtered/pz0R9XJciO0_filtered.json b/annotations_filtered/pz0R9XJciO0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b42f66b48f86ceac269751d0ac28fa489780548 --- /dev/null +++ b/annotations_filtered/pz0R9XJciO0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[71.0, 83.03], [86.0, 101.88], [104.0, 121.12], [121.0, 123.21]], "keep_status": [false, true, false, true], "silence_prob": [31.48, 32.96, 34.46, 32.29], "audiomae_on_audioset": [[["music", 58.94], ["speech", 17.06], ["didgeridoo", 2.72]], [["music", 50.68], ["smash, crash", 9.26], ["trombone", 6.1]], [["music", 70.49], ["didgeridoo", 3.0], ["whack, thwack", 2.99]], [["music", 31.34], ["speech", 10.41], ["groan", 6.17]]], "duration": [12.03, 15.88, 17.12, 2.21]} \ No newline at end of file diff --git a/annotations_filtered/pz6wAzZlnhE_filtered.json b/annotations_filtered/pz6wAzZlnhE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..019b55ce7ef3b45a306bee4b1f921c7099f4e6d6 --- /dev/null +++ b/annotations_filtered/pz6wAzZlnhE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.59], [11.0, 18.08], [19.0, 21.19], [24.0, 25.93], [28.0, 30.62], [34.0, 36.46], [39.0, 39.5], [42.0, 49.79], [51.0, 52.69], [54.0, 54.78], [56.0, 56.05], [57.0, 57.45], [58.0, 58.06], [59.0, 84.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 100.0, 100.0, 0.0, 98.44, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.59, 7.08, 2.19, 1.93, 2.62, 2.46, 0.5, 7.79, 1.69, 0.78, 0.05, 0.45, 0.06, 25.86]} \ No newline at end of file diff --git a/annotations_filtered/pzE6SVUHAYE_filtered.json b/annotations_filtered/pzE6SVUHAYE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1411acf4ccd42e255252174482656c82ee145ae8 --- /dev/null +++ b/annotations_filtered/pzE6SVUHAYE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.18], [5.0, 6.83], [13.0, 13.58], [16.0, 17.32], [24.0, 26.81], [31.0, 31.82], [91.0, 98.29], [99.0, 102.41]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [1.18, 1.83, 0.58, 1.32, 2.81, 0.82, 7.29, 3.41]} \ No newline at end of file diff --git a/annotations_filtered/pzG1ckuBqpg_filtered.json b/annotations_filtered/pzG1ckuBqpg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..afc73124e4d90e22e7ff7a021932e31027dcafbc --- /dev/null +++ b/annotations_filtered/pzG1ckuBqpg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 20.56], [32.0, 49.47], [76.0, 87.96], [90.0, 98.1], [101.0, 104.36], [113.0, 117.15], [125.0, 128.29], [131.0, 131.5], [133.0, 134.54], [135.0, 135.46], [138.0, 139.75], [140.0, 143.19]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [66.39, 31.1, 42.28, 78.04, 78.21, 78.38, 30.67, 0.0, 0.0, 0.0, 0.0, 52.39], "audiomae_on_audioset": [null, [["speech", 83.06], ["boing", 2.28], ["whack, thwack", 1.23]], [["hum", 21.84], ["music", 13.01], ["musical instrument", 10.83]], null, null, null, [["speech", 73.99], ["radio", 11.49], ["speech synthesizer", 3.36]], null, null, null, null, null], "duration": [5.56, 17.47, 11.96, 8.1, 3.36, 4.15, 3.29, 0.5, 1.54, 0.46, 1.75, 3.19]} \ No newline at end of file diff --git a/annotations_filtered/pzZ9UdUTRNA_filtered.json b/annotations_filtered/pzZ9UdUTRNA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc822d4e1c94bc77ce61c6cc6271fbd89602f873 --- /dev/null +++ b/annotations_filtered/pzZ9UdUTRNA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.54], [5.0, 5.73], [15.0, 16.17], [17.0, 25.69], [27.0, 27.84], [29.0, 29.71], [31.0, 31.78], [32.0, 41.52], [42.0, 43.58], [45.0, 46.79], [50.0, 72.28], [79.0, 80.42], [91.0, 94.27], [99.0, 106.83], [113.0, 131.75], [138.0, 140.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 50.97, 0.0, 0.0, 0.0, 61.77, 0.0, 0.0, 35.91, 0.0, 76.04, 53.1, 64.97, 45.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["machine gun", 58.25], ["speech", 14.24], ["gunshot, gunfire", 8.49]], null, null, null, null, [["music", 48.37], ["electronic music", 6.48], ["scary music", 4.18]]], "duration": [1.54, 0.73, 1.17, 8.69, 0.84, 0.71, 0.78, 9.52, 1.58, 1.79, 22.28, 1.42, 3.27, 7.83, 18.75, 2.88]} \ No newline at end of file