Spaces:
Build error
Build error
Adds files 2
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- annotations_2/--Jiv5iYqT8_filtered.json +1 -0
- annotations_2/--aqjaJyZLk_filtered.json +1 -0
- annotations_2/--oCWVOBuvA_filtered.json +1 -0
- annotations_2/--uyzf7X_0c_filtered.json +1 -0
- annotations_2/--vFXH3mH3A_filtered.json +1 -0
- annotations_2/-0f67QE-HP8_filtered.json +1 -0
- annotations_2/-1U0LH6dPfw_filtered.json +1 -0
- annotations_2/-37Mhsak-XI_filtered.json +1 -0
- annotations_2/-3KCgSpt3hU_filtered.json +1 -0
- annotations_2/-3RMOO6mHr4_filtered.json +1 -0
- annotations_2/-4Q-MS_oFkw_filtered.json +1 -0
- annotations_2/-4QqksHXUCc_filtered.json +1 -0
- annotations_2/-4_rMqeyOJY_filtered.json +1 -0
- annotations_2/-5be_UPkLRw_filtered.json +1 -0
- annotations_2/-64q4HpZyaY_filtered.json +1 -0
- annotations_2/-78FgmNwyD4_filtered.json +1 -0
- annotations_2/-7krYJUfFv4_filtered.json +1 -0
- annotations_2/-9DrPi3ki0g_filtered.json +1 -0
- annotations_2/-9P7Ge1KmTY_filtered.json +1 -0
- annotations_2/-ASYRiRflDM_filtered.json +1 -0
- annotations_2/-BOt25-zf8Q_filtered.json +1 -0
- annotations_2/-CKzCdneg04_filtered.json +1 -0
- annotations_2/-CXBIAH4Kgo_filtered.json +1 -0
- annotations_2/-DF-MgSuhQ0_filtered.json +1 -0
- annotations_2/-GSZwG_s-8A_filtered.json +1 -0
- annotations_2/-G_I8dQHN5s_filtered.json +1 -0
- annotations_2/-GaJPgI3jh4_filtered.json +1 -0
- annotations_2/-HPjEz0u-9Q_filtered.json +1 -0
- annotations_2/-HTF_tAUtkQ_filtered.json +1 -0
- annotations_2/-HwMH2_-oKA_filtered.json +1 -0
- annotations_2/-IIHYIZSFbk_filtered.json +1 -0
- annotations_2/-JERO2LQSKc_filtered.json +1 -0
- annotations_2/-Jzi-2lYWEw_filtered.json +1 -0
- annotations_2/-Kd5zqw24S4_filtered.json +1 -0
- annotations_2/-Luy502C920_filtered.json +1 -0
- annotations_2/-N2mhlvygq0_filtered.json +1 -0
- annotations_2/-NeY5tqk1N8_filtered.json +1 -0
- annotations_2/-Nr56-RD_g8_filtered.json +1 -0
- annotations_2/-O3_WO63fhU_filtered.json +1 -0
- annotations_2/-Ot948zIr0s_filtered.json +1 -0
- annotations_2/-PFdr0SiAEw_filtered.json +1 -0
- annotations_2/-Pf1f0pZdnQ_filtered.json +1 -0
- annotations_2/-QJsljIDKkk_filtered.json +1 -0
- annotations_2/-QNxYSDdpig_filtered.json +1 -0
- annotations_2/-QOahlrO8Yo_filtered.json +1 -0
- annotations_2/-QWL-FwX4t4_filtered.json +1 -0
- annotations_2/-RuK7XKbefY_filtered.json +1 -0
- annotations_2/-SJAzpHg4s8_filtered.json +1 -0
- annotations_2/-TLCaDbBv_s_filtered.json +1 -0
- annotations_2/-TzrPYcpPvY_filtered.json +1 -0
annotations_2/--Jiv5iYqT8_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[2.0, 5.14], [7.0, 8.21], [9.0, 12.63], [13.0, 15.26], [17.0, 19.16], [20.0, 23.95], [25.0, 30.32], [31.0, 41.57], [43.0, 54.11], [55.0, 58.31], [59.0, 61.94], [64.0, 99.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.52, 0.0, 100.0, 100.0, 100.0, 100.0, 99.93, 99.95, 99.98, 77.53, 81.17, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.14, 1.21, 3.63, 2.26, 2.16, 3.95, 5.32, 10.57, 11.11, 3.31, 2.94, 35.55]}
|
annotations_2/--aqjaJyZLk_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[8.0, 15.62], [19.0, 22.18], [24.0, 25.74], [26.0, 26.6], [29.0, 33.02], [41.0, 42.13], [46.0, 46.55], [47.0, 48.63], [50.0, 51.17], [54.0, 55.27], [56.0, 57.32], [58.0, 59.81], [63.0, 63.49], [69.0, 69.21], [70.0, 72.59], [75.0, 75.64], [77.0, 78.58], [81.0, 81.77], [83.0, 83.69], [85.0, 85.83], [87.0, 88.38], [89.0, 90.8], [91.0, 91.88], [92.0, 92.64], [95.0, 97.17], [98.0, 106.57], [108.0, 109.51], [110.0, 111.52], [112.0, 115.32], [118.0, 120.87]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [52.27, 54.97, 0.0, 0.0, 49.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.55, 37.26, 0.0, 0.0, 31.3, 58.72], "audiomae_on_audioset": [null, null, null, null, [["noise", 17.53], ["hum", 14.74], ["music", 12.08]], null, null, null, null, null, null, null, null, null, [["music", 42.85], ["speech", 9.51], ["hum", 6.87]], null, null, null, null, null, null, null, null, null, [["tuning fork", 85.18], ["coin (dropping)", 2.94], ["gong", 2.22]], [["music", 39.36], ["mechanisms", 7.52], ["hum", 6.54]], null, null, [["music", 14.77], ["clang", 10.79], ["fly, housefly", 8.68]], null], "duration": [7.62, 3.18, 1.74, 0.6, 4.02, 1.13, 0.55, 1.63, 1.17, 1.27, 1.32, 1.81, 0.49, 0.21, 2.59, 0.64, 1.58, 0.77, 0.69, 0.83, 1.38, 1.8, 0.88, 0.64, 2.17, 8.57, 1.51, 1.52, 3.32, 2.87]}
|
annotations_2/--oCWVOBuvA_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[2.0, 2.42], [4.0, 5.46], [7.0, 7.35], [9.0, 12.02], [13.0, 14.1], [16.0, 17.66], [20.0, 21.22], [24.0, 26.03], [27.0, 28.41], [32.0, 32.81], [36.0, 36.37], [38.0, 38.4], [41.0, 47.61], [49.0, 51.41], [55.0, 56.3], [58.0, 58.21], [60.0, 64.56], [66.0, 66.36], [67.0, 68.35], [70.0, 72.81], [74.0, 75.02], [77.0, 78.65], [80.0, 81.68], [83.0, 83.17], [84.0, 87.4], [88.0, 92.03], [94.0, 95.12], [98.0, 99.33], [102.0, 101.78], [103.0, 105.87], [106.0, 106.83], [109.0, 109.81], [112.0, 113.04], [118.0, 119.72], [121.0, 121.34], [126.0, 126.22], [129.0, 129.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.99, 100.0, 0.0, 0.0, 94.95, 0.0, 0.0, 67.13, 0.0, 0.0, 0.0, 0.0, 100.0, 99.98, 0.0, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 1.46, 0.35, 3.02, 1.1, 1.66, 1.22, 2.03, 1.41, 0.81, 0.37, 0.4, 6.61, 2.41, 1.3, 0.21, 4.56, 0.36, 1.35, 2.81, 1.02, 1.65, 1.68, 0.17, 3.4, 4.03, 1.12, 1.33, -0.22, 2.87, 0.83, 0.81, 1.04, 1.72, 0.34, 0.22, 0.73]}
|
annotations_2/--uyzf7X_0c_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[3.0, 3.45], [5.0, 5.07], [8.0, 8.16], [13.0, 12.78], [20.0, 20.21], [24.0, 24.07], [26.0, 26.52], [35.0, 35.53], [40.0, 40.29], [48.0, 48.36], [51.0, 51.54], [54.0, 54.72], [70.0, 69.72], [71.0, 71.68], [74.0, 74.43], [77.0, 76.92], [78.0, 78.51], [82.0, 82.24], [83.0, 83.03], [85.0, 85.31], [88.0, 88.8], [90.0, 90.86], [95.0, 95.47], [100.0, 100.31], [105.0, 105.33], [107.0, 107.01], [111.0, 111.92], [115.0, 115.06], [115.0, 115.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 0.07, 0.16, -0.22, 0.21, 0.07, 0.52, 0.53, 0.29, 0.36, 0.54, 0.72, -0.28, 0.68, 0.43, -0.08, 0.51, 0.24, 0.03, 0.31, 0.8, 0.86, 0.47, 0.31, 0.33, 0.01, 0.92, 0.06, 0.7]}
|
annotations_2/--vFXH3mH3A_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[9.0, 16.01], [18.0, 36.73], [38.0, 41.69], [49.0, 51.97], [58.0, 59.56], [61.0, 65.1], [74.0, 82.44], [83.0, 89.94], [90.0, 90.98], [96.0, 98.64], [103.0, 103.92], [108.0, 107.97], [108.0, 109.88], [112.0, 114.1], [118.0, 130.54], [132.0, 133.14], [134.0, 144.76], [147.0, 160.37], [161.0, 166.53], [168.0, 167.9], [170.0, 170.83], [173.0, 172.84]], "keep_status": [true, true, true, false, false, false, true, false, false, true, false, false, false, true, true, false, false, false, true, false, false, false], "silence_prob": [28.92, 29.82, 29.42, 29.02, 0.0, 30.59, 29.01, 29.08, 0.0, 29.77, 0.0, 0.0, 0.0, 28.94, 29.1, 0.0, 29.24, 28.93, 30.87, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["whack, thwack", 11.06], ["mosquito", 7.33], ["speech", 6.95]], [["rumble", 29.07], ["hum", 13.01], ["mains hum", 12.77]], [["speech", 17.98], ["whale vocalization", 16.64], ["groan", 16.12]], [["music", 63.1], ["speech", 7.17], ["electronic music", 1.88]], null, [["didgeridoo", 33.1], ["speech", 24.81], ["music", 22.07]], [["music", 52.24], ["vehicle", 9.53], ["motorcycle", 2.87]], [["music", 50.65], ["cattle, bovinae", 18.06], ["moo", 9.87]], null, [["music", 25.05], ["cattle, bovinae", 23.46], ["moo", 18.88]], null, null, null, [["groan", 43.37], ["music", 6.03], ["grunt", 5.74]], [["music", 39.13], ["speech", 20.56], ["electronic music", 6.22]], null, [["music", 83.89], ["electronic music", 3.05], ["techno", 1.93]], [["music", 79.27], ["hum", 3.27], ["throbbing", 2.72]], [["fly, housefly", 28.0], ["explosion", 24.83], ["boom", 9.83]], null, null, null], "duration": [7.01, 18.73, 3.69, 2.97, 1.56, 4.1, 8.44, 6.94, 0.98, 2.64, 0.92, -0.03, 1.88, 2.1, 12.54, 1.14, 10.76, 13.37, 5.53, -0.1, 0.83, -0.16]}
|
annotations_2/-0f67QE-HP8_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[0.0, 0.85], [2.0, 3.06], [4.0, 7.08], [9.0, 35.92], [38.0, 41.82], [44.0, 45.98], [48.0, 57.75], [58.0, 57.86], [58.0, 93.53], [98.0, 105.11], [110.0, 113.12], [114.0, 115.65], [118.0, 121.74], [132.0, 139.5], [143.0, 142.79], [143.0, 143.9], [148.0, 148.56], [152.0, 157.91], [160.0, 159.92], [161.0, 164.03], [169.0, 169.53], [171.0, 172.02], [181.0, 182.46]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.97, 30.71, 34.35, 0.0, 32.99, 0.0, 0.0, 29.01, 30.45, 0.0, 29.66, 30.04, 0.0, 0.0, 0.0, 31.53, 0.0, 30.6, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 72.72], ["music", 8.61], ["sidetone", 2.77]], [["music", 57.26], ["throbbing", 8.84], ["hum", 6.68]], null, [["whale vocalization", 88.55], ["music", 6.54], ["musical instrument", 0.81]], null, null, [["speech", 24.98], ["music", 16.76], ["whack, thwack", 8.37]], [["whale vocalization", 77.84], ["mosquito", 3.38], ["moo", 2.41]], null, [["explosion", 30.95], ["burst, pop", 13.91], ["speech", 9.44]], [["speech", 27.71], ["music", 15.41], ["cattle, bovinae", 6.74]], null, null, null, [["music", 32.22], ["electronic music", 12.21], ["dubstep", 7.19]], null, [["speech", 74.27], ["sound effect", 3.57], ["fart", 2.7]], null, null, null], "duration": [0.85, 1.06, 3.08, 26.92, 3.82, 1.98, 9.75, -0.14, 35.53, 7.11, 3.12, 1.65, 3.74, 7.5, -0.21, 0.9, 0.56, 5.91, -0.08, 3.03, 0.53, 1.02, 1.46]}
|
annotations_2/-1U0LH6dPfw_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[2.0, 2.61], [3.0, 3.11], [3.0, 4.31], [13.0, 14.22], [22.0, 24.88], [26.0, 31.73], [35.0, 38.31], [39.0, 42.03], [46.0, 56.1], [61.0, 85.5], [98.0, 98.49], [100.0, 107.32], [108.0, 108.38], [120.0, 120.63]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.28, 30.67, 30.45, 30.48, 30.16, 30.01, 0.0, 33.86, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 61.12], ["didgeridoo", 4.8], ["sidetone", 4.55]], [["music", 62.74], ["hum", 9.5], ["throbbing", 5.24]], [["music", 45.36], ["speech", 19.03], ["boing", 5.23]], [["music", 53.7], ["boing", 15.98], ["fly, housefly", 3.21]], [["music", 60.24], ["speech", 11.81], ["boing", 9.62]], [["music", 68.45], ["boing", 10.58], ["speech", 6.01]], null, [["music", 42.75], ["speech", 18.11], ["mains hum", 12.3]], null, null], "duration": [0.61, 0.11, 1.31, 1.22, 2.88, 5.73, 3.31, 3.03, 10.1, 24.5, 0.49, 7.32, 0.38, 0.63]}
|
annotations_2/-37Mhsak-XI_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[44.0, 44.73], [48.0, 65.79], [68.0, 86.9], [88.0, 96.03], [97.0, 119.35], [120.0, 123.89], [125.0, 127.58]], "keep_status": [false, false, false, false, true, false, true], "silence_prob": [0.0, 31.97, 35.22, 58.05, 45.75, 58.98, 46.79], "audiomae_on_audioset": [null, [["music", 75.5], ["theremin", 5.06], ["scary music", 3.28]], [["music", 40.89], ["speech", 25.7], ["boing", 12.51]], null, [["music", 36.75], ["guitar", 18.42], ["plucked string instrument", 8.13]], null, [["music", 51.17], ["boing", 10.19], ["didgeridoo", 3.32]]], "duration": [0.73, 17.79, 18.9, 8.03, 22.35, 3.89, 2.58]}
|
annotations_2/-3KCgSpt3hU_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[0.0, 0.26], [2.0, 3.81], [7.0, 6.88], [11.0, 10.98], [14.0, 16.56], [21.0, 21.47], [28.0, 28.24], [31.0, 32.36], [36.0, 37.34], [39.0, 40.07], [44.0, 46.47], [48.0, 48.44], [53.0, 54.99], [56.0, 56.88], [57.0, 58.53], [66.0, 68.28], [71.0, 72.1], [73.0, 73.55], [74.0, 78.63], [81.0, 81.43], [83.0, 84.79], [86.0, 86.05], [90.0, 91.77], [95.0, 95.66], [99.0, 100.94], [102.0, 103.57], [105.0, 105.85], [107.0, 108.28], [111.0, 112.83], [114.0, 119.4], [120.0, 121.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 95.91, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, 1.81, -0.12, -0.02, 2.56, 0.47, 0.24, 1.36, 1.34, 1.07, 2.47, 0.44, 1.99, 0.88, 1.53, 2.28, 1.1, 0.55, 4.63, 0.43, 1.79, 0.05, 1.77, 0.66, 1.94, 1.57, 0.85, 1.28, 1.83, 5.4, 1.05]}
|
annotations_2/-3RMOO6mHr4_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[32.0, 32.24], [33.0, 32.98], [38.0, 37.61], [39.0, 39.99], [47.0, 49.03], [49.0, 49.08], [78.0, 81.3], [89.0, 90.56], [99.0, 113.17]], "keep_status": [false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 42.33, 0.0, 30.81, 0.0, 30.68], "audiomae_on_audioset": [null, null, null, null, [["livestock, farm animals, working animals", 36.74], ["moo", 21.51], ["cattle, bovinae", 13.9]], null, [["music", 20.01], ["moo", 13.1], ["speech", 11.05]], null, [["music", 72.64], ["electronic music", 5.15], ["techno", 3.8]]], "duration": [0.24, -0.02, -0.39, 0.99, 2.03, 0.08, 3.3, 1.56, 14.17]}
|
annotations_2/-4Q-MS_oFkw_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[11.0, 11.03], [13.0, 13.14], [16.0, 19.82], [24.0, 24.0], [24.0, 25.22], [28.0, 31.28], [33.0, 45.86], [48.0, 50.08], [53.0, 54.19], [57.0, 67.07], [72.0, 72.99], [73.0, 86.34], [99.0, 113.97], [118.0, 125.14]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 93.6, 0.0, 0.0, 51.88, 43.56, 93.76, 0.0, 81.0, 0.0, 48.31, 42.06, 33.06], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 38.94], ["synthesizer", 14.42], ["theremin", 3.43]], null, null, null, null, [["music", 47.22], ["speech", 21.31], ["theremin", 7.97]], [["music", 46.21], ["theremin", 24.05], ["synthesizer", 4.34]], [["music", 29.76], ["foghorn", 27.27], ["brass instrument", 3.53]]], "duration": [0.03, 0.14, 3.82, 0.0, 1.22, 3.28, 12.86, 2.08, 1.19, 10.07, 0.99, 13.34, 14.97, 7.14]}
|
annotations_2/-4QqksHXUCc_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[6.0, 6.91], [8.0, 13.36], [19.0, 20.43], [22.0, 24.17], [27.0, 27.38], [43.0, 46.65], [52.0, 57.62], [58.0, 61.52], [66.0, 68.44], [72.0, 72.52], [76.0, 77.55], [90.0, 89.78], [99.0, 100.2], [107.0, 107.87], [119.0, 119.97], [121.0, 122.76], [123.0, 125.02]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 34.59, 0.0, 36.53, 0.0, 32.91, 37.86, 36.06, 34.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.59], "audiomae_on_audioset": [null, [["music", 55.86], ["throbbing", 11.97], ["electronic music", 4.41]], null, [["hum", 30.96], ["throbbing", 30.29], ["music", 20.06]], null, [["music", 59.22], ["hum", 9.81], ["throbbing", 5.74]], [["music", 60.68], ["didgeridoo", 4.99], ["moo", 3.55]], [["music", 35.65], ["speech", 24.35], ["hum", 4.25]], [["fly, housefly", 22.19], ["music", 18.42], ["insect", 14.12]], null, null, null, null, null, null, null, [["music", 23.99], ["boing", 15.45], ["didgeridoo", 13.58]]], "duration": [0.91, 5.36, 1.43, 2.17, 0.38, 3.65, 5.62, 3.52, 2.44, 0.52, 1.55, -0.22, 1.2, 0.87, 0.97, 1.76, 2.02]}
|
annotations_2/-4_rMqeyOJY_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[4.0, 4.99], [7.0, 13.02], [14.0, 14.57], [15.0, 16.07], [17.0, 18.4], [19.0, 20.65], [24.0, 28.92], [31.0, 32.14], [33.0, 35.72], [36.0, 37.72], [45.0, 46.35], [51.0, 51.63], [55.0, 55.59], [60.0, 60.86], [63.0, 63.73], [64.0, 64.4], [68.0, 69.03], [78.0, 79.19], [80.0, 85.9], [88.0, 89.72], [92.0, 93.21], [95.0, 107.42], [109.0, 113.54], [114.0, 121.71], [123.0, 124.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 99.84, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 68.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 45.72, 37.88, 43.71, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 67.89], ["frog", 5.36], ["insect", 3.47]], [["speech", 27.14], ["dial tone", 23.51], ["busy signal", 6.93]], [["speech", 51.05], ["throat clearing", 5.81], ["noise", 4.84]], null], "duration": [0.99, 6.02, 0.57, 1.07, 1.4, 1.65, 4.92, 1.14, 2.72, 1.72, 1.35, 0.63, 0.59, 0.86, 0.73, 0.4, 1.03, 1.19, 5.9, 1.72, 1.21, 12.42, 4.54, 7.71, 1.02]}
|
annotations_2/-5be_UPkLRw_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[2.0, 4.06], [6.0, 6.29], [9.0, 12.5], [14.0, 16.61], [19.0, 20.55], [24.0, 30.74], [31.0, 32.48], [34.0, 33.76], [35.0, 35.63], [36.0, 40.47], [42.0, 44.19], [45.0, 46.9], [49.0, 49.62], [51.0, 52.59], [53.0, 55.44], [58.0, 58.31], [60.0, 60.81], [63.0, 63.42], [65.0, 65.94], [68.0, 68.39], [70.0, 70.63], [72.0, 72.94], [74.0, 75.36], [77.0, 77.63], [79.0, 79.93], [80.0, 83.71], [84.0, 87.1], [89.0, 89.45], [92.0, 91.83], [93.0, 102.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.96, 0.0, 67.38, 99.99, 0.0, 99.62, 0.0, 0.0, 0.0, 100.0, 99.8, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.1, 100.0, 0.0, 0.0, 99.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.06, 0.29, 3.5, 2.61, 1.55, 6.74, 1.48, -0.24, 0.63, 4.47, 2.19, 1.9, 0.62, 1.59, 2.44, 0.31, 0.81, 0.42, 0.94, 0.39, 0.63, 0.94, 1.36, 0.63, 0.93, 3.71, 3.1, 0.45, -0.17, 9.32]}
|
annotations_2/-64q4HpZyaY_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[3.0, 10.61], [12.0, 12.16], [13.0, 79.49], [80.0, 109.46], [111.0, 112.77], [116.0, 117.36], [119.0, 124.24]], "keep_status": [true, false, false, false, false, false, false], "silence_prob": [31.4, 0.0, 0.0, 69.07, 0.0, 0.0, 63.96], "audiomae_on_audioset": [[["fly, housefly", 24.9], ["mains hum", 24.38], ["hum", 14.07]], null, null, null, null, null, null], "duration": [7.61, 0.16, 66.49, 29.46, 1.77, 1.36, 5.24]}
|
annotations_2/-78FgmNwyD4_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[1.0, 1.0], [1.0, 1.16], [16.0, 16.8], [36.0, 36.1], [36.0, 37.08], [39.0, 41.34], [48.0, 48.9], [50.0, 50.38], [56.0, 56.52], [58.0, 58.78], [64.0, 64.3], [66.0, 66.85], [67.0, 76.86], [82.0, 82.63], [83.0, 83.62], [84.0, 84.59], [100.0, 101.29], [102.0, 102.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 84.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.14, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.84], ["groan", 22.6], ["screaming", 2.61]], null, null, null, null, null], "duration": [0.0, 0.16, 0.8, 0.1, 1.08, 2.34, 0.9, 0.38, 0.52, 0.78, 0.3, 0.85, 9.86, 0.63, 0.62, 0.59, 1.29, 0.12]}
|
annotations_2/-7krYJUfFv4_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[7.0, 8.58], [9.0, 10.77], [11.0, 11.94], [13.0, 14.71], [15.0, 16.53], [18.0, 19.45], [20.0, 20.78], [31.0, 31.26], [34.0, 34.37], [41.0, 41.52], [42.0, 42.4], [43.0, 43.65], [45.0, 45.25], [47.0, 47.73], [49.0, 49.59], [50.0, 50.63], [53.0, 54.16], [56.0, 56.03], [62.0, 63.31], [65.0, 65.69], [68.0, 68.22], [81.0, 81.48], [92.0, 92.75], [106.0, 107.37], [109.0, 109.34], [110.0, 111.01], [112.0, 112.08], [113.0, 113.48], [114.0, 114.15], [119.0, 119.03], [124.0, 126.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.58, 1.77, 0.94, 1.71, 1.53, 1.45, 0.78, 0.26, 0.37, 0.52, 0.4, 0.65, 0.25, 0.73, 0.59, 0.63, 1.16, 0.03, 1.31, 0.69, 0.22, 0.48, 0.75, 1.37, 0.34, 1.01, 0.08, 0.48, 0.15, 0.03, 2.66]}
|
annotations_2/-9DrPi3ki0g_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[12.0, 20.28], [22.0, 45.76]], "keep_status": [false, true], "silence_prob": [34.74, 33.61], "audiomae_on_audioset": [[["music", 49.81], ["theremin", 33.23], ["vehicle", 1.7]], [["music", 44.88], ["brass instrument", 11.34], ["trombone", 7.67]]], "duration": [8.28, 23.76]}
|
annotations_2/-9P7Ge1KmTY_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[4.0, 4.02], [5.0, 4.7], [5.0, 5.78], [7.0, 8.72], [32.0, 33.22], [38.0, 39.5], [41.0, 42.06], [47.0, 48.24], [51.0, 50.75], [51.0, 52.86], [54.0, 54.65], [65.0, 65.82], [69.0, 68.99], [76.0, 76.65], [79.0, 78.98], [81.0, 80.94], [84.0, 85.06], [87.0, 89.92], [91.0, 91.72], [92.0, 93.43], [95.0, 97.58], [106.0, 107.76], [111.0, 111.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.32, 0.0, 0.0, 96.29, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 65.48], ["telephone", 13.06], ["hum", 5.47]], null, null, null, null, null], "duration": [0.02, -0.3, 0.78, 1.72, 1.22, 1.5, 1.06, 1.24, -0.25, 1.86, 0.65, 0.82, -0.01, 0.65, -0.02, -0.06, 1.06, 2.92, 0.72, 1.43, 2.58, 1.76, 0.35]}
|
annotations_2/-ASYRiRflDM_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[2.0, 2.96], [5.0, 5.0], [6.0, 6.96], [8.0, 8.68], [10.0, 10.96], [14.0, 14.4], [15.0, 16.77], [19.0, 20.97], [22.0, 22.99], [27.0, 27.23], [28.0, 29.74], [31.0, 33.59], [36.0, 36.83], [37.0, 38.97], [45.0, 45.28], [47.0, 47.46], [49.0, 49.84], [51.0, 51.22], [56.0, 57.87], [58.0, 58.75], [60.0, 60.98], [61.0, 61.99], [64.0, 64.1], [65.0, 65.79], [66.0, 66.6], [68.0, 68.91], [70.0, 71.22], [73.0, 73.03], [82.0, 85.29], [87.0, 87.62], [89.0, 89.21], [104.0, 103.64], [105.0, 106.96], [115.0, 114.78], [116.0, 116.51], [120.0, 120.61], [122.0, 122.93], [124.0, 124.95], [126.0, 127.38], [128.0, 129.19], [130.0, 130.11], [131.0, 131.57], [133.0, 134.27], [136.0, 136.38], [144.0, 144.63], [145.0, 147.6], [150.0, 150.21], [153.0, 153.49], [155.0, 155.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.96, 0.0, 0.96, 0.68, 0.96, 0.4, 1.77, 1.97, 0.99, 0.23, 1.74, 2.59, 0.83, 1.97, 0.28, 0.46, 0.84, 0.22, 1.87, 0.75, 0.98, 0.99, 0.1, 0.79, 0.6, 0.91, 1.22, 0.03, 3.29, 0.62, 0.21, -0.36, 1.96, -0.22, 0.51, 0.61, 0.93, 0.95, 1.38, 1.19, 0.11, 0.57, 1.27, 0.38, 0.63, 2.6, 0.21, 0.49, 0.24]}
|
annotations_2/-BOt25-zf8Q_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[10.0, 10.49], [11.0, 11.99], [13.0, 13.36], [15.0, 15.7], [23.0, 24.43], [29.0, 29.12], [38.0, 40.31], [43.0, 42.8], [44.0, 49.74], [51.0, 50.95], [52.0, 57.08], [59.0, 61.2], [64.0, 68.2], [69.0, 69.45], [72.0, 77.48], [87.0, 87.56], [89.0, 96.18], [98.0, 99.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.2, 0.0, 40.7, 0.0, 45.21, 49.18, 40.36, 0.0, 47.39, 0.0, 39.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 53.99], ["speech", 15.3], ["guitar", 5.89]], null, [["music", 51.1], ["didgeridoo", 10.0], ["theremin", 6.33]], [["music", 51.86], ["guitar", 6.97], ["bass guitar", 5.58]], [["cattle, bovinae", 24.9], ["livestock, farm animals, working animals", 24.55], ["moo", 18.7]], null, [["music", 27.41], ["speech", 10.79], ["hum", 5.84]], null, [["mains hum", 55.58], ["hum", 19.35], ["speech", 6.47]], null], "duration": [0.49, 0.99, 0.36, 0.7, 1.43, 0.12, 2.31, -0.2, 5.74, -0.05, 5.08, 2.2, 4.2, 0.45, 5.48, 0.56, 7.18, 1.72]}
|
annotations_2/-CKzCdneg04_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[3.0, 2.98], [4.0, 5.48], [28.0, 27.94], [29.0, 29.15], [31.0, 31.14], [32.0, 33.51], [36.0, 35.72], [36.0, 36.93], [39.0, 39.55], [46.0, 45.79], [50.0, 50.03], [54.0, 53.92], [56.0, 60.59], [61.0, 63.04], [69.0, 73.55], [78.0, 87.08], [99.0, 99.37], [103.0, 109.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 44.87, 42.3, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 71.34], ["door", 2.71], ["telephone", 2.64]], [["speech", 61.25], ["ding", 11.35], ["thunk", 10.3]], null, null], "duration": [-0.02, 1.48, -0.06, 0.15, 0.14, 1.51, -0.28, 0.93, 0.55, -0.21, 0.03, -0.08, 4.59, 2.04, 4.55, 9.08, 0.37, 6.98]}
|
annotations_2/-CXBIAH4Kgo_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[3.0, 4.01], [5.0, 6.44], [9.0, 13.1], [18.0, 19.62], [20.0, 23.01], [25.0, 25.27], [26.0, 39.75], [41.0, 44.64], [46.0, 47.28], [49.0, 51.11], [53.0, 56.0], [57.0, 58.95], [60.0, 61.42], [64.0, 66.14], [67.0, 71.24], [72.0, 74.34], [75.0, 76.65], [78.0, 79.68], [80.0, 87.93], [91.0, 92.94], [96.0, 97.12], [99.0, 102.25], [104.0, 105.17], [106.0, 108.11], [109.0, 129.44], [133.0, 134.79], [136.0, 137.66], [139.0, 140.95], [144.0, 145.96], [148.0, 150.25], [152.0, 154.95], [156.0, 156.44], [158.0, 158.4], [159.0, 161.86]], "keep_status": [false, false, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 29.1, 0.0, 37.35, 0.0, 47.66, 54.83, 0.0, 73.36, 58.81, 0.0, 0.0, 62.58, 60.7, 74.92, 0.0, 0.0, 42.17, 0.0, 0.0, 68.15, 0.0, 67.89, 66.76, 0.0, 0.0, 0.0, 0.0, 65.79, 37.73, 0.0, 0.0, 40.9], "audiomae_on_audioset": [null, null, [["speech", 31.48], ["explosion", 20.57], ["music", 11.66]], null, [["fly, housefly", 30.96], ["fowl", 9.91], ["creak", 7.03]], null, [["hum", 15.79], ["rumble", 14.23], ["music", 11.52]], null, null, null, null, null, null, null, null, null, null, null, [["hum", 39.88], ["speech", 22.85], ["mains hum", 17.54]], null, null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 24.8], ["music", 24.74], ["hum", 4.13]], null, null, [["music", 45.36], ["speech", 39.28], ["whale vocalization", 2.24]]], "duration": [1.01, 1.44, 4.1, 1.62, 3.01, 0.27, 13.75, 3.64, 1.28, 2.11, 3.0, 1.95, 1.42, 2.14, 4.24, 2.34, 1.65, 1.68, 7.93, 1.94, 1.12, 3.25, 1.17, 2.11, 20.44, 1.79, 1.66, 1.95, 1.96, 2.25, 2.95, 0.44, 0.4, 2.86]}
|
annotations_2/-DF-MgSuhQ0_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[7.0, 9.73], [13.0, 14.4], [16.0, 17.31], [18.0, 18.71], [19.0, 20.83], [24.0, 24.31], [27.0, 29.34], [31.0, 34.8], [35.0, 36.75], [38.0, 39.31], [41.0, 50.11], [51.0, 52.05], [54.0, 54.68], [56.0, 57.4], [58.0, 59.59], [63.0, 64.81], [66.0, 70.04], [71.0, 127.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [58.55, 0.0, 0.0, 0.0, 0.0, 0.0, 77.53, 73.06, 0.0, 0.0, 34.61, 0.0, 0.0, 0.0, 0.0, 0.0, 29.53, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["hum", 28.83], ["music", 26.22], ["throbbing", 24.55]], null, null, null, null, null, [["hum", 17.16], ["rumble", 15.7], ["mains hum", 12.19]], null], "duration": [2.73, 1.4, 1.31, 0.71, 1.83, 0.31, 2.34, 3.8, 1.75, 1.31, 9.11, 1.05, 0.68, 1.4, 1.59, 1.81, 4.04, 56.06]}
|
annotations_2/-GSZwG_s-8A_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[1.0, 2.44], [3.0, 4.26], [7.0, 9.54], [10.0, 12.87], [13.0, 13.39], [17.0, 17.25], [20.0, 23.23], [24.0, 28.97], [29.0, 40.56], [41.0, 43.71], [45.0, 58.67], [59.0, 60.76], [61.0, 63.29], [64.0, 65.31], [67.0, 71.14], [72.0, 74.7], [75.0, 75.73], [77.0, 78.6], [80.0, 82.22], [84.0, 90.17], [90.0, 90.21], [94.0, 96.48], [98.0, 114.37], [117.0, 142.94], [146.0, 167.85], [171.0, 180.91], [181.0, 182.66], [183.0, 195.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true], "silence_prob": [0.0, 0.0, 99.99, 94.81, 0.0, 0.0, 100.0, 97.43, 75.55, 100.0, 85.17, 0.0, 85.72, 0.0, 99.98, 100.0, 0.0, 0.0, 100.0, 98.01, 0.0, 50.11, 39.91, 37.24, 38.84, 52.86, 0.0, 38.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["ding", 21.15], ["cattle, bovinae", 20.11], ["livestock, farm animals, working animals", 16.65]], [["clang", 18.96], ["ding", 15.69], ["fly, housefly", 13.34]], [["fly, housefly", 56.08], ["insect", 19.37], ["mosquito", 9.11]], null, null, [["speech", 43.07], ["explosion", 7.66], ["buzz", 7.05]]], "duration": [1.44, 1.26, 2.54, 2.87, 0.39, 0.25, 3.23, 4.97, 11.56, 2.71, 13.67, 1.76, 2.29, 1.31, 4.14, 2.7, 0.73, 1.6, 2.22, 6.17, 0.21, 2.48, 16.37, 25.94, 21.85, 9.91, 1.66, 12.0]}
|
annotations_2/-G_I8dQHN5s_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[19.0, 19.31], [20.0, 20.29], [33.0, 33.71], [35.0, 36.98], [38.0, 39.53], [40.0, 44.63], [46.0, 47.28], [48.0, 48.51], [49.0, 51.38], [54.0, 55.81], [57.0, 57.55], [60.0, 60.18], [62.0, 66.29], [70.0, 71.96], [76.0, 76.5], [79.0, 78.8], [81.0, 82.83], [83.0, 85.87], [87.0, 88.23], [90.0, 91.45], [94.0, 93.92], [105.0, 104.6], [105.0, 105.83], [107.0, 107.18], [108.0, 108.48], [113.0, 113.0], [115.0, 116.68], [121.0, 120.85], [123.0, 128.02], [129.0, 129.46], [142.0, 141.67], [147.0, 150.2], [152.0, 152.66], [154.0, 156.52], [161.0, 173.03], [187.0, 187.62], [193.0, 193.21], [193.0, 193.41], [193.0, 194.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 81.35, 0.0, 0.0, 79.94, 0.0, 0.0, 0.0, 78.38, 0.0, 0.0, 0.0, 0.0, 49.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.78, 0.0, 0.0, 59.96, 0.0, 64.18, 55.11, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 22.34], ["mains hum", 18.99], ["hum", 7.49]], null, null, null, null, null, null, null, null, null, null, [["mains hum", 50.48], ["hum", 24.6], ["music", 16.73]], null, null, null, null, null, null, null, null, null, null], "duration": [0.31, 0.29, 0.71, 1.98, 1.53, 4.63, 1.28, 0.51, 2.38, 1.81, 0.55, 0.18, 4.29, 1.96, 0.5, -0.2, 1.83, 2.87, 1.23, 1.45, -0.08, -0.4, 0.83, 0.18, 0.48, 0.0, 1.68, -0.15, 5.02, 0.46, -0.33, 3.2, 0.66, 2.52, 12.03, 0.62, 0.21, 0.41, 1.86]}
|
annotations_2/-GaJPgI3jh4_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[0.0, 0.45], [17.0, 17.36], [22.0, 22.01], [27.0, 27.5], [30.0, 33.29], [48.0, 48.27], [74.0, 74.56], [77.0, 79.41], [106.0, 105.6], [107.0, 108.58], [114.0, 113.71], [129.0, 130.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 58.47, 0.0, 0.0, 93.29, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 0.36, 0.01, 0.5, 3.29, 0.27, 0.56, 2.41, -0.4, 1.58, -0.29, 1.42]}
|
annotations_2/-HPjEz0u-9Q_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[38.0, 38.57], [40.0, 40.49], [42.0, 41.72], [45.0, 46.25], [48.0, 57.18], [61.0, 62.72], [65.0, 65.13], [67.0, 67.19], [67.0, 67.22], [67.0, 71.83], [73.0, 74.14], [83.0, 92.16], [94.0, 115.52], [116.0, 117.41], [119.0, 119.35], [121.0, 123.85]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 53.53, 0.0, 0.0, 0.0, 0.0, 36.97, 0.0, 39.12, 37.65, 0.0, 0.0, 81.71], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["sidetone", 33.75], ["speech", 26.88], ["electric shaver, electric razor", 3.88]], null, [["speech", 51.44], ["music", 13.26], ["hum", 5.03]], [["speech", 27.98], ["thump, thud", 15.85], ["whack, thwack", 7.97]], null, null, null], "duration": [0.57, 0.49, -0.28, 1.25, 9.18, 1.72, 0.13, 0.19, 0.22, 4.83, 1.14, 9.16, 21.52, 1.41, 0.35, 2.85]}
|
annotations_2/-HTF_tAUtkQ_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[11.0, 12.56], [16.0, 16.7], [24.0, 25.49], [37.0, 37.74], [42.0, 44.02], [49.0, 49.55], [60.0, 61.55], [65.0, 66.5], [85.0, 86.61], [89.0, 96.99], [105.0, 107.99], [108.0, 108.82], [116.0, 120.75]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 49.87, 0.0, 0.0, 0.0, 0.0, 30.8, 31.19, 0.0, 31.46], "audiomae_on_audioset": [null, null, null, null, [["music", 42.14], ["throbbing", 7.54], ["hum", 7.23]], null, null, null, null, [["speech", 38.58], ["music", 33.33], ["musical instrument", 2.41]], [["music", 30.55], ["speech", 12.0], ["fly, housefly", 9.55]], null, [["speech", 33.82], ["music", 24.08], ["musical instrument", 9.47]]], "duration": [1.56, 0.7, 1.49, 0.74, 2.02, 0.55, 1.55, 1.5, 1.61, 7.99, 2.99, 0.82, 4.75]}
|
annotations_2/-HwMH2_-oKA_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []}
|
annotations_2/-IIHYIZSFbk_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[14.0, 15.31], [16.0, 16.65], [18.0, 18.32], [20.0, 22.0], [24.0, 25.14], [26.0, 29.02], [30.0, 31.62], [33.0, 35.58], [39.0, 40.61], [42.0, 42.04], [43.0, 44.49], [45.0, 45.32], [46.0, 46.6], [48.0, 49.4], [50.0, 50.63], [55.0, 56.03], [57.0, 58.41], [61.0, 62.33], [63.0, 66.8], [68.0, 68.54], [71.0, 85.16], [86.0, 86.97], [90.0, 91.61], [93.0, 93.66], [97.0, 98.49], [100.0, 100.18]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.68, 0.0, 48.27, 0.0, 56.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 63.96, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["tuning fork", 56.11], ["speech", 7.42], ["singing bowl", 4.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.31, 0.65, 0.32, 2.0, 1.14, 3.02, 1.62, 2.58, 1.61, 0.04, 1.49, 0.32, 0.6, 1.4, 0.63, 1.03, 1.41, 1.33, 3.8, 0.54, 14.16, 0.97, 1.61, 0.66, 1.49, 0.18]}
|
annotations_2/-JERO2LQSKc_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[2.0, 1.93], [4.0, 7.53], [8.0, 10.66], [12.0, 15.62], [17.0, 17.76], [21.0, 21.88], [35.0, 37.71], [44.0, 44.91], [73.0, 74.12], [76.0, 76.25], [77.0, 76.99], [87.0, 89.36], [90.0, 92.11], [105.0, 105.76], [106.0, 111.28], [112.0, 116.87], [119.0, 119.62], [120.0, 121.78], [125.0, 126.17], [128.0, 130.15], [131.0, 132.04], [138.0, 139.63], [140.0, 140.39], [147.0, 149.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 96.17, 89.54, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 77.7, 87.74, 0.0, 99.8, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.07, 3.53, 2.66, 3.62, 0.76, 0.88, 2.71, 0.91, 1.12, 0.25, -0.01, 2.36, 2.11, 0.76, 5.28, 4.87, 0.62, 1.78, 1.17, 2.15, 1.04, 1.63, 0.39, 2.17]}
|
annotations_2/-Jzi-2lYWEw_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[2.0, 2.66], [11.0, 12.65], [13.0, 13.29], [16.0, 16.85], [22.0, 21.78], [25.0, 26.16], [27.0, 27.26], [29.0, 29.83], [31.0, 31.82], [32.0, 33.02], [36.0, 37.88], [39.0, 42.28], [44.0, 43.73], [50.0, 51.53], [61.0, 63.36], [66.0, 67.0], [75.0, 77.52], [91.0, 93.48], [98.0, 97.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 0.0, 100.0, 0.0, 99.84, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.66, 1.65, 0.29, 0.85, -0.22, 1.16, 0.26, 0.83, 0.82, 1.02, 1.88, 3.28, -0.27, 1.53, 2.36, 1.0, 2.52, 2.48, -0.05]}
|
annotations_2/-Kd5zqw24S4_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[4.0, 10.61], [11.0, 12.63], [14.0, 15.26], [18.0, 18.74], [22.0, 22.25], [25.0, 26.42], [31.0, 34.1], [35.0, 37.03], [38.0, 41.4], [44.0, 44.29], [44.0, 47.55], [48.0, 49.1], [50.0, 55.9], [58.0, 62.18], [63.0, 70.04], [70.0, 74.61], [76.0, 79.19], [80.0, 81.18], [82.0, 88.69], [90.0, 92.37], [93.0, 95.39], [96.0, 97.53], [98.0, 100.28], [102.0, 105.97], [108.0, 110.02], [114.0, 119.18], [122.0, 125.61], [127.0, 141.07], [142.0, 146.97], [149.0, 151.78], [153.0, 153.71], [155.0, 156.49], [157.0, 159.46], [160.0, 166.94]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [48.65, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 93.45, 100.0, 0.0, 100.0, 0.0, 100.0, 99.99, 100.0, 96.04, 100.0, 0.0, 100.0, 100.0, 98.01, 0.0, 99.99, 100.0, 100.0, 99.98, 99.48, 99.76, 96.54, 99.73, 0.0, 0.0, 99.1, 99.52], "audiomae_on_audioset": [[["music", 19.87], ["smash, crash", 11.37], ["whack, thwack", 9.9]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.61, 1.63, 1.26, 0.74, 0.25, 1.42, 3.1, 2.03, 3.4, 0.29, 3.55, 1.1, 5.9, 4.18, 7.04, 4.61, 3.19, 1.18, 6.69, 2.37, 2.39, 1.53, 2.28, 3.97, 2.02, 5.18, 3.61, 14.07, 4.97, 2.78, 0.71, 1.49, 2.46, 6.94]}
|
annotations_2/-Luy502C920_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[22.0, 23.57], [29.0, 29.66], [49.0, 49.69], [57.0, 58.35], [62.0, 62.55], [67.0, 71.07], [72.0, 72.4], [78.0, 93.34], [94.0, 122.05]], "keep_status": [false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 50.66, 0.0, 32.88, 31.5], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 59.67], ["trance music", 7.81], ["techno", 5.64]], [["music", 35.67], ["skidding", 18.6], ["vehicle", 13.64]]], "duration": [1.57, 0.66, 0.69, 1.35, 0.55, 4.07, 0.4, 15.34, 28.05]}
|
annotations_2/-N2mhlvygq0_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[6.0, 7.8], [12.0, 16.65], [24.0, 27.16], [36.0, 36.05], [36.0, 38.15], [45.0, 45.74], [56.0, 57.01], [69.0, 75.0], [75.0, 109.05], [121.0, 121.68], [122.0, 122.82], [125.0, 125.04], [126.0, 125.98]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.98, 66.51, 0.0, 87.37, 0.0, 0.0, 78.89, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 23.09], ["cattle, bovinae", 22.59], ["animal", 16.78]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.8, 4.65, 3.16, 0.05, 2.15, 0.74, 1.01, 6.0, 34.05, 0.68, 0.82, 0.04, -0.02]}
|
annotations_2/-NeY5tqk1N8_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[2.0, 2.57], [3.0, 4.56], [9.0, 15.72], [17.0, 18.54], [19.0, 21.86], [23.0, 25.0], [29.0, 30.74], [36.0, 36.93], [38.0, 39.39], [42.0, 43.24], [44.0, 44.98], [53.0, 54.16], [55.0, 58.24], [61.0, 64.37], [68.0, 68.77], [70.0, 69.74], [73.0, 74.98], [77.0, 78.46], [80.0, 84.87], [85.0, 86.86], [90.0, 91.12], [96.0, 95.82], [98.0, 98.1], [98.0, 99.3], [106.0, 105.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.99, 0.0, 91.47, 90.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.44, 62.37, 0.0, 0.0, 0.0, 0.0, 98.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.57, 1.56, 6.72, 1.54, 2.86, 2.0, 1.74, 0.93, 1.39, 1.24, 0.98, 1.16, 3.24, 3.37, 0.77, -0.26, 1.98, 1.46, 4.87, 1.86, 1.12, -0.18, 0.1, 1.3, -0.39]}
|
annotations_2/-Nr56-RD_g8_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[6.0, 6.44], [14.0, 14.91], [16.0, 15.84], [29.0, 37.56], [53.0, 55.14], [64.0, 65.15]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 91.3, 62.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.44, 0.91, -0.16, 8.56, 2.14, 1.15]}
|
annotations_2/-O3_WO63fhU_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[2.0, 2.96], [6.0, 5.81], [11.0, 11.48], [15.0, 14.79], [23.0, 28.34], [35.0, 38.77], [41.0, 43.11], [50.0, 54.35], [59.0, 61.91], [67.0, 72.91], [75.0, 75.74], [78.0, 78.73], [80.0, 87.57], [89.0, 89.16], [95.0, 97.93], [101.0, 101.56], [107.0, 115.45], [119.0, 121.22], [125.0, 126.23], [130.0, 130.22], [133.0, 133.29], [134.0, 135.7], [140.0, 176.47], [178.0, 178.19], [182.0, 185.33], [187.0, 191.17], [192.0, 192.94], [194.0, 194.85], [204.0, 204.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.07, 44.99, 37.25, 39.18, 40.38, 37.86, 0.0, 0.0, 40.38, 0.0, 40.88, 0.0, 38.09, 38.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.11, 36.88, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 79.66], ["musical instrument", 2.0], ["didgeridoo", 0.96]], [["music", 65.05], ["hum", 8.31], ["musical instrument", 2.7]], [["music", 68.88], ["synthesizer", 4.56], ["musical instrument", 2.29]], [["music", 61.69], ["carnatic music", 11.77], ["singing", 2.48]], [["music", 74.92], ["didgeridoo", 1.85], ["middle eastern music", 1.02]], [["music", 78.6], ["middle eastern music", 2.74], ["singing", 1.72]], null, null, [["music", 78.02], ["didgeridoo", 1.96], ["throbbing", 1.77]], null, [["music", 54.3], ["synthesizer", 5.09], ["hum", 4.18]], null, [["music", 84.71], ["synthetic singing", 2.81], ["male singing", 1.42]], [["music", 83.54], ["singing", 2.6], ["christian music", 0.79]], null, null, null, null, null, null, [["music", 57.63], ["didgeridoo", 7.66], ["theremin", 4.37]], [["music", 65.22], ["carnatic music", 15.29], ["musical instrument", 4.53]], null, null, null], "duration": [0.96, -0.19, 0.48, -0.21, 5.34, 3.77, 2.11, 4.35, 2.91, 5.91, 0.74, 0.73, 7.57, 0.16, 2.93, 0.56, 8.45, 2.22, 1.23, 0.22, 0.29, 1.7, 36.47, 0.19, 3.33, 4.17, 0.94, 0.85, 0.11]}
|
annotations_2/-Ot948zIr0s_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[2.0, 2.79], [4.0, 4.46], [13.0, 13.61], [16.0, 16.61], [17.0, 17.76], [19.0, 18.94], [20.0, 20.75], [23.0, 24.22], [26.0, 28.92], [30.0, 30.1], [32.0, 32.12], [47.0, 48.84], [55.0, 56.08], [59.0, 59.44], [62.0, 63.66], [69.0, 69.03], [84.0, 84.84], [88.0, 88.77], [94.0, 94.91], [97.0, 97.97], [103.0, 103.13], [106.0, 107.01], [109.0, 110.37], [116.0, 117.56], [119.0, 120.41], [123.0, 124.75], [127.0, 128.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.79, 0.46, 0.61, 0.61, 0.76, -0.06, 0.75, 1.22, 2.92, 0.1, 0.12, 1.84, 1.08, 0.44, 1.66, 0.03, 0.84, 0.77, 0.91, 0.97, 0.13, 1.01, 1.37, 1.56, 1.41, 1.75, 1.75]}
|
annotations_2/-PFdr0SiAEw_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[9.0, 9.21], [10.0, 11.33], [13.0, 12.66], [26.0, 26.08], [28.0, 28.86], [30.0, 30.94], [34.0, 35.23], [36.0, 40.73], [41.0, 41.5], [43.0, 44.02], [45.0, 45.74], [49.0, 49.33], [52.0, 53.27], [56.0, 56.39], [58.0, 94.22], [96.0, 96.28], [97.0, 101.33], [102.0, 103.15], [104.0, 106.51], [116.0, 116.51], [118.0, 120.24], [123.0, 125.09], [128.0, 129.51], [136.0, 137.54], [145.0, 148.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.43, 0.0, 98.8, 0.0, 65.67, 90.95, 0.0, 0.0, 86.27], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 49.53], ["double bass", 17.3], ["musical instrument", 7.61]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.21, 1.33, -0.34, 0.08, 0.86, 0.94, 1.23, 4.73, 0.5, 1.02, 0.74, 0.33, 1.27, 0.39, 36.22, 0.28, 4.33, 1.15, 2.51, 0.51, 2.24, 2.09, 1.51, 1.54, 3.53]}
|
annotations_2/-Pf1f0pZdnQ_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[2.0, 101.44], [103.0, 103.62], [105.0, 106.83], [107.0, 107.69], [111.0, 124.53]], "keep_status": [false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 44.12], "audiomae_on_audioset": [null, null, null, null, [["music", 47.32], ["hum", 8.78], ["synthesizer", 7.92]]], "duration": [99.44, 0.62, 1.83, 0.69, 13.53]}
|
annotations_2/-QJsljIDKkk_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[1.0, 5.46], [9.0, 9.32], [12.0, 12.82], [20.0, 21.05], [22.0, 23.08], [24.0, 25.62], [27.0, 27.67], [29.0, 29.89], [31.0, 31.6], [33.0, 33.47], [37.0, 37.45], [42.0, 42.89], [44.0, 44.1], [50.0, 50.79], [51.0, 52.66], [53.0, 54.6], [55.0, 56.35], [61.0, 62.24], [63.0, 64.83], [67.0, 66.65], [76.0, 78.39], [80.0, 80.7], [82.0, 82.73], [84.0, 84.67], [85.0, 86.36], [88.0, 89.28], [90.0, 90.85], [95.0, 96.48], [99.0, 99.99], [100.0, 105.12], [107.0, 108.35], [110.0, 110.07], [111.0, 112.56], [113.0, 113.66], [116.0, 116.5], [118.0, 119.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.46, 0.32, 0.82, 1.05, 1.08, 1.62, 0.67, 0.89, 0.6, 0.47, 0.45, 0.89, 0.1, 0.79, 1.66, 1.6, 1.35, 1.24, 1.83, -0.35, 2.39, 0.7, 0.73, 0.67, 1.36, 1.28, 0.85, 1.48, 0.99, 5.12, 1.35, 0.07, 1.56, 0.66, 0.5, 1.58]}
|
annotations_2/-QNxYSDdpig_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[3.0, 4.97], [9.0, 8.73], [19.0, 20.98], [22.0, 25.22], [26.0, 28.49], [31.0, 31.7], [35.0, 35.14], [36.0, 38.74], [41.0, 43.17], [44.0, 44.54], [46.0, 46.36], [48.0, 48.0], [50.0, 50.45], [51.0, 51.58], [56.0, 56.32], [60.0, 60.44], [66.0, 66.31], [71.0, 71.2], [72.0, 72.79], [76.0, 75.88], [78.0, 78.65], [91.0, 91.64], [92.0, 92.6], [93.0, 95.01], [108.0, 109.05], [110.0, 111.72], [113.0, 115.05], [118.0, 118.79], [125.0, 125.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 97.73, 89.19, 0.0, 0.0, 69.74, 97.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.54, 0.0, 0.0, 43.35, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.31], ["sidetone", 25.91], ["dial tone", 6.77]], null, null], "duration": [1.97, -0.27, 1.98, 3.22, 2.49, 0.7, 0.14, 2.74, 2.17, 0.54, 0.36, 0.0, 0.45, 0.58, 0.32, 0.44, 0.31, 0.2, 0.79, -0.12, 0.65, 0.64, 0.6, 2.01, 1.05, 1.72, 2.05, 0.79, 0.15]}
|
annotations_2/-QOahlrO8Yo_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[6.0, 46.85], [48.0, 55.66], [56.0, 55.8], [56.0, 55.95], [56.0, 154.8]], "keep_status": [false, true, false, false, false], "silence_prob": [0.0, 30.29, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["noise", 24.48], ["music", 20.3], ["speech", 9.45]], null, null, null], "duration": [40.85, 7.66, -0.2, -0.05, 98.8]}
|
annotations_2/-QWL-FwX4t4_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[24.0, 26.25], [27.0, 29.24], [30.0, 34.38], [35.0, 35.45], [36.0, 37.29], [38.0, 39.31], [40.0, 44.25], [45.0, 52.74], [54.0, 56.64], [58.0, 60.64], [61.0, 61.92], [63.0, 64.84], [67.0, 68.67], [70.0, 72.62], [75.0, 76.27], [77.0, 77.8], [78.0, 80.2], [80.0, 88.87], [100.0, 100.16], [101.0, 101.51], [110.0, 112.35], [113.0, 118.02]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [68.41, 63.64, 87.0, 0.0, 0.0, 0.0, 49.36, 71.57, 90.25, 68.02, 0.0, 0.0, 0.0, 92.8, 0.0, 0.0, 61.47, 62.99, 0.0, 0.0, 90.25, 45.3], "audiomae_on_audioset": [null, null, null, null, null, null, [["sidetone", 20.14], ["noise", 10.95], ["hum", 9.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 36.91], ["hum", 21.39], ["music", 9.18]]], "duration": [2.25, 2.24, 4.38, 0.45, 1.29, 1.31, 4.25, 7.74, 2.64, 2.64, 0.92, 1.84, 1.67, 2.62, 1.27, 0.8, 2.2, 8.87, 0.16, 0.51, 2.35, 5.02]}
|
annotations_2/-RuK7XKbefY_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[3.0, 5.27], [6.0, 8.7], [12.0, 14.44], [17.0, 19.04], [23.0, 25.37], [27.0, 28.95], [31.0, 33.98], [43.0, 43.75], [48.0, 48.12], [73.0, 110.79], [113.0, 113.64], [118.0, 118.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.68, 99.96, 94.66, 98.51, 90.08, 0.0, 87.74, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.27, 2.7, 2.44, 2.04, 2.37, 1.95, 2.98, 0.75, 0.12, 37.79, 0.64, 0.0]}
|
annotations_2/-SJAzpHg4s8_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []}
|
annotations_2/-TLCaDbBv_s_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[5.0, 7.74], [9.0, 10.42], [12.0, 13.61], [16.0, 16.6], [18.0, 18.71], [20.0, 21.46], [22.0, 23.6], [26.0, 26.33], [29.0, 30.47], [31.0, 32.48], [34.0, 35.75], [38.0, 38.77], [41.0, 42.48], [45.0, 45.49], [47.0, 47.38], [49.0, 49.81], [51.0, 52.07], [54.0, 55.17], [61.0, 61.67], [65.0, 67.56], [69.0, 71.22], [74.0, 74.36], [76.0, 76.44], [77.0, 77.04], [77.0, 79.3], [82.0, 82.22], [94.0, 95.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.29, 57.72, 0.0, 0.0, 0.0, 45.56, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.55], ["music", 22.67], ["hum", 3.02]], null, null], "duration": [2.74, 1.42, 1.61, 0.6, 0.71, 1.46, 1.6, 0.33, 1.47, 1.48, 1.75, 0.77, 1.48, 0.49, 0.38, 0.81, 1.07, 1.17, 0.67, 2.56, 2.22, 0.36, 0.44, 0.04, 2.3, 0.22, 1.86]}
|
annotations_2/-TzrPYcpPvY_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[19.0, 21.07], [23.0, 24.63], [25.0, 25.14], [29.0, 37.81], [49.0, 57.82], [60.0, 60.83], [68.0, 68.54], [69.0, 76.45], [78.0, 89.45], [93.0, 92.65], [95.0, 96.72], [105.0, 121.69], [124.0, 132.73]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [48.52, 0.0, 0.0, 39.98, 38.9, 0.0, 0.0, 44.55, 40.66, 0.0, 0.0, 42.15, 69.34], "audiomae_on_audioset": [[["music", 25.92], ["musical instrument", 14.38], ["guitar", 10.44]], null, null, [["music", 74.16], ["theremin", 4.42], ["musical instrument", 2.98]], [["music", 82.24], ["theremin", 4.65], ["musical instrument", 1.81]], null, null, [["music", 69.25], ["musical instrument", 6.25], ["guitar", 2.75]], [["music", 77.09], ["musical instrument", 3.0], ["theremin", 2.49]], null, null, [["music", 79.09], ["theremin", 4.04], ["singing", 2.97]], null], "duration": [2.07, 1.63, 0.14, 8.81, 8.82, 0.83, 0.54, 7.45, 11.45, -0.35, 1.72, 16.69, 8.73]}
|