bpiyush commited on
Commit
aed1af4
·
1 Parent(s): a271ceb
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. annotations_filtered/d-2r0wMjfrY_filtered.json +1 -0
  2. annotations_filtered/d-RR_vV7qDU_filtered.json +1 -0
  3. annotations_filtered/d-kcczAff40_filtered.json +1 -0
  4. annotations_filtered/d-nJUGK8ABk_filtered.json +1 -0
  5. annotations_filtered/d0ZOz1i5-PE_filtered.json +1 -0
  6. annotations_filtered/d0c6KWKMAF8_filtered.json +1 -0
  7. annotations_filtered/d0hM2Ekkk-8_filtered.json +1 -0
  8. annotations_filtered/d0x7-oo9NAk_filtered.json +1 -0
  9. annotations_filtered/d1ZUnCbVoZQ_filtered.json +1 -0
  10. annotations_filtered/d1lql0Z0e-E_filtered.json +1 -0
  11. annotations_filtered/d2uvpiz5up0_filtered.json +1 -0
  12. annotations_filtered/d3-AXjkz3Pk_filtered.json +1 -0
  13. annotations_filtered/d35M7d-E_PY_filtered.json +1 -0
  14. annotations_filtered/d3GeSiD2HIs_filtered.json +1 -0
  15. annotations_filtered/d3HAOZbAj1Q_filtered.json +1 -0
  16. annotations_filtered/d3ZUSI1_lOc_filtered.json +1 -0
  17. annotations_filtered/d3hs2M_0vLE_filtered.json +1 -0
  18. annotations_filtered/d46cDtFv_Rw_filtered.json +1 -0
  19. annotations_filtered/d4Ljj8W1hE8_filtered.json +1 -0
  20. annotations_filtered/d4MZPbERTFs_filtered.json +1 -0
  21. annotations_filtered/d4ftmOI5NnI_filtered.json +1 -0
  22. annotations_filtered/d5MJBYofzhs_filtered.json +1 -0
  23. annotations_filtered/d5Pc-tNsvT4_filtered.json +1 -0
  24. annotations_filtered/d5gSQLPcya0_filtered.json +1 -0
  25. annotations_filtered/d5jxXkpstv4_filtered.json +1 -0
  26. annotations_filtered/d5nAgnojNgk_filtered.json +1 -0
  27. annotations_filtered/d6263F3UkWo_filtered.json +1 -0
  28. annotations_filtered/d68yRIE9OvQ_filtered.json +1 -0
  29. annotations_filtered/d6HReoQl6Mo_filtered.json +1 -0
  30. annotations_filtered/d6NOGc2Dymo_filtered.json +1 -0
  31. annotations_filtered/d6zX6-Rf4JY_filtered.json +1 -0
  32. annotations_filtered/d7-pWfZgFKU_filtered.json +1 -0
  33. annotations_filtered/d76CwsWbV2E_filtered.json +1 -0
  34. annotations_filtered/d79o09D8cuo_filtered.json +1 -0
  35. annotations_filtered/d7Aot4Wr-Yo_filtered.json +1 -0
  36. annotations_filtered/d7RrYVI3Xw0_filtered.json +1 -0
  37. annotations_filtered/d7V9liYn-IA_filtered.json +1 -0
  38. annotations_filtered/d7WraA-roN8_filtered.json +1 -0
  39. annotations_filtered/d7_F5P5PygM_filtered.json +1 -0
  40. annotations_filtered/d7c4TXqkMso_filtered.json +1 -0
  41. annotations_filtered/d7he8f2L_BE_filtered.json +1 -0
  42. annotations_filtered/d7pioagkX5k_filtered.json +1 -0
  43. annotations_filtered/d7ye5zFyuso_filtered.json +1 -0
  44. annotations_filtered/d87eHGVaoc8_filtered.json +1 -0
  45. annotations_filtered/d8Ff_W4-4VE_filtered.json +1 -0
  46. annotations_filtered/d8Gg9rPHKNU_filtered.json +1 -0
  47. annotations_filtered/d8WHOiQZGok_filtered.json +1 -0
  48. annotations_filtered/d8sDpSZeDBE_filtered.json +1 -0
  49. annotations_filtered/d9-DFXwcmFI_filtered.json +1 -0
  50. annotations_filtered/d921M-ACMM4_filtered.json +1 -0
annotations_filtered/d-2r0wMjfrY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 2.29], [3.0, 3.08], [5.0, 22.57]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 30.4], "audiomae_on_audioset": [null, null, [["music", 58.47], ["speech", 17.54], ["musical instrument", 3.9]]], "duration": [0.29, 0.08, 17.57]}
annotations_filtered/d-RR_vV7qDU_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[7.0, 10.99], [16.0, 19.48], [22.0, 23.03], [27.0, 28.75], [30.0, 35.09], [41.0, 53.23], [55.0, 85.6], [87.0, 93.39], [96.0, 99.52], [102.0, 105.31], [108.0, 108.82], [109.0, 118.2], [125.0, 127.06], [129.0, 131.13]], "keep_status": [true, false, false, false, true, true, false, false, true, true, false, false, false, true], "silence_prob": [31.64, 30.83, 0.0, 0.0, 31.61, 32.3, 0.0, 31.11, 31.77, 32.18, 0.0, 31.62, 32.23, 33.24], "audiomae_on_audioset": [[["cacophony", 23.96], ["vehicle", 9.44], ["music", 8.97]], [["sidetone", 32.38], ["music", 29.07], ["speech", 17.33]], null, null, [["music", 38.68], ["hum", 16.72], ["throbbing", 9.88]], [["music", 24.24], ["speech", 23.55], ["sonar", 9.01]], null, [["speech", 46.38], ["sidetone", 20.62], ["music", 12.17]], [["music", 30.9], ["electronic music", 11.26], ["cacophony", 7.68]], [["music", 38.97], ["speech", 16.23], ["sidetone", 6.9]], null, [["speech", 79.81], ["music", 8.27], ["cacophony", 2.73]], [["music", 76.3], ["musical instrument", 5.27], ["theremin", 2.64]], [["speech", 38.32], ["music", 13.44], ["synthesizer", 5.86]]], "duration": [3.99, 3.48, 1.03, 1.75, 5.09, 12.23, 30.6, 6.39, 3.52, 3.31, 0.82, 9.2, 2.06, 2.13]}
annotations_filtered/d-kcczAff40_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[101.0, 101.46], [102.0, 103.1], [104.0, 105.17], [106.0, 106.44]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.46, 1.1, 1.17, 0.44]}
annotations_filtered/d-nJUGK8ABk_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[5.0, 5.91], [10.0, 10.45], [16.0, 32.12], [32.0, 32.16], [33.0, 33.2], [34.0, 35.16], [36.0, 46.97], [51.0, 90.78], [97.0, 98.15], [102.0, 102.74], [108.0, 108.87], [111.0, 112.16], [115.0, 115.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.44, 0.0, 0.0, 0.0, 33.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 65.94], ["drum machine", 13.79], ["speech", 12.33]], null, null, null, [["music", 61.13], ["speech", 17.13], ["drum machine", 2.44]], null, null, null, null, null, null], "duration": [0.91, 0.45, 16.12, 0.16, 0.2, 1.16, 10.97, 39.78, 1.15, 0.74, 0.87, 1.16, 0.45]}
annotations_filtered/d0ZOz1i5-PE_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[19.0, 20.53], [23.0, 24.8], [26.0, 26.22], [28.0, 29.3], [31.0, 36.14], [37.0, 37.23], [40.0, 40.46], [44.0, 46.06], [46.0, 46.6], [49.0, 49.11], [54.0, 54.43], [59.0, 59.48], [63.0, 68.88], [69.0, 70.17], [72.0, 72.15], [84.0, 86.59], [90.0, 91.18], [93.0, 96.3], [103.0, 103.89], [107.0, 109.21], [117.0, 118.34], [122.0, 125.56]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, true, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 43.15, 0.0, 0.0, 34.96, 0.0, 0.0, 0.0, 0.0, 33.86, 0.0, 0.0, 36.11, 0.0, 31.57, 0.0, 36.76, 0.0, 39.55], "audiomae_on_audioset": [null, null, null, null, [["speech", 39.08], ["fly, housefly", 17.56], ["insect", 13.84]], null, null, [["music", 32.73], ["speech", 19.45], ["timpani", 8.0]], null, null, null, null, [["music", 47.04], ["speech", 22.91], ["boing", 11.62]], null, null, [["speech", 26.29], ["boing", 17.4], ["music", 15.57]], null, [["music", 14.96], ["speech", 14.4], ["moo", 13.19]], null, [["music", 39.33], ["speech", 9.48], ["didgeridoo", 5.21]], null, [["music", 49.65], ["boing", 3.43], ["sampler", 2.9]]], "duration": [1.53, 1.8, 0.22, 1.3, 5.14, 0.23, 0.46, 2.06, 0.6, 0.11, 0.43, 0.48, 5.88, 1.17, 0.15, 2.59, 1.18, 3.3, 0.89, 2.21, 1.34, 3.56]}
annotations_filtered/d0c6KWKMAF8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 6.35], [7.0, 7.69], [9.0, 11.2], [12.0, 20.8], [22.0, 47.97], [49.0, 50.6], [52.0, 53.18], [55.0, 56.15], [57.0, 62.46], [64.0, 65.57], [66.0, 67.26], [68.0, 68.39], [80.0, 93.93], [96.0, 103.32], [106.0, 106.86], [109.0, 114.91], [116.0, 117.22]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [38.15, 0.0, 84.25, 44.55, 36.2, 0.0, 0.0, 0.0, 36.47, 0.0, 0.0, 0.0, 31.59, 53.1, 0.0, 90.43, 0.0], "audiomae_on_audioset": [[["speech", 56.49], ["music", 8.86], ["synthesizer", 2.92]], null, null, [["hum", 46.55], ["throbbing", 30.95], ["mains hum", 16.7]], [["hum", 41.44], ["throbbing", 40.18], ["mains hum", 7.96]], null, null, null, [["throbbing", 27.99], ["music", 26.95], ["hum", 19.67]], null, null, null, [["hum", 33.15], ["speech", 15.04], ["throbbing", 14.93]], null, null, null, null], "duration": [3.35, 0.69, 2.2, 8.8, 25.97, 1.6, 1.18, 1.15, 5.46, 1.57, 1.26, 0.39, 13.93, 7.32, 0.86, 5.91, 1.22]}
annotations_filtered/d0hM2Ekkk-8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[19.0, 20.28], [24.0, 24.33], [33.0, 49.08], [77.0, 76.79], [101.0, 101.39], [135.0, 135.82]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 64.52, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [1.28, 0.33, 16.08, -0.21, 0.39, 0.82]}
annotations_filtered/d0x7-oo9NAk_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[85.0, 85.85], [88.0, 87.83], [90.0, 100.82], [103.0, 106.05], [107.0, 120.41], [121.0, 122.76], [123.0, 140.53], [142.0, 142.92], [147.0, 183.22], [184.0, 185.53], [186.0, 194.43], [198.0, 203.5]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 29.67, 40.55, 29.93, 0.0, 32.82, 0.0, 0.0, 0.0, 33.46, 33.63], "audiomae_on_audioset": [null, null, [["hum", 33.27], ["throbbing", 24.19], ["music", 18.59]], [["music", 58.6], ["throbbing", 6.78], ["theme music", 3.25]], [["throbbing", 41.88], ["music", 28.89], ["hum", 16.73]], null, [["speech", 26.93], ["hum", 22.73], ["music", 14.61]], null, null, null, [["grunt", 67.15], ["speech", 4.83], ["sound effect", 4.43]], [["music", 30.39], ["effects unit", 26.24], ["musical instrument", 10.2]]], "duration": [0.85, -0.17, 10.82, 3.05, 13.41, 1.76, 17.53, 0.92, 36.22, 1.53, 8.43, 5.5]}
annotations_filtered/d1ZUnCbVoZQ_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 5.58], [6.0, 9.66], [11.0, 14.17], [15.0, 15.7], [16.0, 16.09], [17.0, 17.37], [19.0, 21.57], [22.0, 23.36], [25.0, 25.78], [27.0, 29.49], [30.0, 39.73], [43.0, 42.79], [43.0, 45.35], [51.0, 51.54], [57.0, 57.33], [58.0, 58.48], [59.0, 60.35], [63.0, 63.36], [65.0, 71.52], [76.0, 76.1], [76.0, 78.24], [79.0, 80.01], [82.0, 82.58], [85.0, 86.83], [87.0, 88.32], [89.0, 90.14], [94.0, 95.77], [101.0, 102.63], [104.0, 105.48], [107.0, 107.7], [109.0, 109.75], [112.0, 112.8], [114.0, 114.44], [117.0, 117.37], [122.0, 123.63], [125.0, 126.15], [128.0, 128.97], [134.0, 133.88], [154.0, 154.09], [159.0, 161.06], [163.0, 164.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.07, 99.05, 93.29, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 57.4, 96.42, 0.0, 51.55, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 79.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.58, 3.66, 3.17, 0.7, 0.09, 0.37, 2.57, 1.36, 0.78, 2.49, 9.73, -0.21, 2.35, 0.54, 0.33, 0.48, 1.35, 0.36, 6.52, 0.1, 2.24, 1.01, 0.58, 1.83, 1.32, 1.14, 1.77, 1.63, 1.48, 0.7, 0.75, 0.8, 0.44, 0.37, 1.63, 1.15, 0.97, -0.12, 0.09, 2.06, 1.46]}
annotations_filtered/d1lql0Z0e-E_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 2.98], [6.0, 7.28], [13.0, 13.71], [16.0, 19.33], [20.0, 27.24], [29.0, 49.45], [50.0, 49.55], [50.0, 57.5], [58.0, 72.69], [76.0, 86.9], [89.0, 91.13], [92.0, 92.43], [93.0, 94.31], [96.0, 98.25], [101.0, 102.52], [104.0, 104.68], [108.0, 108.85], [111.0, 111.94]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 28.63, 32.98, 37.89, 0.0, 38.19, 55.39, 41.72, 61.08, 0.0, 0.0, 77.03, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["crowd", 31.19], ["cheering", 19.04], ["cattle, bovinae", 16.75]], [["music", 44.16], ["theremin", 30.2], ["didgeridoo", 4.5]], [["music", 42.04], ["musical instrument", 13.75], ["gong", 8.69]], null, [["speech", 80.42], ["sidetone", 4.27], ["hum", 2.55]], null, [["didgeridoo", 44.64], ["music", 37.06], ["musical instrument", 3.67]], null, null, null, null, null, null, null, null], "duration": [0.98, 1.28, 0.71, 3.33, 7.24, 20.45, -0.45, 7.5, 14.69, 10.9, 2.13, 0.43, 1.31, 2.25, 1.52, 0.68, 0.85, 0.94]}
annotations_filtered/d2uvpiz5up0_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[7.0, 16.16], [17.0, 30.81], [34.0, 68.66], [70.0, 103.82], [107.0, 118.37]], "keep_status": [true, false, false, false, true], "silence_prob": [32.14, 31.49, 0.0, 0.0, 30.63], "audiomae_on_audioset": [[["hum", 27.24], ["speech", 25.41], ["mains hum", 15.35]], [["speech", 68.8], ["vehicle", 9.05], ["helicopter", 3.48]], null, null, [["hum", 36.31], ["music", 19.79], ["mains hum", 8.46]]], "duration": [9.16, 13.81, 34.66, 33.82, 11.37]}
annotations_filtered/d3-AXjkz3Pk_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 6.4], [8.0, 7.99], [9.0, 10.08], [10.0, 11.91], [13.0, 20.92], [28.0, 29.25], [31.0, 34.16], [36.0, 39.63], [42.0, 44.91], [53.0, 53.96], [55.0, 56.24], [57.0, 60.44], [69.0, 69.8], [71.0, 71.44], [72.0, 73.09], [87.0, 87.61], [88.0, 88.23], [90.0, 91.47], [103.0, 107.55], [110.0, 110.89]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.0, 0.0, 0.0, 0.0, 33.97, 0.0, 57.89, 49.36, 66.51, 0.0, 0.0, 80.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0], "audiomae_on_audioset": [[["music", 44.32], ["whip", 6.97], ["musical instrument", 4.6]], null, null, null, [["cattle, bovinae", 33.94], ["moo", 26.72], ["fly, housefly", 9.45]], null, null, [["mosquito", 22.84], ["fly, housefly", 10.68], ["insect", 7.64]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.4, -0.01, 1.08, 1.91, 7.92, 1.25, 3.16, 3.63, 2.91, 0.96, 1.24, 3.44, 0.8, 0.44, 1.09, 0.61, 0.23, 1.47, 4.55, 0.89]}
annotations_filtered/d35M7d-E_PY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 2.24], [7.0, 7.65], [9.0, 9.69], [10.0, 11.23], [18.0, 18.32], [30.0, 30.67], [33.0, 33.17], [38.0, 39.5], [43.0, 43.04], [44.0, 44.59], [48.0, 49.59], [51.0, 51.11], [53.0, 53.82], [54.0, 55.53], [59.0, 59.81], [65.0, 65.42], [70.0, 70.55], [74.0, 74.36], [87.0, 87.54], [94.0, 95.01], [99.0, 99.72], [102.0, 102.54], [107.0, 107.62], [109.0, 109.26], [117.0, 118.5], [121.0, 121.86], [125.0, 125.58], [128.0, 129.03], [131.0, 131.68], [132.0, 132.34], [132.0, 133.68], [135.0, 136.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.24, 0.65, 0.69, 1.23, 0.32, 0.67, 0.17, 1.5, 0.04, 0.59, 1.59, 0.11, 0.82, 1.53, 0.81, 0.42, 0.55, 0.36, 0.54, 1.01, 0.72, 0.54, 0.62, 0.26, 1.5, 0.86, 0.58, 1.03, 0.68, 0.34, 1.68, 1.19]}
annotations_filtered/d3GeSiD2HIs_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[18.0, 32.09], [37.0, 37.44], [39.0, 121.81], [122.0, 123.16], [124.0, 125.2], [128.0, 171.04]], "keep_status": [true, false, false, false, false, false], "silence_prob": [49.64, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["fly, housefly", 12.36], ["roaring cats (lions, tigers)", 12.33], ["stomach rumble", 9.94]], null, null, null, null, null], "duration": [14.09, 0.44, 82.81, 1.16, 1.2, 43.04]}
annotations_filtered/d3HAOZbAj1Q_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[20.0, 23.94], [25.0, 25.46], [30.0, 36.85], [45.0, 45.69], [53.0, 53.45], [53.0, 69.4]], "keep_status": [true, false, true, false, false, true], "silence_prob": [29.84, 0.0, 30.51, 0.0, 0.0, 29.74], "audiomae_on_audioset": [[["music", 28.79], ["hum", 14.97], ["mains hum", 14.13]], null, [["rumble", 22.82], ["speech", 16.18], ["hum", 13.03]], null, null, [["music", 51.69], ["hum", 11.58], ["grunt", 6.59]]], "duration": [3.94, 0.46, 6.85, 0.69, 0.45, 16.4]}
annotations_filtered/d3ZUSI1_lOc_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[30.0, 30.47], [37.0, 38.15], [44.0, 43.87], [53.0, 55.97]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 30.38], "audiomae_on_audioset": [null, null, null, [["noise", 38.03], ["music", 9.97], ["livestock, farm animals, working animals", 6.98]]], "duration": [0.47, 1.15, -0.13, 2.97]}
annotations_filtered/d3hs2M_0vLE_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[10.0, 10.08], [12.0, 13.09], [25.0, 27.51], [28.0, 29.52], [31.0, 31.18], [32.0, 32.29], [37.0, 37.77], [45.0, 46.06], [48.0, 50.85], [66.0, 66.51], [69.0, 69.36], [73.0, 83.54], [84.0, 84.96], [97.0, 100.79], [106.0, 107.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.72, 0.0, 0.0, 0.0, 0.0, 0.0, 75.07, 0.0, 0.0, 100.0, 0.0, 84.43, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.08, 1.09, 2.51, 1.52, 0.18, 0.29, 0.77, 1.06, 2.85, 0.51, 0.36, 10.54, 0.96, 3.79, 1.7]}
annotations_filtered/d46cDtFv_Rw_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 3.55], [6.0, 6.45], [8.0, 9.04], [9.0, 10.37], [11.0, 12.83], [19.0, 21.81], [22.0, 23.65], [28.0, 31.46], [38.0, 40.29], [43.0, 43.95], [46.0, 50.99], [52.0, 54.3], [55.0, 57.11], [59.0, 60.57], [62.0, 65.26], [66.0, 67.24], [69.0, 73.84], [76.0, 79.29], [81.0, 82.81], [85.0, 95.61], [99.0, 108.31], [110.0, 111.45], [113.0, 112.78], [115.0, 116.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 95.64, 0.0, 97.43, 72.16, 0.0, 77.36, 65.55, 49.13, 0.0, 99.16, 0.0, 76.2, 65.67, 0.0, 72.31, 71.29, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 47.8], ["insect", 3.49], ["hum", 3.27]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.55, 0.45, 1.04, 1.37, 1.83, 2.81, 1.65, 3.46, 2.29, 0.95, 4.99, 2.3, 2.11, 1.57, 3.26, 1.24, 4.84, 3.29, 1.81, 10.61, 9.31, 1.45, -0.22, 1.9]}
annotations_filtered/d4Ljj8W1hE8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[8.0, 11.16], [18.0, 18.76], [19.0, 20.17], [24.0, 24.02], [32.0, 33.45], [35.0, 36.0], [37.0, 37.45], [38.0, 41.0], [43.0, 53.91], [55.0, 58.97], [61.0, 72.64], [73.0, 72.69], [73.0, 75.59], [76.0, 77.97], [79.0, 79.37], [80.0, 81.65], [84.0, 84.35], [88.0, 90.31], [91.0, 95.18], [96.0, 101.22], [102.0, 102.81], [105.0, 105.56], [109.0, 109.66], [110.0, 114.64], [116.0, 126.59], [129.0, 129.07], [132.0, 136.98], [138.0, 138.65]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [39.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.12, 36.0, 95.51, 36.71, 0.0, 69.34, 0.0, 0.0, 0.0, 0.0, 88.28, 97.22, 65.91, 0.0, 0.0, 0.0, 70.44, 62.17, 0.0, 40.55, 0.0], "audiomae_on_audioset": [[["speech", 82.42], ["fart", 5.38], ["radio", 2.72]], null, null, null, null, null, null, [["chirp tone", 49.29], ["sine wave", 17.16], ["noise", 11.24]], [["mains hum", 24.24], ["hum", 17.67], ["music", 17.07]], null, [["creak", 19.25], ["percussion", 15.43], ["tabla", 14.07]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 43.27], ["speech", 7.1], ["hiccup", 4.23]], null], "duration": [3.16, 0.76, 1.17, 0.02, 1.45, 1.0, 0.45, 3.0, 10.91, 3.97, 11.64, -0.31, 2.59, 1.97, 0.37, 1.65, 0.35, 2.31, 4.18, 5.22, 0.81, 0.56, 0.66, 4.64, 10.59, 0.07, 4.98, 0.65]}
annotations_filtered/d4MZPbERTFs_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 1.81], [4.0, 3.62], [4.0, 5.04], [6.0, 6.54], [7.0, 7.45], [8.0, 10.72], [11.0, 12.33], [15.0, 15.48], [16.0, 17.61], [18.0, 19.84], [20.0, 23.55], [24.0, 26.0], [27.0, 27.97], [29.0, 32.27], [33.0, 34.25], [42.0, 42.11], [43.0, 43.95], [44.0, 45.05], [46.0, 45.76], [46.0, 55.39], [66.0, 66.01], [71.0, 72.47], [73.0, 79.52], [81.0, 83.32], [84.0, 84.91], [87.0, 88.94], [92.0, 92.16], [94.0, 97.38], [103.0, 104.89], [107.0, 107.55], [108.0, 109.44], [112.0, 119.94], [121.0, 124.34], [127.0, 127.3], [128.0, 132.12], [135.0, 135.51], [141.0, 142.21], [145.0, 146.3], [147.0, 146.97], [149.0, 150.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 88.1, 0.0, 0.0, 0.0, 0.0, 84.8, 93.29, 0.0, 97.43, 0.0, 0.0, 0.0, 0.0, 0.0, 32.25, 0.0, 0.0, 32.95, 52.92, 0.0, 0.0, 0.0, 42.0, 0.0, 0.0, 0.0, 30.58, 56.86, 0.0, 42.51, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 54.47], ["music", 18.97], ["hum", 4.54]], null, null, [["hum", 25.88], ["mains hum", 15.84], ["speech", 15.61]], null, null, null, null, [["hum", 49.32], ["throbbing", 33.4], ["stomach rumble", 3.31]], null, null, null, [["hum", 19.8], ["whip", 10.36], ["explosion", 10.24]], null, null, [["mains hum", 35.26], ["hum", 25.43], ["speech", 8.37]], null, null, null, null, null], "duration": [0.81, -0.38, 1.04, 0.54, 0.45, 2.72, 1.33, 0.48, 1.61, 1.84, 3.55, 2.0, 0.97, 3.27, 1.25, 0.11, 0.95, 1.05, -0.24, 9.39, 0.01, 1.47, 6.52, 2.32, 0.91, 1.94, 0.16, 3.38, 1.89, 0.55, 1.44, 7.94, 3.34, 0.3, 4.12, 0.51, 1.21, 1.3, -0.03, 1.26]}
annotations_filtered/d4ftmOI5NnI_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 1.41], [2.0, 1.98], [2.0, 2.91], [4.0, 4.8], [6.0, 5.97], [8.0, 8.75], [9.0, 10.0], [16.0, 17.78], [19.0, 19.52], [21.0, 22.65], [25.0, 26.27], [27.0, 28.02], [36.0, 36.68], [38.0, 38.1], [39.0, 41.07], [52.0, 53.67], [55.0, 54.73], [63.0, 63.04], [64.0, 64.23], [66.0, 72.47], [73.0, 74.02], [76.0, 75.71], [78.0, 78.39], [81.0, 85.68], [87.0, 86.85], [87.0, 89.09], [92.0, 92.52], [94.0, 93.7], [96.0, 96.96], [125.0, 125.29], [155.0, 156.07], [159.0, 159.54], [161.0, 163.21], [169.0, 173.87], [175.0, 175.8], [189.0, 189.89], [194.0, 194.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.27, 0.0, 0.0, 0.0, 0.0, 97.0, 0.0, 0.0, 0.0, 100.0, 0.0, 68.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.63, 87.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 11.32], ["boing", 8.13], ["animal", 7.5]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.41, -0.02, 0.91, 0.8, -0.03, 0.75, 1.0, 1.78, 0.52, 1.65, 1.27, 1.02, 0.68, 0.1, 2.07, 1.67, -0.27, 0.04, 0.23, 6.47, 1.02, -0.29, 0.39, 4.68, -0.15, 2.09, 0.52, -0.3, 0.96, 0.29, 1.07, 0.54, 2.21, 4.87, 0.8, 0.89, 0.05]}
annotations_filtered/d5MJBYofzhs_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[17.0, 57.69]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [40.69]}
annotations_filtered/d5Pc-tNsvT4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 4.23], [5.0, 5.54], [7.0, 7.21], [16.0, 17.22], [19.0, 19.77], [22.0, 23.95], [33.0, 33.15], [38.0, 38.64], [49.0, 49.47], [53.0, 54.08], [59.0, 59.54], [70.0, 70.02], [73.0, 72.91], [75.0, 75.19], [79.0, 79.88], [82.0, 82.53], [101.0, 107.59], [110.0, 110.96], [115.0, 115.05], [117.0, 116.95], [121.0, 121.58], [129.0, 128.82], [139.0, 145.15], [151.0, 156.63], [159.0, 160.32], [162.0, 165.87]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true], "silence_prob": [40.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.21, 0.0, 0.0, 0.0, 0.0, 0.0, 29.29, 42.44, 0.0, 45.75], "audiomae_on_audioset": [[["music", 27.05], ["hum", 20.14], ["speech", 10.98]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 51.64], ["trombone", 10.17], ["brass instrument", 5.23]], [["hum", 40.68], ["mains hum", 14.25], ["rumble", 14.17]], null, [["music", 24.48], ["whale vocalization", 11.18], ["sidetone", 8.62]]], "duration": [2.23, 0.54, 0.21, 1.22, 0.77, 1.95, 0.15, 0.64, 0.47, 1.08, 0.54, 0.02, -0.09, 0.19, 0.88, 0.53, 6.59, 0.96, 0.05, -0.05, 0.58, -0.18, 6.15, 5.63, 1.32, 3.87]}
annotations_filtered/d5gSQLPcya0_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[5.0, 14.37], [15.0, 17.12], [18.0, 33.78], [37.0, 57.6], [60.0, 82.29], [84.0, 96.85], [98.0, 104.19], [106.0, 107.28], [111.0, 112.5], [123.0, 127.99], [131.0, 134.45], [138.0, 141.32], [143.0, 165.67]], "keep_status": [false, true, false, true, true, true, true, false, false, true, false, true, false], "silence_prob": [30.27, 46.94, 78.21, 30.87, 35.64, 31.96, 36.21, 0.0, 0.0, 31.29, 30.82, 30.15, 50.51], "audiomae_on_audioset": [[["music", 29.9], ["hum", 23.69], ["throbbing", 19.61]], [["speech", 20.15], ["sonar", 10.51], ["music", 9.41]], null, [["speech", 30.81], ["buzz", 13.54], ["livestock, farm animals, working animals", 7.68]], [["music", 36.4], ["hum", 17.42], ["throbbing", 6.06]], [["speech", 34.02], ["music", 14.55], ["hum", 9.58]], [["speech", 45.62], ["music", 9.59], ["sidetone", 6.24]], null, null, [["speech", 41.25], ["vehicle", 10.17], ["mains hum", 5.22]], [["speech", 48.47], ["music", 13.0], ["vehicle", 9.08]], [["speech", 21.31], ["music", 16.95], ["noise", 5.82]], null], "duration": [9.37, 2.12, 15.78, 20.6, 22.29, 12.85, 6.19, 1.28, 1.5, 4.99, 3.45, 3.32, 22.67]}
annotations_filtered/d5jxXkpstv4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 17.37], [20.0, 43.39], [48.0, 48.78], [50.0, 50.94], [53.0, 53.22], [55.0, 55.88], [57.0, 57.25], [58.0, 58.75], [61.0, 61.84], [63.0, 63.54], [68.0, 68.44], [74.0, 88.4], [90.0, 93.82], [97.0, 107.87], [115.0, 124.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [55.96, 52.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.45, 51.02, 41.03, 30.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 40.7], ["speech", 16.89], ["throbbing", 16.5]], null, [["speech", 35.36], ["music", 30.94], ["buzz", 2.03]], [["speech", 38.39], ["music", 17.25], ["cacophony", 9.03]]], "duration": [13.37, 23.39, 0.78, 0.94, 0.22, 0.88, 0.25, 0.75, 0.84, 0.54, 0.44, 14.4, 3.82, 10.87, 9.95]}
annotations_filtered/d5nAgnojNgk_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[5.0, 6.51], [8.0, 10.25], [11.0, 14.49], [15.0, 19.99], [22.0, 28.0], [37.0, 44.51], [48.0, 70.51], [72.0, 101.97], [107.0, 108.87], [110.0, 137.15], [138.0, 139.04], [141.0, 146.21], [147.0, 147.12]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 99.71, 77.7, 99.82, 99.88, 34.43, 38.56, 43.61, 0.0, 47.9, 0.0, 52.68, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 63.98], ["singing bowl", 15.83], ["ambient music", 6.12]], [["music", 54.89], ["singing bowl", 10.56], ["musical instrument", 4.91]], [["fly, housefly", 46.69], ["insect", 23.94], ["music", 7.17]], null, [["fly, housefly", 21.33], ["speech", 13.45], ["music", 11.62]], null, null, null], "duration": [1.51, 2.25, 3.49, 4.99, 6.0, 7.51, 22.51, 29.97, 1.87, 27.15, 1.04, 5.21, 0.12]}
annotations_filtered/d6263F3UkWo_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[30.0, 29.73], [30.0, 29.89], [31.0, 33.79], [36.0, 36.04], [37.0, 39.09], [40.0, 43.56], [44.0, 43.6], [44.0, 49.23], [50.0, 88.11], [89.0, 91.93], [94.0, 104.46], [105.0, 109.22], [112.0, 122.59], [124.0, 131.11], [133.0, 135.21], [138.0, 146.23], [147.0, 169.5], [171.0, 178.56], [184.0, 185.53], [186.0, 186.39]], "keep_status": [false, false, false, false, false, false, false, true, false, true, true, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 29.31, 0.0, 30.17, 31.18, 0.0, 30.84, 0.0, 29.99, 31.1, 29.49, 31.59, 49.36, 82.61, 79.24, 50.81, 46.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["boing", 66.53], ["music", 20.82], ["didgeridoo", 1.16]], null, [["music", 58.91], ["livestock, farm animals, working animals", 7.1], ["cattle, bovinae", 4.92]], [["music", 61.79], ["speech", 9.67], ["throbbing", 5.51]], null, [["music", 36.66], ["livestock, farm animals, working animals", 16.91], ["cattle, bovinae", 13.36]], null, [["whip", 38.3], ["music", 6.15], ["whack, thwack", 5.92]], [["music", 36.43], ["speech", 27.97], ["synthesizer", 3.52]], [["music", 15.84], ["buzz", 10.95], ["speech", 10.69]], [["music", 69.09], ["speech", 3.45], ["musical instrument", 2.64]], [["speech", 46.91], ["music", 25.64], ["foghorn", 15.04]], null, null, null, [["insect", 23.03], ["music", 21.98], ["fly, housefly", 16.5]], null, null], "duration": [-0.27, -0.11, 2.79, 0.04, 2.09, 3.56, -0.4, 5.23, 38.11, 2.93, 10.46, 4.22, 10.59, 7.11, 2.21, 8.23, 22.5, 7.56, 1.53, 0.39]}
annotations_filtered/d68yRIE9OvQ_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 54.72], [56.0, 57.59], [61.0, 61.47], [65.0, 80.54], [82.0, 81.87], [111.0, 111.28], [112.0, 112.11]], "keep_status": [false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.77, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 58.91], ["synthesizer", 5.83], ["cacophony", 3.8]], null, null, null], "duration": [51.72, 1.59, 0.47, 15.54, -0.13, 0.28, 0.11]}
annotations_filtered/d6HReoQl6Mo_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[8.0, 26.4], [31.0, 43.98], [48.0, 48.76], [53.0, 53.89], [56.0, 60.0], [63.0, 71.52], [72.0, 74.11], [75.0, 77.19], [78.0, 77.94], [79.0, 80.28], [86.0, 87.07], [90.0, 92.16], [94.0, 96.28], [98.0, 99.94], [102.0, 104.4], [106.0, 108.3], [115.0, 118.59], [119.0, 120.34], [122.0, 123.58], [130.0, 135.06], [136.0, 136.9], [138.0, 142.94], [144.0, 161.0], [165.0, 165.01], [166.0, 165.99], [166.0, 166.06], [166.0, 166.09], [166.0, 166.13], [166.0, 166.16], [166.0, 166.19], [166.0, 169.35], [170.0, 171.07], [176.0, 176.77], [178.0, 181.28], [185.0, 190.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [30.86, 32.25, 0.0, 0.0, 63.74, 42.15, 64.41, 73.82, 0.0, 0.0, 0.0, 82.97, 48.91, 0.0, 69.47, 48.52, 58.81, 0.0, 0.0, 57.17, 0.0, 74.29, 33.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.22, 0.0, 0.0, 38.56, 34.85], "audiomae_on_audioset": [[["theremin", 58.17], ["music", 27.23], ["clarinet", 3.04]], [["theremin", 70.01], ["music", 24.25], ["musical instrument", 1.26]], null, null, null, [["theremin", 35.94], ["music", 31.99], ["wind instrument, woodwind instrument", 4.0]], null, null, null, null, null, null, [["music", 42.39], ["theremin", 20.9], ["whale vocalization", 6.15]], null, null, [["music", 30.99], ["domestic animals, pets", 10.03], ["animal", 7.15]], null, null, null, null, null, null, [["music", 56.01], ["theremin", 27.28], ["musical instrument", 3.81]], null, null, null, null, null, null, null, [["music", 30.19], ["speech", 20.21], ["radio", 9.03]], null, null, [["hum", 21.55], ["music", 21.41], ["mains hum", 14.45]], [["music", 45.13], ["theremin", 30.91], ["effects unit", 3.33]]], "duration": [18.4, 12.98, 0.76, 0.89, 4.0, 8.52, 2.11, 2.19, -0.06, 1.28, 1.07, 2.16, 2.28, 1.94, 2.4, 2.3, 3.59, 1.34, 1.58, 5.06, 0.9, 4.94, 17.0, 0.01, -0.01, 0.06, 0.09, 0.13, 0.16, 0.19, 3.35, 1.07, 0.77, 3.28, 5.56]}
annotations_filtered/d6NOGc2Dymo_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 20.24], [22.0, 27.08], [27.0, 36.53]], "keep_status": [false, true, false], "silence_prob": [31.5, 30.51, 32.26], "audiomae_on_audioset": [[["music", 45.0], ["speech", 39.69], ["whack, thwack", 3.15]], [["music", 21.73], ["speech", 20.67], ["fly, housefly", 10.19]], [["music", 59.43], ["electronic music", 6.5], ["hum", 5.15]]], "duration": [18.24, 5.08, 9.53]}
annotations_filtered/d6zX6-Rf4JY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 2.76], [4.0, 8.8], [10.0, 25.47], [26.0, 26.97], [28.0, 47.16], [48.0, 59.32], [68.0, 73.57], [74.0, 75.44]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.99, 77.36, 0.0, 77.03, 70.02, 73.36, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.76, 4.8, 15.47, 0.97, 19.16, 11.32, 5.57, 1.44]}
annotations_filtered/d7-pWfZgFKU_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 5.05], [7.0, 8.88], [9.0, 13.04], [13.0, 23.33], [25.0, 38.57], [39.0, 41.91], [43.0, 47.01], [48.0, 49.05], [51.0, 90.37], [91.0, 94.66], [96.0, 96.06], [102.0, 103.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 0.0, 99.16, 57.09, 64.63, 94.07, 99.1, 0.0, 0.0, 82.61, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.05, 1.88, 4.04, 10.33, 13.57, 2.91, 4.01, 1.05, 39.37, 3.66, 0.06, 1.65]}
annotations_filtered/d76CwsWbV2E_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[5.0, 6.12], [9.0, 9.1], [16.0, 16.44], [18.0, 18.54], [19.0, 20.7], [22.0, 22.89], [24.0, 25.66], [26.0, 27.03]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [1.12, 0.1, 0.44, 0.54, 1.7, 0.89, 1.66, 1.03]}
annotations_filtered/d79o09D8cuo_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 4.18], [5.0, 12.19], [18.0, 19.63], [20.0, 21.19], [22.0, 24.16], [25.0, 26.25], [27.0, 29.35], [35.0, 36.75], [40.0, 41.22], [49.0, 49.23], [70.0, 71.05], [86.0, 86.05], [90.0, 91.02], [97.0, 98.12], [100.0, 100.58], [101.0, 102.12], [104.0, 109.83], [111.0, 111.25], [113.0, 115.42], [117.0, 119.26], [120.0, 121.71], [123.0, 123.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 78.38, 0.0, 0.0, 49.68, 0.0, 99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.87, 0.0, 66.39, 83.52, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 76.78], ["speech", 4.07], ["radio", 2.89]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 53.84], ["music", 18.39], ["bang", 4.75]], null, null, null, null, null], "duration": [0.18, 7.19, 1.63, 1.19, 2.16, 1.25, 2.35, 1.75, 1.22, 0.23, 1.05, 0.05, 1.02, 1.12, 0.58, 1.12, 5.83, 0.25, 2.42, 2.26, 1.71, 0.97]}
annotations_filtered/d7Aot4Wr-Yo_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[9.0, 34.69], [35.0, 120.01], [121.0, 132.43], [135.0, 135.62], [136.0, 158.75], [159.0, 162.4], [167.0, 169.67], [170.0, 169.84], [170.0, 171.27], [173.0, 173.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [81.71, 0.0, 99.88, 0.0, 78.04, 99.31, 50.21, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [25.69, 85.01, 11.43, 0.62, 22.75, 3.4, 2.67, -0.16, 1.27, 0.23]}
annotations_filtered/d7RrYVI3Xw0_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[26.0, 26.64], [29.0, 29.46], [32.0, 32.85], [41.0, 41.86], [43.0, 43.04], [43.0, 44.02], [47.0, 48.47], [50.0, 51.9], [61.0, 65.67], [66.0, 69.26], [71.0, 72.03], [74.0, 76.38], [78.0, 78.46], [79.0, 80.67], [83.0, 84.45]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.78, 47.39, 0.0, 88.64, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 57.15], ["theremin", 10.52], ["musical instrument", 5.16]], [["music", 31.17], ["theremin", 10.78], ["speech", 10.08]], null, null, null, null, null], "duration": [0.64, 0.46, 0.85, 0.86, 0.04, 1.02, 1.47, 1.9, 4.67, 3.26, 1.03, 2.38, 0.46, 1.67, 1.45]}
annotations_filtered/d7V9liYn-IA_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[7.0, 8.9], [10.0, 14.1], [19.0, 19.8], [21.0, 38.01], [39.0, 66.07], [67.0, 121.32], [123.0, 122.98], [126.0, 126.96], [128.0, 128.31], [129.0, 130.01], [132.0, 132.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 82.79, 0.0, 45.78, 35.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 59.19], ["synthesizer", 14.41], ["musical instrument", 4.15]], [["music", 52.59], ["theremin", 19.13], ["synthesizer", 12.02]], null, null, null, null, null, null], "duration": [1.9, 4.1, 0.8, 17.01, 27.07, 54.32, -0.02, 0.96, 0.31, 1.01, 0.04]}
annotations_filtered/d7WraA-roN8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 5.56], [7.0, 7.4], [8.0, 11.11], [12.0, 12.97], [14.0, 15.77], [16.0, 18.52], [23.0, 25.07], [34.0, 39.24], [41.0, 52.05], [54.0, 58.04], [61.0, 61.7], [65.0, 65.87], [67.0, 96.72], [98.0, 102.47], [105.0, 105.7], [107.0, 110.15], [111.0, 111.55], [112.0, 117.09]], "keep_status": [false, false, true, false, false, true, false, true, true, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.02, 0.0, 0.0, 45.95, 39.21, 41.62, 28.82, 28.38, 0.0, 0.0, 32.85, 36.44, 0.0, 32.09, 0.0, 34.53], "audiomae_on_audioset": [null, null, [["hum", 19.0], ["sidetone", 17.9], ["speech", 15.49]], null, null, [["speech", 32.69], ["music", 11.39], ["mains hum", 8.17]], [["didgeridoo", 36.6], ["music", 24.77], ["trombone", 9.79]], [["speech", 38.5], ["hum", 17.19], ["throbbing", 7.34]], [["speech", 43.3], ["music", 10.99], ["whack, thwack", 7.03]], [["livestock, farm animals, working animals", 22.19], ["breaking", 16.03], ["cowbell", 8.28]], null, null, [["fly, housefly", 17.86], ["hum", 13.51], ["mosquito", 8.34]], [["music", 73.21], ["guitar", 3.82], ["effects unit", 3.57]], null, [["music", 64.51], ["speech", 9.64], ["guitar", 4.0]], null, [["music", 66.85], ["guitar", 7.46], ["musical instrument", 5.54]]], "duration": [1.56, 0.4, 3.11, 0.97, 1.77, 2.52, 2.07, 5.24, 11.05, 4.04, 0.7, 0.87, 29.72, 4.47, 0.7, 3.15, 0.55, 5.09]}
annotations_filtered/d7_F5P5PygM_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[10.0, 13.04], [14.0, 14.2], [17.0, 19.3], [20.0, 20.41], [22.0, 23.52], [24.0, 25.56], [26.0, 33.47], [35.0, 35.7], [36.0, 37.98], [40.0, 45.1], [46.0, 53.43], [55.0, 58.04]], "keep_status": [true, false, true, false, false, false, false, false, false, true, true, true], "silence_prob": [31.92, 0.0, 32.3, 0.0, 0.0, 0.0, 33.23, 0.0, 0.0, 30.43, 34.45, 49.59], "audiomae_on_audioset": [[["hum", 23.66], ["music", 22.98], ["mains hum", 18.91]], null, [["white noise", 17.77], ["mains hum", 9.26], ["explosion", 8.34]], null, null, null, [["music", 65.19], ["synthesizer", 8.44], ["hum", 6.49]], null, null, [["music", 29.13], ["synthesizer", 13.11], ["speech", 9.85]], [["music", 39.39], ["mains hum", 13.94], ["hum", 12.49]], [["music", 38.7], ["ambient music", 9.26], ["synthesizer", 8.45]]], "duration": [3.04, 0.2, 2.3, 0.41, 1.52, 1.56, 7.47, 0.7, 1.98, 5.1, 7.43, 3.04]}
annotations_filtered/d7c4TXqkMso_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[12.0, 12.73], [14.0, 13.66], [24.0, 29.39], [32.0, 42.87], [44.0, 44.88], [48.0, 48.49], [50.0, 50.48], [51.0, 51.68], [53.0, 53.06], [54.0, 54.65], [57.0, 58.21], [59.0, 59.73], [64.0, 65.11], [68.0, 67.9], [69.0, 70.07], [71.0, 71.52], [74.0, 74.61], [76.0, 76.28], [85.0, 85.19], [88.0, 88.3], [91.0, 91.23], [94.0, 94.19], [96.0, 97.83], [99.0, 99.22], [100.0, 101.12], [102.0, 103.1], [105.0, 106.1], [108.0, 108.46], [115.0, 116.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 50.02, 63.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, -0.34, 5.39, 10.87, 0.88, 0.49, 0.48, 0.68, 0.06, 0.65, 1.21, 0.73, 1.11, -0.1, 1.07, 0.52, 0.61, 0.28, 0.19, 0.3, 0.23, 0.19, 1.83, 0.22, 1.12, 1.1, 1.1, 0.46, 1.07]}
annotations_filtered/d7he8f2L_BE_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []}
annotations_filtered/d7pioagkX5k_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []}
annotations_filtered/d7ye5zFyuso_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[0.0, 0.68], [3.0, 3.05], [9.0, 17.42], [18.0, 23.31], [38.0, 38.01], [40.0, 40.53], [42.0, 42.35], [43.0, 43.83], [51.0, 54.35], [56.0, 56.74], [68.0, 70.09], [77.0, 77.55], [80.0, 80.62], [83.0, 83.47], [84.0, 110.56]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 35.74, 44.81, 0.0, 0.0, 0.0, 0.0, 50.26, 0.0, 56.78, 0.0, 0.0, 0.0, 30.35], "audiomae_on_audioset": [null, null, [["speech", 31.63], ["music", 28.65], ["hum", 4.37]], [["music", 53.77], ["speech", 8.77], ["didgeridoo", 3.36]], null, null, null, null, null, null, null, null, null, null, [["music", 52.42], ["theremin", 12.29], ["speech", 3.87]]], "duration": [0.68, 0.05, 8.42, 5.31, 0.01, 0.53, 0.35, 0.83, 3.35, 0.74, 2.09, 0.55, 0.62, 0.47, 26.56]}
annotations_filtered/d87eHGVaoc8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[13.0, 15.2], [24.0, 23.94], [24.0, 27.08], [50.0, 50.3], [57.0, 60.39], [62.0, 63.12], [64.0, 71.66], [77.0, 77.25]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [96.77, 0.0, 54.5, 0.0, 47.78, 0.0, 34.42, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 69.45], ["electronic music", 3.71], ["timpani", 3.4]], null, [["speech", 56.78], ["music", 24.35], ["outside, rural or natural", 2.28]], null], "duration": [2.2, -0.06, 3.08, 0.3, 3.39, 1.12, 7.66, 0.25]}
annotations_filtered/d8Ff_W4-4VE_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[5.0, 5.97], [13.0, 14.18], [15.0, 15.96], [17.0, 17.93], [34.0, 34.48], [45.0, 45.0], [49.0, 50.01], [54.0, 54.16], [55.0, 54.92], [63.0, 65.26], [69.0, 69.09], [73.0, 74.16], [77.0, 77.97], [83.0, 83.76], [88.0, 88.18], [89.0, 90.12], [101.0, 100.62], [102.0, 102.24], [108.0, 110.96], [116.0, 116.63], [119.0, 119.77], [123.0, 124.36], [126.0, 127.09], [129.0, 129.86], [132.0, 132.83], [133.0, 133.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 67.95], ["musical instrument", 6.51], ["guitar", 3.8]], null, null, null, null, null, null, null, null, [["speech", 59.51], ["radio", 9.67], ["sidetone", 4.16]], null, null, null, null, null, null, null], "duration": [0.97, 1.18, 0.96, 0.93, 0.48, 0.0, 1.01, 0.16, -0.08, 2.26, 0.09, 1.16, 0.97, 0.76, 0.18, 1.12, -0.38, 0.24, 2.96, 0.63, 0.77, 1.36, 1.09, 0.86, 0.83, 0.73]}
annotations_filtered/d8Gg9rPHKNU_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[6.0, 6.17], [7.0, 8.36], [10.0, 47.73]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.17, 1.36, 37.73]}
annotations_filtered/d8WHOiQZGok_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 4.33], [8.0, 8.09], [8.0, 9.58], [10.0, 15.74], [17.0, 32.48], [34.0, 34.26], [35.0, 35.68], [37.0, 37.22], [45.0, 45.3], [51.0, 51.61], [53.0, 53.18], [56.0, 56.44], [58.0, 58.24], [59.0, 61.65], [66.0, 75.56], [76.0, 77.33], [78.0, 79.29], [79.0, 85.83], [95.0, 98.12], [99.0, 99.12], [102.0, 103.03], [104.0, 105.06], [108.0, 109.71], [111.0, 111.62], [117.0, 117.34], [118.0, 118.76], [119.0, 124.09], [125.0, 128.6], [129.0, 131.11], [132.0, 133.47], [135.0, 135.63], [137.0, 137.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.62, 31.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.55, 39.25, 0.0, 0.0, 32.96, 34.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.55, 43.69, 37.65, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 71.25], ["trance music", 1.71], ["electronic music", 1.7]], [["music", 71.78], ["psychedelic rock", 5.99], ["swing music", 1.2]], null, null, null, null, null, null, null, null, [["music", 36.53], ["didgeridoo", 27.78], ["musical instrument", 4.03]], [["music", 53.75], ["speech", 12.76], ["throbbing", 3.26]], null, null, [["music", 36.91], ["speech", 36.4], ["sidetone", 8.81]], [["music", 34.85], ["throbbing", 27.1], ["hum", 15.7]], null, null, null, null, null, null, null, [["music", 40.41], ["speech", 23.32], ["didgeridoo", 13.54]], [["fly, housefly", 15.92], ["music", 9.65], ["creak", 8.99]], [["cattle, bovinae", 39.92], ["moo", 29.68], ["livestock, farm animals, working animals", 26.59]], null, null, null], "duration": [0.33, 0.09, 1.58, 5.74, 15.48, 0.26, 0.68, 0.22, 0.3, 0.61, 0.18, 0.44, 0.24, 2.65, 9.56, 1.33, 1.29, 6.83, 3.12, 0.12, 1.03, 1.06, 1.71, 0.62, 0.34, 0.76, 5.09, 3.6, 2.11, 1.47, 0.63, 0.39]}
annotations_filtered/d8sDpSZeDBE_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[17.0, 17.49], [19.0, 19.55], [21.0, 21.2], [23.0, 24.31], [28.0, 28.93], [30.0, 30.08], [31.0, 33.62], [39.0, 39.06], [41.0, 41.34], [45.0, 47.6], [49.0, 49.67], [50.0, 51.14], [52.0, 52.52], [53.0, 53.82], [55.0, 66.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.22, 0.0, 0.0, 92.31, 0.0, 0.0, 0.0, 0.0, 86.27], "audiomae_on_audioset": [null, null, null, null, null, null, [["fly, housefly", 54.11], ["bee, wasp, etc.", 21.52], ["insect", 13.31]], null, null, null, null, null, null, null, null], "duration": [0.49, 0.55, 0.2, 1.31, 0.93, 0.08, 2.62, 0.06, 0.34, 2.6, 0.67, 1.14, 0.52, 0.82, 11.11]}
annotations_filtered/d9-DFXwcmFI_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[7.0, 8.06], [9.0, 9.54], [15.0, 16.68], [18.0, 18.62], [19.0, 20.68], [23.0, 23.97], [25.0, 25.86], [28.0, 29.32], [36.0, 38.01], [39.0, 40.36], [41.0, 41.82], [46.0, 47.06], [52.0, 52.17], [59.0, 59.97], [61.0, 62.55], [63.0, 64.27], [67.0, 68.01], [71.0, 73.04], [74.0, 74.65], [75.0, 76.86], [79.0, 79.71], [81.0, 83.51], [86.0, 87.27], [90.0, 90.59], [92.0, 93.21], [94.0, 95.03], [99.0, 106.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.06, 0.54, 1.68, 0.62, 1.68, 0.97, 0.86, 1.32, 2.01, 1.36, 0.82, 1.06, 0.17, 0.97, 1.55, 1.27, 1.01, 2.04, 0.65, 1.86, 0.71, 2.51, 1.27, 0.59, 1.21, 1.03, 7.95]}
annotations_filtered/d921M-ACMM4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 2.32], [5.0, 5.32], [7.0, 16.17], [20.0, 33.56], [36.0, 48.91], [53.0, 59.76], [60.0, 64.3], [69.0, 79.57], [80.0, 81.58], [83.0, 83.27], [85.0, 84.59], [85.0, 85.67], [97.0, 96.9], [114.0, 114.39], [116.0, 117.42], [119.0, 122.55], [125.0, 147.63], [148.0, 148.64]], "keep_status": [false, false, false, true, false, true, true, true, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 30.98, 46.02, 45.78, 38.41, 43.69, 37.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.97, 31.78, 0.0], "audiomae_on_audioset": [null, null, [["speech", 44.39], ["eruption", 19.09], ["explosion", 7.67]], [["speech", 15.47], ["animal", 14.93], ["livestock, farm animals, working animals", 10.13]], [["livestock, farm animals, working animals", 34.01], ["cattle, bovinae", 28.85], ["animal", 20.85]], [["speech", 53.48], ["hum", 5.2], ["buzz", 3.51]], [["animal", 30.94], ["domestic animals, pets", 17.19], ["dog", 11.0]], [["whale vocalization", 34.08], ["animal", 16.39], ["speech", 6.46]], null, null, null, null, null, null, null, null, [["frog", 46.28], ["insect", 11.0], ["fly, housefly", 8.44]], null], "duration": [0.32, 0.32, 9.17, 13.56, 12.91, 6.76, 4.3, 10.57, 1.58, 0.27, -0.41, 0.67, -0.1, 0.39, 1.42, 3.55, 22.63, 0.64]}