bpiyush commited on
Commit
1d59104
·
1 Parent(s): 2753972
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. annotations_filtered/f-3Bldu8BJ4_filtered.json +1 -0
  2. annotations_filtered/f-77xulkB_U_filtered.json +1 -0
  3. annotations_filtered/f-DgdMpSo7c_filtered.json +1 -0
  4. annotations_filtered/f-DiniX_1mI_filtered.json +1 -0
  5. annotations_filtered/f-EjBwpuVFI_filtered.json +1 -0
  6. annotations_filtered/f-PnGRaJaSA_filtered.json +1 -0
  7. annotations_filtered/f-vA6GMMKgQ_filtered.json +1 -0
  8. annotations_filtered/f0-Ea9Ki7YU_filtered.json +1 -0
  9. annotations_filtered/f06qimixOOI_filtered.json +1 -0
  10. annotations_filtered/f08pzusjWTQ_filtered.json +1 -0
  11. annotations_filtered/f0MBL-DyXaE_filtered.json +1 -0
  12. annotations_filtered/f0eTISgJ3Io_filtered.json +1 -0
  13. annotations_filtered/f0sDG0nnftw_filtered.json +1 -0
  14. annotations_filtered/f0wEV9jySXg_filtered.json +1 -0
  15. annotations_filtered/f187FGFi1AM_filtered.json +1 -0
  16. annotations_filtered/f1N8-L5cuWQ_filtered.json +1 -0
  17. annotations_filtered/f1Nh9DlkZ1w_filtered.json +1 -0
  18. annotations_filtered/f1bk5a_jaEA_filtered.json +1 -0
  19. annotations_filtered/f1fSmptANOU_filtered.json +1 -0
  20. annotations_filtered/f1mbRj3ejAk_filtered.json +1 -0
  21. annotations_filtered/f20aUH5IG9s_filtered.json +1 -0
  22. annotations_filtered/f2FzrfnfQPY_filtered.json +1 -0
  23. annotations_filtered/f2Hz2k2PcfI_filtered.json +1 -0
  24. annotations_filtered/f2SskRLd4F4_filtered.json +1 -0
  25. annotations_filtered/f2c-tMZSZtY_filtered.json +1 -0
  26. annotations_filtered/f2ugRkVMOuE_filtered.json +1 -0
  27. annotations_filtered/f39I-UCl9Qo_filtered.json +1 -0
  28. annotations_filtered/f3XcExCD3HM_filtered.json +1 -0
  29. annotations_filtered/f3tseBsU248_filtered.json +1 -0
  30. annotations_filtered/f3u4j0hVy8c_filtered.json +1 -0
  31. annotations_filtered/f48wH7l3c5I_filtered.json +1 -0
  32. annotations_filtered/f4LEgmt0roE_filtered.json +1 -0
  33. annotations_filtered/f4M5MT96FwY_filtered.json +1 -0
  34. annotations_filtered/f4gmgTebHog_filtered.json +1 -0
  35. annotations_filtered/f4ojzsvQhh0_filtered.json +1 -0
  36. annotations_filtered/f4wQCy4xIyY_filtered.json +1 -0
  37. annotations_filtered/f4wmj-Nq9xA_filtered.json +1 -0
  38. annotations_filtered/f4zl3CuJvt8_filtered.json +1 -0
  39. annotations_filtered/f505OHOUHoU_filtered.json +1 -0
  40. annotations_filtered/f57Vat6YZUI_filtered.json +1 -0
  41. annotations_filtered/f58Ba78abHg_filtered.json +1 -0
  42. annotations_filtered/f5e73A39TF4_filtered.json +1 -0
  43. annotations_filtered/f5f86alm7jk_filtered.json +1 -0
  44. annotations_filtered/f5mcMmE3RL8_filtered.json +1 -0
  45. annotations_filtered/f5umSa_YYX0_filtered.json +1 -0
  46. annotations_filtered/f6DDYCf80hw_filtered.json +1 -0
  47. annotations_filtered/f6Dan7z0p4c_filtered.json +1 -0
  48. annotations_filtered/f6F6MzMT2g8_filtered.json +1 -0
  49. annotations_filtered/f6hhVIV_LPs_filtered.json +1 -0
  50. annotations_filtered/f6m4J0AfEOo_filtered.json +1 -0
annotations_filtered/f-3Bldu8BJ4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 4.09], [8.0, 10.2], [12.0, 15.55], [17.0, 19.48], [21.0, 26.1], [27.0, 31.06], [33.0, 36.26], [37.0, 43.83], [44.0, 46.18], [46.0, 46.21], [64.0, 64.45], [66.0, 70.31], [75.0, 77.09], [82.0, 81.92], [85.0, 89.72], [93.0, 98.47], [100.0, 99.94], [103.0, 109.32], [110.0, 111.86], [113.0, 115.91], [117.0, 127.53], [128.0, 130.23], [132.0, 133.1], [137.0, 137.61], [138.0, 141.12], [144.0, 150.92], [153.0, 156.61], [157.0, 158.53], [159.0, 160.78], [162.0, 162.58], [164.0, 163.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [73.51, 87.92, 82.07, 81.35, 79.41, 78.38, 82.07, 94.81, 73.97, 0.0, 0.0, 62.68, 80.82, 0.0, 68.67, 74.44, 0.0, 57.64, 0.0, 99.59, 64.63, 84.98, 0.0, 0.0, 81.35, 68.8, 75.88, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.09, 2.2, 3.55, 2.48, 5.1, 4.06, 3.26, 6.83, 2.18, 0.21, 0.45, 4.31, 2.09, -0.08, 4.72, 5.47, -0.06, 6.32, 1.86, 2.91, 10.53, 2.23, 1.1, 0.61, 3.12, 6.92, 3.61, 1.53, 1.78, 0.58, -0.14]}
annotations_filtered/f-77xulkB_U_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 5.71], [11.0, 13.29], [15.0, 15.42], [17.0, 17.42], [21.0, 21.61], [25.0, 26.1], [27.0, 27.84], [29.0, 29.1], [31.0, 32.07], [35.0, 35.8], [38.0, 39.34], [40.0, 40.44], [41.0, 43.6], [45.0, 50.36], [54.0, 65.74], [67.0, 68.81], [91.0, 92.01], [101.0, 102.76], [107.0, 107.16], [108.0, 109.71], [110.0, 111.23], [112.0, 113.05], [119.0, 121.02], [123.0, 123.36], [126.0, 129.09], [130.0, 135.67], [136.0, 137.47], [139.0, 140.0], [147.0, 150.38], [151.0, 152.25], [154.0, 154.92], [159.0, 159.46], [161.0, 161.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [42.48, 38.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.4, 64.86, 31.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.74, 0.0, 47.23, 46.61, 0.0, 0.0, 45.21, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["sidetone", 60.55], ["speech", 22.86], ["radio", 4.85]], [["speech", 70.08], ["sidetone", 14.6], ["radio", 4.19]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 88.4], ["boing", 2.93], ["sidetone", 0.99]], null, null, null, null, null, null, null, [["speech", 64.18], ["telephone", 9.45], ["dial tone", 8.38]], null, [["music", 38.45], ["crushing", 28.34], ["musical instrument", 4.74]], [["music", 44.91], ["crushing", 11.43], ["effects unit", 10.28]], null, null, [["music", 49.38], ["didgeridoo", 8.44], ["theremin", 4.49]], null, null, null, null], "duration": [3.71, 2.29, 0.42, 0.42, 0.61, 1.1, 0.84, 0.1, 1.07, 0.8, 1.34, 0.44, 2.6, 5.36, 11.74, 1.81, 1.01, 1.76, 0.16, 1.71, 1.23, 1.05, 2.02, 0.36, 3.09, 5.67, 1.47, 1.0, 3.38, 1.25, 0.92, 0.46, 0.62]}
annotations_filtered/f-DgdMpSo7c_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[12.0, 17.51], [28.0, 28.81], [29.0, 29.49], [30.0, 30.15], [31.0, 30.75], [32.0, 32.7], [33.0, 33.56], [35.0, 35.73], [37.0, 37.77], [39.0, 39.41], [40.0, 40.41], [41.0, 41.37], [42.0, 43.02], [47.0, 47.33], [49.0, 68.05], [76.0, 77.36], [84.0, 85.35], [92.0, 93.87], [98.0, 98.04], [100.0, 100.48], [110.0, 122.69], [123.0, 122.82], [126.0, 125.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.36, 0.0, 0.0, 0.0, 0.0, 0.0, 41.34, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 30.5], ["mosquito", 13.89], ["cattle, bovinae", 12.98]], null, null, null, null, null, [["music", 48.63], ["groan", 6.31], ["fart", 5.29]], null, null], "duration": [5.51, 0.81, 0.49, 0.15, -0.25, 0.7, 0.56, 0.73, 0.77, 0.41, 0.41, 0.37, 1.02, 0.33, 19.05, 1.36, 1.35, 1.87, 0.04, 0.48, 12.69, -0.18, -0.21]}
annotations_filtered/f-DiniX_1mI_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[16.0, 16.78], [17.0, 17.74], [18.0, 20.87], [28.0, 29.39], [30.0, 30.75], [33.0, 35.83], [37.0, 37.66], [39.0, 39.78], [41.0, 44.93], [48.0, 54.73], [69.0, 72.22]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 64.41, 0.0, 0.0, 31.25, 0.0, 0.0, 32.17, 29.61, 60.42], "audiomae_on_audioset": [null, null, null, null, null, [["explosion", 38.09], ["gunshot, gunfire", 18.54], ["burst, pop", 18.34]], null, null, [["explosion", 36.08], ["burst, pop", 14.05], ["gunshot, gunfire", 9.82]], [["gunshot, gunfire", 29.6], ["explosion", 13.98], ["clang", 9.46]], null], "duration": [0.78, 0.74, 2.87, 1.39, 0.75, 2.83, 0.66, 0.78, 3.93, 6.73, 3.22]}
annotations_filtered/f-EjBwpuVFI_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[7.0, 23.82], [30.0, 43.38], [46.0, 49.06], [51.0, 51.31], [54.0, 56.74], [66.0, 66.99], [74.0, 75.71], [77.0, 76.96], [79.0, 80.43], [84.0, 86.26], [89.0, 99.25], [99.0, 103.98], [104.0, 118.42], [123.0, 134.65], [139.0, 141.72], [149.0, 149.93], [151.0, 152.76], [158.0, 158.43], [171.0, 173.94]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, true, true, false, false, false, false, true], "silence_prob": [34.94, 37.89, 43.56, 0.0, 37.98, 0.0, 0.0, 0.0, 0.0, 40.9, 38.84, 48.31, 37.31, 34.63, 44.55, 0.0, 0.0, 0.0, 39.61], "audiomae_on_audioset": [[["music", 56.38], ["hum", 8.73], ["musical instrument", 5.93]], [["music", 59.06], ["didgeridoo", 17.49], ["insect", 3.35]], [["music", 76.92], ["didgeridoo", 3.25], ["musical instrument", 2.48]], null, [["music", 67.29], ["electronic music", 6.86], ["synthesizer", 3.75]], null, null, null, null, [["speech", 32.91], ["music", 15.78], ["hum", 15.63]], [["music", 70.01], ["hum", 5.02], ["electronic music", 3.41]], [["music", 35.05], ["speech", 24.42], ["whale vocalization", 8.18]], [["music", 35.91], ["speech", 21.4], ["whale vocalization", 5.14]], [["music", 31.24], ["hum", 25.55], ["throbbing", 11.53]], [["music", 49.66], ["pulse", 18.57], ["theremin", 6.33]], null, null, null, [["music", 42.22], ["buzz", 9.42], ["didgeridoo", 4.76]]], "duration": [16.82, 13.38, 3.06, 0.31, 2.74, 0.99, 1.71, -0.04, 1.43, 2.26, 10.25, 4.98, 14.42, 11.65, 2.72, 0.93, 1.76, 0.43, 2.94]}
annotations_filtered/f-PnGRaJaSA_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 5.1], [6.0, 6.54], [7.0, 7.75], [9.0, 8.92], [13.0, 12.68], [14.0, 14.23], [35.0, 37.99], [49.0, 49.81], [52.0, 53.1], [56.0, 57.27], [66.0, 66.6], [68.0, 68.88], [73.0, 73.58], [75.0, 77.7], [90.0, 90.41], [105.0, 105.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.91, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 52.34], ["theremin", 23.65], ["throbbing", 3.55]], null, null, null, null, null, null, [["theremin", 40.58], ["music", 34.95], ["musical instrument", 4.81]], null, null], "duration": [1.1, 0.54, 0.75, -0.08, -0.32, 0.23, 2.99, 0.81, 1.1, 1.27, 0.6, 0.88, 0.58, 2.7, 0.41, 0.7]}
annotations_filtered/f-vA6GMMKgQ_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 3.1], [6.0, 7.28], [10.0, 10.57], [19.0, 19.94], [22.0, 22.23], [24.0, 24.61], [26.0, 26.62], [34.0, 34.5], [38.0, 37.76], [41.0, 41.54], [42.0, 42.38], [49.0, 53.08], [54.0, 54.65], [56.0, 57.11], [60.0, 60.91], [64.0, 64.66], [67.0, 67.46], [83.0, 83.22], [89.0, 90.04], [95.0, 95.1], [100.0, 99.89], [101.0, 101.73], [103.0, 107.06], [113.0, 114.07], [114.0, 115.5], [116.0, 116.4], [117.0, 117.37], [120.0, 120.16], [122.0, 122.34], [125.0, 124.87], [126.0, 126.37], [127.0, 127.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [84.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.1, 1.28, 0.57, 0.94, 0.23, 0.61, 0.62, 0.5, -0.24, 0.54, 0.38, 4.08, 0.65, 1.11, 0.91, 0.66, 0.46, 0.22, 1.04, 0.1, -0.11, 0.73, 4.06, 1.07, 1.5, 0.4, 0.37, 0.16, 0.34, -0.13, 0.37, 0.38]}
annotations_filtered/f0-Ea9Ki7YU_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[9.0, 12.48], [15.0, 35.48], [40.0, 96.01], [97.0, 98.04], [100.0, 120.31], [121.0, 121.78], [127.0, 127.33], [129.0, 130.23], [132.0, 132.21], [133.0, 133.93], [138.0, 138.33], [139.0, 140.86], [141.0, 148.05], [149.0, 151.87], [153.0, 154.65], [156.0, 179.29], [180.0, 180.76]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [28.68, 28.37, 0.0, 0.0, 31.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.79, 64.52, 0.0, 29.87, 0.0], "audiomae_on_audioset": [[["music", 43.22], ["buzzer", 10.91], ["theremin", 8.38]], [["music", 71.47], ["didgeridoo", 8.21], ["musical instrument", 3.24]], null, null, [["trombone", 23.01], ["music", 22.49], ["brass instrument", 21.31]], null, null, null, null, null, null, null, null, null, null, [["theremin", 60.98], ["music", 30.85], ["musical instrument", 0.87]], null], "duration": [3.48, 20.48, 56.01, 1.04, 20.31, 0.78, 0.33, 1.23, 0.21, 0.93, 0.33, 1.86, 7.05, 2.87, 1.65, 23.29, 0.76]}
annotations_filtered/f06qimixOOI_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 4.31], [5.0, 6.67], [9.0, 18.32], [20.0, 28.16], [31.0, 51.14], [52.0, 51.71], [55.0, 55.05], [56.0, 65.67], [67.0, 69.21], [73.0, 83.49], [86.0, 91.59]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 81.53, 72.31, 33.6, 0.0, 0.0, 30.5, 50.56, 46.47, 29.07], "audiomae_on_audioset": [null, null, null, null, [["music", 61.82], ["musical instrument", 4.5], ["singing bowl", 2.76]], null, null, [["music", 18.4], ["livestock, farm animals, working animals", 17.67], ["cattle, bovinae", 10.12]], null, [["music", 61.56], ["effects unit", 9.36], ["guitar", 6.42]], [["didgeridoo", 33.32], ["speech", 28.02], ["music", 23.54]]], "duration": [1.31, 1.67, 9.32, 8.16, 20.14, -0.29, 0.05, 9.67, 2.21, 10.49, 5.59]}
annotations_filtered/f08pzusjWTQ_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 2.46], [4.0, 5.04], [9.0, 9.69], [11.0, 12.01], [15.0, 16.85], [18.0, 18.67], [20.0, 20.95], [23.0, 24.12], [25.0, 26.79], [28.0, 30.48], [32.0, 36.49], [38.0, 43.26], [47.0, 57.3], [59.0, 59.63], [63.0, 63.78], [70.0, 77.75], [79.0, 80.65], [82.0, 82.31], [83.0, 84.79], [86.0, 87.02], [88.0, 88.99], [96.0, 96.74], [100.0, 100.87], [107.0, 108.62], [110.0, 110.42], [111.0, 116.38], [118.0, 119.45], [123.0, 127.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.07, 92.97, 98.44, 47.58, 0.0, 0.0, 58.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.66, 0.0, 41.09], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 44.34], ["music", 37.89], ["effects unit", 3.76]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 54.02], ["music", 18.27], ["speech", 9.82]]], "duration": [1.46, 1.04, 0.69, 1.01, 1.85, 0.67, 0.95, 1.12, 1.79, 2.48, 4.49, 5.26, 10.3, 0.63, 0.78, 7.75, 1.65, 0.31, 1.79, 1.02, 0.99, 0.74, 0.87, 1.62, 0.42, 5.38, 1.45, 4.36]}
annotations_filtered/f0MBL-DyXaE_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 4.89], [5.0, 13.51], [14.0, 13.61], [16.0, 29.4], [33.0, 33.25], [39.0, 39.24], [49.0, 51.16], [53.0, 54.36], [55.0, 57.1], [58.0, 59.54], [62.0, 63.91], [66.0, 66.53], [75.0, 76.01], [77.0, 79.98], [81.0, 81.16], [82.0, 82.24], [85.0, 85.62]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [65.91, 37.51, 0.0, 36.31, 0.0, 0.0, 67.51, 0.0, 99.82, 0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 44.8], ["music", 10.92], ["explosion", 5.67]], null, [["motorboat, speedboat", 29.02], ["boat, water vehicle", 23.89], ["music", 9.57]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.89, 8.51, -0.39, 13.4, 0.25, 0.24, 2.16, 1.36, 2.1, 1.54, 1.91, 0.53, 1.01, 2.98, 0.16, 0.24, 0.62]}
annotations_filtered/f0eTISgJ3Io_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[54.0, 54.84], [57.0, 56.84], [61.0, 76.76], [78.0, 79.32], [85.0, 87.05], [88.0, 89.53]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.92, 0.0, 33.01, 0.0], "audiomae_on_audioset": [null, null, [["speech", 78.94], ["fart", 8.14], ["throbbing", 1.8]], null, [["hum", 29.92], ["mains hum", 25.36], ["throbbing", 17.83]], null], "duration": [0.84, -0.16, 15.76, 1.32, 2.05, 1.53]}
annotations_filtered/f0sDG0nnftw_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[7.0, 40.37], [51.0, 51.85], [53.0, 53.25], [54.0, 62.99], [79.0, 86.36], [91.0, 91.88], [95.0, 99.27], [101.0, 105.53]], "keep_status": [false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.42, 80.82, 0.0, 78.21, 63.96], "audiomae_on_audioset": [null, null, null, [["music", 43.94], ["didgeridoo", 10.07], ["musical instrument", 9.0]], null, null, null, null], "duration": [33.37, 0.85, 0.25, 8.99, 7.36, 0.88, 4.27, 4.53]}
annotations_filtered/f0wEV9jySXg_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 1.85], [5.0, 5.17], [6.0, 7.75], [9.0, 9.64], [12.0, 11.72], [16.0, 16.88], [20.0, 20.88], [21.0, 22.4], [33.0, 33.84], [34.0, 35.9], [38.0, 39.39], [51.0, 51.6], [60.0, 59.97], [60.0, 60.69], [62.0, 63.1], [69.0, 70.21], [75.0, 75.63], [78.0, 82.0], [83.0, 84.69], [86.0, 89.63], [91.0, 92.31], [93.0, 94.81], [96.0, 96.08], [100.0, 100.52], [103.0, 103.94], [105.0, 105.6], [108.0, 108.21], [110.0, 110.17], [118.0, 123.2], [124.0, 125.25], [127.0, 129.39], [129.0, 130.59], [133.0, 142.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.53, 0.0, 100.0, 0.0, 81.53], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.15, 0.17, 1.75, 0.64, -0.28, 0.88, 0.88, 1.4, 0.84, 1.9, 1.39, 0.6, -0.03, 0.69, 1.1, 1.21, 0.63, 4.0, 1.69, 3.63, 1.31, 1.81, 0.08, 0.52, 0.94, 0.6, 0.21, 0.17, 5.2, 1.25, 2.39, 1.59, 9.01]}
annotations_filtered/f187FGFi1AM_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 4.13], [8.0, 9.85], [11.0, 17.17], [18.0, 24.78], [25.0, 25.1], [25.0, 26.55], [27.0, 32.22], [32.0, 33.0], [34.0, 35.78], [36.0, 64.99], [66.0, 67.51], [69.0, 79.95], [81.0, 83.19], [84.0, 84.67], [86.0, 87.15], [89.0, 90.73], [91.0, 121.1], [122.0, 122.55], [124.0, 124.44], [125.0, 125.64]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [65.09, 0.0, 33.75, 38.6, 0.0, 0.0, 34.58, 0.0, 0.0, 46.79, 0.0, 33.49, 62.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 36.24], ["effects unit", 8.84], ["musical instrument", 8.26]], [["music", 68.13], ["theremin", 19.21], ["musical instrument", 2.65]], null, null, [["music", 42.66], ["theremin", 19.64], ["musical instrument", 9.06]], null, null, [["music", 51.97], ["mains hum", 18.42], ["hum", 13.39]], null, [["mains hum", 23.93], ["hum", 22.3], ["speech", 22.11]], null, null, null, null, null, null, null, null], "duration": [2.13, 1.85, 6.17, 6.78, 0.1, 1.55, 5.22, 1.0, 1.78, 28.99, 1.51, 10.95, 2.19, 0.67, 1.15, 1.73, 30.1, 0.55, 0.44, 0.64]}
annotations_filtered/f1N8-L5cuWQ_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 10.77], [13.0, 14.34], [18.0, 18.28], [19.0, 21.34], [25.0, 26.52], [30.0, 30.3], [34.0, 34.23], [35.0, 42.2], [43.0, 51.53], [54.0, 55.31], [58.0, 59.36], [67.0, 74.68], [75.0, 79.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.6, 0.0, 0.0, 43.74, 0.0, 0.0, 0.0, 45.36, 59.24, 0.0, 0.0, 32.9, 35.91], "audiomae_on_audioset": [[["speech", 38.31], ["music", 26.71], ["hum", 10.25]], null, null, [["music", 41.61], ["didgeridoo", 21.74], ["quack", 8.38]], null, null, null, [["music", 59.33], ["speech", 16.9], ["hum", 5.7]], null, null, null, [["music", 51.0], ["didgeridoo", 33.82], ["speech", 5.47]], [["music", 43.02], ["hum", 13.8], ["speech", 13.45]]], "duration": [8.77, 1.34, 0.28, 2.34, 1.52, 0.3, 0.23, 7.2, 8.53, 1.31, 1.36, 7.68, 4.15]}
annotations_filtered/f1Nh9DlkZ1w_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[7.0, 22.44], [23.0, 23.45], [25.0, 49.44]], "keep_status": [true, false, true], "silence_prob": [32.4, 0.0, 41.42], "audiomae_on_audioset": [[["cattle, bovinae", 17.88], ["livestock, farm animals, working animals", 15.71], ["moo", 15.59]], null, [["clip-clop", 31.47], ["horse", 21.88], ["animal", 7.54]]], "duration": [15.44, 0.45, 24.44]}
annotations_filtered/f1bk5a_jaEA_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[16.0, 17.83], [31.0, 31.97], [34.0, 38.6], [40.0, 40.49], [41.0, 57.16], [58.0, 62.01], [77.0, 76.65], [79.0, 78.93], [83.0, 85.68], [89.0, 101.06], [102.0, 102.93], [103.0, 103.81], [104.0, 150.63], [152.0, 154.8], [157.0, 158.16], [161.0, 172.3], [177.0, 177.15], [177.0, 178.09], [179.0, 179.0], [180.0, 179.86], [188.0, 212.45], [218.0, 225.9]], "keep_status": [false, false, true, false, false, true, false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 36.86, 0.0, 34.94, 30.54, 0.0, 0.0, 30.66, 31.95, 0.0, 0.0, 0.0, 31.69, 0.0, 29.96, 0.0, 0.0, 0.0, 0.0, 31.57, 30.94], "audiomae_on_audioset": [null, null, [["music", 48.99], ["marimba, xylophone", 6.3], ["glockenspiel", 4.12]], null, [["music", 71.17], ["brass instrument", 4.08], ["echo", 2.93]], [["music", 34.83], ["effects unit", 6.56], ["musical instrument", 5.73]], null, null, [["chant", 28.32], ["choir", 12.67], ["music", 12.61]], [["music", 46.92], ["musical instrument", 13.39], ["brass instrument", 5.44]], null, null, null, [["sidetone", 29.36], ["music", 12.03], ["fly, housefly", 10.36]], null, [["music", 73.8], ["theremin", 4.44], ["singing", 2.16]], null, null, null, null, [["music", 36.68], ["didgeridoo", 33.97], ["theremin", 14.9]], [["music", 42.67], ["animal", 11.55], ["noise", 10.9]]], "duration": [1.83, 0.97, 4.6, 0.49, 16.16, 4.01, -0.35, -0.07, 2.68, 12.06, 0.93, 0.81, 46.63, 2.8, 1.16, 11.3, 0.15, 1.09, 0.0, -0.14, 24.45, 7.9]}
annotations_filtered/f1fSmptANOU_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[10.0, 11.2], [32.0, 32.56], [33.0, 38.6], [43.0, 52.54], [55.0, 56.22], [58.0, 64.45], [67.0, 72.17], [73.0, 73.09], [73.0, 74.01], [75.0, 75.76], [78.0, 78.97], [95.0, 95.32], [96.0, 96.67], [98.0, 98.39], [99.0, 99.33], [101.0, 100.84], [101.0, 101.76], [103.0, 104.14]], "keep_status": [false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.2, 30.89, 0.0, 30.59, 41.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 48.07], ["musical instrument", 7.22], ["noise", 6.32]], [["music", 85.03], ["cacophony", 2.72], ["didgeridoo", 2.32]], null, [["music", 45.42], ["cacophony", 12.36], ["sound effect", 5.73]], [["music", 36.98], ["didgeridoo", 20.6], ["synthesizer", 5.16]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.2, 0.56, 5.6, 9.54, 1.22, 6.45, 5.17, 0.09, 1.01, 0.76, 0.97, 0.32, 0.67, 0.39, 0.33, -0.16, 0.76, 1.14]}
annotations_filtered/f1mbRj3ejAk_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[17.0, 19.45], [25.0, 26.62], [28.0, 28.31], [30.0, 31.53], [33.0, 33.08], [35.0, 35.19], [36.0, 36.61], [38.0, 38.37], [45.0, 50.4], [51.0, 51.93], [55.0, 57.77], [58.0, 58.13], [59.0, 61.33], [62.0, 76.59], [80.0, 83.1]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, true, true], "silence_prob": [56.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.31, 0.0, 34.73, 0.0, 32.89, 33.06, 32.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 27.47], ["music", 15.36], ["tick-tock", 5.7]], null, [["music", 30.57], ["throbbing", 29.6], ["hum", 13.84]], null, [["music", 50.36], ["didgeridoo", 12.81], ["speech", 3.37]], [["music", 26.82], ["hum", 19.1], ["throbbing", 14.77]], [["speech", 28.3], ["hum", 12.41], ["music", 11.35]]], "duration": [2.45, 1.62, 0.31, 1.53, 0.08, 0.19, 0.61, 0.37, 5.4, 0.93, 2.77, 0.13, 2.33, 14.59, 3.1]}
annotations_filtered/f20aUH5IG9s_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 4.23], [6.0, 6.32], [7.0, 7.43], [8.0, 11.53], [13.0, 14.08], [15.0, 19.36], [22.0, 23.19], [24.0, 25.44], [26.0, 26.11], [28.0, 28.49], [29.0, 32.49], [35.0, 36.17], [40.0, 40.85], [42.0, 42.35], [43.0, 43.39], [46.0, 47.65], [50.0, 50.6], [51.0, 51.27], [53.0, 54.06], [56.0, 57.75], [59.0, 62.83], [64.0, 65.96], [74.0, 73.97], [76.0, 77.52], [79.0, 80.23], [83.0, 82.83], [84.0, 84.92], [89.0, 91.86], [92.0, 96.28], [103.0, 104.45], [115.0, 115.94], [117.0, 117.93], [124.0, 124.28], [127.0, 127.68], [130.0, 130.38], [132.0, 133.08], [134.0, 136.83], [139.0, 141.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 96.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.51, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.23, 0.32, 0.43, 3.53, 1.08, 4.36, 1.19, 1.44, 0.11, 0.49, 3.49, 1.17, 0.85, 0.35, 0.39, 1.65, 0.6, 0.27, 1.06, 1.75, 3.83, 1.96, -0.03, 1.52, 1.23, -0.17, 0.92, 2.86, 4.28, 1.45, 0.94, 0.93, 0.28, 0.68, 0.38, 1.08, 2.83, 2.07]}
annotations_filtered/f2FzrfnfQPY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[6.0, 7.55], [10.0, 11.21], [13.0, 13.8], [16.0, 17.46], [20.0, 21.95], [25.0, 25.14], [26.0, 26.25], [32.0, 31.95], [33.0, 33.54], [36.0, 37.32], [38.0, 38.52], [42.0, 42.74], [44.0, 45.96], [47.0, 48.9], [54.0, 54.8], [64.0, 65.43], [76.0, 79.15], [81.0, 84.2], [86.0, 88.03], [95.0, 106.95], [112.0, 112.24], [114.0, 116.16], [118.0, 121.17], [124.0, 128.17], [133.0, 135.38], [137.0, 139.04], [145.0, 146.4], [149.0, 150.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, true, true, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.31, 31.92, 38.16, 29.65, 0.0, 29.59, 32.8, 46.33, 28.92, 40.75, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 39.92], ["mains hum", 29.22], ["fly, housefly", 7.01]], [["whack, thwack", 14.03], ["vehicle", 10.43], ["car", 8.64]], [["throbbing", 24.06], ["music", 23.79], ["hum", 19.79]], [["music", 35.49], ["hum", 12.77], ["mains hum", 8.48]], null, [["music", 63.44], ["theremin", 4.51], ["sound effect", 3.46]], [["music", 25.91], ["hum", 10.22], ["pulse", 6.58]], [["music", 33.48], ["hum", 16.28], ["throbbing", 7.46]], [["music", 54.86], ["musical instrument", 3.91], ["whale vocalization", 3.62]], [["speech", 32.0], ["hum", 16.13], ["music", 15.54]], null, null], "duration": [1.55, 1.21, 0.8, 1.46, 1.95, 0.14, 0.25, -0.05, 0.54, 1.32, 0.52, 0.74, 1.96, 1.9, 0.8, 1.43, 3.15, 3.2, 2.03, 11.95, 0.24, 2.16, 3.17, 4.17, 2.38, 2.04, 1.4, 1.43]}
annotations_filtered/f2Hz2k2PcfI_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[18.0, 29.66], [30.0, 32.16], [35.0, 38.03], [39.0, 40.88], [61.0, 62.55], [64.0, 64.71], [74.0, 75.07], [81.0, 81.84], [84.0, 86.04], [90.0, 90.46], [96.0, 97.34], [99.0, 100.41], [102.0, 102.3], [116.0, 117.86], [119.0, 120.19], [121.0, 122.52], [123.0, 123.57], [125.0, 125.07], [136.0, 136.76], [143.0, 143.45], [145.0, 148.63], [150.0, 151.55], [153.0, 154.75], [159.0, 159.71], [164.0, 167.88], [170.0, 170.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.07, 87.37, 71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.39, 0.0, 0.0, 0.0, 95.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [11.66, 2.16, 3.03, 1.88, 1.55, 0.71, 1.07, 0.84, 2.04, 0.46, 1.34, 1.41, 0.3, 1.86, 1.19, 1.52, 0.57, 0.07, 0.76, 0.45, 3.63, 1.55, 1.75, 0.71, 3.88, 0.73]}
annotations_filtered/f2SskRLd4F4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[12.0, 12.88], [18.0, 34.16], [35.0, 39.88], [41.0, 59.73], [60.0, 62.36], [64.0, 66.38], [68.0, 76.47], [79.0, 95.45]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 59.51, 99.96, 78.55, 99.99, 99.96, 90.08, 46.68], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 69.23], ["theremin", 7.42], ["musical instrument", 4.28]]], "duration": [0.88, 16.16, 4.88, 18.73, 2.36, 2.38, 8.47, 16.45]}
annotations_filtered/f2c-tMZSZtY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[31.0, 34.05], [34.0, 42.7], [49.0, 50.97], [58.0, 59.04], [60.0, 60.17], [63.0, 64.47], [66.0, 66.77], [73.0, 78.88], [81.0, 83.02], [86.0, 89.48], [97.0, 97.31], [97.0, 97.92], [98.0, 98.91], [99.0, 98.96], [100.0, 102.22], [113.0, 113.8], [119.0, 122.44], [123.0, 154.28]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, true, false], "silence_prob": [58.81, 43.05, 0.0, 0.0, 0.0, 0.0, 0.0, 41.66, 53.22, 45.88, 0.0, 0.0, 0.0, 0.0, 58.47, 0.0, 33.06, 0.0], "audiomae_on_audioset": [null, [["speech", 60.01], ["music", 10.89], ["electric shaver, electric razor", 4.18]], null, null, null, null, null, [["music", 52.11], ["hum", 6.59], ["throbbing", 4.05]], null, [["music", 18.22], ["moo", 16.91], ["cattle, bovinae", 16.21]], null, null, null, null, null, null, [["music", 36.73], ["speech", 22.46], ["animal", 2.85]], null], "duration": [3.05, 8.7, 1.97, 1.04, 0.17, 1.47, 0.77, 5.88, 2.02, 3.48, 0.31, 0.92, 0.91, -0.04, 2.22, 0.8, 3.44, 31.28]}
annotations_filtered/f2ugRkVMOuE_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 3.79], [7.0, 7.45], [8.0, 9.81], [13.0, 15.36], [17.0, 17.05], [18.0, 20.19], [22.0, 22.92], [23.0, 24.27], [26.0, 27.08], [30.0, 30.28], [35.0, 35.36], [36.0, 40.31], [44.0, 49.32], [50.0, 59.8], [60.0, 61.28], [64.0, 64.08], [64.0, 66.19], [67.0, 68.66], [73.0, 80.28], [82.0, 82.19], [87.0, 93.36], [104.0, 110.1], [112.0, 115.48], [120.0, 122.96], [126.0, 126.91], [128.0, 128.58]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 40.93, 0.0, 59.96, 0.0, 0.0, 0.0, 0.0, 0.0, 75.55, 60.14, 42.42, 0.0, 0.0, 37.61, 0.0, 34.51, 0.0, 33.7, 34.76, 39.82, 37.89, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 34.65], ["animal", 10.3], ["whimper", 4.86]], null, null, null, null, null, null, null, null, null, [["music", 54.68], ["speech", 14.95], ["wind instrument, woodwind instrument", 7.27]], null, null, [["music", 78.02], ["musical instrument", 3.58], ["guitar", 1.29]], null, [["music", 72.24], ["singing", 2.81], ["musical instrument", 2.21]], null, [["music", 66.72], ["musical instrument", 6.11], ["guitar", 5.36]], [["music", 70.44], ["music of bollywood", 6.5], ["singing", 3.32]], [["music", 75.66], ["speech", 4.04], ["bleat", 1.1]], [["music", 35.62], ["sidetone", 26.31], ["speech", 12.79]], null, null], "duration": [0.79, 0.45, 1.81, 2.36, 0.05, 2.19, 0.92, 1.27, 1.08, 0.28, 0.36, 4.31, 5.32, 9.8, 1.28, 0.08, 2.19, 1.66, 7.28, 0.19, 6.36, 6.1, 3.48, 2.96, 0.91, 0.58]}
annotations_filtered/f39I-UCl9Qo_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 3.74], [4.0, 4.7], [6.0, 6.59], [7.0, 8.99], [10.0, 10.67], [11.0, 11.62], [13.0, 36.9], [38.0, 39.77], [42.0, 47.83], [49.0, 54.65], [56.0, 59.76], [61.0, 62.19], [64.0, 64.71], [65.0, 66.82], [67.0, 70.98], [72.0, 77.11], [78.0, 88.52], [89.0, 90.58], [91.0, 94.46], [96.0, 99.72], [103.0, 119.67], [122.0, 128.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 100.0, 99.84, 94.95, 0.0, 0.0, 0.0, 100.0, 99.98, 100.0, 0.0, 93.91, 94.07, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.74, 0.7, 0.59, 1.99, 0.67, 0.62, 23.9, 1.77, 5.83, 5.65, 3.76, 1.19, 0.71, 1.82, 3.98, 5.11, 10.52, 1.58, 3.46, 3.72, 16.67, 6.43]}
annotations_filtered/f3XcExCD3HM_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[12.0, 12.09], [15.0, 15.69], [17.0, 17.98], [19.0, 20.19], [21.0, 22.25], [30.0, 30.42], [35.0, 36.64], [40.0, 40.04], [43.0, 43.06], [47.0, 48.54], [54.0, 53.97], [55.0, 55.26], [57.0, 57.92], [59.0, 60.56], [62.0, 64.0], [65.0, 66.43], [67.0, 68.44], [71.0, 71.2], [73.0, 73.95], [75.0, 75.41], [79.0, 80.37], [85.0, 86.36], [89.0, 90.83], [98.0, 99.49], [100.0, 100.18], [105.0, 105.93], [107.0, 108.41], [113.0, 114.39], [117.0, 125.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.11], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.09, 0.69, 0.98, 1.19, 1.25, 0.42, 1.64, 0.04, 0.06, 1.54, -0.03, 0.26, 0.92, 1.56, 2.0, 1.43, 1.44, 0.2, 0.95, 0.41, 1.37, 1.36, 1.83, 1.49, 0.18, 0.93, 1.41, 1.39, 8.29]}
annotations_filtered/f3tseBsU248_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[12.0, 12.48], [29.0, 28.58], [52.0, 52.15], [55.0, 55.19], [55.0, 55.83], [56.0, 56.29], [57.0, 58.24], [61.0, 62.6], [63.0, 63.32], [70.0, 70.04], [75.0, 77.11], [83.0, 84.13], [85.0, 85.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, -0.42, 0.15, 0.19, 0.83, 0.29, 1.24, 1.6, 0.32, 0.04, 2.11, 1.13, 0.02]}
annotations_filtered/f3u4j0hVy8c_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[5.0, 20.39], [24.0, 42.15], [43.0, 43.73], [44.0, 50.67], [54.0, 54.41], [56.0, 61.38], [64.0, 64.45], [67.0, 67.95], [69.0, 69.33], [71.0, 72.81], [77.0, 78.16], [82.0, 82.68], [84.0, 85.43], [86.0, 86.85], [94.0, 95.86], [98.0, 100.25], [105.0, 106.54], [109.0, 109.86], [112.0, 112.18], [113.0, 113.81], [116.0, 115.79], [116.0, 117.61], [119.0, 120.85], [121.0, 120.93], [121.0, 121.37], [123.0, 123.26], [124.0, 124.48], [127.0, 128.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.72, 45.95, 0.0, 41.07, 0.0, 38.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 65.35], ["didgeridoo", 15.72], ["musical instrument", 3.14]], [["music", 71.26], ["speech", 5.87], ["theremin", 3.15]], null, [["music", 84.93], ["didgeridoo", 7.01], ["musical instrument", 2.44]], null, [["music", 75.91], ["didgeridoo", 6.86], ["theremin", 3.02]], null, null, null, null, null, null, null, null, null, [["whale vocalization", 43.29], ["speech", 18.93], ["music", 11.09]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [15.39, 18.15, 0.73, 6.67, 0.41, 5.38, 0.45, 0.95, 0.33, 1.81, 1.16, 0.68, 1.43, 0.85, 1.86, 2.25, 1.54, 0.86, 0.18, 0.81, -0.21, 1.61, 1.85, -0.07, 0.37, 0.26, 0.48, 1.01]}
annotations_filtered/f48wH7l3c5I_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[5.0, 6.49], [10.0, 11.08], [13.0, 14.71], [15.0, 18.13], [21.0, 21.63], [29.0, 30.2], [35.0, 35.16], [36.0, 38.18], [39.0, 45.28], [47.0, 57.3], [70.0, 74.75], [78.0, 79.05], [86.0, 90.24], [102.0, 104.18], [106.0, 108.78], [111.0, 116.29]], "keep_status": [false, false, false, false, false, false, false, true, true, false, true, false, true, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 33.39, 0.0, 0.0, 0.0, 30.11, 29.98, 30.67, 31.7, 0.0, 29.76, 32.77, 31.54, 30.76], "audiomae_on_audioset": [null, null, null, [["hum", 27.8], ["mains hum", 23.14], ["speech", 21.49]], null, null, null, [["hum", 19.99], ["mains hum", 10.55], ["sound effect", 9.36]], [["music", 20.18], ["vehicle", 14.5], ["hum", 12.35]], [["music", 60.04], ["synthesizer", 8.21], ["musical instrument", 6.06]], [["music", 45.83], ["hum", 12.53], ["throbbing", 8.43]], null, [["whale vocalization", 19.34], ["sound effect", 11.69], ["echo", 7.1]], [["music", 11.4], ["whale vocalization", 10.92], ["synthesizer", 7.71]], [["buzz", 23.65], ["mains hum", 17.67], ["hum", 11.27]], [["hum", 23.27], ["mains hum", 16.05], ["breaking", 14.76]]], "duration": [1.49, 1.08, 1.71, 3.13, 0.63, 1.2, 0.16, 2.18, 6.28, 10.3, 4.75, 1.05, 4.24, 2.18, 2.78, 5.29]}
annotations_filtered/f4LEgmt0roE_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[10.0, 10.86], [18.0, 18.15], [22.0, 22.67], [79.0, 79.25], [88.0, 90.15], [95.0, 94.96], [99.0, 99.71], [106.0, 107.76], [108.0, 108.75]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.86, 0.15, 0.67, 0.25, 2.15, -0.04, 0.71, 1.76, 0.75]}
annotations_filtered/f4M5MT96FwY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[6.0, 6.44], [13.0, 13.73], [15.0, 22.2], [34.0, 35.97]], "keep_status": [false, false, true, false], "silence_prob": [0.0, 0.0, 32.51, 0.0], "audiomae_on_audioset": [null, null, [["music", 27.79], ["hum", 23.02], ["mains hum", 10.1]], null], "duration": [0.44, 0.73, 7.2, 1.97]}
annotations_filtered/f4gmgTebHog_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 3.94], [6.0, 6.96], [9.0, 25.51], [26.0, 64.93], [69.0, 71.09], [72.0, 74.53], [77.0, 78.68], [80.0, 87.57], [88.0, 89.04], [90.0, 94.95], [99.0, 140.54], [141.0, 155.22], [158.0, 158.57], [162.0, 161.99], [163.0, 164.62], [168.0, 169.67], [174.0, 175.41], [179.0, 180.76], [182.0, 182.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.9, 0.0, 75.23, 55.81, 0.0, 40.31, 0.0, 34.39, 0.0, 30.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 57.35], ["hum", 9.54], ["sonar", 6.95]], null, null, null, null, [["music", 65.75], ["hum", 8.59], ["throbbing", 4.94]], null, [["music", 73.53], ["musical instrument", 6.1], ["guitar", 2.16]], null, [["music", 80.6], ["theremin", 5.71], ["scary music", 2.48]], null, null, null, null, null, null, null], "duration": [0.94, 0.96, 16.51, 38.93, 2.09, 2.53, 1.68, 7.57, 1.04, 4.95, 41.54, 14.22, 0.57, -0.01, 1.62, 1.67, 1.41, 1.76, 0.28]}
annotations_filtered/f4ojzsvQhh0_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[7.0, 7.97], [11.0, 12.18], [13.0, 13.17], [13.0, 21.95], [24.0, 23.72], [28.0, 30.08], [35.0, 36.53], [42.0, 44.14], [46.0, 47.09], [50.0, 51.8], [55.0, 58.35], [59.0, 61.32], [62.0, 63.36], [66.0, 67.85], [70.0, 72.72]], "keep_status": [false, false, false, true, false, true, false, true, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.05, 0.0, 40.71, 0.0, 37.17, 0.0, 0.0, 37.57, 39.96, 0.0, 0.0, 33.1], "audiomae_on_audioset": [null, null, null, [["whale vocalization", 44.11], ["noise", 14.32], ["throbbing", 6.48]], null, [["hum", 28.59], ["mains hum", 21.8], ["music", 8.83]], null, [["hum", 33.3], ["mains hum", 12.71], ["whale vocalization", 5.35]], null, null, [["music", 22.52], ["hum", 16.29], ["rumble", 11.1]], [["hum", 35.51], ["mains hum", 13.57], ["music", 10.6]], null, null, [["speech", 55.74], ["sidetone", 26.44], ["whale vocalization", 5.12]]], "duration": [0.97, 1.18, 0.17, 8.95, -0.28, 2.08, 1.53, 2.14, 1.09, 1.8, 3.35, 2.32, 1.36, 1.85, 2.72]}
annotations_filtered/f4wQCy4xIyY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[10.0, 12.24], [13.0, 18.15], [19.0, 19.55], [21.0, 20.93], [22.0, 22.35], [23.0, 35.67], [36.0, 37.5], [39.0, 103.57], [105.0, 113.14], [115.0, 128.44]], "keep_status": [true, false, false, false, false, true, false, false, true, true], "silence_prob": [39.0, 51.55, 0.0, 0.0, 0.0, 32.94, 0.0, 0.0, 30.39, 31.29], "audiomae_on_audioset": [[["hum", 14.98], ["music", 9.65], ["mains hum", 4.86]], null, null, null, null, [["whack, thwack", 45.92], ["quack", 8.91], ["speech", 8.16]], null, null, [["music", 44.07], ["electronic music", 13.89], ["synthesizer", 8.07]], [["music", 39.16], ["synthesizer", 9.99], ["car", 7.34]]], "duration": [2.24, 5.15, 0.55, -0.07, 0.35, 12.67, 1.5, 64.57, 8.14, 13.44]}
annotations_filtered/f4wmj-Nq9xA_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[12.0, 12.26], [13.0, 13.44], [23.0, 22.79], [51.0, 51.49], [66.0, 66.77], [69.0, 69.72], [73.0, 75.57], [77.0, 78.44]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.3, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.26, 0.44, -0.21, 0.49, 0.77, 0.72, 2.57, 1.44]}
annotations_filtered/f4zl3CuJvt8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 3.84], [9.0, 41.89], [43.0, 44.07], [49.0, 53.27], [54.0, 73.11], [75.0, 83.93], [86.0, 89.02], [90.0, 92.04], [93.0, 98.49], [102.0, 108.31], [111.0, 111.05], [112.0, 112.53], [126.0, 137.17], [139.0, 139.29], [140.0, 144.24], [146.0, 147.41], [148.0, 150.18], [152.0, 166.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.6, 30.81, 58.13, 99.36, 89.19, 79.07, 36.88, 0.0, 0.0, 31.9, 0.0, 72.75, 0.0, 90.08, 32.37], "audiomae_on_audioset": [null, null, null, [["music", 30.72], ["throbbing", 21.43], ["hum", 20.26]], [["cattle, bovinae", 34.71], ["livestock, farm animals, working animals", 23.24], ["moo", 20.93]], null, null, null, null, [["music", 70.31], ["hum", 4.57], ["synthesizer", 4.0]], null, null, [["music", 63.22], ["didgeridoo", 6.42], ["synthesizer", 4.16]], null, null, null, null, [["music", 66.84], ["didgeridoo", 4.72], ["musical instrument", 3.75]]], "duration": [-0.16, 32.89, 1.07, 4.27, 19.11, 8.93, 3.02, 2.04, 5.49, 6.31, 0.05, 0.53, 11.17, 0.29, 4.24, 1.41, 2.18, 14.87]}
annotations_filtered/f505OHOUHoU_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[97.0, 101.71], [107.0, 113.88], [116.0, 117.27], [119.0, 124.16], [126.0, 127.52]], "keep_status": [true, true, false, true, false], "silence_prob": [43.61, 45.05, 0.0, 38.15, 0.0], "audiomae_on_audioset": [[["music", 29.75], ["didgeridoo", 14.16], ["hum", 10.71]], [["music", 23.03], ["hum", 15.28], ["whale vocalization", 10.38]], null, [["music", 44.99], ["sonar", 7.4], ["electronic music", 6.32]], null], "duration": [4.71, 6.88, 1.27, 5.16, 1.52]}
annotations_filtered/f57Vat6YZUI_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 3.57], [8.0, 9.15], [12.0, 13.76], [18.0, 18.82], [22.0, 24.71], [26.0, 26.43], [31.0, 31.67], [44.0, 52.08], [54.0, 62.4], [64.0, 87.49], [92.0, 96.55], [99.0, 107.64], [108.0, 120.45], [124.0, 145.62], [147.0, 148.91]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 39.47, 0.0, 0.0, 32.99, 32.11, 32.18, 31.72, 31.8, 31.43, 30.86, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 31.73], ["hum", 20.46], ["mains hum", 17.22]], null, null, [["music", 42.8], ["hum", 25.81], ["throbbing", 16.19]], [["music", 81.6], ["singing", 0.98], ["music of bollywood", 0.9]], [["music", 80.16], ["throbbing", 3.88], ["hum", 2.89]], [["music", 58.77], ["throbbing", 5.17], ["hum", 4.6]], [["music", 46.69], ["hum", 11.18], ["mains hum", 7.27]], [["music", 64.44], ["hum", 9.92], ["throbbing", 8.0]], [["music", 87.48], ["musical instrument", 0.98], ["carnatic music", 0.73]], null], "duration": [1.57, 1.15, 1.76, 0.82, 2.71, 0.43, 0.67, 8.08, 8.4, 23.49, 4.55, 8.64, 12.45, 21.62, 1.91]}
annotations_filtered/f58Ba78abHg_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[5.0, 5.98], [6.0, 7.59], [9.0, 9.26], [15.0, 16.97], [19.0, 26.18], [27.0, 28.34], [32.0, 36.71], [38.0, 43.04], [44.0, 45.96], [47.0, 48.9], [50.0, 50.84], [53.0, 54.55], [58.0, 58.72], [59.0, 76.18], [77.0, 78.63]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 50.61, 0.0, 49.0, 58.81, 0.0, 0.0, 0.0, 0.0, 0.0, 32.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 24.26], ["gong", 23.41], ["singing bowl", 16.74]], null, null, null, null, null, null, [["music", 49.09], ["synthesizer", 13.45], ["ambient music", 7.68]], null], "duration": [0.98, 1.59, 0.26, 1.97, 7.18, 1.34, 4.71, 5.04, 1.96, 1.9, 0.84, 1.55, 0.72, 17.18, 1.63]}
annotations_filtered/f5e73A39TF4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 2.81], [5.0, 5.88], [20.0, 23.33], [26.0, 26.81], [32.0, 33.76], [35.0, 36.12], [40.0, 41.5], [49.0, 50.3], [51.0, 52.41], [57.0, 56.88], [60.0, 60.61], [64.0, 65.92], [74.0, 75.93], [77.0, 79.84], [100.0, 100.97], [106.0, 106.12], [107.0, 107.28], [110.0, 111.42], [115.0, 116.46], [121.0, 123.5], [126.0, 125.91], [129.0, 131.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 0.88, 3.33, 0.81, 1.76, 1.12, 1.5, 1.3, 1.41, -0.12, 0.61, 1.92, 1.93, 2.84, 0.97, 0.12, 0.28, 1.42, 1.46, 2.5, -0.09, 2.41]}
annotations_filtered/f5f86alm7jk_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 3.52], [7.0, 7.25], [9.0, 9.17], [11.0, 11.26], [12.0, 12.77], [15.0, 16.09], [18.0, 18.54], [19.0, 22.23], [26.0, 28.51], [29.0, 33.03], [36.0, 36.54], [39.0, 40.39], [55.0, 56.2], [57.0, 57.94], [59.0, 61.69], [62.0, 63.51], [71.0, 71.52], [80.0, 83.07], [85.0, 85.43], [89.0, 88.7], [104.0, 104.35], [107.0, 107.79], [110.0, 111.03], [114.0, 114.86], [117.0, 117.69], [118.0, 119.75], [122.0, 123.92], [125.0, 126.5], [128.0, 128.78]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.36, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["thunk", 24.79], ["speech", 18.16], ["boing", 16.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 0.25, 0.17, 0.26, 0.77, 1.09, 0.54, 3.23, 2.51, 4.03, 0.54, 1.39, 1.2, 0.94, 2.69, 1.51, 0.52, 3.07, 0.43, -0.3, 0.35, 0.79, 1.03, 0.86, 0.69, 1.75, 1.92, 1.5, 0.78]}
annotations_filtered/f5mcMmE3RL8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 33.71], [35.0, 201.43], [202.0, 210.61], [212.0, 212.75]], "keep_status": [false, false, true, false], "silence_prob": [0.0, 0.0, 41.09, 0.0], "audiomae_on_audioset": [null, null, [["music", 35.85], ["didgeridoo", 20.38], ["mains hum", 6.89]], null], "duration": [30.71, 166.43, 8.61, 0.75]}
annotations_filtered/f5umSa_YYX0_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 4.11], [6.0, 8.01], [12.0, 20.82], [22.0, 27.48], [34.0, 35.38], [46.0, 47.65], [57.0, 57.79], [61.0, 62.34], [82.0, 82.36], [84.0, 90.48], [92.0, 92.75], [93.0, 93.7], [96.0, 97.92], [98.0, 99.54], [100.0, 102.69], [105.0, 106.54], [107.0, 107.6], [108.0, 109.85], [110.0, 110.96], [112.0, 113.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.88, 100.0, 99.93, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.11, 2.01, 8.82, 5.48, 1.38, 1.65, 0.79, 1.34, 0.36, 6.48, 0.75, 0.7, 1.92, 1.54, 2.69, 1.54, 0.6, 1.85, 0.96, 1.8]}
annotations_filtered/f6DDYCf80hw_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[9.0, 10.23], [14.0, 14.45], [16.0, 17.83], [19.0, 18.84], [21.0, 26.25], [30.0, 30.75], [33.0, 34.3], [36.0, 48.93], [50.0, 54.9], [56.0, 57.97], [59.0, 62.55], [64.0, 65.33], [69.0, 82.44], [84.0, 91.71], [96.0, 114.64], [117.0, 120.07], [124.0, 144.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 70.58, 0.0, 0.0, 78.04, 77.36, 0.0, 74.76, 0.0, 50.76, 42.58, 36.94, 31.15, 38.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 29.71], ["music", 9.21], ["throbbing", 7.89]], [["speech", 49.38], ["music", 18.35], ["beatboxing", 6.0]], [["speech", 30.85], ["music", 11.07], ["didgeridoo", 4.9]], [["speech", 52.62], ["music", 11.98], ["hum", 9.68]]], "duration": [1.23, 0.45, 1.83, -0.16, 5.25, 0.75, 1.3, 12.93, 4.9, 1.97, 3.55, 1.33, 13.44, 7.71, 18.64, 3.07, 20.21]}
annotations_filtered/f6Dan7z0p4c_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []}
annotations_filtered/f6F6MzMT2g8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[6.0, 12.09], [13.0, 16.93], [18.0, 18.32], [19.0, 21.0], [24.0, 27.57], [28.0, 31.51], [35.0, 34.82], [43.0, 44.64], [46.0, 48.1], [57.0, 63.44], [72.0, 72.12], [74.0, 75.52], [78.0, 78.16], [80.0, 79.96], [82.0, 84.06], [92.0, 91.69], [95.0, 94.95], [96.0, 100.28], [113.0, 113.43], [114.0, 118.67], [120.0, 121.12], [122.0, 123.35], [126.0, 126.2], [130.0, 130.15], [144.0, 144.64]], "keep_status": [true, true, false, true, true, true, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [33.03, 32.04, 0.0, 44.72, 37.2, 38.27, 0.0, 0.0, 35.5, 34.92, 0.0, 0.0, 0.0, 0.0, 35.03, 0.0, 0.0, 32.3, 0.0, 35.62, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 29.26], ["speech", 20.99], ["throbbing", 11.58]], [["music", 43.75], ["speech", 15.22], ["hum", 3.44]], null, [["speech", 20.27], ["music", 14.68], ["fly, housefly", 7.36]], [["music", 19.69], ["foghorn", 18.88], ["speech", 10.07]], [["music", 30.89], ["speech", 26.63], ["radio", 7.85]], null, null, [["music", 55.66], ["speech", 10.33], ["musical instrument", 3.42]], [["music", 63.02], ["throbbing", 5.72], ["noise", 5.58]], null, null, null, null, [["music", 74.66], ["synthesizer", 10.35], ["musical instrument", 4.21]], null, null, [["music", 38.66], ["speech", 17.93], ["hum", 11.79]], null, [["speech", 36.69], ["music", 28.19], ["hum", 9.87]], null, null, null, null, null], "duration": [6.09, 3.93, 0.32, 2.0, 3.57, 3.51, -0.18, 1.64, 2.1, 6.44, 0.12, 1.52, 0.16, -0.04, 2.06, -0.31, -0.05, 4.28, 0.43, 4.67, 1.12, 1.35, 0.2, 0.15, 0.64]}
annotations_filtered/f6hhVIV_LPs_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 5.43], [11.0, 12.28], [14.0, 14.74], [16.0, 16.53], [17.0, 17.25], [20.0, 20.09], [22.0, 21.93], [25.0, 25.32], [26.0, 27.31], [29.0, 29.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [78.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [2.43, 1.28, 0.74, 0.53, 0.25, 0.09, -0.07, 0.32, 1.31, 0.29]}
annotations_filtered/f6m4J0AfEOo_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[23.0, 24.38], [26.0, 28.19], [30.0, 31.73], [32.0, 32.48], [32.0, 32.51], [33.0, 32.54], [33.0, 32.58], [33.0, 32.61], [33.0, 32.64], [33.0, 32.68], [33.0, 32.71], [33.0, 32.75], [33.0, 32.78], [33.0, 32.81], [33.0, 33.24], [33.0, 33.27], [35.0, 36.76], [38.0, 38.23], [41.0, 47.22], [48.0, 48.68], [53.0, 58.33], [59.0, 58.72], [66.0, 72.57], [74.0, 74.56], [78.0, 78.49], [83.0, 83.84], [91.0, 91.62], [93.0, 93.6]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.05, 0.0, 50.61, 0.0, 82.79, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 7.73], ["moo", 6.22], ["vehicle", 5.84]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.59], ["buzz", 6.8], ["musical instrument", 5.8]], null, null, null, null, null, null, null, null, null], "duration": [1.38, 2.19, 1.73, 0.48, 0.51, -0.46, -0.42, -0.39, -0.36, -0.32, -0.29, -0.25, -0.22, -0.19, 0.24, 0.27, 1.76, 0.23, 6.22, 0.68, 5.33, -0.28, 6.57, 0.56, 0.49, 0.84, 0.62, 0.6]}