bpiyush commited on
Commit
a271ceb
·
1 Parent(s): 092fdf5
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. annotations_filtered/c--eNhRG5B4_filtered.json +1 -0
  2. annotations_filtered/c-NDI-HvYd4_filtered.json +1 -0
  3. annotations_filtered/c-ecbGNxEHM_filtered.json +1 -0
  4. annotations_filtered/c-ej3IOxBno_filtered.json +1 -0
  5. annotations_filtered/c-jOeDA-X0k_filtered.json +1 -0
  6. annotations_filtered/c-tGV96ceBM_filtered.json +1 -0
  7. annotations_filtered/c-unYxWW6ws_filtered.json +1 -0
  8. annotations_filtered/c-veUs6bPHY_filtered.json +1 -0
  9. annotations_filtered/c-zaHGYURv0_filtered.json +1 -0
  10. annotations_filtered/c0-3FQ-_SAg_filtered.json +1 -0
  11. annotations_filtered/c0JxgKT4jZc_filtered.json +1 -0
  12. annotations_filtered/c0N60xOU9yk_filtered.json +1 -0
  13. annotations_filtered/c0RlK3VAmzg_filtered.json +1 -0
  14. annotations_filtered/c0XTkj3PIWg_filtered.json +1 -0
  15. annotations_filtered/c0wH6YDfCzg_filtered.json +1 -0
  16. annotations_filtered/c17KWinVFss_filtered.json +1 -0
  17. annotations_filtered/c1EyN9xTK94_filtered.json +1 -0
  18. annotations_filtered/c1nmARXTuvE_filtered.json +1 -0
  19. annotations_filtered/c2HEnbmtknM_filtered.json +1 -0
  20. annotations_filtered/c2HZzrcEbZc_filtered.json +1 -0
  21. annotations_filtered/c2TcT9JairA_filtered.json +1 -0
  22. annotations_filtered/c2ecZiVEs70_filtered.json +1 -0
  23. annotations_filtered/c2k_kuU84ro_filtered.json +1 -0
  24. annotations_filtered/c2tWZFAL5t4_filtered.json +1 -0
  25. annotations_filtered/c35RsjYzAhY_filtered.json +1 -0
  26. annotations_filtered/c38HJR-9vhU_filtered.json +1 -0
  27. annotations_filtered/c3nJu9SBkis_filtered.json +1 -0
  28. annotations_filtered/c3uOWTAuaTQ_filtered.json +1 -0
  29. annotations_filtered/c3vmsUcknhY_filtered.json +1 -0
  30. annotations_filtered/c3zRfKmcqv8_filtered.json +1 -0
  31. annotations_filtered/c4Wls5pZlxQ_filtered.json +1 -0
  32. annotations_filtered/c4X58OjlVPo_filtered.json +1 -0
  33. annotations_filtered/c4ibjfBu1IY_filtered.json +1 -0
  34. annotations_filtered/c4ux2NclHoE_filtered.json +1 -0
  35. annotations_filtered/c4w-IE-Hsqc_filtered.json +1 -0
  36. annotations_filtered/c5BJJbtFP4E_filtered.json +1 -0
  37. annotations_filtered/c5Re3lGYUA0_filtered.json +1 -0
  38. annotations_filtered/c5WfxwnLlLU_filtered.json +1 -0
  39. annotations_filtered/c5ZiiE8fyGk_filtered.json +1 -0
  40. annotations_filtered/c5mAaBl_qqk_filtered.json +1 -0
  41. annotations_filtered/c5zKpr5gmgk_filtered.json +1 -0
  42. annotations_filtered/c6XHLe94SJA_filtered.json +1 -0
  43. annotations_filtered/c6dmj-WpTW4_filtered.json +1 -0
  44. annotations_filtered/c6ik-AA87Uo_filtered.json +1 -0
  45. annotations_filtered/c6mLa5_GvCQ_filtered.json +1 -0
  46. annotations_filtered/c7-u-fyUSkM_filtered.json +1 -0
  47. annotations_filtered/c77JrXbqqV0_filtered.json +1 -0
  48. annotations_filtered/c7AescgZzEg_filtered.json +1 -0
  49. annotations_filtered/c7RyGNzyGB4_filtered.json +1 -0
  50. annotations_filtered/c7tvfdSjRE4_filtered.json +1 -0
annotations_filtered/c--eNhRG5B4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[13.0, 12.75], [16.0, 17.24], [21.0, 24.0], [27.0, 27.03], [28.0, 29.71], [33.0, 33.18], [34.0, 34.3], [36.0, 38.08], [38.0, 38.84], [40.0, 40.02], [40.0, 40.66], [42.0, 45.32], [46.0, 46.75], [48.0, 47.97], [52.0, 53.87], [55.0, 57.06], [58.0, 58.99], [61.0, 61.5], [62.0, 64.79], [65.0, 68.23], [71.0, 75.93], [83.0, 86.93], [99.0, 99.99], [114.0, 130.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 50.86, 0.0, 0.0, 0.0, 0.0, 97.33, 0.0, 0.0, 0.0, 73.97, 0.0, 0.0, 0.0, 98.01, 0.0, 0.0, 75.55, 42.84, 34.5, 30.4, 0.0, 30.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.76], ["speech", 30.82], ["musical instrument", 4.26]], [["music", 38.03], ["effects unit", 9.21], ["musical instrument", 6.73]], [["music", 69.33], ["effects unit", 4.15], ["musical instrument", 3.77]], null, [["music", 43.41], ["effects unit", 9.97], ["theremin", 5.91]]], "duration": [-0.25, 1.24, 3.0, 0.03, 1.71, 0.18, 0.3, 2.08, 0.84, 0.02, 0.66, 3.32, 0.75, -0.03, 1.87, 2.06, 0.99, 0.5, 2.79, 3.23, 4.93, 3.93, 0.99, 16.59]}
annotations_filtered/c-NDI-HvYd4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[17.0, 17.95], [20.0, 29.0], [32.0, 51.93], [58.0, 113.16], [116.0, 128.36], [131.0, 131.84]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 30.7, 30.3, 0.0, 29.33, 0.0], "audiomae_on_audioset": [null, [["music", 67.8], ["speech", 8.21], ["musical instrument", 2.94]], [["speech", 38.27], ["buzz", 26.84], ["music", 15.7]], null, [["fly, housefly", 36.74], ["mosquito", 21.11], ["insect", 20.32]], null], "duration": [0.95, 9.0, 19.93, 55.16, 12.36, 0.84]}
annotations_filtered/c-ecbGNxEHM_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[17.0, 17.2], [21.0, 22.96], [23.0, 29.19], [35.0, 35.72], [39.0, 39.14], [39.0, 40.53], [41.0, 43.6], [45.0, 45.49], [47.0, 47.95], [60.0, 68.1], [75.0, 75.69], [79.0, 79.73], [81.0, 82.59], [87.0, 91.89], [95.0, 99.23], [101.0, 101.76], [103.0, 103.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 34.29, 0.0, 0.0, 0.0, 55.81, 0.0, 0.0, 41.7, 0.0, 0.0, 0.0, 38.05, 34.43, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 67.49], ["theremin", 7.38], ["ambient music", 6.2]], null, null, null, null, null, null, [["throbbing", 55.09], ["hum", 19.79], ["heart sounds, heartbeat", 7.4]], null, null, null, [["speech", 53.0], ["music", 12.31], ["hum", 5.12]], [["speech", 34.19], ["sidetone", 12.52], ["hum", 6.99]], null, null], "duration": [0.2, 1.96, 6.19, 0.72, 0.14, 1.53, 2.6, 0.49, 0.95, 8.1, 0.69, 0.73, 1.59, 4.89, 4.23, 0.76, 0.67]}
annotations_filtered/c-ej3IOxBno_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 2.4], [3.0, 4.48], [8.0, 8.43], [10.0, 11.2], [12.0, 14.22], [15.0, 16.92], [19.0, 20.61], [22.0, 29.84], [32.0, 32.86]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.4, 1.48, 0.43, 1.2, 2.22, 1.92, 1.61, 7.84, 0.86]}
annotations_filtered/c-jOeDA-X0k_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 4.01], [6.0, 8.02], [9.0, 10.27], [13.0, 15.62], [17.0, 33.62], [35.0, 35.18], [39.0, 39.5], [41.0, 43.31], [44.0, 44.9], [46.0, 50.67], [52.0, 51.7], [55.0, 56.03], [60.0, 66.87], [67.0, 70.11], [74.0, 75.52], [77.0, 77.16], [79.0, 78.78], [80.0, 81.67], [84.0, 84.87], [86.0, 86.27], [91.0, 114.71], [117.0, 117.37], [119.0, 119.94]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 99.71, 0.0, 99.44, 41.01, 0.0, 0.0, 35.32, 0.0, 39.64, 0.0, 0.0, 32.96, 36.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.92, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 62.67], ["music", 7.16], ["bouncing", 5.57]], null, null, [["didgeridoo", 52.55], ["mains hum", 10.61], ["sidetone", 6.89]], null, [["speech", 23.69], ["music", 22.55], ["mains hum", 10.27]], null, null, [["music", 31.26], ["didgeridoo", 30.99], ["hum", 6.33]], [["didgeridoo", 25.35], ["music", 18.32], ["speech", 15.31]], null, null, null, null, null, null, [["speech", 41.82], ["music", 18.51], ["effects unit", 5.27]], null, null], "duration": [1.01, 2.02, 1.27, 2.62, 16.62, 0.18, 0.5, 2.31, 0.9, 4.67, -0.3, 1.03, 6.87, 3.11, 1.52, 0.16, -0.22, 1.67, 0.87, 0.27, 23.71, 0.37, 0.94]}
annotations_filtered/c-tGV96ceBM_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[10.0, 13.42], [14.0, 15.53], [16.0, 18.96], [20.0, 21.86], [25.0, 25.95], [32.0, 32.61], [33.0, 33.64], [36.0, 35.92], [39.0, 39.82], [42.0, 43.38], [50.0, 51.44], [52.0, 55.05], [56.0, 56.64], [58.0, 58.5], [60.0, 62.28], [65.0, 65.37], [71.0, 71.19], [71.0, 72.84], [76.0, 76.05], [77.0, 78.06], [83.0, 84.25], [86.0, 98.07], [100.0, 102.24], [104.0, 105.31], [106.0, 106.81], [109.0, 109.53], [111.0, 111.91], [113.0, 114.42], [115.0, 118.66], [119.0, 121.22], [122.0, 134.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [81.35, 0.0, 76.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.59, 0.0, 0.0, 61.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.77, 98.86, 0.0, 0.0, 0.0, 0.0, 0.0, 45.4, 97.22, 99.71], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.58], ["rumble", 13.13], ["hum", 10.9]], null, null], "duration": [3.42, 1.53, 2.96, 1.86, 0.95, 0.61, 0.64, -0.08, 0.82, 1.38, 1.44, 3.05, 0.64, 0.5, 2.28, 0.37, 0.19, 1.84, 0.05, 1.06, 1.25, 12.07, 2.24, 1.31, 0.81, 0.53, 0.91, 1.42, 3.66, 2.22, 12.64]}
annotations_filtered/c-unYxWW6ws_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 8.02], [9.0, 9.66], [10.0, 13.51], [14.0, 14.96], [16.0, 18.35], [21.0, 23.38], [25.0, 26.2], [27.0, 28.95], [30.0, 30.92], [32.0, 31.95], [33.0, 33.91], [35.0, 41.1], [43.0, 46.47], [48.0, 54.46], [56.0, 57.52], [59.0, 61.69], [65.0, 67.83], [70.0, 71.98], [74.0, 75.63], [85.0, 88.65], [95.0, 99.87], [102.0, 103.52], [105.0, 109.58], [115.0, 119.06], [121.0, 122.32], [129.0, 132.76], [136.0, 138.67], [141.0, 144.51], [146.0, 150.43], [151.0, 152.85], [155.0, 157.08], [159.0, 159.9], [161.0, 166.04], [168.0, 174.8]], "keep_status": [true, false, true, false, true, true, false, false, false, false, false, true, true, true, false, true, true, false, false, true, false, false, false, true, false, true, true, true, true, false, false, false, false, false], "silence_prob": [41.34, 0.0, 39.72, 0.0, 48.31, 42.02, 0.0, 0.0, 0.0, 0.0, 0.0, 46.64, 44.87, 47.05, 0.0, 38.38, 41.32, 0.0, 0.0, 40.02, 38.28, 0.0, 40.99, 46.9, 0.0, 48.23, 39.15, 41.7, 38.84, 0.0, 39.94, 0.0, 36.8, 33.54], "audiomae_on_audioset": [[["hum", 25.59], ["mains hum", 12.82], ["throbbing", 8.37]], null, [["hum", 22.11], ["speech", 19.54], ["whale vocalization", 9.24]], null, [["hum", 35.17], ["throbbing", 11.11], ["music", 9.26]], [["music", 13.88], ["hum", 10.59], ["speech", 10.52]], null, null, null, null, null, [["rumble", 21.42], ["speech", 11.46], ["hum", 7.3]], [["speech", 43.64], ["hum", 13.17], ["rumble", 11.67]], [["music", 53.9], ["musical instrument", 4.2], ["theremin", 2.81]], null, [["music", 55.9], ["hum", 6.92], ["throbbing", 5.41]], [["music", 37.45], ["speech", 17.61], ["hum", 4.22]], null, null, [["music", 36.08], ["speech", 16.53], ["synthesizer", 3.43]], [["music", 61.53], ["ambient music", 7.05], ["harmonic", 4.26]], null, [["music", 50.05], ["ambient music", 16.0], ["whale vocalization", 6.53]], [["speech", 57.09], ["field recording", 6.19], ["rumble", 5.5]], null, [["speech", 16.8], ["fire", 6.47], ["vehicle", 6.14]], [["speech", 25.43], ["music", 21.33], ["hum", 20.62]], [["music", 35.49], ["hum", 7.98], ["electronic music", 5.13]], [["music", 49.43], ["didgeridoo", 5.18], ["speech", 5.13]], null, [["music", 48.16], ["synthesizer", 18.3], ["ambient music", 7.19]], null, [["music", 71.4], ["musical instrument", 3.32], ["gong", 3.0]], [["music", 64.7], ["musical instrument", 5.76], ["guitar", 4.98]]], "duration": [7.02, 0.66, 3.51, 0.96, 2.35, 2.38, 1.2, 1.95, 0.92, -0.05, 0.91, 6.1, 3.47, 6.46, 1.52, 2.69, 2.83, 1.98, 1.63, 3.65, 4.87, 1.52, 4.58, 4.06, 1.32, 3.76, 2.67, 3.51, 4.43, 1.85, 2.08, 0.9, 5.04, 6.8]}
annotations_filtered/c-veUs6bPHY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[0.0, 0.3], [0.0, 7.47], [9.0, 9.39], [12.0, 12.72], [14.0, 16.11], [22.0, 22.72], [24.0, 25.25], [32.0, 32.14], [37.0, 37.77], [38.0, 38.96], [40.0, 40.53], [51.0, 51.8], [52.0, 54.72], [66.0, 67.61], [69.0, 74.68], [76.0, 79.05], [81.0, 81.38], [82.0, 82.43], [83.0, 83.91], [92.0, 94.73], [97.0, 97.56], [103.0, 103.84], [109.0, 110.22], [111.0, 112.51], [113.0, 116.55], [131.0, 131.28]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 34.93, 0.0, 0.0, 36.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.08, 0.0, 33.67, 35.12, 0.0, 0.0, 0.0, 33.54, 0.0, 0.0, 0.0, 0.0, 34.82, 0.0], "audiomae_on_audioset": [null, [["noise", 46.75], ["hum", 6.66], ["whale vocalization", 5.04]], null, null, [["sine wave", 23.79], ["hum", 11.84], ["chirp tone", 8.58]], null, null, null, null, null, null, null, [["hum", 20.66], ["music", 17.31], ["speech", 14.34]], null, [["speech", 44.64], ["hum", 12.75], ["mains hum", 8.95]], [["hum", 45.97], ["mains hum", 19.85], ["throbbing", 12.65]], null, null, null, [["speech", 55.32], ["hum", 8.2], ["bee, wasp, etc.", 5.57]], null, null, null, null, [["hum", 52.14], ["mains hum", 23.69], ["throbbing", 17.08]], null], "duration": [0.3, 7.47, 0.39, 0.72, 2.11, 0.72, 1.25, 0.14, 0.77, 0.96, 0.53, 0.8, 2.72, 1.61, 5.68, 3.05, 0.38, 0.43, 0.91, 2.73, 0.56, 0.84, 1.22, 1.51, 3.55, 0.28]}
annotations_filtered/c-zaHGYURv0_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 0.97], [1.0, 1.04], [5.0, 5.97], [11.0, 11.01], [12.0, 21.05], [22.0, 23.21], [28.0, 28.75], [32.0, 36.41], [37.0, 52.0], [54.0, 54.62], [55.0, 56.67], [60.0, 62.29], [64.0, 64.77], [65.0, 76.45], [78.0, 84.28], [91.0, 94.19], [95.0, 96.67], [98.0, 98.9], [101.0, 104.87], [107.0, 106.76], [107.0, 106.83], [107.0, 114.37], [115.0, 115.75], [117.0, 117.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 72.6, 0.0, 0.0, 43.2, 51.5, 0.0, 0.0, 69.61, 0.0, 45.3, 41.98, 61.87, 0.0, 0.0, 62.89, 0.0, 0.0, 31.8, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["mains hum", 48.17], ["hum", 29.27], ["speech", 4.95]], null, null, null, null, null, [["music", 56.67], ["musical instrument", 4.75], ["marimba, xylophone", 4.21]], [["music", 34.11], ["mains hum", 18.6], ["hum", 17.31]], null, null, null, null, null, null, [["mains hum", 36.41], ["hum", 16.38], ["music", 14.0]], null, null], "duration": [-0.03, 0.04, 0.97, 0.01, 9.05, 1.21, 0.75, 4.41, 15.0, 0.62, 1.67, 2.29, 0.77, 11.45, 6.28, 3.19, 1.67, 0.9, 3.87, -0.24, -0.17, 7.37, 0.75, 0.76]}
annotations_filtered/c0-3FQ-_SAg_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[8.0, 8.78], [10.0, 11.18], [17.0, 68.39], [69.0, 70.58], [73.0, 77.23], [80.0, 89.04], [93.0, 93.75], [96.0, 120.38], [123.0, 124.38], [129.0, 132.0], [133.0, 137.12], [139.0, 139.36], [140.0, 149.71]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.95, 31.52, 0.0, 29.68, 0.0, 78.38, 53.97, 0.0, 41.03], "audiomae_on_audioset": [null, null, null, null, [["fart", 37.84], ["sound effect", 10.16], ["groan", 9.5]], [["speech", 82.77], ["didgeridoo", 2.49], ["music", 1.61]], null, [["music", 24.27], ["livestock, farm animals, working animals", 15.7], ["speech", 12.7]], null, null, null, null, [["music", 65.3], ["speech", 11.15], ["thunk", 3.98]]], "duration": [0.78, 1.18, 51.39, 1.58, 4.23, 9.04, 0.75, 24.38, 1.38, 3.0, 4.12, 0.36, 9.71]}
annotations_filtered/c0JxgKT4jZc_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[31.0, 66.31], [68.0, 79.14], [81.0, 83.56]], "keep_status": [false, false, false], "silence_prob": [0.0, 99.1, 98.66], "audiomae_on_audioset": [null, null, null], "duration": [35.31, 11.14, 2.56]}
annotations_filtered/c0N60xOU9yk_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[14.0, 14.82], [19.0, 21.14], [26.0, 26.4], [29.0, 29.54], [32.0, 31.7], [38.0, 38.15], [40.0, 41.18], [44.0, 45.37], [51.0, 52.27], [53.0, 54.19], [58.0, 58.04], [59.0, 59.02], [61.0, 61.43], [63.0, 62.78], [68.0, 68.88], [72.0, 72.81], [85.0, 84.69], [88.0, 88.59], [106.0, 106.07], [111.0, 113.14], [114.0, 114.76], [121.0, 120.66], [124.0, 127.13], [129.0, 129.3], [133.0, 133.22], [134.0, 134.32], [139.0, 139.68], [141.0, 141.74], [160.0, 160.3], [163.0, 168.47], [169.0, 172.64], [174.0, 176.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.93, 59.96, 72.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.82, 2.14, 0.4, 0.54, -0.3, 0.15, 1.18, 1.37, 1.27, 1.19, 0.04, 0.02, 0.43, -0.22, 0.88, 0.81, -0.31, 0.59, 0.07, 2.14, 0.76, -0.34, 3.13, 0.3, 0.22, 0.32, 0.68, 0.74, 0.3, 5.47, 3.64, 2.32]}
annotations_filtered/c0RlK3VAmzg_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[7.0, 11.37], [16.0, 16.11], [17.0, 17.25], [24.0, 24.38], [26.0, 26.4], [34.0, 35.7], [37.0, 40.95], [42.0, 42.92], [53.0, 52.86], [53.0, 61.5], [63.0, 66.09], [68.0, 70.75], [71.0, 71.52], [96.0, 98.19], [106.0, 106.52], [125.0, 126.91]], "keep_status": [true, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [42.81, 0.0, 0.0, 0.0, 0.0, 0.0, 49.31, 0.0, 0.0, 33.09, 99.16, 68.54, 0.0, 78.21, 0.0, 0.0], "audiomae_on_audioset": [[["sine wave", 12.59], ["hum", 11.63], ["throbbing", 10.25]], null, null, null, null, null, [["music", 54.09], ["speech", 10.06], ["hum", 4.92]], null, null, [["speech", 23.18], ["fart", 14.34], ["sidetone", 12.2]], null, null, null, null, null, null], "duration": [4.37, 0.11, 0.25, 0.38, 0.4, 1.7, 3.95, 0.92, -0.14, 8.5, 3.09, 2.75, 0.52, 2.19, 0.52, 1.91]}
annotations_filtered/c0XTkj3PIWg_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[6.0, 6.22], [22.0, 27.99], [29.0, 29.96], [34.0, 34.87], [36.0, 37.4], [38.0, 39.87], [41.0, 43.34], [45.0, 45.81], [50.0, 53.7], [55.0, 55.73], [56.0, 61.94], [65.0, 64.66], [65.0, 66.61], [67.0, 68.17], [80.0, 80.62], [81.0, 81.48], [83.0, 84.48], [88.0, 87.81], [99.0, 101.78], [103.0, 116.92], [117.0, 126.32], [127.0, 126.71], [129.0, 129.22], [131.0, 131.77], [133.0, 133.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 53.72, 0.0, 0.0, 0.0, 0.0, 57.01, 0.0, 64.07, 0.0, 57.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.14, 42.6, 48.1, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 20.73], ["thunk", 7.88], ["boing", 7.15]], [["music", 61.73], ["hum", 10.22], ["synthesizer", 4.69]], [["music", 35.0], ["speech", 11.13], ["fly, housefly", 7.93]], null, null, null, null], "duration": [0.22, 5.99, 0.96, 0.87, 1.4, 1.87, 2.34, 0.81, 3.7, 0.73, 5.94, -0.34, 1.61, 1.17, 0.62, 0.48, 1.48, -0.19, 2.78, 13.92, 9.32, -0.29, 0.22, 0.77, 0.08]}
annotations_filtered/c0wH6YDfCzg_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 2.88], [8.0, 8.34], [11.0, 11.77], [13.0, 13.83], [15.0, 15.26], [17.0, 28.11], [30.0, 31.41], [35.0, 38.75], [39.0, 48.24], [49.0, 51.06], [58.0, 59.49], [73.0, 80.32], [85.0, 99.13], [103.0, 124.33], [127.0, 127.62], [133.0, 133.78], [138.0, 139.19], [144.0, 145.86], [151.0, 152.44], [157.0, 158.68], [167.0, 168.62]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, true, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0, 47.27, 34.88, 36.3, 0.0, 33.95, 37.24, 38.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 20.05], ["mains hum", 9.61], ["music", 7.84]], [["speech", 57.77], ["noise", 10.01], ["buzz", 8.07]], [["speech", 31.54], ["radio", 14.36], ["fly, housefly", 3.99]], null, [["mains hum", 22.85], ["hum", 19.54], ["buzz", 14.76]], [["music", 49.33], ["theremin", 11.1], ["buzz", 4.6]], [["music", 48.34], ["brass instrument", 13.65], ["wind instrument, woodwind instrument", 6.42]], null, null, null, null, null, null, null], "duration": [0.88, 0.34, 0.77, 0.83, 0.26, 11.11, 1.41, 3.75, 9.24, 2.06, 1.49, 7.32, 14.13, 21.33, 0.62, 0.78, 1.19, 1.86, 1.44, 1.68, 1.62]}
annotations_filtered/c17KWinVFss_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 11.77], [12.0, 13.88], [15.0, 16.36], [19.0, 20.26], [21.0, 21.24], [22.0, 24.06], [30.0, 30.06], [31.0, 31.46], [34.0, 34.59], [37.0, 38.28], [40.0, 41.96], [43.0, 44.9], [49.0, 81.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [56.25, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.77, 1.88, 1.36, 1.26, 0.24, 2.06, 0.06, 0.46, 0.59, 1.28, 1.96, 1.9, 32.97]}
annotations_filtered/c1EyN9xTK94_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[19.0, 19.01], [21.0, 21.29], [23.0, 23.92], [25.0, 25.35], [27.0, 27.08], [28.0, 28.73], [30.0, 30.47], [40.0, 43.11], [45.0, 45.23], [50.0, 50.94], [55.0, 55.85], [56.0, 58.82]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.21, 0.0, 0.0, 0.0, 84.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["tuning fork", 22.47], ["music", 18.33], ["chirp tone", 15.55]], null, null, null, null], "duration": [0.01, 0.29, 0.92, 0.35, 0.08, 0.73, 0.47, 3.11, 0.23, 0.94, 0.85, 2.82]}
annotations_filtered/c1nmARXTuvE_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[6.0, 7.65], [11.0, 12.63], [18.0, 19.08], [24.0, 29.15], [30.0, 32.61], [37.0, 37.13], [40.0, 42.84], [45.0, 46.41], [52.0, 58.68], [59.0, 62.29], [63.0, 65.4], [72.0, 79.39], [81.0, 84.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.26, 99.98, 0.0, 99.78, 0.0, 100.0, 86.64, 48.91, 93.6, 85.17], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 17.84], ["fly, housefly", 17.39], ["sine wave", 12.57]], null, null], "duration": [1.65, 1.63, 1.08, 5.15, 2.61, 0.13, 2.84, 1.41, 6.68, 3.29, 2.4, 7.39, 3.59]}
annotations_filtered/c2HEnbmtknM_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[6.0, 10.59], [13.0, 47.44], [49.0, 53.03], [54.0, 62.06], [63.0, 91.03], [93.0, 95.47], [97.0, 98.52], [99.0, 117.32]], "keep_status": [false, false, false, true, false, false, false, false], "silence_prob": [30.56, 0.0, 99.96, 33.13, 31.0, 36.18, 0.0, 31.4], "audiomae_on_audioset": [[["mains hum", 39.47], ["hum", 17.27], ["music", 14.24]], null, null, [["music", 43.25], ["speech", 12.31], ["breaking", 5.26]], [["speech", 46.95], ["music", 12.61], ["hum", 12.6]], [["hum", 33.82], ["music", 21.11], ["throbbing", 15.93]], null, [["speech", 36.14], ["music", 24.38], ["breaking", 11.58]]], "duration": [4.59, 34.44, 4.03, 8.06, 28.03, 2.47, 1.52, 18.32]}
annotations_filtered/c2HZzrcEbZc_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[9.0, 9.54], [12.0, 13.22], [15.0, 14.61], [17.0, 18.05], [20.0, 21.68], [23.0, 51.44], [54.0, 55.41], [58.0, 67.71], [68.0, 69.16], [70.0, 70.48], [72.0, 73.01], [74.0, 85.35], [92.0, 105.29], [108.0, 109.36], [112.0, 121.76], [126.0, 126.6], [129.0, 136.76], [138.0, 140.83], [142.0, 190.38]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, true, false, false, true, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.03, 0.0, 37.39, 0.0, 0.0, 0.0, 34.72, 34.46, 0.0, 35.98, 0.0, 41.95, 33.75, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 27.5], ["speech", 24.94], ["whack, thwack", 12.92]], null, [["music", 30.94], ["cattle, bovinae", 15.18], ["livestock, farm animals, working animals", 11.0]], null, null, null, [["music", 56.59], ["hum", 5.55], ["speech", 4.89]], [["music", 80.04], ["throbbing", 2.88], ["didgeridoo", 2.76]], null, [["music", 38.16], ["hum", 13.03], ["throbbing", 8.83]], null, [["speech", 50.54], ["music", 8.39], ["hum", 4.56]], [["vehicle", 19.78], ["music", 17.42], ["car", 6.1]], null], "duration": [0.54, 1.22, -0.39, 1.05, 1.68, 28.44, 1.41, 9.71, 1.16, 0.48, 1.01, 11.35, 13.29, 1.36, 9.76, 0.6, 7.76, 2.83, 48.38]}
annotations_filtered/c2TcT9JairA_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[11.0, 11.5], [15.0, 23.11], [26.0, 25.86], [27.0, 29.0], [29.0, 30.0], [32.0, 32.9], [38.0, 43.44], [48.0, 59.61], [60.0, 60.44], [62.0, 62.04], [65.0, 71.42]], "keep_status": [false, true, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 48.02, 0.0, 46.83, 0.0, 0.0, 58.22, 48.23, 0.0, 0.0, 44.81], "audiomae_on_audioset": [null, [["music", 25.51], ["fly, housefly", 13.93], ["speech", 13.52]], null, [["music", 13.62], ["speech", 12.21], ["musical instrument", 2.22]], null, null, null, [["music", 25.18], ["livestock, farm animals, working animals", 15.53], ["speech", 13.25]], null, null, [["speech", 36.29], ["music", 23.59], ["trombone", 14.77]]], "duration": [0.5, 8.11, -0.14, 2.0, 1.0, 0.9, 5.44, 11.61, 0.44, 0.04, 6.42]}
annotations_filtered/c2ecZiVEs70_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[18.0, 18.62], [19.0, 21.44], [23.0, 25.71], [26.0, 100.21], [106.0, 105.97], [113.0, 113.21], [116.0, 125.54], [126.0, 131.73], [132.0, 133.08], [134.0, 134.96], [136.0, 136.65], [138.0, 138.03], [139.0, 140.59], [143.0, 143.94]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 72.01, 89.36, 0.0, 0.0, 0.0, 48.82, 36.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["telephone bell ringing", 41.71], ["music", 31.33], ["telephone", 7.55]], [["speech", 32.98], ["fart", 12.01], ["hum", 7.26]], null, null, null, null, null, null], "duration": [0.62, 2.44, 2.71, 74.21, -0.03, 0.21, 9.54, 5.73, 1.08, 0.96, 0.65, 0.03, 1.59, 0.94]}
annotations_filtered/c2k_kuU84ro_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[71.0, 139.94], [143.0, 147.99], [149.0, 152.39], [154.0, 172.56], [174.0, 182.28]], "keep_status": [false, true, false, false, true], "silence_prob": [0.0, 29.79, 28.88, 29.07, 28.61], "audiomae_on_audioset": [null, [["music", 21.98], ["rumble", 6.88], ["speech", 6.03]], [["speech", 35.31], ["music", 21.58], ["whip", 14.29]], [["speech", 45.54], ["music", 24.83], ["clang", 5.23]], [["music", 49.74], ["speech", 7.62], ["burst, pop", 2.76]]], "duration": [68.94, 4.99, 3.39, 18.56, 8.28]}
annotations_filtered/c2tWZFAL5t4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 12.06], [12.0, 12.45], [14.0, 55.05], [58.0, 82.75], [85.0, 85.19], [87.0, 101.61], [105.0, 113.81], [115.0, 115.87], [124.0, 124.73], [126.0, 126.01], [130.0, 130.94], [132.0, 150.7], [151.0, 163.7]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [29.78, 0.0, 0.0, 30.28, 0.0, 30.1, 31.12, 0.0, 0.0, 0.0, 0.0, 30.05, 30.54], "audiomae_on_audioset": [[["music", 47.17], ["synthesizer", 11.08], ["theremin", 10.78]], null, null, [["music", 75.19], ["musical instrument", 10.03], ["didgeridoo", 4.94]], null, [["music", 26.09], ["siren", 8.72], ["didgeridoo", 7.72]], [["music", 52.97], ["didgeridoo", 29.08], ["musical instrument", 4.06]], null, null, null, null, [["music", 37.94], ["didgeridoo", 33.06], ["musical instrument", 8.68]], [["music", 57.31], ["hum", 7.24], ["throbbing", 7.17]]], "duration": [10.06, 0.45, 41.05, 24.75, 0.19, 14.61, 8.81, 0.87, 0.73, 0.01, 0.94, 18.7, 12.7]}
annotations_filtered/c35RsjYzAhY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 4.21], [19.0, 19.84], [25.0, 25.98], [28.0, 29.07], [36.0, 36.12], [43.0, 45.01]], "keep_status": [true, false, false, false, false, true], "silence_prob": [35.86, 0.0, 0.0, 0.0, 0.0, 33.4], "audiomae_on_audioset": [[["hum", 25.92], ["mains hum", 24.36], ["speech", 17.95]], null, null, null, null, [["fly, housefly", 13.35], ["mosquito", 7.66], ["crowd", 6.98]]], "duration": [2.21, 0.84, 0.98, 1.07, 0.12, 2.01]}
annotations_filtered/c38HJR-9vhU_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[31.0, 32.56], [34.0, 39.78], [41.0, 41.49], [43.0, 44.31], [45.0, 50.82], [52.0, 52.47], [54.0, 68.15], [70.0, 73.16], [73.0, 75.15], [77.0, 77.85], [79.0, 87.79], [90.0, 89.85], [91.0, 92.45], [95.0, 94.58], [95.0, 96.9], [99.0, 99.64], [103.0, 104.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.76, 0.0, 0.0, 99.98, 0.0, 99.85, 93.13, 100.0, 0.0, 97.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.56, 5.78, 0.49, 1.31, 5.82, 0.47, 14.15, 3.16, 2.15, 0.85, 8.79, -0.15, 1.45, -0.42, 1.9, 0.64, 1.92]}
annotations_filtered/c3nJu9SBkis_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 2.29], [5.0, 5.21], [8.0, 8.23], [9.0, 10.59], [11.0, 16.5], [21.0, 22.5], [24.0, 24.17], [25.0, 25.59], [28.0, 30.13], [32.0, 37.91], [46.0, 47.46], [49.0, 49.32], [53.0, 52.83], [54.0, 54.36], [56.0, 56.3], [62.0, 62.36], [67.0, 72.72], [75.0, 75.96], [77.0, 77.26], [87.0, 94.12], [95.0, 95.3], [96.0, 97.61], [100.0, 107.37], [115.0, 114.98], [119.0, 135.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 68.67, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.22, 0.0, 0.0, 44.43, 0.0, 0.0, 35.49, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 86.58], ["knock", 1.77], ["hands", 1.49]], null, null, [["speech", 71.1], ["knock", 7.38], ["thunk", 2.51]], null, null, [["speech", 69.89], ["thunk", 10.47], ["whack, thwack", 5.11]], null, null], "duration": [0.29, 0.21, 0.23, 1.59, 5.5, 1.5, 0.17, 0.59, 2.13, 5.91, 1.46, 0.32, -0.17, 0.36, 0.3, 0.36, 5.72, 0.96, 0.26, 7.12, 0.3, 1.61, 7.37, -0.02, 16.45]}
annotations_filtered/c3uOWTAuaTQ_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[8.0, 8.94], [14.0, 15.43], [26.0, 25.71], [35.0, 35.4]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.94, 1.43, -0.29, 0.4]}
annotations_filtered/c3vmsUcknhY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[6.0, 11.25], [20.0, 20.43], [22.0, 22.72], [23.0, 31.31], [32.0, 37.44], [38.0, 39.36], [40.0, 40.19], [42.0, 44.88], [48.0, 66.78], [67.0, 66.95], [67.0, 87.51], [88.0, 107.45], [109.0, 108.99], [109.0, 118.54], [121.0, 122.91], [124.0, 125.27]], "keep_status": [true, false, false, true, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [33.3, 0.0, 0.0, 29.0, 28.93, 0.0, 0.0, 28.91, 31.42, 0.0, 29.01, 28.44, 0.0, 28.48, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 25.33], ["didgeridoo", 22.78], ["music", 15.84]], null, null, [["music", 48.23], ["speech", 8.63], ["buzz", 4.19]], [["music", 54.86], ["throbbing", 9.21], ["hum", 7.22]], null, null, [["music", 50.5], ["throbbing", 12.26], ["hum", 4.28]], [["music", 51.75], ["didgeridoo", 10.53], ["musical instrument", 7.95]], null, [["music", 45.51], ["throbbing", 25.0], ["didgeridoo", 6.0]], [["music", 38.42], ["speech", 25.6], ["hum", 6.28]], null, [["music", 31.53], ["speech", 15.19], ["buzz", 9.57]], null, null], "duration": [5.25, 0.43, 0.72, 8.31, 5.44, 1.36, 0.19, 2.88, 18.78, -0.05, 20.51, 19.45, -0.01, 9.54, 1.91, 1.27]}
annotations_filtered/c3zRfKmcqv8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[12.0, 13.46], [15.0, 15.03], [19.0, 19.5], [21.0, 21.36], [23.0, 23.99], [36.0, 39.28], [41.0, 40.95], [42.0, 43.61], [44.0, 69.94], [73.0, 73.6], [81.0, 81.21], [83.0, 83.27], [86.0, 91.93], [94.0, 96.97], [98.0, 99.91], [101.0, 104.63], [107.0, 107.5], [108.0, 117.1], [121.0, 122.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 50.36, 0.0, 0.0, 96.17, 0.0, 0.0, 0.0, 84.25, 56.7, 0.0, 54.76, 0.0, 37.83, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 30.47], ["speech", 13.1], ["livestock, farm animals, working animals", 9.07]], null], "duration": [1.46, 0.03, 0.5, 0.36, 0.99, 3.28, -0.05, 1.61, 25.94, 0.6, 0.21, 0.27, 5.93, 2.97, 1.91, 3.63, 0.5, 9.1, 1.03]}
annotations_filtered/c4Wls5pZlxQ_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[11.0, 20.55], [23.0, 27.09], [27.0, 27.55], [31.0, 34.99], [37.0, 37.77], [38.0, 42.38], [46.0, 49.1], [55.0, 57.94], [60.0, 68.22], [71.0, 71.22], [74.0, 97.55], [98.0, 99.28], [99.0, 105.53], [106.0, 106.37], [107.0, 110.83], [115.0, 115.33], [116.0, 118.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.65, 82.43, 0.0, 96.77, 0.0, 62.07, 82.61, 86.64, 70.86, 0.0, 62.99, 0.0, 52.51, 0.0, 74.13, 0.0, 94.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.55, 4.09, 0.55, 3.99, 0.77, 4.38, 3.1, 2.94, 8.22, 0.22, 23.55, 1.28, 6.53, 0.37, 3.83, 0.33, 2.62]}
annotations_filtered/c4X58OjlVPo_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 5.14], [6.0, 6.13], [11.0, 10.89], [24.0, 24.78], [30.0, 29.88], [31.0, 32.09], [33.0, 33.44], [35.0, 34.75], [41.0, 40.78], [43.0, 43.58], [45.0, 45.22], [47.0, 51.66], [56.0, 57.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.36, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.14, 0.13, -0.11, 0.78, -0.12, 1.09, 0.44, -0.25, -0.22, 0.58, 0.22, 4.66, 1.55]}
annotations_filtered/c4ibjfBu1IY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 2.93], [4.0, 3.84], [4.0, 7.01], [9.0, 9.58], [10.0, 12.46], [13.0, 15.58], [17.0, 31.99], [35.0, 44.02], [45.0, 45.37], [53.0, 54.73], [55.0, 61.82], [67.0, 68.67], [69.0, 76.54], [79.0, 79.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.58, 0.0, 53.78, 73.21, 71.87, 50.86, 0.0, 0.0, 28.22, 0.0, 29.53, 0.0], "audiomae_on_audioset": [null, null, [["music", 42.69], ["speech", 25.37], ["electric shaver, electric razor", 8.05]], null, null, null, null, null, null, null, [["speech", 45.99], ["music", 18.47], ["vehicle", 14.47]], null, [["speech", 50.68], ["music", 23.46], ["mains hum", 7.97]], null], "duration": [-0.07, -0.16, 3.01, 0.58, 2.46, 2.58, 14.99, 9.02, 0.37, 1.73, 6.82, 1.67, 7.54, 0.91]}
annotations_filtered/c4ux2NclHoE_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[14.0, 14.44], [14.0, 50.55], [51.0, 50.85], [58.0, 60.22], [65.0, 82.75], [84.0, 88.64]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.22, 35.59, 33.61], "audiomae_on_audioset": [null, null, null, [["music", 38.86], ["whip", 6.86], ["speech", 5.02]], [["music", 64.36], ["effects unit", 8.35], ["synthesizer", 3.64]], [["music", 72.25], ["didgeridoo", 3.64], ["musical instrument", 3.57]]], "duration": [0.44, 36.55, -0.15, 2.22, 17.75, 4.64]}
annotations_filtered/c4w-IE-Hsqc_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[22.0, 23.3], [35.0, 35.45], [39.0, 39.85], [51.0, 53.01], [56.0, 55.97], [63.0, 71.68], [72.0, 72.5], [74.0, 74.07], [79.0, 82.44], [83.0, 83.2], [84.0, 84.69], [92.0, 93.07], [94.0, 95.4], [100.0, 100.04], [112.0, 112.68], [114.0, 114.98], [116.0, 116.92], [120.0, 121.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 98.44, 0.0, 65.2, 0.0, 0.0, 93.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.3, 0.45, 0.85, 2.01, -0.03, 8.68, 0.5, 0.07, 3.44, 0.2, 0.69, 1.07, 1.4, 0.04, 0.68, 0.98, 0.92, 1.46]}
annotations_filtered/c5BJJbtFP4E_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 4.24], [5.0, 9.0], [10.0, 10.37], [12.0, 32.78], [36.0, 37.08], [40.0, 42.63], [48.0, 48.37], [56.0, 64.44], [70.0, 92.03], [97.0, 101.17], [104.0, 104.52], [106.0, 108.36], [120.0, 125.32]], "keep_status": [false, true, false, false, false, true, false, false, true, true, false, true, false], "silence_prob": [0.0, 36.9, 0.0, 30.83, 0.0, 30.26, 0.0, 31.03, 30.74, 30.93, 0.0, 29.55, 30.39], "audiomae_on_audioset": [null, [["music", 19.71], ["cattle, bovinae", 18.37], ["moo", 15.89]], null, [["music", 53.77], ["cattle, bovinae", 10.64], ["crowd", 6.05]], null, [["moo", 24.43], ["speech", 22.6], ["cattle, bovinae", 18.32]], null, [["music", 47.46], ["livestock, farm animals, working animals", 13.79], ["cattle, bovinae", 10.33]], [["music", 34.75], ["cattle, bovinae", 8.31], ["crowd", 6.59]], [["music", 34.37], ["speech", 26.23], ["crowd", 3.53]], null, [["speech", 20.44], ["crowd", 19.14], ["cheering", 18.39]], [["cattle, bovinae", 45.24], ["moo", 27.05], ["livestock, farm animals, working animals", 15.56]]], "duration": [0.24, 4.0, 0.37, 20.78, 1.08, 2.63, 0.37, 8.44, 22.03, 4.17, 0.52, 2.36, 5.32]}
annotations_filtered/c5Re3lGYUA0_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 2.61], [5.0, 5.34], [7.0, 21.76], [22.0, 33.67], [39.0, 86.85], [87.0, 88.59], [91.0, 112.78], [113.0, 115.94], [119.0, 122.98]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 66.63, 65.44, 0.0, 0.0, 73.97, 91.64, 65.67], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.61, 0.34, 14.76, 11.67, 47.85, 1.59, 21.78, 2.94, 3.98]}
annotations_filtered/c5WfxwnLlLU_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[6.0, 5.78], [30.0, 32.37]], "keep_status": [false, true], "silence_prob": [0.0, 36.11], "audiomae_on_audioset": [null, [["music", 11.9], ["explosion", 11.49], ["eruption", 9.88]]], "duration": [-0.22, 2.37]}
annotations_filtered/c5ZiiE8fyGk_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 3.11], [7.0, 7.3], [8.0, 8.18], [9.0, 10.15], [12.0, 12.87], [14.0, 15.38], [24.0, 24.81], [26.0, 27.18], [28.0, 29.54], [34.0, 34.96], [36.0, 37.45], [38.0, 38.8], [42.0, 43.17], [45.0, 45.54], [47.0, 47.8], [48.0, 48.03], [52.0, 51.95], [54.0, 55.71], [57.0, 57.57], [62.0, 62.07], [73.0, 73.47], [89.0, 88.7], [93.0, 94.86], [103.0, 103.4], [105.0, 107.28], [108.0, 109.02], [110.0, 111.57], [115.0, 116.13], [120.0, 121.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.78, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.11, 0.3, 0.18, 1.15, 0.87, 1.38, 0.81, 1.18, 1.54, 0.96, 1.45, 0.8, 1.17, 0.54, 0.8, 0.03, -0.05, 1.71, 0.57, 0.07, 0.47, -0.3, 1.86, 0.4, 2.28, 1.02, 1.57, 1.13, 1.2]}
annotations_filtered/c5mAaBl_qqk_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 3.52], [5.0, 12.48], [13.0, 13.74], [14.0, 15.13], [16.0, 16.93], [18.0, 20.53], [22.0, 62.19], [63.0, 63.54], [64.0, 86.48], [87.0, 95.44], [97.0, 130.86], [134.0, 134.49], [135.0, 136.92], [138.0, 139.16], [142.0, 144.49], [148.0, 151.17], [152.0, 152.74]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.78, 0.0, 0.0, 0.0, 46.26, 0.0, 0.0, 46.72, 46.15, 0.0, 0.0, 0.0, 0.0, 71.57, 52.45, 0.0], "audiomae_on_audioset": [null, [["music", 57.93], ["hum", 10.57], ["electronic music", 6.1]], null, null, null, [["hum", 31.19], ["mains hum", 16.52], ["music", 9.82]], null, null, [["speech", 53.35], ["music", 24.4], ["hum", 6.97]], [["hum", 36.72], ["throbbing", 35.2], ["music", 8.61]], null, null, null, null, null, null, null], "duration": [1.52, 7.48, 0.74, 1.13, 0.93, 2.53, 40.19, 0.54, 22.48, 8.44, 33.86, 0.49, 1.92, 1.16, 2.49, 3.17, 0.74]}
annotations_filtered/c5zKpr5gmgk_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[11.0, 12.07], [12.0, 14.94], [15.0, 15.89], [22.0, 23.43], [24.0, 28.49], [29.0, 29.51], [30.0, 29.62], [33.0, 33.76], [49.0, 49.72], [51.0, 52.17], [57.0, 58.33], [67.0, 67.27], [71.0, 70.75], [82.0, 85.82]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 76.53, 0.0, 0.0, 49.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.71], "audiomae_on_audioset": [null, null, null, null, [["music", 37.51], ["noise", 15.79], ["whale vocalization", 9.7]], null, null, null, null, null, null, null, null, null], "duration": [1.07, 2.94, 0.89, 1.43, 4.49, 0.51, -0.38, 0.76, 0.72, 1.17, 1.33, 0.27, -0.25, 3.82]}
annotations_filtered/c6XHLe94SJA_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 2.05], [3.0, 41.69], [44.0, 46.68], [49.0, 50.23], [51.0, 51.95], [53.0, 60.29], [62.0, 96.65]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 31.38, 0.0, 0.0, 33.96, 0.0], "audiomae_on_audioset": [null, null, [["mains hum", 22.04], ["hum", 19.43], ["eruption", 7.3]], null, null, [["hum", 33.44], ["music", 24.75], ["mains hum", 13.65]], null], "duration": [0.05, 38.69, 2.68, 1.23, 0.95, 7.29, 34.65]}
annotations_filtered/c6dmj-WpTW4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[5.0, 9.68], [11.0, 13.9], [15.0, 20.92], [22.0, 26.84], [27.0, 27.85], [30.0, 30.97], [34.0, 38.82], [40.0, 40.34], [42.0, 42.09], [43.0, 44.05], [54.0, 54.92], [56.0, 57.42], [61.0, 62.5], [64.0, 69.04], [73.0, 74.06], [77.0, 108.36], [111.0, 111.6], [112.0, 114.27], [115.0, 115.77], [116.0, 117.8], [119.0, 124.55]], "keep_status": [false, true, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [55.25, 44.84, 47.86, 35.71, 0.0, 0.0, 42.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.69, 0.0, 0.0, 0.0, 45.46, 0.0, 0.0, 40.43], "audiomae_on_audioset": [null, [["speech", 12.84], ["bee, wasp, etc.", 8.07], ["hum", 7.58]], [["bee, wasp, etc.", 19.8], ["fly, housefly", 16.44], ["mains hum", 11.21]], [["animal", 13.88], ["speech", 13.75], ["dog", 10.47]], null, null, [["speech", 54.53], ["hum", 4.59], ["sidetone", 4.43]], null, null, null, null, null, null, [["whistling", 50.28], ["music", 15.54], ["whistle", 10.43]], null, null, null, [["mosquito", 18.38], ["fart", 14.52], ["fly, housefly", 14.24]], null, null, [["hum", 39.79], ["speech", 28.42], ["mains hum", 9.35]]], "duration": [4.68, 2.9, 5.92, 4.84, 0.85, 0.97, 4.82, 0.34, 0.09, 1.05, 0.92, 1.42, 1.5, 5.04, 1.06, 31.36, 0.6, 2.27, 0.77, 1.8, 5.55]}
annotations_filtered/c6ik-AA87Uo_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[33.0, 34.53], [38.0, 38.79], [42.0, 42.58], [49.0, 49.33], [55.0, 55.32], [59.0, 60.24], [63.0, 69.89], [72.0, 72.52], [75.0, 75.34], [76.0, 77.28], [82.0, 82.95], [94.0, 94.91], [98.0, 98.32]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 9.32], ["animal", 9.01], ["cattle, bovinae", 7.78]], null, null, null, null, null, null], "duration": [1.53, 0.79, 0.58, 0.33, 0.32, 1.24, 6.89, 0.52, 0.34, 1.28, 0.95, 0.91, 0.32]}
annotations_filtered/c6mLa5_GvCQ_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 10.07], [12.0, 14.39], [28.0, 39.63], [45.0, 44.71], [49.0, 49.84], [54.0, 54.35], [63.0, 64.3], [65.0, 65.82], [71.0, 71.27], [76.0, 76.76], [80.0, 79.84], [80.0, 80.0], [80.0, 80.05], [102.0, 104.72], [112.0, 116.56], [126.0, 125.95], [126.0, 126.99], [129.0, 129.37], [130.0, 131.14], [135.0, 135.7], [146.0, 146.53], [156.0, 156.61], [165.0, 168.02], [169.0, 170.29], [172.0, 172.13], [178.0, 179.1]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.95, 44.2, 30.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.51, 38.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 29.37], ["mains hum", 15.96], ["hum", 15.43]], [["music", 52.07], ["throbbing", 4.37], ["hum", 4.32]], [["music", 63.91], ["animal", 6.16], ["hum", 4.94]], null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 53.23], ["moo", 20.08], ["cattle, bovinae", 16.98]], [["speech", 44.66], ["music", 9.55], ["noise", 5.69]], null, null, null, null, null, null, null, [["mains hum", 31.62], ["hum", 28.64], ["speech", 16.24]], null, null, null], "duration": [7.07, 2.39, 11.63, -0.29, 0.84, 0.35, 1.3, 0.82, 0.27, 0.76, -0.16, 0.0, 0.05, 2.72, 4.56, -0.05, 0.99, 0.37, 1.14, 0.7, 0.53, 0.61, 3.02, 1.29, 0.13, 1.1]}
annotations_filtered/c7-u-fyUSkM_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 4.62], [5.0, 8.92], [10.0, 10.91], [12.0, 12.65], [15.0, 15.4], [17.0, 47.02], [48.0, 51.0], [51.0, 52.15], [54.0, 54.38], [55.0, 59.66], [60.0, 70.04], [71.0, 73.38], [77.0, 81.36], [82.0, 82.97], [85.0, 91.34], [92.0, 95.49], [97.0, 98.05]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.4, 0.0, 0.0, 0.0, 0.0, 37.0, 0.0, 0.0, 60.89, 46.94, 79.07, 65.67, 0.0, 56.18, 56.63, 0.0], "audiomae_on_audioset": [null, [["speech", 32.27], ["hum", 16.64], ["rumble", 13.98]], null, null, null, null, [["wail, moan", 28.6], ["animal", 18.24], ["speech", 16.21]], null, null, null, [["speech", 72.24], ["beatboxing", 1.96], ["fart", 1.52]], null, null, null, null, null, null], "duration": [1.62, 3.92, 0.91, 0.65, 0.4, 30.02, 3.0, 1.15, 0.38, 4.66, 10.04, 2.38, 4.36, 0.97, 6.34, 3.49, 1.05]}
annotations_filtered/c77JrXbqqV0_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[5.0, 5.71], [7.0, 7.59], [9.0, 9.17], [10.0, 10.99], [15.0, 15.03], [18.0, 18.37], [20.0, 21.19], [22.0, 22.69], [23.0, 23.79], [26.0, 26.64], [31.0, 30.86], [32.0, 32.27], [32.0, 32.46], [32.0, 35.28], [38.0, 37.98], [40.0, 40.76], [42.0, 41.96], [43.0, 43.34], [44.0, 45.87], [51.0, 54.9], [56.0, 56.94], [60.0, 60.91], [64.0, 65.3], [74.0, 74.16], [76.0, 77.68], [91.0, 92.01], [110.0, 111.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.17], ["sidetone", 27.68], ["hum", 3.43]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.71, 0.59, 0.17, 0.99, 0.03, 0.37, 1.19, 0.69, 0.79, 0.64, -0.14, 0.27, 0.46, 3.28, -0.02, 0.76, -0.04, 0.34, 1.87, 3.9, 0.94, 0.91, 1.3, 0.16, 1.68, 1.01, 1.99]}
annotations_filtered/c7AescgZzEg_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[8.0, 10.88], [14.0, 19.8], [36.0, 36.59], [37.0, 37.13], [48.0, 49.92], [51.0, 58.21], [58.0, 58.41], [59.0, 76.17], [77.0, 78.22], [79.0, 79.64], [87.0, 87.05], [92.0, 91.69], [97.0, 97.39], [98.0, 98.91], [100.0, 101.22], [102.0, 102.12], [105.0, 106.73], [109.0, 108.92], [116.0, 116.95], [118.0, 119.75], [125.0, 129.66], [132.0, 133.96], [137.0, 137.79], [141.0, 143.68], [144.0, 145.32], [152.0, 154.63], [155.0, 155.73], [163.0, 165.64], [166.0, 168.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.37, 94.07, 0.0, 0.0, 0.0, 51.28, 0.0, 85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.72, 0.0, 0.0, 92.64, 0.0, 99.85, 0.0, 99.87, 98.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.88, 5.8, 0.59, 0.13, 1.92, 7.21, 0.41, 17.17, 1.22, 0.64, 0.05, -0.31, 0.39, 0.91, 1.22, 0.12, 1.73, -0.08, 0.95, 1.75, 4.66, 1.96, 0.79, 2.68, 1.32, 2.63, 0.73, 2.64, 2.71]}
annotations_filtered/c7RyGNzyGB4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[62.0, 62.11], [63.0, 103.0], [104.0, 104.77], [106.0, 112.45]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 35.28], "audiomae_on_audioset": [null, null, null, [["thunk", 31.03], ["music", 24.41], ["moo", 3.7]]], "duration": [0.11, 40.0, 0.77, 6.45]}
annotations_filtered/c7tvfdSjRE4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 5.09], [6.0, 7.94], [12.0, 16.43], [19.0, 26.25], [28.0, 33.0], [34.0, 38.35], [39.0, 39.58], [41.0, 42.09], [43.0, 47.01], [50.0, 53.5], [55.0, 80.16], [87.0, 92.13], [92.0, 92.23], [93.0, 93.46], [96.0, 103.87], [104.0, 104.45], [104.0, 104.85], [107.0, 109.76], [121.0, 129.41], [139.0, 140.19], [152.0, 154.84], [156.0, 156.44], [156.0, 156.59], [159.0, 160.17], [173.0, 172.94]], "keep_status": [false, false, false, false, true, true, false, false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.82, 37.07, 36.8, 35.81, 0.0, 0.0, 32.1, 32.32, 30.21, 32.02, 0.0, 0.0, 31.41, 0.0, 0.0, 32.55, 30.64, 0.0, 35.85, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["bee, wasp, etc.", 31.17], ["fly, housefly", 27.36], ["insect", 12.21]], [["bee, wasp, etc.", 40.22], ["fly, housefly", 33.14], ["insect", 14.32]], [["vehicle", 22.3], ["fly, housefly", 13.36], ["speech", 10.75]], [["speech", 47.7], ["cattle, bovinae", 5.83], ["moo", 4.55]], null, null, [["cattle, bovinae", 39.57], ["moo", 24.31], ["livestock, farm animals, working animals", 21.24]], [["fly, housefly", 59.21], ["insect", 22.49], ["bee, wasp, etc.", 14.56]], [["mains hum", 24.04], ["music", 20.16], ["hum", 16.59]], [["speech", 34.63], ["fly, housefly", 15.39], ["fart", 8.73]], null, null, [["fly, housefly", 21.47], ["bee, wasp, etc.", 17.64], ["insect", 14.44]], null, null, [["vehicle", 43.63], ["car", 19.45], ["speech", 9.8]], [["fly, housefly", 42.26], ["insect", 20.41], ["bee, wasp, etc.", 9.0]], null, [["cattle, bovinae", 35.15], ["moo", 30.63], ["speech", 11.65]], null, null, null, null], "duration": [1.09, 1.94, 4.43, 7.25, 5.0, 4.35, 0.58, 1.09, 4.01, 3.5, 25.16, 5.13, 0.23, 0.46, 7.87, 0.45, 0.85, 2.76, 8.41, 1.19, 2.84, 0.44, 0.59, 1.17, -0.06]}