bpiyush commited on
Commit
6260a8b
·
1 Parent(s): 2dad76a
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. annotations_filtered/--ABd2SeIGE_filtered.json +1 -0
  2. annotations_filtered/--Jiv5iYqT8_filtered.json +1 -0
  3. annotations_filtered/--QCZKgJt6o_filtered.json +1 -0
  4. annotations_filtered/--aqjaJyZLk_filtered.json +1 -0
  5. annotations_filtered/--hendERqm0_filtered.json +1 -0
  6. annotations_filtered/--oCWVOBuvA_filtered.json +1 -0
  7. annotations_filtered/--uyzf7X_0c_filtered.json +1 -0
  8. annotations_filtered/--vFXH3mH3A_filtered.json +1 -0
  9. annotations_filtered/-0SHIbuEO3w_filtered.json +1 -0
  10. annotations_filtered/-0f67QE-HP8_filtered.json +1 -0
  11. annotations_filtered/-19d_T472co_filtered.json +1 -0
  12. annotations_filtered/-1U0LH6dPfw_filtered.json +1 -0
  13. annotations_filtered/-1W4xHNKvAk_filtered.json +1 -0
  14. annotations_filtered/-1eKufUP5XQ_filtered.json +1 -0
  15. annotations_filtered/-1gCG8m1SHU_filtered.json +1 -0
  16. annotations_filtered/-1zLU5N6uBU_filtered.json +1 -0
  17. annotations_filtered/-2KG4lLGEl0_filtered.json +1 -0
  18. annotations_filtered/-2KGPYEFnsU_filtered.json +1 -0
  19. annotations_filtered/-2QFIXEHnOY_filtered.json +1 -0
  20. annotations_filtered/-37Mhsak-XI_filtered.json +1 -0
  21. annotations_filtered/-3KCgSpt3hU_filtered.json +1 -0
  22. annotations_filtered/-3RMOO6mHr4_filtered.json +1 -0
  23. annotations_filtered/-3mo5CqjvWs_filtered.json +1 -0
  24. annotations_filtered/-3ywc_7_IE8_filtered.json +1 -0
  25. annotations_filtered/-4GsCEopbd4_filtered.json +1 -0
  26. annotations_filtered/-4Q-MS_oFkw_filtered.json +1 -0
  27. annotations_filtered/-4QqksHXUCc_filtered.json +1 -0
  28. annotations_filtered/-4_rMqeyOJY_filtered.json +1 -0
  29. annotations_filtered/-5798-VRVYA_filtered.json +1 -0
  30. annotations_filtered/-5Pku48YPFo_filtered.json +1 -0
  31. annotations_filtered/-5Rohhkg-7k_filtered.json +1 -0
  32. annotations_filtered/-5be_UPkLRw_filtered.json +1 -0
  33. annotations_filtered/-5twCD8tAMc_filtered.json +1 -0
  34. annotations_filtered/-64q4HpZyaY_filtered.json +1 -0
  35. annotations_filtered/-6fuDrAmhNc_filtered.json +1 -0
  36. annotations_filtered/-7-2-088LnM_filtered.json +1 -0
  37. annotations_filtered/-7-C6lSAfOs_filtered.json +1 -0
  38. annotations_filtered/-78FgmNwyD4_filtered.json +1 -0
  39. annotations_filtered/-7Sow81yi24_filtered.json +1 -0
  40. annotations_filtered/-7cV5cWQmxg_filtered.json +1 -0
  41. annotations_filtered/-7krYJUfFv4_filtered.json +1 -0
  42. annotations_filtered/-7mzQx0ebqk_filtered.json +1 -0
  43. annotations_filtered/-85ubSkzSWg_filtered.json +1 -0
  44. annotations_filtered/-8ajIeIeJpY_filtered.json +1 -0
  45. annotations_filtered/-98BSUhcZtY_filtered.json +1 -0
  46. annotations_filtered/-9DrPi3ki0g_filtered.json +1 -0
  47. annotations_filtered/-9IgLueodZA_filtered.json +1 -0
  48. annotations_filtered/-9P7Ge1KmTY_filtered.json +1 -0
  49. annotations_filtered/-A-fBbIXbPo_filtered.json +1 -0
  50. annotations_filtered/-A9rFt7ITy4_filtered.json +1 -0
annotations_filtered/--ABd2SeIGE_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[8.0, 12.75], [15.0, 23.94], [27.0, 37.12], [48.0, 47.83], [51.0, 51.43], [60.0, 60.0], [62.0, 69.42], [86.0, 86.32], [93.0, 96.79], [98.0, 98.36], [99.0, 99.6], [100.0, 102.39], [106.0, 113.46]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [31.94, 30.17, 46.33, 0.0, 0.0, 0.0, 68.15, 0.0, 61.97, 0.0, 0.0, 38.33, 39.55], "audiomae_on_audioset": [[["theremin", 29.79], ["music", 28.67], ["hum", 7.9]], [["speech", 57.27], ["explosion", 14.36], ["burst, pop", 7.06]], [["music", 62.43], ["theremin", 8.26], ["cello", 4.68]], null, null, null, null, null, null, null, null, [["music", 21.78], ["musical instrument", 6.05], ["didgeridoo", 5.51]], [["music", 76.58], ["musical instrument", 3.22], ["theremin", 2.27]]], "duration": [4.75, 8.94, 10.12, -0.17, 0.43, 0.0, 7.42, 0.32, 3.79, 0.36, 0.6, 2.39, 7.46]}
annotations_filtered/--Jiv5iYqT8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 5.14], [7.0, 8.21], [9.0, 12.63], [13.0, 15.26], [17.0, 19.16], [20.0, 23.95], [25.0, 30.32], [31.0, 41.57], [43.0, 54.11], [55.0, 58.31], [59.0, 61.94], [64.0, 99.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.52, 0.0, 100.0, 100.0, 100.0, 100.0, 99.93, 99.95, 99.98, 77.53, 81.17, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.14, 1.21, 3.63, 2.26, 2.16, 3.95, 5.32, 10.57, 11.11, 3.31, 2.94, 35.55]}
annotations_filtered/--QCZKgJt6o_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 3.3], [5.0, 6.37], [7.0, 9.76], [14.0, 16.93], [30.0, 31.36], [33.0, 33.54], [35.0, 35.72], [40.0, 46.94], [51.0, 50.68], [52.0, 61.47], [67.0, 69.9], [77.0, 77.35], [107.0, 108.08], [117.0, 117.19], [117.0, 118.18], [127.0, 128.22], [133.0, 134.74], [136.0, 136.24], [140.0, 142.8], [146.0, 149.35], [151.0, 151.31], [152.0, 153.35], [156.0, 156.61], [157.0, 159.6], [164.0, 165.43], [174.0, 175.02]], "keep_status": [false, false, false, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 60.89, 45.59, 0.0, 0.0, 0.0, 35.85, 0.0, 34.71, 61.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.78, 47.2, 0.0, 0.0, 0.0, 39.47, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 26.24], ["vocal music", 7.63], ["singing", 6.21]], null, null, null, [["speech", 18.36], ["moo", 9.75], ["livestock, farm animals, working animals", 8.42]], null, [["chant", 14.05], ["cattle, bovinae", 12.42], ["grunt", 10.88]], null, null, null, null, null, null, null, null, null, [["speech", 49.28], ["hum", 8.71], ["music", 5.69]], null, null, null, [["speech", 31.98], ["music", 6.36], ["hum", 5.44]], null, null], "duration": [1.3, 1.37, 2.76, 2.93, 1.36, 0.54, 0.72, 6.94, -0.32, 9.47, 2.9, 0.35, 1.08, 0.19, 1.18, 1.22, 1.74, 0.24, 2.8, 3.35, 0.31, 1.35, 0.61, 2.6, 1.43, 1.02]}
annotations_filtered/--aqjaJyZLk_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[8.0, 15.62], [19.0, 22.18], [24.0, 25.74], [26.0, 26.6], [29.0, 33.02], [41.0, 42.13], [46.0, 46.55], [47.0, 48.63], [50.0, 51.17], [54.0, 55.27], [56.0, 57.32], [58.0, 59.81], [63.0, 63.49], [69.0, 69.21], [70.0, 72.59], [75.0, 75.64], [77.0, 78.58], [81.0, 81.77], [83.0, 83.69], [85.0, 85.83], [87.0, 88.38], [89.0, 90.8], [91.0, 91.88], [92.0, 92.64], [95.0, 97.17], [98.0, 106.57], [108.0, 109.51], [110.0, 111.52], [112.0, 115.32], [118.0, 120.87]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [52.27, 54.97, 0.0, 0.0, 49.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.55, 37.26, 0.0, 0.0, 31.3, 58.72], "audiomae_on_audioset": [null, null, null, null, [["noise", 17.53], ["hum", 14.74], ["music", 12.08]], null, null, null, null, null, null, null, null, null, [["music", 42.85], ["speech", 9.51], ["hum", 6.87]], null, null, null, null, null, null, null, null, null, [["tuning fork", 85.18], ["coin (dropping)", 2.94], ["gong", 2.22]], [["music", 39.36], ["mechanisms", 7.52], ["hum", 6.54]], null, null, [["music", 14.77], ["clang", 10.79], ["fly, housefly", 8.68]], null], "duration": [7.62, 3.18, 1.74, 0.6, 4.02, 1.13, 0.55, 1.63, 1.17, 1.27, 1.32, 1.81, 0.49, 0.21, 2.59, 0.64, 1.58, 0.77, 0.69, 0.83, 1.38, 1.8, 0.88, 0.64, 2.17, 8.57, 1.51, 1.52, 3.32, 2.87]}
annotations_filtered/--hendERqm0_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[12.0, 12.56], [14.0, 14.22], [16.0, 21.17], [28.0, 28.76], [32.0, 32.95], [34.0, 34.42], [36.0, 36.15], [38.0, 38.06], [40.0, 40.63], [41.0, 51.34], [53.0, 56.84], [58.0, 59.12], [61.0, 62.31], [66.0, 67.93], [70.0, 71.29], [74.0, 74.75], [77.0, 78.38], [82.0, 84.72]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 30.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.77, 31.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.95], "audiomae_on_audioset": [null, null, [["music", 67.55], ["electronic music", 5.78], ["house music", 4.08]], null, null, null, null, null, null, [["music", 45.64], ["speech", 12.16], ["techno", 9.56]], [["music", 51.69], ["speech", 33.92], ["drum machine", 1.58]], null, null, null, null, null, null, [["music", 30.48], ["sonar", 30.27], ["electronic music", 9.0]]], "duration": [0.56, 0.22, 5.17, 0.76, 0.95, 0.42, 0.15, 0.06, 0.63, 10.34, 3.84, 1.12, 1.31, 1.93, 1.29, 0.75, 1.38, 2.72]}
annotations_filtered/--oCWVOBuvA_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 2.42], [4.0, 5.46], [7.0, 7.35], [9.0, 12.02], [13.0, 14.1], [16.0, 17.66], [20.0, 21.22], [24.0, 26.03], [27.0, 28.41], [32.0, 32.81], [36.0, 36.37], [38.0, 38.4], [41.0, 47.61], [49.0, 51.41], [55.0, 56.3], [58.0, 58.21], [60.0, 64.56], [66.0, 66.36], [67.0, 68.35], [70.0, 72.81], [74.0, 75.02], [77.0, 78.65], [80.0, 81.68], [83.0, 83.17], [84.0, 87.4], [88.0, 92.03], [94.0, 95.12], [98.0, 99.33], [102.0, 101.78], [103.0, 105.87], [106.0, 106.83], [109.0, 109.81], [112.0, 113.04], [118.0, 119.72], [121.0, 121.34], [126.0, 126.22], [129.0, 129.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.99, 100.0, 0.0, 0.0, 94.95, 0.0, 0.0, 67.13, 0.0, 0.0, 0.0, 0.0, 100.0, 99.98, 0.0, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 1.46, 0.35, 3.02, 1.1, 1.66, 1.22, 2.03, 1.41, 0.81, 0.37, 0.4, 6.61, 2.41, 1.3, 0.21, 4.56, 0.36, 1.35, 2.81, 1.02, 1.65, 1.68, 0.17, 3.4, 4.03, 1.12, 1.33, -0.22, 2.87, 0.83, 0.81, 1.04, 1.72, 0.34, 0.22, 0.73]}
annotations_filtered/--uyzf7X_0c_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 3.45], [5.0, 5.07], [8.0, 8.16], [13.0, 12.78], [20.0, 20.21], [24.0, 24.07], [26.0, 26.52], [35.0, 35.53], [40.0, 40.29], [48.0, 48.36], [51.0, 51.54], [54.0, 54.72], [70.0, 69.72], [71.0, 71.68], [74.0, 74.43], [77.0, 76.92], [78.0, 78.51], [82.0, 82.24], [83.0, 83.03], [85.0, 85.31], [88.0, 88.8], [90.0, 90.86], [95.0, 95.47], [100.0, 100.31], [105.0, 105.33], [107.0, 107.01], [111.0, 111.92], [115.0, 115.06], [115.0, 115.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 0.07, 0.16, -0.22, 0.21, 0.07, 0.52, 0.53, 0.29, 0.36, 0.54, 0.72, -0.28, 0.68, 0.43, -0.08, 0.51, 0.24, 0.03, 0.31, 0.8, 0.86, 0.47, 0.31, 0.33, 0.01, 0.92, 0.06, 0.7]}
annotations_filtered/--vFXH3mH3A_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[9.0, 16.01], [18.0, 36.73], [38.0, 41.69], [49.0, 51.97], [58.0, 59.56], [61.0, 65.1], [74.0, 82.44], [83.0, 89.94], [90.0, 90.98], [96.0, 98.64], [103.0, 103.92], [108.0, 107.97], [108.0, 109.88], [112.0, 114.1], [118.0, 130.54], [132.0, 133.14], [134.0, 144.76], [147.0, 160.37], [161.0, 166.53], [168.0, 167.9], [170.0, 170.83], [173.0, 172.84]], "keep_status": [true, true, true, false, false, false, true, false, false, true, false, false, false, true, true, false, false, false, true, false, false, false], "silence_prob": [28.92, 29.82, 29.42, 29.02, 0.0, 30.59, 29.01, 29.08, 0.0, 29.77, 0.0, 0.0, 0.0, 28.94, 29.1, 0.0, 29.24, 28.93, 30.87, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["whack, thwack", 11.06], ["mosquito", 7.33], ["speech", 6.95]], [["rumble", 29.07], ["hum", 13.01], ["mains hum", 12.77]], [["speech", 17.98], ["whale vocalization", 16.64], ["groan", 16.12]], [["music", 63.1], ["speech", 7.17], ["electronic music", 1.88]], null, [["didgeridoo", 33.1], ["speech", 24.81], ["music", 22.07]], [["music", 52.24], ["vehicle", 9.53], ["motorcycle", 2.87]], [["music", 50.65], ["cattle, bovinae", 18.06], ["moo", 9.87]], null, [["music", 25.05], ["cattle, bovinae", 23.46], ["moo", 18.88]], null, null, null, [["groan", 43.37], ["music", 6.03], ["grunt", 5.74]], [["music", 39.13], ["speech", 20.56], ["electronic music", 6.22]], null, [["music", 83.89], ["electronic music", 3.05], ["techno", 1.93]], [["music", 79.27], ["hum", 3.27], ["throbbing", 2.72]], [["fly, housefly", 28.0], ["explosion", 24.83], ["boom", 9.83]], null, null, null], "duration": [7.01, 18.73, 3.69, 2.97, 1.56, 4.1, 8.44, 6.94, 0.98, 2.64, 0.92, -0.03, 1.88, 2.1, 12.54, 1.14, 10.76, 13.37, 5.53, -0.1, 0.83, -0.16]}
annotations_filtered/-0SHIbuEO3w_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[56.0, 60.72], [63.0, 122.66], [127.0, 131.94]], "keep_status": [false, false, true], "silence_prob": [29.36, 0.0, 30.22], "audiomae_on_audioset": [[["music", 65.38], ["speech", 7.81], ["throbbing", 3.28]], null, [["speech", 22.67], ["music", 22.28], ["crowd", 5.83]]], "duration": [4.72, 59.66, 4.94]}
annotations_filtered/-0f67QE-HP8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[0.0, 0.85], [2.0, 3.06], [4.0, 7.08], [9.0, 35.92], [38.0, 41.82], [44.0, 45.98], [48.0, 57.75], [58.0, 57.86], [58.0, 93.53], [98.0, 105.11], [110.0, 113.12], [114.0, 115.65], [118.0, 121.74], [132.0, 139.5], [143.0, 142.79], [143.0, 143.9], [148.0, 148.56], [152.0, 157.91], [160.0, 159.92], [161.0, 164.03], [169.0, 169.53], [171.0, 172.02], [181.0, 182.46]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.97, 30.71, 34.35, 0.0, 32.99, 0.0, 0.0, 29.01, 30.45, 0.0, 29.66, 30.04, 0.0, 0.0, 0.0, 31.53, 0.0, 30.6, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 72.72], ["music", 8.61], ["sidetone", 2.77]], [["music", 57.26], ["throbbing", 8.84], ["hum", 6.68]], null, [["whale vocalization", 88.55], ["music", 6.54], ["musical instrument", 0.81]], null, null, [["speech", 24.98], ["music", 16.76], ["whack, thwack", 8.37]], [["whale vocalization", 77.84], ["mosquito", 3.38], ["moo", 2.41]], null, [["explosion", 30.95], ["burst, pop", 13.91], ["speech", 9.44]], [["speech", 27.71], ["music", 15.41], ["cattle, bovinae", 6.74]], null, null, null, [["music", 32.22], ["electronic music", 12.21], ["dubstep", 7.19]], null, [["speech", 74.27], ["sound effect", 3.57], ["fart", 2.7]], null, null, null], "duration": [0.85, 1.06, 3.08, 26.92, 3.82, 1.98, 9.75, -0.14, 35.53, 7.11, 3.12, 1.65, 3.74, 7.5, -0.21, 0.9, 0.56, 5.91, -0.08, 3.03, 0.53, 1.02, 1.46]}
annotations_filtered/-19d_T472co_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 47.21], [48.0, 48.57], [53.0, 53.25], [53.0, 166.8], [167.0, 167.7], [168.0, 173.04], [175.0, 177.45], [180.0, 201.29], [205.0, 205.17], [206.0, 212.75]], "keep_status": [false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 70.58, 31.68, 35.71, 0.0, 74.76], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 76.85], ["speech", 5.82], ["boing", 1.78]], [["music", 32.21], ["fly, housefly", 10.63], ["buzz", 6.42]], null, null], "duration": [46.21, 0.57, 0.25, 113.8, 0.7, 5.04, 2.45, 21.29, 0.17, 6.75]}
annotations_filtered/-1U0LH6dPfw_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 2.61], [3.0, 3.11], [3.0, 4.31], [13.0, 14.22], [22.0, 24.88], [26.0, 31.73], [35.0, 38.31], [39.0, 42.03], [46.0, 56.1], [61.0, 85.5], [98.0, 98.49], [100.0, 107.32], [108.0, 108.38], [120.0, 120.63]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.28, 30.67, 30.45, 30.48, 30.16, 30.01, 0.0, 33.86, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 61.12], ["didgeridoo", 4.8], ["sidetone", 4.55]], [["music", 62.74], ["hum", 9.5], ["throbbing", 5.24]], [["music", 45.36], ["speech", 19.03], ["boing", 5.23]], [["music", 53.7], ["boing", 15.98], ["fly, housefly", 3.21]], [["music", 60.24], ["speech", 11.81], ["boing", 9.62]], [["music", 68.45], ["boing", 10.58], ["speech", 6.01]], null, [["music", 42.75], ["speech", 18.11], ["mains hum", 12.3]], null, null], "duration": [0.61, 0.11, 1.31, 1.22, 2.88, 5.73, 3.31, 3.03, 10.1, 24.5, 0.49, 7.32, 0.38, 0.63]}
annotations_filtered/-1W4xHNKvAk_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[7.0, 7.62], [16.0, 17.51], [35.0, 35.06], [36.0, 36.69], [50.0, 51.21], [52.0, 53.15], [73.0, 74.11], [85.0, 86.86], [100.0, 101.07], [102.0, 103.08], [114.0, 115.01], [117.0, 117.29], [120.0, 120.75], [135.0, 134.97], [150.0, 150.13], [208.0, 208.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 1.51, 0.06, 0.69, 1.21, 1.15, 1.11, 1.86, 1.07, 1.08, 1.01, 0.29, 0.75, -0.03, 0.13, 0.63]}
annotations_filtered/-1eKufUP5XQ_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[5.0, 5.29], [11.0, 15.52], [20.0, 20.07], [24.0, 24.58], [40.0, 41.15], [44.0, 49.44], [50.0, 51.68], [53.0, 59.09], [64.0, 64.49], [65.0, 65.69], [66.0, 68.1], [79.0, 79.39], [80.0, 80.59], [83.0, 84.33], [89.0, 89.85], [91.0, 97.97], [99.0, 99.39], [100.0, 99.98], [100.0, 102.0], [104.0, 104.41], [105.0, 105.73], [106.0, 106.74], [107.0, 107.97], [110.0, 111.35], [112.0, 113.56], [114.0, 115.64], [116.0, 118.37], [119.0, 123.13]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.9, 0.0, 0.0, 0.0, 90.25, 0.0, 89.72, 0.0, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 0.0, 81.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.92, 94.66], "audiomae_on_audioset": [null, [["speech", 27.69], ["whack, thwack", 9.37], ["busy signal", 8.67]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 4.52, 0.07, 0.58, 1.15, 5.44, 1.68, 6.09, 0.49, 0.69, 2.1, 0.39, 0.59, 1.33, 0.85, 6.97, 0.39, -0.02, 2.0, 0.41, 0.73, 0.74, 0.97, 1.35, 1.56, 1.64, 2.37, 4.13]}
annotations_filtered/-1gCG8m1SHU_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 21.51], [23.0, 29.44], [31.0, 32.14], [38.0, 40.2], [43.0, 44.31], [47.0, 46.79], [48.0, 50.19], [54.0, 53.77], [59.0, 59.85], [61.0, 61.05], [62.0, 63.46], [64.0, 64.57], [66.0, 66.75], [70.0, 70.95], [72.0, 73.08], [74.0, 74.8], [77.0, 77.3], [78.0, 79.47], [83.0, 84.65], [85.0, 96.15], [99.0, 113.75], [115.0, 123.8], [125.0, 126.12]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [40.95, 98.73, 0.0, 99.73, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.99, 31.55, 54.63, 0.0], "audiomae_on_audioset": [[["music", 35.95], ["hum", 13.7], ["noise", 5.28]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.38], ["theremin", 8.86], ["hum", 4.46]], [["music", 47.45], ["hum", 18.65], ["throbbing", 9.19]], null, null], "duration": [17.51, 6.44, 1.14, 2.2, 1.31, -0.21, 2.19, -0.23, 0.85, 0.05, 1.46, 0.57, 0.75, 0.95, 1.08, 0.8, 0.3, 1.47, 1.65, 11.15, 14.75, 8.8, 1.12]}
annotations_filtered/-1zLU5N6uBU_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []}
annotations_filtered/-2KG4lLGEl0_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[13.0, 13.27], [14.0, 15.26], [21.0, 21.66], [27.0, 27.48], [31.0, 32.09], [34.0, 34.03], [34.0, 34.96], [36.0, 36.54], [38.0, 39.01], [41.0, 42.52], [43.0, 43.6], [46.0, 46.41], [47.0, 49.2], [51.0, 51.33], [54.0, 55.85], [57.0, 58.55], [68.0, 68.88], [79.0, 79.73], [80.0, 80.94], [84.0, 84.54], [87.0, 87.52], [89.0, 90.24], [101.0, 101.85], [105.0, 105.51], [109.0, 109.65], [111.0, 112.77], [116.0, 116.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.27, 1.26, 0.66, 0.48, 1.09, 0.03, 0.96, 0.54, 1.01, 1.52, 0.6, 0.41, 2.2, 0.33, 1.85, 1.55, 0.88, 0.73, 0.94, 0.54, 0.52, 1.24, 0.85, 0.51, 0.65, 1.77, 0.92]}
annotations_filtered/-2KGPYEFnsU_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[14.0, 14.39], [15.0, 16.73], [17.0, 17.9], [19.0, 20.11], [24.0, 24.53], [25.0, 25.76], [29.0, 33.12], [38.0, 39.55], [41.0, 43.04], [44.0, 44.71], [46.0, 47.39], [50.0, 50.03], [52.0, 53.38], [55.0, 56.1], [59.0, 60.71], [66.0, 66.9], [73.0, 73.94], [78.0, 78.9], [81.0, 80.79], [110.0, 110.1], [116.0, 117.9], [120.0, 119.8], [125.0, 127.04], [129.0, 129.41], [132.0, 132.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.63, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.39, 1.73, 0.9, 1.11, 0.53, 0.76, 4.12, 1.55, 2.04, 0.71, 1.39, 0.03, 1.38, 1.1, 1.71, 0.9, 0.94, 0.9, -0.21, 0.1, 1.9, -0.2, 2.04, 0.41, 0.97]}
annotations_filtered/-2QFIXEHnOY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[6.0, 16.11], [19.0, 22.35], [24.0, 31.28], [33.0, 33.39], [34.0, 58.75], [59.0, 68.89]], "keep_status": [true, true, true, false, true, true], "silence_prob": [29.59, 29.9, 28.84, 0.0, 29.2, 29.4], "audiomae_on_audioset": [[["music", 34.03], ["buzz", 18.87], ["hum", 9.34]], [["hum", 17.0], ["mains hum", 12.84], ["throbbing", 7.47]], [["fly, housefly", 16.88], ["buzz", 13.34], ["mosquito", 12.24]], null, [["buzz", 13.81], ["hum", 12.07], ["electric shaver, electric razor", 6.64]], [["hum", 22.83], ["mains hum", 10.69], ["fly, housefly", 8.24]]], "duration": [10.11, 3.35, 7.28, 0.39, 24.75, 9.89]}
annotations_filtered/-37Mhsak-XI_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[44.0, 44.73], [48.0, 65.79], [68.0, 86.9], [88.0, 96.03], [97.0, 119.35], [120.0, 123.89], [125.0, 127.58]], "keep_status": [false, false, false, false, true, false, true], "silence_prob": [0.0, 31.97, 35.22, 58.05, 45.75, 58.98, 46.79], "audiomae_on_audioset": [null, [["music", 75.5], ["theremin", 5.06], ["scary music", 3.28]], [["music", 40.89], ["speech", 25.7], ["boing", 12.51]], null, [["music", 36.75], ["guitar", 18.42], ["plucked string instrument", 8.13]], null, [["music", 51.17], ["boing", 10.19], ["didgeridoo", 3.32]]], "duration": [0.73, 17.79, 18.9, 8.03, 22.35, 3.89, 2.58]}
annotations_filtered/-3KCgSpt3hU_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[0.0, 0.26], [2.0, 3.81], [7.0, 6.88], [11.0, 10.98], [14.0, 16.56], [21.0, 21.47], [28.0, 28.24], [31.0, 32.36], [36.0, 37.34], [39.0, 40.07], [44.0, 46.47], [48.0, 48.44], [53.0, 54.99], [56.0, 56.88], [57.0, 58.53], [66.0, 68.28], [71.0, 72.1], [73.0, 73.55], [74.0, 78.63], [81.0, 81.43], [83.0, 84.79], [86.0, 86.05], [90.0, 91.77], [95.0, 95.66], [99.0, 100.94], [102.0, 103.57], [105.0, 105.85], [107.0, 108.28], [111.0, 112.83], [114.0, 119.4], [120.0, 121.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 95.91, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, 1.81, -0.12, -0.02, 2.56, 0.47, 0.24, 1.36, 1.34, 1.07, 2.47, 0.44, 1.99, 0.88, 1.53, 2.28, 1.1, 0.55, 4.63, 0.43, 1.79, 0.05, 1.77, 0.66, 1.94, 1.57, 0.85, 1.28, 1.83, 5.4, 1.05]}
annotations_filtered/-3RMOO6mHr4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[32.0, 32.24], [33.0, 32.98], [38.0, 37.61], [39.0, 39.99], [47.0, 49.03], [49.0, 49.08], [78.0, 81.3], [89.0, 90.56], [99.0, 113.17]], "keep_status": [false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 42.33, 0.0, 30.81, 0.0, 30.68], "audiomae_on_audioset": [null, null, null, null, [["livestock, farm animals, working animals", 36.74], ["moo", 21.51], ["cattle, bovinae", 13.9]], null, [["music", 20.01], ["moo", 13.1], ["speech", 11.05]], null, [["music", 72.64], ["electronic music", 5.15], ["techno", 3.8]]], "duration": [0.24, -0.02, -0.39, 0.99, 2.03, 0.08, 3.3, 1.56, 14.17]}
annotations_filtered/-3mo5CqjvWs_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 2.22], [7.0, 6.89], [9.0, 8.85], [25.0, 25.24], [28.0, 27.68], [31.0, 31.48]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.22, -0.11, -0.15, 0.24, -0.32, 0.48]}
annotations_filtered/-3ywc_7_IE8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[10.0, 12.68], [19.0, 37.59], [41.0, 41.98], [49.0, 63.66], [67.0, 114.02], [115.0, 123.55], [126.0, 126.84], [134.0, 134.45], [136.0, 137.25], [139.0, 138.96], [144.0, 144.83], [145.0, 145.47], [156.0, 156.44], [157.0, 157.18], [158.0, 158.57], [160.0, 161.0], [168.0, 168.49], [171.0, 173.43], [174.0, 176.01]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.31, 31.05, 0.0, 31.15, 0.0, 32.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.04, 99.9], "audiomae_on_audioset": [[["cacophony", 9.36], ["fly, housefly", 5.02], ["cheering", 4.37]], [["fly, housefly", 54.14], ["insect", 15.95], ["bee, wasp, etc.", 11.82]], null, [["bee, wasp, etc.", 42.33], ["fly, housefly", 26.81], ["insect", 13.73]], null, [["speech", 21.02], ["whack, thwack", 12.44], ["livestock, farm animals, working animals", 5.97]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.68, 18.59, 0.98, 14.66, 47.02, 8.55, 0.84, 0.45, 1.25, -0.04, 0.83, 0.47, 0.44, 0.18, 0.57, 1.0, 0.49, 2.43, 2.01]}
annotations_filtered/-4GsCEopbd4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[32.0, 52.84], [53.0, 63.14], [64.0, 81.58], [83.0, 94.9], [97.0, 100.3], [102.0, 103.0], [104.0, 106.0], [107.0, 108.97], [110.0, 120.66], [123.0, 130.13], [132.0, 133.24], [137.0, 137.56], [139.0, 139.11], [139.0, 143.53], [144.0, 171.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [69.47, 98.51, 99.96, 100.0, 99.16, 0.0, 99.87, 0.0, 37.81, 35.33, 0.0, 0.0, 0.0, 32.88, 30.79], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 57.7], ["music", 12.4], ["theremin", 8.34]], [["speech", 61.66], ["explosion", 7.3], ["firecracker", 6.96]], null, null, null, [["speech", 42.44], ["fart", 13.31], ["explosion", 10.21]], [["speech", 52.19], ["fly, housefly", 9.28], ["music", 8.03]]], "duration": [20.84, 10.14, 17.58, 11.9, 3.3, 1.0, 2.0, 1.97, 10.66, 7.13, 1.24, 0.56, 0.11, 4.53, 27.59]}
annotations_filtered/-4Q-MS_oFkw_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[11.0, 11.03], [13.0, 13.14], [16.0, 19.82], [24.0, 24.0], [24.0, 25.22], [28.0, 31.28], [33.0, 45.86], [48.0, 50.08], [53.0, 54.19], [57.0, 67.07], [72.0, 72.99], [73.0, 86.34], [99.0, 113.97], [118.0, 125.14]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 93.6, 0.0, 0.0, 51.88, 43.56, 93.76, 0.0, 81.0, 0.0, 48.31, 42.06, 33.06], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 38.94], ["synthesizer", 14.42], ["theremin", 3.43]], null, null, null, null, [["music", 47.22], ["speech", 21.31], ["theremin", 7.97]], [["music", 46.21], ["theremin", 24.05], ["synthesizer", 4.34]], [["music", 29.76], ["foghorn", 27.27], ["brass instrument", 3.53]]], "duration": [0.03, 0.14, 3.82, 0.0, 1.22, 3.28, 12.86, 2.08, 1.19, 10.07, 0.99, 13.34, 14.97, 7.14]}
annotations_filtered/-4QqksHXUCc_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[6.0, 6.91], [8.0, 13.36], [19.0, 20.43], [22.0, 24.17], [27.0, 27.38], [43.0, 46.65], [52.0, 57.62], [58.0, 61.52], [66.0, 68.44], [72.0, 72.52], [76.0, 77.55], [90.0, 89.78], [99.0, 100.2], [107.0, 107.87], [119.0, 119.97], [121.0, 122.76], [123.0, 125.02]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 34.59, 0.0, 36.53, 0.0, 32.91, 37.86, 36.06, 34.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.59], "audiomae_on_audioset": [null, [["music", 55.86], ["throbbing", 11.97], ["electronic music", 4.41]], null, [["hum", 30.96], ["throbbing", 30.29], ["music", 20.06]], null, [["music", 59.22], ["hum", 9.81], ["throbbing", 5.74]], [["music", 60.68], ["didgeridoo", 4.99], ["moo", 3.55]], [["music", 35.65], ["speech", 24.35], ["hum", 4.25]], [["fly, housefly", 22.19], ["music", 18.42], ["insect", 14.12]], null, null, null, null, null, null, null, [["music", 23.99], ["boing", 15.45], ["didgeridoo", 13.58]]], "duration": [0.91, 5.36, 1.43, 2.17, 0.38, 3.65, 5.62, 3.52, 2.44, 0.52, 1.55, -0.22, 1.2, 0.87, 0.97, 1.76, 2.02]}
annotations_filtered/-4_rMqeyOJY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 4.99], [7.0, 13.02], [14.0, 14.57], [15.0, 16.07], [17.0, 18.4], [19.0, 20.65], [24.0, 28.92], [31.0, 32.14], [33.0, 35.72], [36.0, 37.72], [45.0, 46.35], [51.0, 51.63], [55.0, 55.59], [60.0, 60.86], [63.0, 63.73], [64.0, 64.4], [68.0, 69.03], [78.0, 79.19], [80.0, 85.9], [88.0, 89.72], [92.0, 93.21], [95.0, 107.42], [109.0, 113.54], [114.0, 121.71], [123.0, 124.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 99.84, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 68.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 45.72, 37.88, 43.71, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 67.89], ["frog", 5.36], ["insect", 3.47]], [["speech", 27.14], ["dial tone", 23.51], ["busy signal", 6.93]], [["speech", 51.05], ["throat clearing", 5.81], ["noise", 4.84]], null], "duration": [0.99, 6.02, 0.57, 1.07, 1.4, 1.65, 4.92, 1.14, 2.72, 1.72, 1.35, 0.63, 0.59, 0.86, 0.73, 0.4, 1.03, 1.19, 5.9, 1.72, 1.21, 12.42, 4.54, 7.71, 1.02]}
annotations_filtered/-5798-VRVYA_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 3.92], [5.0, 5.26], [6.0, 6.29], [9.0, 11.03], [11.0, 11.84], [14.0, 14.05], [17.0, 18.25], [19.0, 20.36], [21.0, 21.34], [23.0, 24.06], [27.0, 27.14], [28.0, 28.86], [30.0, 30.65], [32.0, 33.98], [37.0, 37.86], [39.0, 39.02], [40.0, 40.34], [44.0, 44.91], [46.0, 47.51], [48.0, 48.02], [49.0, 50.72], [52.0, 52.76], [54.0, 54.77], [56.0, 57.01], [58.0, 59.48], [60.0, 60.54], [62.0, 66.66], [68.0, 72.22], [73.0, 74.19], [75.0, 76.18], [77.0, 79.98], [83.0, 84.57], [87.0, 90.64], [92.0, 97.43], [98.0, 101.38], [102.0, 106.74], [107.0, 110.03], [112.0, 146.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 84.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.41, 36.03, 0.0, 0.0, 73.97, 0.0, 83.52, 48.23, 85.54, 51.5, 43.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["burping, eructation", 16.08], ["domestic animals, pets", 10.18], ["hum", 10.12]], null, null, null, null, null, [["hum", 47.0], ["mains hum", 28.83], ["speech", 6.35]], null, null, [["speech", 62.57], ["hum", 6.04], ["mains hum", 3.86]], null], "duration": [0.92, 0.26, 0.29, 2.03, 0.84, 0.05, 1.25, 1.36, 0.34, 1.06, 0.14, 0.86, 0.65, 1.98, 0.86, 0.02, 0.34, 0.91, 1.51, 0.02, 1.72, 0.76, 0.77, 1.01, 1.48, 0.54, 4.66, 4.22, 1.19, 1.18, 2.98, 1.57, 3.64, 5.43, 3.38, 4.74, 3.03, 34.74]}
annotations_filtered/-5Pku48YPFo_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[8.0, 8.4], [13.0, 17.25], [28.0, 31.53], [35.0, 40.85], [43.0, 93.6], [97.0, 102.05], [102.0, 102.78], [103.0, 104.14], [106.0, 109.41], [110.0, 118.64]], "keep_status": [false, true, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 34.91, 38.11, 30.81, 0.0, 32.26, 0.0, 0.0, 35.07, 75.72], "audiomae_on_audioset": [null, [["speech", 22.11], ["screaming", 17.24], ["thunk", 10.79]], [["whale vocalization", 19.7], ["dog", 10.82], ["music", 9.72]], [["music", 69.01], ["musical instrument", 4.65], ["domestic animals, pets", 2.95]], null, [["speech", 37.14], ["vehicle", 17.56], ["radio", 8.43]], null, null, [["speech", 51.87], ["vehicle", 15.02], ["hum", 3.86]], null], "duration": [0.4, 4.25, 3.53, 5.85, 50.6, 5.05, 0.78, 1.14, 3.41, 8.64]}
annotations_filtered/-5Rohhkg-7k_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[7.0, 7.94], [8.0, 9.31], [10.0, 11.06], [12.0, 12.31], [14.0, 14.39], [15.0, 15.69], [16.0, 16.92], [19.0, 19.33], [20.0, 20.76], [24.0, 25.17], [27.0, 29.67], [33.0, 33.0], [37.0, 37.84], [39.0, 39.34], [40.0, 41.3], [42.0, 44.2], [46.0, 46.41], [49.0, 48.78], [51.0, 52.12], [53.0, 53.59], [56.0, 57.35], [59.0, 60.12], [61.0, 61.94], [62.0, 62.77], [64.0, 65.53], [67.0, 68.99], [72.0, 72.82], [75.0, 75.69], [77.0, 77.3], [79.0, 80.42], [84.0, 84.3], [85.0, 85.9], [87.0, 87.59], [89.0, 93.24], [95.0, 96.13], [97.0, 97.95], [100.0, 103.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.7, 0.0, 0.0, 0.0, 0.0, 69.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25, 0.0, 0.0, 98.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.94, 1.31, 1.06, 0.31, 0.39, 0.69, 0.92, 0.33, 0.76, 1.17, 2.67, 0.0, 0.84, 0.34, 1.3, 2.2, 0.41, -0.22, 1.12, 0.59, 1.35, 1.12, 0.94, 0.77, 1.53, 1.99, 0.82, 0.69, 0.3, 1.42, 0.3, 0.9, 0.59, 4.24, 1.13, 0.95, 3.76]}
annotations_filtered/-5be_UPkLRw_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 4.06], [6.0, 6.29], [9.0, 12.5], [14.0, 16.61], [19.0, 20.55], [24.0, 30.74], [31.0, 32.48], [34.0, 33.76], [35.0, 35.63], [36.0, 40.47], [42.0, 44.19], [45.0, 46.9], [49.0, 49.62], [51.0, 52.59], [53.0, 55.44], [58.0, 58.31], [60.0, 60.81], [63.0, 63.42], [65.0, 65.94], [68.0, 68.39], [70.0, 70.63], [72.0, 72.94], [74.0, 75.36], [77.0, 77.63], [79.0, 79.93], [80.0, 83.71], [84.0, 87.1], [89.0, 89.45], [92.0, 91.83], [93.0, 102.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.96, 0.0, 67.38, 99.99, 0.0, 99.62, 0.0, 0.0, 0.0, 100.0, 99.8, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.1, 100.0, 0.0, 0.0, 99.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.06, 0.29, 3.5, 2.61, 1.55, 6.74, 1.48, -0.24, 0.63, 4.47, 2.19, 1.9, 0.62, 1.59, 2.44, 0.31, 0.81, 0.42, 0.94, 0.39, 0.63, 0.94, 1.36, 0.63, 0.93, 3.71, 3.1, 0.45, -0.17, 9.32]}
annotations_filtered/-5twCD8tAMc_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[8.0, 23.65], [25.0, 25.08], [27.0, 28.24], [29.0, 30.91], [35.0, 35.61], [38.0, 42.33], [44.0, 75.29], [76.0, 76.72], [81.0, 89.38]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [33.09, 0.0, 0.0, 0.0, 0.0, 41.56, 0.0, 0.0, 30.12], "audiomae_on_audioset": [[["music", 83.83], ["theremin", 1.62], ["synthesizer", 1.3]], null, null, null, null, [["boat, water vehicle", 16.83], ["music", 14.4], ["vehicle", 11.07]], null, null, [["music", 72.52], ["musical instrument", 4.87], ["cacophony", 2.86]]], "duration": [15.65, 0.08, 1.24, 1.91, 0.61, 4.33, 31.29, 0.72, 8.38]}
annotations_filtered/-64q4HpZyaY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 10.61], [12.0, 12.16], [13.0, 79.49], [80.0, 109.46], [111.0, 112.77], [116.0, 117.36], [119.0, 124.24]], "keep_status": [true, false, false, false, false, false, false], "silence_prob": [31.4, 0.0, 0.0, 69.07, 0.0, 0.0, 63.96], "audiomae_on_audioset": [[["fly, housefly", 24.9], ["mains hum", 24.38], ["hum", 14.07]], null, null, null, null, null, null], "duration": [7.61, 0.16, 66.49, 29.46, 1.77, 1.36, 5.24]}
annotations_filtered/-6fuDrAmhNc_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[24.0, 26.13], [27.0, 28.88], [32.0, 32.17], [33.0, 38.03], [38.0, 40.19], [41.0, 44.02], [45.0, 46.45], [47.0, 47.63], [49.0, 49.91], [54.0, 54.67], [55.0, 56.32], [58.0, 58.46], [61.0, 61.74], [62.0, 63.98], [65.0, 65.4], [69.0, 69.99], [73.0, 73.89], [75.0, 76.54], [78.0, 84.0], [88.0, 97.07], [98.0, 98.78], [103.0, 155.43], [159.0, 179.0]], "keep_status": [false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [37.01, 0.0, 0.0, 43.45, 32.83, 35.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.32, 31.62, 0.0, 0.0, 34.35], "audiomae_on_audioset": [[["hum", 40.54], ["mains hum", 26.25], ["speech", 5.13]], null, null, [["hum", 22.65], ["mains hum", 17.99], ["music", 17.63]], [["music", 31.89], ["speech", 15.71], ["cattle, bovinae", 7.73]], [["music", 29.62], ["foghorn", 13.93], ["speech", 6.49]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 60.31], ["theremin", 11.38], ["hum", 2.41]], [["music", 53.67], ["brass instrument", 12.72], ["musical instrument", 8.37]], null, null, [["music", 40.6], ["didgeridoo", 12.31], ["gong", 10.97]]], "duration": [2.13, 1.88, 0.17, 5.03, 2.19, 3.02, 1.45, 0.63, 0.91, 0.67, 1.32, 0.46, 0.74, 1.98, 0.4, 0.99, 0.89, 1.54, 6.0, 9.07, 0.78, 52.43, 20.0]}
annotations_filtered/-7-2-088LnM_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[22.0, 22.2], [23.0, 22.92], [23.0, 25.52], [28.0, 30.13], [35.0, 36.71], [40.0, 42.08], [44.0, 45.2], [45.0, 46.09], [46.0, 48.91], [49.0, 49.25], [50.0, 50.72], [51.0, 52.47], [53.0, 57.54], [59.0, 67.63], [70.0, 72.08], [72.0, 74.56], [82.0, 82.93], [87.0, 99.28], [99.0, 99.5], [100.0, 100.01], [100.0, 100.45], [101.0, 109.46]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 39.47, 36.04, 0.0, 97.11, 0.0, 0.0, 66.63, 0.0, 0.0, 0.0, 71.14, 67.63, 98.99, 43.85, 0.0, 37.46, 0.0, 0.0, 0.0, 42.74], "audiomae_on_audioset": [null, null, [["whale vocalization", 16.24], ["boing", 16.19], ["moo", 10.98]], [["speech", 72.48], ["applause", 5.84], ["radio", 2.77]], null, null, null, null, null, null, null, null, null, null, null, [["music", 62.7], ["burping, eructation", 2.31], ["percussion", 1.49]], null, [["music", 60.25], ["groan", 6.88], ["grunt", 5.85]], null, null, null, [["gasp", 19.11], ["speech", 13.68], ["breaking", 11.58]]], "duration": [0.2, -0.08, 2.52, 2.13, 1.71, 2.08, 1.2, 1.09, 2.91, 0.25, 0.72, 1.47, 4.54, 8.63, 2.08, 2.56, 0.93, 12.28, 0.5, 0.01, 0.45, 8.46]}
annotations_filtered/-7-C6lSAfOs_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[30.0, 76.38], [77.0, 76.99], [79.0, 79.69], [80.0, 81.9], [83.0, 83.78], [85.0, 103.96], [107.0, 107.38], [112.0, 113.68]], "keep_status": [false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 34.04, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 58.1], ["synthesizer", 6.42], ["musical instrument", 3.74]], null, null], "duration": [46.38, -0.01, 0.69, 1.9, 0.78, 18.96, 0.38, 1.68]}
annotations_filtered/-78FgmNwyD4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 1.0], [1.0, 1.16], [16.0, 16.8], [36.0, 36.1], [36.0, 37.08], [39.0, 41.34], [48.0, 48.9], [50.0, 50.38], [56.0, 56.52], [58.0, 58.78], [64.0, 64.3], [66.0, 66.85], [67.0, 76.86], [82.0, 82.63], [83.0, 83.62], [84.0, 84.59], [100.0, 101.29], [102.0, 102.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 84.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.14, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.84], ["groan", 22.6], ["screaming", 2.61]], null, null, null, null, null], "duration": [0.0, 0.16, 0.8, 0.1, 1.08, 2.34, 0.9, 0.38, 0.52, 0.78, 0.3, 0.85, 9.86, 0.63, 0.62, 0.59, 1.29, 0.12]}
annotations_filtered/-7Sow81yi24_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[32.0, 32.53], [33.0, 38.33], [40.0, 42.58], [44.0, 45.69], [47.0, 63.64], [64.0, 66.07], [67.0, 73.43], [75.0, 76.65], [77.0, 79.95], [81.0, 84.52], [86.0, 89.21], [94.0, 96.35], [100.0, 101.29], [102.0, 103.87], [107.0, 107.33], [109.0, 110.39], [114.0, 124.66]], "keep_status": [false, true, false, false, false, true, false, false, false, true, true, false, false, false, false, false, true], "silence_prob": [0.0, 49.92, 54.9, 0.0, 47.94, 35.61, 38.42, 0.0, 43.15, 38.54, 36.11, 45.14, 0.0, 0.0, 0.0, 0.0, 28.26], "audiomae_on_audioset": [null, [["music", 25.69], ["hum", 11.38], ["speech", 11.19]], null, null, [["hum", 39.29], ["mains hum", 20.44], ["music", 15.13]], [["gong", 43.33], ["hum", 9.03], ["singing bowl", 6.05]], [["hum", 50.46], ["throbbing", 24.51], ["mains hum", 10.71]], null, [["music", 41.92], ["mains hum", 17.04], ["hum", 14.08]], [["music", 40.52], ["mains hum", 12.71], ["hum", 12.62]], [["hum", 25.29], ["music", 24.57], ["mains hum", 18.16]], [["music", 60.94], ["theremin", 7.71], ["musical instrument", 3.84]], null, null, null, null, [["music", 56.16], ["vehicle", 7.08], ["car", 4.84]]], "duration": [0.53, 5.33, 2.58, 1.69, 16.64, 2.07, 6.43, 1.65, 2.95, 3.52, 3.21, 2.35, 1.29, 1.87, 0.33, 1.39, 10.66]}
annotations_filtered/-7cV5cWQmxg_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[6.0, 6.34], [8.0, 8.5], [9.0, 9.83], [17.0, 18.98], [21.0, 21.37], [22.0, 23.33], [27.0, 28.56], [32.0, 33.91], [34.0, 38.38], [39.0, 40.36], [42.0, 61.25], [64.0, 66.39], [68.0, 73.47], [80.0, 79.89], [80.0, 80.2], [88.0, 94.09]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.01, 0.0, 41.98, 94.81, 37.09, 0.0, 0.0, 41.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 28.43], ["music", 28.37], ["synthesizer", 5.19]], null, [["mosquito", 27.65], ["fly, housefly", 20.31], ["insect", 8.7]], null, [["speech", 72.72], ["stomach rumble", 4.04], ["animal", 2.28]], null, null, [["speech", 19.75], ["music", 18.08], ["throbbing", 13.72]]], "duration": [0.34, 0.5, 0.83, 1.98, 0.37, 1.33, 1.56, 1.91, 4.38, 1.36, 19.25, 2.39, 5.47, -0.11, 0.2, 6.09]}
annotations_filtered/-7krYJUfFv4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[7.0, 8.58], [9.0, 10.77], [11.0, 11.94], [13.0, 14.71], [15.0, 16.53], [18.0, 19.45], [20.0, 20.78], [31.0, 31.26], [34.0, 34.37], [41.0, 41.52], [42.0, 42.4], [43.0, 43.65], [45.0, 45.25], [47.0, 47.73], [49.0, 49.59], [50.0, 50.63], [53.0, 54.16], [56.0, 56.03], [62.0, 63.31], [65.0, 65.69], [68.0, 68.22], [81.0, 81.48], [92.0, 92.75], [106.0, 107.37], [109.0, 109.34], [110.0, 111.01], [112.0, 112.08], [113.0, 113.48], [114.0, 114.15], [119.0, 119.03], [124.0, 126.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.58, 1.77, 0.94, 1.71, 1.53, 1.45, 0.78, 0.26, 0.37, 0.52, 0.4, 0.65, 0.25, 0.73, 0.59, 0.63, 1.16, 0.03, 1.31, 0.69, 0.22, 0.48, 0.75, 1.37, 0.34, 1.01, 0.08, 0.48, 0.15, 0.03, 2.66]}
annotations_filtered/-7mzQx0ebqk_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 3.64], [10.0, 10.27], [14.0, 14.88], [19.0, 20.17], [23.0, 23.01], [24.0, 28.61], [32.0, 34.43], [43.0, 43.29], [45.0, 45.52], [49.0, 49.55], [54.0, 54.06], [62.0, 63.85], [65.0, 72.45], [75.0, 79.84], [82.0, 82.54], [86.0, 89.4], [96.0, 97.44], [98.0, 100.3], [126.0, 125.73], [128.0, 127.7], [131.0, 132.16], [133.0, 133.22], [135.0, 136.95], [141.0, 141.61], [144.0, 143.95], [145.0, 148.66]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 48.27, 73.97, 0.0, 0.0, 0.0, 0.0, 0.0, 61.67, 60.05, 0.0, 94.22, 0.0, 78.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.7], "audiomae_on_audioset": [null, null, null, null, null, [["singing bowl", 23.82], ["music", 21.45], ["burping, eructation", 15.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, 0.27, 0.88, 1.17, 0.01, 4.61, 2.43, 0.29, 0.52, 0.55, 0.06, 1.85, 7.45, 4.84, 0.54, 3.4, 1.44, 2.3, -0.27, -0.3, 1.16, 0.22, 1.95, 0.61, -0.05, 3.66]}
annotations_filtered/-85ubSkzSWg_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[6.0, 7.99], [15.0, 14.64], [16.0, 20.71], [22.0, 22.96], [23.0, 23.62], [24.0, 24.85], [25.0, 27.18], [28.0, 30.72], [32.0, 33.2], [33.0, 34.4], [36.0, 36.54], [38.0, 40.76], [42.0, 42.84], [44.0, 45.91], [48.0, 50.75], [56.0, 66.06]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, true, false, false, true, true], "silence_prob": [0.0, 0.0, 38.46, 0.0, 0.0, 0.0, 35.38, 34.84, 0.0, 0.0, 0.0, 33.42, 0.0, 0.0, 42.11, 33.01], "audiomae_on_audioset": [null, null, [["music", 56.86], ["musical instrument", 5.27], ["synthesizer", 3.65]], null, null, null, [["speech", 53.41], ["music", 20.83], ["radio", 4.67]], [["music", 21.99], ["mains hum", 19.4], ["hum", 13.14]], null, null, null, [["music", 32.01], ["speech", 25.74], ["radio", 9.71]], null, null, [["hum", 30.98], ["speech", 20.05], ["music", 8.82]], [["hum", 22.59], ["sidetone", 20.95], ["mains hum", 18.14]]], "duration": [1.99, -0.36, 4.71, 0.96, 0.62, 0.85, 2.18, 2.72, 1.2, 1.4, 0.54, 2.76, 0.84, 1.91, 2.75, 10.06]}
annotations_filtered/-8ajIeIeJpY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 0.89], [3.0, 5.76], [6.0, 6.86], [8.0, 8.73], [14.0, 15.4], [19.0, 19.99], [22.0, 23.03], [24.0, 24.53], [26.0, 26.33], [34.0, 33.86], [35.0, 35.43], [36.0, 36.31], [37.0, 37.89], [38.0, 39.29], [42.0, 43.29], [44.0, 44.58], [45.0, 45.4], [46.0, 46.4], [48.0, 48.32], [57.0, 57.15], [58.0, 59.56], [60.0, 61.32], [63.0, 63.66], [68.0, 68.47], [74.0, 76.0], [77.0, 78.85], [81.0, 85.8], [86.0, 86.41], [89.0, 90.75], [91.0, 91.93], [92.0, 92.62], [93.0, 93.85]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.92, 0.0, 83.16, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 34.69], ["radio", 21.67], ["croak", 11.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.11, 2.76, 0.86, 0.73, 1.4, 0.99, 1.03, 0.53, 0.33, -0.14, 0.43, 0.31, 0.89, 1.29, 1.29, 0.58, 0.4, 0.4, 0.32, 0.15, 1.56, 1.32, 0.66, 0.47, 2.0, 1.85, 4.8, 0.41, 1.75, 0.93, 0.62, 0.85]}
annotations_filtered/-98BSUhcZtY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[17.0, 16.95], [23.0, 24.24], [33.0, 34.2], [39.0, 41.27], [43.0, 44.42], [47.0, 47.7]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 42.26, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 47.69], ["mains hum", 18.88], ["throbbing", 10.53]], null, null], "duration": [-0.05, 1.24, 1.2, 2.27, 1.42, 0.7]}
annotations_filtered/-9DrPi3ki0g_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[12.0, 20.28], [22.0, 45.76]], "keep_status": [false, true], "silence_prob": [34.74, 33.61], "audiomae_on_audioset": [[["music", 49.81], ["theremin", 33.23], ["vehicle", 1.7]], [["music", 44.88], ["brass instrument", 11.34], ["trombone", 7.67]]], "duration": [8.28, 23.76]}
annotations_filtered/-9IgLueodZA_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 4.73], [7.0, 9.44], [10.0, 11.7], [15.0, 15.26], [24.0, 24.09], [25.0, 27.26], [28.0, 33.27], [37.0, 37.32], [38.0, 39.36], [41.0, 47.78], [50.0, 53.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 68.28, 0.0, 0.0, 0.0, 65.44, 69.74, 0.0, 0.0, 100.0, 92.15], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, 2.44, 1.7, 0.26, 0.09, 2.26, 5.27, 0.32, 1.36, 6.78, 3.38]}
annotations_filtered/-9P7Ge1KmTY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 4.02], [5.0, 4.7], [5.0, 5.78], [7.0, 8.72], [32.0, 33.22], [38.0, 39.5], [41.0, 42.06], [47.0, 48.24], [51.0, 50.75], [51.0, 52.86], [54.0, 54.65], [65.0, 65.82], [69.0, 68.99], [76.0, 76.65], [79.0, 78.98], [81.0, 80.94], [84.0, 85.06], [87.0, 89.92], [91.0, 91.72], [92.0, 93.43], [95.0, 97.58], [106.0, 107.76], [111.0, 111.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.32, 0.0, 0.0, 96.29, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 65.48], ["telephone", 13.06], ["hum", 5.47]], null, null, null, null, null], "duration": [0.02, -0.3, 0.78, 1.72, 1.22, 1.5, 1.06, 1.24, -0.25, 1.86, 0.65, 0.82, -0.01, 0.65, -0.02, -0.06, 1.06, 2.92, 0.72, 1.43, 2.58, 1.76, 0.35]}
annotations_filtered/-A-fBbIXbPo_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 9.78], [13.0, 14.96], [16.0, 20.09], [22.0, 24.02], [25.0, 26.28], [28.0, 33.52], [36.0, 40.32], [41.0, 52.84], [54.0, 59.63], [61.0, 71.81], [73.0, 72.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.48, 0.0, 97.73, 100.0, 0.0, 99.99, 99.93, 96.42, 94.07, 74.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [5.78, 1.96, 4.09, 2.02, 1.28, 5.52, 4.32, 11.84, 5.63, 10.81, -0.21]}
annotations_filtered/-A9rFt7ITy4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[34.0, 33.86], [36.0, 36.41], [38.0, 39.02], [42.0, 43.14], [45.0, 45.82], [46.0, 47.26], [48.0, 48.44], [50.0, 50.4], [51.0, 51.24], [53.0, 52.89], [58.0, 58.35], [62.0, 62.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.14, 0.41, 1.02, 1.14, 0.82, 1.26, 0.44, 0.4, 0.24, -0.11, 0.35, 0.51]}