bpiyush commited on
Commit
9cb3c99
·
1 Parent(s): 919bb66
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. annotations_filtered/n-5bVE4K2Ls_filtered.json +1 -0
  2. annotations_filtered/n-mpifTiPV4_filtered.json +1 -0
  3. annotations_filtered/n-omBTsCIDE_filtered.json +1 -0
  4. annotations_filtered/n0Fz-ACCMHk_filtered.json +1 -0
  5. annotations_filtered/n0QO2xOuqp0_filtered.json +1 -0
  6. annotations_filtered/n13FhFrtu_8_filtered.json +1 -0
  7. annotations_filtered/n16wkJDq2VQ_filtered.json +1 -0
  8. annotations_filtered/n16wxs5pgvk_filtered.json +1 -0
  9. annotations_filtered/n1BXpNTsoB8_filtered.json +1 -0
  10. annotations_filtered/n1GlWng3oOQ_filtered.json +1 -0
  11. annotations_filtered/n1TqCGEBdLw_filtered.json +1 -0
  12. annotations_filtered/n1VEmXiaFY4_filtered.json +1 -0
  13. annotations_filtered/n1X2w0tinkg_filtered.json +1 -0
  14. annotations_filtered/n1lQR-GjWYw_filtered.json +1 -0
  15. annotations_filtered/n1lbpj6868o_filtered.json +1 -0
  16. annotations_filtered/n1pSObsJ_hk_filtered.json +1 -0
  17. annotations_filtered/n2A194yTWoQ_filtered.json +1 -0
  18. annotations_filtered/n2YCseaZK0Q_filtered.json +1 -0
  19. annotations_filtered/n2ZkOcq4vWU_filtered.json +1 -0
  20. annotations_filtered/n2lTpPptOWA_filtered.json +1 -0
  21. annotations_filtered/n3BgbwW6PXc_filtered.json +1 -0
  22. annotations_filtered/n3K6Fkd5ri8_filtered.json +1 -0
  23. annotations_filtered/n3L8UVTe6Ak_filtered.json +1 -0
  24. annotations_filtered/n3PGfjyctSQ_filtered.json +1 -0
  25. annotations_filtered/n3SrAOdy-tE_filtered.json +1 -0
  26. annotations_filtered/n3Y6B_UKam0_filtered.json +1 -0
  27. annotations_filtered/n3tXVrGw3kY_filtered.json +1 -0
  28. annotations_filtered/n44APWaJZ58_filtered.json +1 -0
  29. annotations_filtered/n4BJBz8GpzI_filtered.json +1 -0
  30. annotations_filtered/n4Mohc3SrHs_filtered.json +1 -0
  31. annotations_filtered/n4bsNkDyF2s_filtered.json +1 -0
  32. annotations_filtered/n4pUbyGBD18_filtered.json +1 -0
  33. annotations_filtered/n59mG9_X35Q_filtered.json +1 -0
  34. annotations_filtered/n5ArS3Got4U_filtered.json +1 -0
  35. annotations_filtered/n5HtgUGCM30_filtered.json +1 -0
  36. annotations_filtered/n5PnSNCFBYs_filtered.json +1 -0
  37. annotations_filtered/n5tMCxz-9uY_filtered.json +1 -0
  38. annotations_filtered/n6H7zga2Ks0_filtered.json +1 -0
  39. annotations_filtered/n75PgMSxAOw_filtered.json +1 -0
  40. annotations_filtered/n7KKfjFRw8w_filtered.json +1 -0
  41. annotations_filtered/n7W0yxKnuvs_filtered.json +1 -0
  42. annotations_filtered/n7cRx_7umjE_filtered.json +1 -0
  43. annotations_filtered/n7l2RLvI7Ss_filtered.json +1 -0
  44. annotations_filtered/n86CV7VKvfE_filtered.json +1 -0
  45. annotations_filtered/n8mK-A_0viA_filtered.json +1 -0
  46. annotations_filtered/n8yUoQP6Rwo_filtered.json +1 -0
  47. annotations_filtered/n9-Wk6ulBuA_filtered.json +1 -0
  48. annotations_filtered/n92XBsqbSF4_filtered.json +1 -0
  49. annotations_filtered/n94um7eDILg_filtered.json +1 -0
  50. annotations_filtered/n9L9jMlulXI_filtered.json +1 -0
annotations_filtered/n-5bVE4K2Ls_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 7.23], [9.0, 16.58], [19.0, 19.36], [25.0, 25.57], [26.0, 29.52], [30.0, 31.82], [32.0, 34.52], [35.0, 36.64], [40.0, 43.68], [44.0, 44.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.96, 99.95, 0.0, 0.0, 99.97, 0.0, 87.74, 0.0, 99.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [3.23, 7.58, 0.36, 0.57, 3.52, 1.82, 2.52, 1.64, 3.68, 0.98]}
annotations_filtered/n-mpifTiPV4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[13.0, 13.96], [14.0, 16.41], [17.0, 18.1], [18.0, 19.52], [21.0, 25.05], [26.0, 26.59], [28.0, 28.07], [34.0, 34.79], [37.0, 37.27], [42.0, 44.0], [46.0, 46.14], [50.0, 52.25], [53.0, 53.57], [61.0, 61.3], [66.0, 66.04], [66.0, 66.5], [73.0, 74.83], [82.0, 82.34], [84.0, 84.08], [85.0, 87.61], [88.0, 88.53], [95.0, 95.3], [96.0, 96.42], [100.0, 100.18], [102.0, 102.3], [106.0, 106.54], [107.0, 107.35], [107.0, 107.76], [109.0, 108.95], [109.0, 111.42], [119.0, 121.76], [125.0, 125.47], [127.0, 127.3]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 35.26, 0.0, 0.0, 59.15, 0.0, 0.0, 0.0, 0.0, 76.86, 0.0, 31.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.94, 43.93, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 21.96], ["mains hum", 21.32], ["sidetone", 11.87]], null, null, null, null, null, null, null, null, null, [["speech", 21.04], ["chirp tone", 10.42], ["sneeze", 8.94]], null, null, null, null, null, null, null, [["speech", 30.16], ["animal", 21.5], ["dog", 6.3]], null, null, null, null, null, null, null, null, null, [["fly, housefly", 24.63], ["hum", 16.92], ["mains hum", 10.41]], [["speech", 47.12], ["hum", 8.4], ["throbbing", 3.93]], null, null], "duration": [0.96, 2.41, 1.1, 1.52, 4.05, 0.59, 0.07, 0.79, 0.27, 2.0, 0.14, 2.25, 0.57, 0.3, 0.04, 0.5, 1.83, 0.34, 0.08, 2.61, 0.53, 0.3, 0.42, 0.18, 0.3, 0.54, 0.35, 0.76, -0.05, 2.42, 2.76, 0.47, 0.3]}
annotations_filtered/n-omBTsCIDE_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 9.83], [10.0, 10.61], [11.0, 11.47], [15.0, 15.16], [19.0, 23.18], [25.0, 25.08], [27.0, 27.13], [28.0, 29.91], [31.0, 31.11], [32.0, 37.4], [39.0, 39.06], [45.0, 45.12], [56.0, 59.68], [63.0, 63.19], [64.0, 64.91], [67.0, 67.07], [78.0, 78.93], [96.0, 96.69], [109.0, 109.98], [117.0, 119.33], [122.0, 122.98], [123.0, 123.97], [125.0, 125.41], [127.0, 128.68]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.61, 0.0, 0.0, 0.0, 44.43, 0.0, 0.0, 0.0, 0.0, 69.34, 0.0, 0.0, 98.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.17, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 13.01], ["hum", 11.37], ["bouncing", 7.33]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.83, 0.61, 0.47, 0.16, 4.18, 0.08, 0.13, 1.91, 0.11, 5.4, 0.06, 0.12, 3.68, 0.19, 0.91, 0.07, 0.93, 0.69, 0.98, 2.33, 0.98, 0.97, 0.41, 1.68]}
annotations_filtered/n0Fz-ACCMHk_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[15.0, 15.01], [24.0, 24.33], [26.0, 28.31], [29.0, 29.49], [33.0, 33.32], [36.0, 36.19], [39.0, 39.66], [40.0, 41.34], [42.0, 42.28], [46.0, 47.44], [48.0, 49.87], [51.0, 60.72], [61.0, 62.61], [64.0, 66.77], [68.0, 69.52], [70.0, 71.51], [72.0, 74.6], [75.0, 76.25], [78.0, 78.7], [79.0, 79.88], [83.0, 84.23], [85.0, 85.53], [89.0, 91.98], [96.0, 99.12], [101.0, 101.85], [102.0, 107.15], [107.0, 109.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.8, 35.8, 0.0, 59.42, 69.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["clang", 15.67], ["boing", 13.66], ["arrow", 13.61]], null, null, null], "duration": [0.01, 0.33, 2.31, 0.49, 0.32, 0.19, 0.66, 1.34, 0.28, 1.44, 1.87, 9.72, 1.61, 2.77, 1.52, 1.51, 2.6, 1.25, 0.7, 0.88, 1.23, 0.53, 2.98, 3.12, 0.85, 5.15, 2.27]}
annotations_filtered/n0QO2xOuqp0_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 5.09], [13.0, 23.8], [26.0, 25.84], [28.0, 28.54], [34.0, 34.97], [40.0, 42.36], [44.0, 49.52], [54.0, 57.87], [63.0, 79.02], [83.0, 93.51], [97.0, 98.81], [105.0, 105.21], [110.0, 115.16], [126.0, 132.81], [145.0, 147.56], [154.0, 157.3], [158.0, 158.16], [159.0, 160.88], [162.0, 167.81]], "keep_status": [false, false, false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [30.79, 29.02, 0.0, 0.0, 0.0, 28.97, 28.98, 29.49, 28.84, 29.21, 0.0, 0.0, 28.9, 28.81, 29.18, 29.53, 0.0, 0.0, 28.78], "audiomae_on_audioset": [[["music", 60.94], ["throbbing", 9.68], ["sidetone", 2.85]], [["smash, crash", 44.44], ["whack, thwack", 22.46], ["music", 22.03]], null, null, null, [["music", 23.22], ["speech", 16.01], ["cattle, bovinae", 8.83]], [["speech", 39.6], ["vehicle", 12.86], ["music", 9.58]], [["music", 56.91], ["speech", 30.17], ["sidetone", 2.35]], [["music", 78.33], ["speech", 3.14], ["whip", 1.98]], [["music", 52.14], ["cacophony", 8.1], ["throbbing", 7.43]], null, null, [["music", 64.81], ["speech", 14.85], ["boing", 5.07]], [["music", 71.59], ["speech", 5.9], ["musical instrument", 1.61]], [["music", 36.66], ["speech", 27.72], ["electronic music", 7.16]], [["music", 46.65], ["throbbing", 28.08], ["hum", 7.3]], null, null, [["throbbing", 56.65], ["music", 15.17], ["hum", 14.51]]], "duration": [2.09, 10.8, -0.16, 0.54, 0.97, 2.36, 5.52, 3.87, 16.02, 10.51, 1.81, 0.21, 5.16, 6.81, 2.56, 3.3, 0.16, 1.88, 5.81]}
annotations_filtered/n13FhFrtu_8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[12.0, 12.51], [14.0, 15.08], [15.0, 17.02], [19.0, 24.36], [26.0, 27.45], [30.0, 31.16], [33.0, 35.36], [39.0, 40.14], [43.0, 45.52], [50.0, 59.8], [63.0, 64.23], [66.0, 66.56], [68.0, 68.28], [70.0, 70.36], [72.0, 73.7], [79.0, 79.71], [80.0, 80.87], [82.0, 83.17], [85.0, 92.08], [96.0, 100.03], [101.0, 102.22], [107.0, 107.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.56, 47.78, 0.0, 0.0, 98.36, 0.0, 100.0, 64.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.31, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 56.64], ["sidetone", 12.66], ["telephone", 7.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.51, 1.08, 2.02, 5.36, 1.45, 1.16, 2.36, 1.14, 2.52, 9.8, 1.23, 0.56, 0.28, 0.36, 1.7, 0.71, 0.87, 1.17, 7.08, 4.03, 1.22, 0.82]}
annotations_filtered/n16wkJDq2VQ_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[6.0, 5.9], [11.0, 11.06], [23.0, 23.11], [24.0, 25.84], [26.0, 27.97], [31.0, 31.43], [36.0, 37.66], [38.0, 44.25], [45.0, 47.76], [48.0, 50.08], [51.0, 51.34], [53.0, 53.37], [54.0, 55.29], [58.0, 58.58], [63.0, 64.1], [68.0, 68.77], [70.0, 71.59], [76.0, 76.42], [77.0, 78.27], [81.0, 86.83], [91.0, 94.07], [97.0, 97.71], [99.0, 100.36], [101.0, 105.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17, 99.52, 76.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.78, 37.93, 0.0, 0.0, 98.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 65.27], ["noise", 2.9], ["beatboxing", 2.48]], null, null, null], "duration": [-0.1, 0.06, 0.11, 1.84, 1.97, 0.43, 1.66, 6.25, 2.76, 2.08, 0.34, 0.37, 1.29, 0.58, 1.1, 0.77, 1.59, 0.42, 1.27, 5.83, 3.07, 0.71, 1.36, 4.54]}
annotations_filtered/n16wxs5pgvk_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[19.0, 18.67], [42.0, 42.58], [43.0, 45.64], [69.0, 69.43], [77.0, 80.89], [94.0, 95.07], [97.0, 101.11], [118.0, 118.96]], "keep_status": [false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 45.75, 0.0, 31.95, 0.0, 31.16, 0.0], "audiomae_on_audioset": [null, null, [["fart", 32.51], ["speech", 12.62], ["noise", 7.27]], null, [["speech", 77.2], ["fart", 4.37], ["noise", 4.13]], null, [["music", 54.81], ["trombone", 8.35], ["brass instrument", 5.45]], null], "duration": [-0.33, 0.58, 2.64, 0.43, 3.89, 1.07, 4.11, 0.96]}
annotations_filtered/n1BXpNTsoB8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[29.0, 30.16], [31.0, 32.63], [40.0, 40.51], [41.0, 42.16], [47.0, 47.19], [48.0, 50.14], [51.0, 52.88], [55.0, 57.96], [59.0, 60.32], [63.0, 65.26], [68.0, 69.03], [71.0, 71.29], [74.0, 77.94], [79.0, 79.57], [80.0, 81.82], [83.0, 83.12], [86.0, 86.26], [87.0, 86.95], [87.0, 87.89], [89.0, 89.85], [90.0, 91.79], [93.0, 94.36], [95.0, 95.98], [97.0, 98.63], [99.0, 100.87], [105.0, 106.15], [109.0, 110.05], [110.0, 111.35], [113.0, 113.53], [118.0, 118.69], [121.0, 124.07], [125.0, 125.9], [127.0, 128.75]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.54, 0.0, 60.32, 0.0, 45.78, 0.0, 0.0, 43.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.66, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 63.7], ["sine wave", 7.09], ["music", 4.74]], null, null, null, [["speech", 36.9], ["sidetone", 19.63], ["busy signal", 6.28]], null, null, [["speech", 71.66], ["dial tone", 8.55], ["busy signal", 2.87]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 1.63, 0.51, 1.16, 0.19, 2.14, 1.88, 2.96, 1.32, 2.26, 1.03, 0.29, 3.94, 0.57, 1.82, 0.12, 0.26, -0.05, 0.89, 0.85, 1.79, 1.36, 0.98, 1.63, 1.87, 1.15, 1.05, 1.35, 0.53, 0.69, 3.07, 0.9, 1.75]}
annotations_filtered/n1GlWng3oOQ_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[56.0, 58.31], [59.0, 59.9], [60.0, 62.29], [63.0, 64.64], [66.0, 68.98], [70.0, 78.22], [79.0, 82.46], [84.0, 87.86], [89.0, 90.14], [91.0, 93.82], [95.0, 96.11], [97.0, 99.32], [100.0, 102.07], [103.0, 115.96], [116.0, 119.65], [120.0, 127.95], [131.0, 131.84], [133.0, 133.93], [135.0, 136.41], [138.0, 139.09], [140.0, 148.0], [149.0, 155.56], [156.0, 159.0], [160.0, 164.69], [165.0, 168.84], [170.0, 174.85], [176.0, 177.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [51.23, 0.0, 62.78, 0.0, 64.29, 58.38, 74.29, 85.9, 0.0, 98.36, 0.0, 92.97, 97.33, 58.47, 77.36, 62.99, 0.0, 0.0, 0.0, 0.0, 56.86, 56.86, 69.47, 73.67, 57.89, 53.53, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.31, 0.9, 2.29, 1.64, 2.98, 8.22, 3.46, 3.86, 1.14, 2.82, 1.11, 2.32, 2.07, 12.96, 3.65, 7.95, 0.84, 0.93, 1.41, 1.09, 8.0, 6.56, 3.0, 4.69, 3.84, 4.85, 1.96]}
annotations_filtered/n1TqCGEBdLw_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[14.0, 54.99], [56.0, 70.29]], "keep_status": [false, false], "silence_prob": [0.0, 60.05], "audiomae_on_audioset": [null, null], "duration": [40.99, 14.29]}
annotations_filtered/n1VEmXiaFY4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[86.0, 107.08], [108.0, 110.08], [117.0, 120.04], [122.0, 127.04], [129.0, 135.14], [137.0, 143.31], [143.0, 147.72], [148.0, 149.45], [153.0, 155.78], [162.0, 162.5]], "keep_status": [false, true, false, false, false, true, false, false, false, false], "silence_prob": [31.51, 46.68, 64.63, 53.84, 61.37, 48.95, 40.92, 0.0, 99.44, 0.0], "audiomae_on_audioset": [[["music", 61.4], ["hum", 10.88], ["throbbing", 7.79]], [["speech", 26.03], ["music", 20.1], ["hum", 14.09]], null, null, null, [["music", 29.49], ["gong", 13.49], ["singing bowl", 9.7]], [["speech", 67.48], ["music", 19.33], ["sidetone", 2.92]], null, null, null], "duration": [21.08, 2.08, 3.04, 5.04, 6.14, 6.31, 4.72, 1.45, 2.78, 0.5]}
annotations_filtered/n1X2w0tinkg_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[6.0, 9.02], [14.0, 16.93], [22.0, 26.4], [29.0, 87.59], [90.0, 105.68], [106.0, 125.29]], "keep_status": [true, true, false, false, false, false], "silence_prob": [39.85, 43.58, 54.3, 0.0, 32.94, 37.35], "audiomae_on_audioset": [[["music", 57.55], ["didgeridoo", 8.15], ["synthesizer", 3.68]], [["music", 56.13], ["theremin", 8.61], ["musical instrument", 3.59]], null, null, [["music", 60.09], ["theremin", 14.39], ["ambient music", 6.25]], [["music", 70.8], ["foghorn", 7.37], ["didgeridoo", 4.55]]], "duration": [3.02, 2.93, 4.4, 58.59, 15.68, 19.29]}
annotations_filtered/n1lQR-GjWYw_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[31.0, 64.84], [66.0, 67.85], [69.0, 81.4], [85.0, 101.36], [105.0, 111.99], [113.0, 119.79], [121.0, 125.17]], "keep_status": [false, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 30.02, 30.19, 29.35, 30.89, 29.99], "audiomae_on_audioset": [null, null, [["music", 43.79], ["groan", 7.15], ["whack, thwack", 6.87]], [["music", 33.3], ["speech", 22.24], ["fart", 10.8]], [["music", 74.79], ["theremin", 3.69], ["whack, thwack", 2.87]], [["music", 51.94], ["smash, crash", 26.8], ["whack, thwack", 8.78]], [["moo", 23.6], ["livestock, farm animals, working animals", 22.8], ["cattle, bovinae", 19.08]]], "duration": [33.84, 1.85, 12.4, 16.36, 6.99, 6.79, 4.17]}
annotations_filtered/n1lbpj6868o_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[34.0, 39.41], [62.0, 62.51], [86.0, 87.47], [88.0, 88.72], [90.0, 90.86], [98.0, 100.75], [108.0, 109.81], [114.0, 115.52], [117.0, 118.89], [119.0, 119.74], [120.0, 121.44], [123.0, 126.28]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [66.27, 0.0, 0.0, 0.0, 0.0, 40.12, 0.0, 0.0, 0.0, 0.0, 0.0, 34.08], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 38.93], ["music", 19.81], ["sidetone", 10.94]], null, null, null, null, null, [["music", 36.53], ["speech", 32.84], ["whack, thwack", 2.31]]], "duration": [5.41, 0.51, 1.47, 0.72, 0.86, 2.75, 1.81, 1.52, 1.89, 0.74, 1.44, 3.28]}
annotations_filtered/n1pSObsJ_hk_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[8.0, 10.71], [18.0, 18.35], [24.0, 28.58], [29.0, 29.98], [31.0, 32.51], [35.0, 35.6], [36.0, 36.61], [37.0, 58.73], [63.0, 65.97], [67.0, 68.05], [76.0, 78.98], [82.0, 99.42], [113.0, 114.99], [115.0, 115.03], [119.0, 120.31], [120.0, 120.43], [120.0, 120.48], [121.0, 121.95], [126.0, 131.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [99.97, 0.0, 59.68, 0.0, 0.0, 0.0, 0.0, 41.34, 74.6, 0.0, 36.57, 50.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.15], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 66.15], ["radio", 3.24], ["explosion", 2.35]], null, null, [["speech", 60.15], ["fireworks", 4.27], ["noise", 2.92]], null, null, null, null, null, null, null, null], "duration": [2.71, 0.35, 4.58, 0.98, 1.51, 0.6, 0.61, 21.73, 2.97, 1.05, 2.98, 17.42, 1.99, 0.03, 1.31, 0.43, 0.48, 0.95, 5.77]}
annotations_filtered/n2A194yTWoQ_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 5.02], [7.0, 7.42], [10.0, 11.5], [12.0, 12.97], [15.0, 15.65], [28.0, 27.94], [29.0, 29.66], [37.0, 37.57], [43.0, 43.26], [48.0, 48.25], [51.0, 52.15], [55.0, 56.61], [60.0, 60.56], [62.0, 62.68], [67.0, 68.74], [72.0, 73.03], [77.0, 79.84], [81.0, 81.18], [84.0, 84.13], [87.0, 87.39], [91.0, 98.78], [99.0, 100.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.31, 0.0, 0.0, 0.0, 44.99, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 91.7], ["speech", 1.99], ["mains hum", 1.15]], null, null, null, [["hum", 26.15], ["sidetone", 15.45], ["mains hum", 14.17]], null], "duration": [1.02, 0.42, 1.5, 0.97, 0.65, -0.06, 0.66, 0.57, 0.26, 0.25, 1.15, 1.61, 0.56, 0.68, 1.74, 1.03, 2.84, 0.18, 0.13, 0.39, 7.78, 1.8]}
annotations_filtered/n2YCseaZK0Q_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 5.12], [7.0, 8.04], [15.0, 16.02], [19.0, 20.48], [24.0, 27.72], [29.0, 34.13], [35.0, 36.37], [38.0, 38.67], [40.0, 41.84], [43.0, 52.78], [57.0, 61.59], [63.0, 64.13], [70.0, 72.27], [75.0, 75.69], [76.0, 92.6], [94.0, 97.02], [103.0, 109.02], [109.0, 121.85], [122.0, 124.92], [126.0, 127.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 58.98, 51.99, 0.0, 0.0, 0.0, 53.91, 57.97, 0.0, 53.65, 0.0, 48.74, 49.18, 48.87, 40.16, 44.63, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 24.62], ["hum", 20.8], ["throbbing", 13.72]], [["throbbing", 36.44], ["hum", 21.45], ["music", 17.25]], [["throbbing", 45.32], ["hum", 25.45], ["mains hum", 5.77]], [["hum", 45.11], ["throbbing", 17.55], ["mains hum", 14.93]], [["throbbing", 28.32], ["hum", 28.0], ["music", 22.52]], null], "duration": [1.12, 1.04, 1.02, 1.48, 3.72, 5.13, 1.37, 0.67, 1.84, 9.78, 4.59, 1.13, 2.27, 0.69, 16.6, 3.02, 6.02, 12.85, 2.92, 1.63]}
annotations_filtered/n2ZkOcq4vWU_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 4.55], [5.0, 5.48], [7.0, 8.02], [8.0, 9.44], [10.0, 12.66], [13.0, 14.15], [16.0, 18.05], [19.0, 20.75], [23.0, 24.54], [26.0, 26.6]], "keep_status": [false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 47.31, 0.0, 46.22, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 40.18], ["hum", 33.12], ["speech", 7.17]], null, [["speech", 22.18], ["hum", 12.21], ["mains hum", 11.44]], null, null, null], "duration": [0.55, 0.48, 1.02, 1.44, 2.66, 1.15, 2.05, 1.75, 1.54, 0.6]}
annotations_filtered/n2lTpPptOWA_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[10.0, 18.99], [19.0, 19.23], [19.0, 28.8], [55.0, 55.36], [60.0, 62.21], [64.0, 69.74], [72.0, 77.16], [91.0, 92.3], [108.0, 107.96]], "keep_status": [false, false, true, false, false, true, false, false, false], "silence_prob": [44.52, 0.0, 37.57, 0.0, 99.93, 31.81, 32.05, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 39.75], ["snicker", 15.74], ["laughter", 14.79]], null, [["speech", 44.9], ["honk", 7.7], ["goose", 6.52]], null, null, [["screaming", 37.69], ["moo", 15.92], ["cattle, bovinae", 15.6]], [["speech", 66.57], ["fart", 20.57], ["noise", 3.33]], null, null], "duration": [8.99, 0.23, 9.8, 0.36, 2.21, 5.74, 5.16, 1.3, -0.04]}
annotations_filtered/n3BgbwW6PXc_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[8.0, 10.34], [10.0, 11.92], [14.0, 14.4], [15.0, 16.85], [17.0, 20.75], [26.0, 26.84], [28.0, 34.13], [46.0, 46.38], [47.0, 47.93], [49.0, 50.18], [52.0, 51.7], [53.0, 57.21], [61.0, 61.67], [62.0, 63.69], [65.0, 66.43], [69.0, 69.03], [81.0, 81.72]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.4, 0.0, 0.0, 0.0, 59.86, 0.0, 62.27, 0.0, 0.0, 0.0, 0.0, 63.53, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 34.47], ["speech", 23.2], ["sidetone", 8.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.34, 1.92, 0.4, 1.85, 3.75, 0.84, 6.13, 0.38, 0.93, 1.18, -0.3, 4.21, 0.67, 1.69, 1.43, 0.03, 0.72]}
annotations_filtered/n3K6Fkd5ri8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[10.0, 9.9], [18.0, 18.23], [19.0, 19.36], [20.0, 20.19], [23.0, 23.72], [26.0, 26.25], [30.0, 30.0], [32.0, 32.58], [33.0, 33.64], [35.0, 35.02], [37.0, 37.03], [39.0, 40.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.1, 0.23, 0.36, 0.19, 0.72, 0.25, 0.0, 0.58, 0.64, 0.02, 0.03, 1.36]}
annotations_filtered/n3L8UVTe6Ak_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 4.29], [7.0, 8.5], [12.0, 13.09], [17.0, 17.86], [22.0, 22.98], [26.0, 26.16], [34.0, 36.02], [39.0, 39.88], [40.0, 40.41], [43.0, 45.22], [47.0, 49.65], [51.0, 52.41], [54.0, 54.95], [57.0, 59.17], [69.0, 69.25], [71.0, 71.47], [73.0, 73.99], [77.0, 77.62], [79.0, 80.22], [82.0, 83.07], [85.0, 88.74], [91.0, 147.46], [148.0, 149.37], [153.0, 154.31], [166.0, 167.04], [170.0, 170.65], [175.0, 179.25], [181.0, 196.23], [197.0, 198.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.86, 0.0, 0.0, 64.75, 86.09, 0.0, 0.0, 68.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.39, 0.0, 0.0, 0.0, 0.0, 0.0, 49.87, 31.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.15], ["music", 14.2], ["croak", 7.45]], null, null, null, null, null, [["music", 31.26], ["hum", 10.83], ["speech", 7.24]], [["music", 46.67], ["speech", 16.5], ["hum", 8.78]], null], "duration": [0.29, 1.5, 1.09, 0.86, 0.98, 0.16, 2.02, 0.88, 0.41, 2.22, 2.65, 1.41, 0.95, 2.17, 0.25, 0.47, 0.99, 0.62, 1.22, 1.07, 3.74, 56.46, 1.37, 1.31, 1.04, 0.65, 4.25, 15.23, 1.78]}
annotations_filtered/n3PGfjyctSQ_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[8.0, 8.01], [9.0, 9.63], [12.0, 13.05], [14.0, 15.7], [17.0, 17.34], [20.0, 22.49], [30.0, 31.24], [38.0, 39.36], [39.0, 39.46], [44.0, 44.69], [46.0, 46.65], [48.0, 48.59], [50.0, 50.85], [53.0, 53.22], [57.0, 57.35], [60.0, 60.78], [75.0, 75.9], [77.0, 79.49], [82.0, 83.73], [85.0, 88.48], [90.0, 90.69], [93.0, 94.19], [95.0, 98.56], [102.0, 104.04], [106.0, 106.79], [108.0, 107.94], [112.0, 114.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.26, 0.0, 81.71, 0.0, 0.0, 31.15, 30.82, 0.0, 0.0, 34.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 31.26], ["music", 25.38], ["chirp tone", 9.17]], null, null, null, null, [["music", 44.97], ["speech", 15.59], ["trombone", 8.78]], [["music", 19.32], ["boat, water vehicle", 9.54], ["vehicle", 6.13]], null, null, [["beatboxing", 37.81], ["boing", 26.27], ["fart", 15.53]]], "duration": [0.01, 0.63, 1.05, 1.7, 0.34, 2.49, 1.24, 1.36, 0.46, 0.69, 0.65, 0.59, 0.85, 0.22, 0.35, 0.78, 0.9, 2.49, 1.73, 3.48, 0.69, 1.19, 3.56, 2.04, 0.79, -0.06, 2.86]}
annotations_filtered/n3SrAOdy-tE_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[5.0, 6.72], [8.0, 9.66], [10.0, 12.01], [13.0, 15.04], [19.0, 19.2], [22.0, 23.33], [26.0, 27.43], [28.0, 29.47], [30.0, 33.13], [34.0, 37.72], [39.0, 40.32], [41.0, 48.2]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 43.98, 88.1, 0.0, 0.0, 0.0, 0.0, 51.88, 51.88, 0.0, 48.39], "audiomae_on_audioset": [null, null, [["speech", 48.87], ["sidetone", 8.73], ["chirp tone", 6.58]], null, null, null, null, null, null, null, null, [["speech", 23.47], ["cough", 15.93], ["music", 12.16]]], "duration": [1.72, 1.66, 2.01, 2.04, 0.2, 1.33, 1.43, 1.47, 3.13, 3.72, 1.32, 7.2]}
annotations_filtered/n3Y6B_UKam0_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[10.0, 11.21], [16.0, 16.56], [21.0, 22.42], [25.0, 26.91], [28.0, 29.02], [36.0, 44.31], [49.0, 49.01], [50.0, 50.67], [55.0, 60.32], [63.0, 63.31], [64.0, 64.47], [73.0, 73.13], [75.0, 75.81], [79.0, 83.69], [84.0, 86.81], [88.0, 87.67], [89.0, 89.28], [95.0, 99.18], [99.0, 100.14], [104.0, 104.3], [106.0, 106.57], [109.0, 108.85], [112.0, 127.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 64.41, 0.0, 0.0, 60.79, 0.0, 0.0, 0.0, 0.0, 61.87, 58.72, 0.0, 0.0, 68.8, 0.0, 0.0, 0.0, 0.0, 31.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 46.17], ["music", 6.99], ["buzz", 5.0]]], "duration": [1.21, 0.56, 1.42, 1.91, 1.02, 8.31, 0.01, 0.67, 5.32, 0.31, 0.47, 0.13, 0.81, 4.69, 2.81, -0.33, 0.28, 4.18, 1.14, 0.3, 0.57, -0.15, 15.03]}
annotations_filtered/n3tXVrGw3kY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 3.59], [9.0, 9.95], [12.0, 12.56], [21.0, 21.73], [25.0, 25.56], [30.0, 33.2], [39.0, 40.19], [50.0, 51.95], [54.0, 55.56], [62.0, 63.0], [83.0, 84.89], [87.0, 88.11], [91.0, 92.53], [97.0, 96.92], [101.0, 101.78], [118.0, 118.79], [127.0, 128.61]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.41, 0.0, 0.0, 0.0, 0.0, 33.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 36.88], ["fart", 13.92], ["whip", 12.62]], null, null, null, null, null, null, null, null, null, null, null], "duration": [2.59, 0.95, 0.56, 0.73, 0.56, 3.2, 1.19, 1.95, 1.56, 1.0, 1.89, 1.11, 1.53, -0.08, 0.78, 0.79, 1.61]}
annotations_filtered/n44APWaJZ58_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[5.0, 5.61], [8.0, 7.87], [13.0, 14.66], [20.0, 21.15], [27.0, 28.17], [30.0, 30.4], [34.0, 36.51], [38.0, 38.03], [41.0, 41.17], [47.0, 48.63], [49.0, 49.65], [50.0, 53.06], [58.0, 92.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.08, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.61, -0.13, 1.66, 1.15, 1.17, 0.4, 2.51, 0.03, 0.17, 1.63, 0.65, 3.06, 34.75]}
annotations_filtered/n4BJBz8GpzI_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[18.0, 80.96], [81.0, 115.7], [116.0, 117.07], [117.0, 123.92]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 28.9], "audiomae_on_audioset": [null, null, null, [["music", 46.79], ["speech", 24.71], ["hum", 6.25]]], "duration": [62.96, 34.7, 1.07, 6.92]}
annotations_filtered/n4Mohc3SrHs_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[12.0, 12.55], [16.0, 15.84], [16.0, 16.66], [20.0, 20.63], [22.0, 21.74], [25.0, 26.4], [27.0, 28.46], [42.0, 42.63], [44.0, 44.69]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.55, -0.16, 0.66, 0.63, -0.26, 1.4, 1.46, 0.63, 0.69]}
annotations_filtered/n4bsNkDyF2s_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[10.0, 10.2], [13.0, 20.39], [23.0, 41.74], [45.0, 60.98]], "keep_status": [false, true, false, true], "silence_prob": [0.0, 43.13, 28.4, 28.3], "audiomae_on_audioset": [null, [["hum", 28.06], ["music", 24.89], ["mains hum", 9.15]], [["music", 76.33], ["speech", 3.77], ["throbbing", 1.9]], [["music", 28.71], ["speech", 13.55], ["explosion", 7.93]]], "duration": [0.2, 7.39, 18.74, 15.98]}
annotations_filtered/n4pUbyGBD18_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 0.99], [2.0, 2.78], [5.0, 6.61], [8.0, 7.96], [10.0, 10.4], [12.0, 12.88], [19.0, 19.45], [28.0, 31.48], [33.0, 33.05], [34.0, 34.82], [42.0, 42.53], [43.0, 43.85], [46.0, 48.81], [51.0, 51.54], [53.0, 53.64], [55.0, 55.36], [56.0, 56.47], [57.0, 58.16], [59.0, 61.47], [64.0, 64.39], [65.0, 74.21], [77.0, 87.39], [88.0, 88.43], [89.0, 136.19], [139.0, 140.37], [142.0, 143.07]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.86, 0.0, 0.0, 0.0, 0.0, 42.79, 0.0, 0.0, 0.0, 0.0, 0.0, 49.82, 0.0, 30.85, 48.91, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["sidetone", 25.07], ["hum", 11.98], ["mains hum", 9.89]], null, null, null, null, [["fly, housefly", 46.56], ["bee, wasp, etc.", 17.51], ["insect", 13.29]], null, null, null, null, null, [["fly, housefly", 41.02], ["insect", 16.67], ["bee, wasp, etc.", 9.37]], null, [["music", 17.09], ["hum", 15.72], ["mains hum", 6.0]], [["music", 45.62], ["wind instrument, woodwind instrument", 6.03], ["hum", 5.13]], null, null, null, null], "duration": [-0.01, 0.78, 1.61, -0.04, 0.4, 0.88, 0.45, 3.48, 0.05, 0.82, 0.53, 0.85, 2.81, 0.54, 0.64, 0.36, 0.47, 1.16, 2.47, 0.39, 9.21, 10.39, 0.43, 47.19, 1.37, 1.07]}
annotations_filtered/n59mG9_X35Q_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 3.65], [7.0, 8.18], [14.0, 18.4], [20.0, 20.24], [21.0, 21.49], [28.0, 29.49], [35.0, 39.68], [41.0, 48.25], [52.0, 58.35], [58.0, 58.53], [59.0, 60.44], [62.0, 63.64], [73.0, 73.47], [74.0, 80.5], [86.0, 87.27], [89.0, 90.41], [95.0, 99.84]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.7, 0.0, 0.0, 0.0, 29.06, 30.0, 32.37, 0.0, 0.0, 0.0, 0.0, 36.39, 0.0, 0.0, 32.34], "audiomae_on_audioset": [null, null, [["music", 28.91], ["grunt", 18.4], ["speech", 13.9]], null, null, null, [["music", 39.54], ["throbbing", 19.77], ["hum", 14.23]], [["speech", 43.08], ["music", 34.74], ["throbbing", 2.89]], [["music", 53.7], ["theremin", 13.93], ["soundtrack music", 4.33]], null, null, null, null, [["music", 76.5], ["didgeridoo", 8.69], ["musical instrument", 3.55]], null, null, [["music", 48.87], ["grunt", 22.24], ["animal", 13.24]]], "duration": [0.65, 1.18, 4.4, 0.24, 0.49, 1.49, 4.68, 7.25, 6.35, 0.53, 1.44, 1.64, 0.47, 6.5, 1.27, 1.41, 4.84]}
annotations_filtered/n5ArS3Got4U_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[5.0, 13.32], [14.0, 33.2], [34.0, 41.08], [55.0, 55.0], [56.0, 56.96], [59.0, 60.07], [65.0, 65.64], [67.0, 67.71], [69.0, 69.6], [82.0, 87.81], [88.0, 88.32], [89.0, 117.54], [118.0, 119.69], [120.0, 122.52], [124.0, 127.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 96.54, 70.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.45, 0.0, 44.63, 0.0, 97.73, 95.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 81.75], ["didgeridoo", 2.53], ["cello", 1.57]], null, null, null], "duration": [8.32, 19.2, 7.08, 0.0, 0.96, 1.07, 0.64, 0.71, 0.6, 5.81, 0.32, 28.54, 1.69, 2.52, 3.55]}
annotations_filtered/n5HtgUGCM30_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[7.0, 7.82], [11.0, 72.49], [75.0, 121.02]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.82, 61.49, 46.02]}
annotations_filtered/n5PnSNCFBYs_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[8.0, 8.34], [10.0, 16.68], [21.0, 24.02], [26.0, 28.02], [29.0, 30.21], [38.0, 39.28], [56.0, 60.52], [68.0, 69.43]], "keep_status": [false, false, true, false, false, false, true, false], "silence_prob": [0.0, 38.37, 43.38, 81.35, 0.0, 0.0, 44.81, 0.0], "audiomae_on_audioset": [null, [["music", 46.62], ["speech", 19.26], ["throbbing", 8.49]], [["music", 24.81], ["hum", 12.89], ["synthesizer", 5.48]], null, null, null, [["speech", 40.22], ["radio", 17.38], ["frog", 4.3]], null], "duration": [0.34, 6.68, 3.02, 2.02, 1.21, 1.28, 4.52, 1.43]}
annotations_filtered/n5tMCxz-9uY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[17.0, 18.76], [26.0, 30.79], [44.0, 44.12], [50.0, 50.75], [53.0, 53.15], [55.0, 56.78], [58.0, 61.82], [68.0, 68.49], [78.0, 79.14], [93.0, 92.99], [102.0, 102.05], [104.0, 104.57], [111.0, 111.84], [121.0, 122.5], [125.0, 136.78], [140.0, 151.58], [157.0, 157.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 31.2, 0.0, 0.0, 0.0, 0.0, 30.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.32, 30.57, 0.0], "audiomae_on_audioset": [null, [["music", 78.77], ["quack", 2.23], ["boing", 1.9]], null, null, null, null, [["music", 95.33], ["musical instrument", 0.6], ["guitar", 0.44]], null, null, null, null, null, null, null, [["music", 49.87], ["boing", 15.09], ["speech", 4.89]], [["music", 83.62], ["reggae", 1.58], ["drum and bass", 1.27]], null], "duration": [1.76, 4.79, 0.12, 0.75, 0.15, 1.78, 3.82, 0.49, 1.14, -0.01, 0.05, 0.57, 0.84, 1.5, 11.78, 11.58, 0.76]}
annotations_filtered/n6H7zga2Ks0_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[7.0, 11.03], [12.0, 13.26], [16.0, 17.27], [21.0, 23.21], [24.0, 26.05], [28.0, 29.03], [31.0, 33.94], [34.0, 36.0], [38.0, 40.02], [46.0, 45.99], [48.0, 50.6], [55.0, 56.02], [57.0, 58.41], [59.0, 60.03], [62.0, 63.85], [65.0, 66.02], [67.0, 67.49], [69.0, 69.13], [76.0, 78.07], [84.0, 84.47], [85.0, 87.99], [90.0, 95.99], [96.0, 99.42], [102.0, 103.72], [104.0, 105.43], [107.0, 106.98], [108.0, 109.98], [111.0, 112.75], [114.0, 114.67], [115.0, 116.77], [119.0, 119.52], [123.0, 123.82], [124.0, 126.79], [128.0, 128.55], [130.0, 132.27], [133.0, 136.22], [137.0, 138.3], [139.0, 142.82], [143.0, 144.59], [146.0, 148.19]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 0.0, 0.0, 99.48, 86.82, 0.0, 100.0, 48.91, 83.7, 0.0, 99.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 78.38, 99.95, 99.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 0.0, 100.0, 100.0, 0.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 54.23], ["sidetone", 10.47], ["hum", 5.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.03, 1.26, 1.27, 2.21, 2.05, 1.03, 2.94, 2.0, 2.02, -0.01, 2.6, 1.02, 1.41, 1.03, 1.85, 1.02, 0.49, 0.13, 2.07, 0.47, 2.99, 5.99, 3.42, 1.72, 1.43, -0.02, 1.98, 1.75, 0.67, 1.77, 0.52, 0.82, 2.79, 0.55, 2.27, 3.22, 1.3, 3.82, 1.59, 2.19]}
annotations_filtered/n75PgMSxAOw_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[11.0, 32.48], [34.0, 97.07], [100.0, 118.02], [121.0, 125.79]], "keep_status": [true, false, true, true], "silence_prob": [30.64, 0.0, 29.65, 32.05], "audiomae_on_audioset": [[["speech", 47.71], ["vehicle", 5.51], ["music", 5.09]], null, [["whack, thwack", 36.42], ["music", 16.08], ["thump, thud", 14.98]], [["vehicle", 9.01], ["fly, housefly", 8.22], ["throbbing", 6.91]]], "duration": [21.48, 63.07, 18.02, 4.79]}
annotations_filtered/n7KKfjFRw8w_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[8.0, 8.77], [20.0, 24.65], [29.0, 32.86], [34.0, 35.04], [40.0, 81.82], [86.0, 86.04], [87.0, 87.12], [90.0, 89.7], [91.0, 91.08], [94.0, 93.6], [95.0, 110.34], [111.0, 111.27], [112.0, 114.52], [115.0, 118.22]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 33.96, 36.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.34, 0.0, 39.33, 51.99], "audiomae_on_audioset": [null, [["speech", 39.09], ["music", 22.37], ["synthesizer", 4.47]], [["music", 20.48], ["speech", 17.55], ["pulse", 7.72]], null, null, null, null, null, null, null, [["speech", 42.04], ["music", 24.03], ["sidetone", 11.79]], null, [["music", 53.32], ["musical instrument", 7.63], ["synthesizer", 7.21]], null], "duration": [0.77, 4.65, 3.86, 1.04, 41.82, 0.04, 0.12, -0.3, 0.08, -0.4, 15.34, 0.27, 2.52, 3.22]}
annotations_filtered/n7W0yxKnuvs_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[0.0, 0.68], [3.0, 4.72], [6.0, 9.71], [12.0, 13.71], [20.0, 20.28], [22.0, 23.19], [25.0, 27.03], [30.0, 31.21], [32.0, 33.44], [37.0, 37.39], [41.0, 45.71], [47.0, 47.82], [49.0, 49.74], [52.0, 52.86], [54.0, 54.85], [57.0, 62.77], [64.0, 66.19], [67.0, 67.61], [69.0, 70.26], [71.0, 71.49], [73.0, 73.35], [74.0, 78.27], [84.0, 85.5], [86.0, 87.42], [90.0, 90.32], [91.0, 92.35], [95.0, 96.42], [98.0, 98.76], [103.0, 102.93], [108.0, 108.45], [114.0, 114.76], [117.0, 117.71], [119.0, 121.96], [123.0, 123.53], [127.0, 129.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.05, 0.0, 0.0, 0.0, 78.55, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.76, 0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.91, 0.0, 89.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.68, 1.72, 3.71, 1.71, 0.28, 1.19, 2.03, 1.21, 1.44, 0.39, 4.71, 0.82, 0.74, 0.86, 0.85, 5.77, 2.19, 0.61, 1.26, 0.49, 0.35, 4.27, 1.5, 1.42, 0.32, 1.35, 1.42, 0.76, -0.07, 0.45, 0.76, 0.71, 2.96, 0.53, 2.76]}
annotations_filtered/n7cRx_7umjE_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 4.35], [5.0, 6.59], [11.0, 18.03], [20.0, 33.99], [35.0, 43.95], [52.0, 80.2], [81.0, 96.2]], "keep_status": [true, false, true, false, true, true, true], "silence_prob": [39.75, 0.0, 38.32, 35.15, 32.44, 31.2, 30.22], "audiomae_on_audioset": [[["vehicle", 15.68], ["music", 11.36], ["car", 4.49]], null, [["music", 28.88], ["speech", 24.04], ["throbbing", 11.25]], [["music", 42.59], ["speech", 21.05], ["throbbing", 10.78]], [["hum", 31.52], ["mains hum", 15.9], ["music", 9.08]], [["music", 34.24], ["speech", 9.09], ["hum", 9.0]], [["speech", 37.72], ["music", 26.4], ["fart", 4.95]]], "duration": [2.35, 1.59, 7.03, 13.99, 8.95, 28.2, 15.2]}
annotations_filtered/n7l2RLvI7Ss_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 2.05], [9.0, 9.14], [12.0, 12.7], [18.0, 22.33], [26.0, 26.74], [29.0, 28.78], [30.0, 30.74], [33.0, 33.1], [34.0, 34.97], [35.0, 35.56], [40.0, 40.1], [41.0, 41.07], [49.0, 49.33], [50.0, 50.89], [53.0, 54.21], [56.0, 56.88], [61.0, 61.77], [63.0, 65.94], [66.0, 67.26], [68.0, 68.17], [69.0, 69.18], [69.0, 70.02], [71.0, 71.27], [73.0, 73.8], [76.0, 77.6], [78.0, 78.92], [80.0, 80.0], [81.0, 81.6], [83.0, 82.88], [84.0, 83.91], [84.0, 85.41], [88.0, 88.64], [94.0, 94.09], [96.0, 96.97], [98.0, 98.0], [98.0, 100.14], [102.0, 104.13], [106.0, 107.13], [109.0, 109.41], [110.0, 111.94], [114.0, 114.07], [115.0, 115.45], [116.0, 115.96], [116.0, 117.21], [125.0, 125.02], [130.0, 130.22], [131.0, 130.98], [132.0, 132.22], [134.0, 133.64], [136.0, 136.78], [139.0, 140.17], [141.0, 141.61], [143.0, 143.83], [144.0, 144.88], [146.0, 146.5], [147.0, 147.68], [148.0, 148.46], [151.0, 151.5], [152.0, 152.19], [153.0, 153.39], [156.0, 156.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 97.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.05, 0.14, 0.7, 4.33, 0.74, -0.22, 0.74, 0.1, 0.97, 0.56, 0.1, 0.07, 0.33, 0.89, 1.21, 0.88, 0.77, 2.94, 1.26, 0.17, 0.18, 1.02, 0.27, 0.8, 1.6, 0.92, 0.0, 0.6, -0.12, -0.09, 1.41, 0.64, 0.09, 0.97, 0.0, 2.14, 2.13, 1.13, 0.41, 1.94, 0.07, 0.45, -0.04, 1.21, 0.02, 0.22, -0.02, 0.22, -0.36, 0.78, 1.17, 0.61, 0.83, 0.88, 0.5, 0.68, 0.46, 0.5, 0.19, 0.39, 0.79]}
annotations_filtered/n86CV7VKvfE_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 3.81], [12.0, 13.56], [22.0, 22.23], [32.0, 32.56], [33.0, 33.3], [39.0, 40.0], [41.0, 40.74], [42.0, 42.75], [45.0, 45.45], [51.0, 51.22], [59.0, 59.68], [62.0, 62.11], [64.0, 64.39], [66.0, 66.68], [67.0, 67.56], [68.0, 68.86], [76.0, 76.98], [78.0, 79.71], [84.0, 84.97], [88.0, 88.11], [91.0, 92.03], [96.0, 96.57], [99.0, 99.72], [102.0, 102.44], [104.0, 103.64], [106.0, 106.37], [108.0, 108.77], [111.0, 111.94], [113.0, 113.26], [119.0, 119.89], [124.0, 124.21], [125.0, 126.25], [129.0, 129.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 1.56, 0.23, 0.56, 0.3, 1.0, -0.26, 0.75, 0.45, 0.22, 0.68, 0.11, 0.39, 0.68, 0.56, 0.86, 0.98, 1.71, 0.97, 0.11, 1.03, 0.57, 0.72, 0.44, -0.36, 0.37, 0.77, 0.94, 0.26, 0.89, 0.21, 1.25, 0.3]}
annotations_filtered/n8mK-A_0viA_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[12.0, 13.12], [15.0, 19.08], [20.0, 21.37], [27.0, 30.11], [31.0, 33.45], [35.0, 102.39], [105.0, 106.0], [108.0, 109.09], [110.0, 110.51], [112.0, 119.6], [120.0, 130.54], [131.0, 131.28]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 62.27, 0.0, 49.22, 35.74, 0.0, 0.0, 0.0, 0.0, 31.7, 34.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 54.38], ["whale vocalization", 12.25], ["sine wave", 4.97]], [["music", 34.47], ["synthesizer", 9.94], ["didgeridoo", 6.63]], null, null, null, null, [["animal", 21.27], ["groan", 16.72], ["roar", 8.2]], [["speech", 48.26], ["sidetone", 30.47], ["music", 6.32]], null], "duration": [1.12, 4.08, 1.37, 3.11, 2.45, 67.39, 1.0, 1.09, 0.51, 7.6, 10.54, 0.28]}
annotations_filtered/n8yUoQP6Rwo_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 3.89], [5.0, 5.61], [9.0, 16.66], [22.0, 30.91], [36.0, 41.44], [42.0, 42.62], [44.0, 52.37], [54.0, 56.2], [61.0, 62.14], [64.0, 82.86]], "keep_status": [false, false, false, true, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 49.59, 30.13, 28.67, 0.0, 29.12, 29.44, 0.0, 29.3], "audiomae_on_audioset": [null, null, [["whale vocalization", 64.52], ["music", 11.4], ["speech", 8.86]], [["whale vocalization", 25.82], ["animal", 11.63], ["buzz", 8.67]], [["animal", 13.18], ["speech", 11.35], ["livestock, farm animals, working animals", 8.82]], null, [["speech", 21.7], ["music", 14.65], ["roar", 8.73]], [["speech", 24.02], ["fly, housefly", 23.68], ["insect", 11.74]], null, [["music", 50.82], ["speech", 12.57], ["groan", 11.49]]], "duration": [0.89, 0.61, 7.66, 8.91, 5.44, 0.62, 8.37, 2.2, 1.14, 18.86]}
annotations_filtered/n9-Wk6ulBuA_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[12.0, 12.58], [14.0, 14.08], [15.0, 18.64], [23.0, 28.0], [33.0, 33.89], [34.0, 41.5], [42.0, 47.26], [51.0, 51.34], [52.0, 54.01], [57.0, 65.91], [67.0, 68.76]], "keep_status": [false, false, true, false, false, true, true, false, true, true, false], "silence_prob": [0.0, 0.0, 32.28, 34.42, 0.0, 31.89, 32.56, 0.0, 33.0, 32.54, 0.0], "audiomae_on_audioset": [null, null, [["music", 31.24], ["speech", 16.7], ["knock", 10.39]], [["hum", 40.18], ["mains hum", 25.3], ["throbbing", 11.8]], null, [["sidetone", 24.85], ["throbbing", 24.43], ["speech", 14.35]], [["speech", 52.28], ["hum", 6.8], ["music", 6.3]], null, [["speech", 57.78], ["music", 4.16], ["speech synthesizer", 3.57]], [["whack, thwack", 40.9], ["throbbing", 8.13], ["music", 7.33]], null], "duration": [0.58, 0.08, 3.64, 5.0, 0.89, 7.5, 5.26, 0.34, 2.01, 8.91, 1.76]}
annotations_filtered/n92XBsqbSF4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[14.0, 18.55], [20.0, 178.68]], "keep_status": [false, false], "silence_prob": [43.82, 0.0], "audiomae_on_audioset": [[["speech", 32.41], ["music", 31.03], ["hum", 6.98]], null], "duration": [4.55, 158.68]}
annotations_filtered/n94um7eDILg_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 6.47], [13.0, 13.46], [15.0, 14.99], [16.0, 19.23], [21.0, 21.25], [22.0, 22.69], [25.0, 25.24], [26.0, 26.5], [39.0, 39.51], [42.0, 47.55], [59.0, 59.0], [61.0, 62.01], [63.0, 63.26], [69.0, 69.58], [71.0, 71.42], [72.0, 72.76], [79.0, 81.23], [84.0, 85.19], [86.0, 87.44], [88.0, 88.96], [90.0, 111.91], [114.0, 114.62]], "keep_status": [true, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [32.77, 0.0, 0.0, 32.45, 0.0, 0.0, 0.0, 0.0, 0.0, 36.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.79, 0.0, 0.0, 0.0, 32.73, 0.0], "audiomae_on_audioset": [[["thump, thud", 17.92], ["rumble", 8.86], ["speech", 7.21]], null, null, [["fly, housefly", 28.36], ["insect", 13.81], ["wail, moan", 7.59]], null, null, null, null, null, [["speech", 29.41], ["groan", 18.11], ["grunt", 4.91]], null, null, null, null, null, null, [["music", 9.36], ["cattle, bovinae", 8.58], ["animal", 7.68]], null, null, null, [["music", 17.52], ["fly, housefly", 13.64], ["groan", 8.42]], null], "duration": [2.47, 0.46, -0.01, 3.23, 0.25, 0.69, 0.24, 0.5, 0.51, 5.55, 0.0, 1.01, 0.26, 0.58, 0.42, 0.76, 2.23, 1.19, 1.44, 0.96, 21.91, 0.62]}
annotations_filtered/n9L9jMlulXI_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[16.0, 16.92], [22.0, 21.83], [24.0, 24.07], [25.0, 26.38], [27.0, 27.35], [28.0, 28.11], [28.0, 31.92], [32.0, 32.76], [37.0, 38.96], [41.0, 43.93], [46.0, 46.25], [46.0, 46.92], [50.0, 55.98], [58.0, 71.91], [79.0, 80.43], [88.0, 87.91], [89.0, 90.31], [100.0, 99.94], [104.0, 104.7]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.71, 0.0, 0.0, 38.75, 0.0, 0.0, 34.04, 31.04, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["animal", 9.18], ["electric shaver, electric razor", 9.0], ["hum", 8.06]], null, null, [["hum", 43.79], ["throbbing", 24.77], ["mains hum", 9.15]], null, null, [["animal", 11.92], ["speech", 7.3], ["fart", 5.5]], [["speech", 22.51], ["hum", 20.66], ["mains hum", 13.6]], null, null, null, null, null], "duration": [0.92, -0.17, 0.07, 1.38, 0.35, 0.11, 3.92, 0.76, 1.96, 2.93, 0.25, 0.92, 5.98, 13.91, 1.43, -0.09, 1.31, -0.06, 0.7]}