bpiyush commited on
Commit
b6c3fcf
·
1 Parent(s): 72d6257

WIP: Adding annotation files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. annotations_filtered/a-9990dlfvo_filtered.json +1 -0
  2. annotations_filtered/a-CS6CjnEw8_filtered.json +1 -0
  3. annotations_filtered/a-IU2mBY1_4_filtered.json +1 -0
  4. annotations_filtered/a-KQ5h6WmJg_filtered.json +1 -0
  5. annotations_filtered/a-SnsqKFHLY_filtered.json +1 -0
  6. annotations_filtered/a-VqYtkvmzw_filtered.json +1 -0
  7. annotations_filtered/a-Z66uN97Ds_filtered.json +1 -0
  8. annotations_filtered/a-h2glY0jyg_filtered.json +1 -0
  9. annotations_filtered/a1Bx9nyw35w_filtered.json +1 -0
  10. annotations_filtered/a1GeB9y9zzo_filtered.json +1 -0
  11. annotations_filtered/a1REfTIc5po_filtered.json +1 -0
  12. annotations_filtered/a1iQDKCkh6k_filtered.json +1 -0
  13. annotations_filtered/a2872XpfqKY_filtered.json +1 -0
  14. annotations_filtered/a2ZdXUZt3iw_filtered.json +1 -0
  15. annotations_filtered/a2_9fQ0U57w_filtered.json +1 -0
  16. annotations_filtered/a2gMY3TRx8s_filtered.json +1 -0
  17. annotations_filtered/a2lb_3-fYFc_filtered.json +1 -0
  18. annotations_filtered/a2qE4hG9XCk_filtered.json +1 -0
  19. annotations_filtered/a38HZFbhB-M_filtered.json +1 -0
  20. annotations_filtered/a3HOCIXroqQ_filtered.json +1 -0
  21. annotations_filtered/a3Xm0KpUYj4_filtered.json +1 -0
  22. annotations_filtered/a3bI7kbVBwM_filtered.json +1 -0
  23. annotations_filtered/a469ezsg86A_filtered.json +1 -0
  24. annotations_filtered/a46FsHMRPkc_filtered.json +1 -0
  25. annotations_filtered/a46m8g3grB8_filtered.json +1 -0
  26. annotations_filtered/a4EqbYUl7Rg_filtered.json +1 -0
  27. annotations_filtered/a4OWkIrQUJw_filtered.json +1 -0
  28. annotations_filtered/a4QlQy31HIk_filtered.json +1 -0
  29. annotations_filtered/a4Td_W5dc1w_filtered.json +1 -0
  30. annotations_filtered/a4wb-xmYM50_filtered.json +1 -0
  31. annotations_filtered/a51EYR5AeNk_filtered.json +1 -0
  32. annotations_filtered/a5BtDmdw708_filtered.json +1 -0
  33. annotations_filtered/a5PoLM_QBuo_filtered.json +1 -0
  34. annotations_filtered/a5QBuJla5do_filtered.json +1 -0
  35. annotations_filtered/a5WAyc-EaNc_filtered.json +1 -0
  36. annotations_filtered/a6--cEjo3bY_filtered.json +1 -0
  37. annotations_filtered/a66f39DMwtY_filtered.json +1 -0
  38. annotations_filtered/a6CsW4dCk_8_filtered.json +1 -0
  39. annotations_filtered/a6XtVMtUZI8_filtered.json +1 -0
  40. annotations_filtered/a6cUudbbHl0_filtered.json +1 -0
  41. annotations_filtered/a6mkbps0BmY_filtered.json +1 -0
  42. annotations_filtered/a6oC5iQB4u8_filtered.json +1 -0
  43. annotations_filtered/a72FDTElH9g_filtered.json +1 -0
  44. annotations_filtered/a7K1xgoi_c4_filtered.json +1 -0
  45. annotations_filtered/a7XZaIy4a9k_filtered.json +1 -0
  46. annotations_filtered/a7gZgEpgKiY_filtered.json +1 -0
  47. annotations_filtered/a7qRJ9T9TPg_filtered.json +1 -0
  48. annotations_filtered/a7vAR-7YBWE_filtered.json +1 -0
  49. annotations_filtered/a81pNygdAXw_filtered.json +1 -0
  50. annotations_filtered/a861J6gxqmg_filtered.json +1 -0
annotations_filtered/a-9990dlfvo_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[6.0, 8.94], [11.0, 10.61], [11.0, 11.87], [13.0, 16.95], [18.0, 22.4], [24.0, 33.08], [35.0, 37.17], [38.0, 89.46], [92.0, 92.28], [96.0, 96.38], [97.0, 97.48], [99.0, 99.6], [101.0, 103.76], [110.0, 110.24], [111.0, 111.2], [116.0, 116.87], [122.0, 122.61], [123.0, 123.58], [125.0, 124.97], [126.0, 126.6], [130.0, 130.76], [131.0, 138.55], [142.0, 142.01], [145.0, 148.96], [149.0, 150.15], [154.0, 154.97], [155.0, 156.32], [157.0, 159.51], [161.0, 165.47], [167.0, 167.04], [167.0, 167.1], [167.0, 173.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false, false, true], "silence_prob": [62.89, 0.0, 0.0, 58.13, 53.04, 56.18, 73.21, 0.0, 0.0, 0.0, 0.0, 0.0, 31.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.13, 0.0, 32.35, 0.0, 0.0, 0.0, 33.09, 31.81, 0.0, 0.0, 31.14], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.65], ["speech", 4.74], ["meow", 4.68]], null, null, null, null, null, null, null, null, [["music", 36.25], ["livestock, farm animals, working animals", 9.95], ["hum", 6.28]], null, [["speech", 47.96], ["music", 22.24], ["musical instrument", 10.32]], null, null, null, [["music", 33.5], ["wind instrument, woodwind instrument", 8.27], ["musical instrument", 6.59]], [["music", 36.18], ["musical instrument", 16.14], ["shofar", 6.98]], null, null, [["speech", 53.16], ["music", 11.99], ["electric shaver, electric razor", 4.51]]], "duration": [2.94, -0.39, 0.87, 3.95, 4.4, 9.08, 2.17, 51.46, 0.28, 0.38, 0.48, 0.6, 2.76, 0.24, 0.2, 0.87, 0.61, 0.58, -0.03, 0.6, 0.76, 7.55, 0.01, 3.96, 1.15, 0.97, 1.32, 2.51, 4.47, 0.04, 0.1, 6.31]}
annotations_filtered/a-CS6CjnEw8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[9.0, 11.62], [23.0, 23.8], [25.0, 26.2], [27.0, 30.47], [35.0, 36.68], [38.0, 38.57], [40.0, 40.19], [41.0, 42.09], [43.0, 49.52], [51.0, 51.53], [52.0, 52.71], [53.0, 56.1], [58.0, 58.29], [59.0, 76.6], [78.0, 80.28], [82.0, 84.13], [87.0, 89.06], [98.0, 99.23], [101.0, 108.38], [109.0, 115.26], [116.0, 131.16], [132.0, 133.62], [135.0, 137.0], [142.0, 142.65], [143.0, 146.42]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 48.74, 0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 49.54, 0.0, 72.01, 96.54, 100.0, 94.81, 0.0, 100.0, 96.89, 99.93, 0.0, 97.54, 0.0, 88.28], "audiomae_on_audioset": [null, null, null, [["music", 25.28], ["didgeridoo", 11.68], ["guitar", 7.89]], null, null, null, null, null, null, null, [["sidetone", 50.03], ["busy signal", 18.45], ["speech", 16.24]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.62, 0.8, 1.2, 3.47, 1.68, 0.57, 0.19, 1.09, 6.52, 0.53, 0.71, 3.1, 0.29, 17.6, 2.28, 2.13, 2.06, 1.23, 7.38, 6.26, 15.16, 1.62, 2.0, 0.65, 3.42]}
annotations_filtered/a-IU2mBY1_4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[0.0, 0.94], [12.0, 26.69], [29.0, 47.36], [48.0, 52.79], [53.0, 56.42], [58.0, 67.27], [71.0, 70.87], [72.0, 74.95], [76.0, 79.0], [82.0, 85.99], [88.0, 91.0], [92.0, 95.89], [98.0, 106.78], [107.0, 110.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 76.53, 89.19, 99.99, 95.91, 97.73, 0.0, 99.68, 99.59, 54.7, 57.64, 66.27, 64.52, 44.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 22.05], ["hiccup", 12.11], ["theremin", 7.62]]], "duration": [0.94, 14.69, 18.36, 4.79, 3.42, 9.27, -0.13, 2.95, 3.0, 3.99, 3.0, 3.89, 8.78, 3.71]}
annotations_filtered/a-KQ5h6WmJg_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 2.44], [5.0, 5.16], [6.0, 6.56], [8.0, 8.55], [9.0, 12.68], [13.0, 17.04], [18.0, 19.8], [22.0, 22.81], [25.0, 24.98], [27.0, 31.51], [32.0, 32.31], [34.0, 35.53], [36.0, 37.32], [40.0, 40.02], [42.0, 42.9], [49.0, 48.86], [51.0, 57.65], [61.0, 62.18], [65.0, 65.6], [68.0, 71.71], [80.0, 80.64], [81.0, 82.38], [83.0, 83.96], [91.0, 91.64], [93.0, 93.18], [98.0, 98.69], [102.0, 102.39], [104.0, 104.03], [106.0, 106.08], [111.0, 112.87], [115.0, 115.8], [117.0, 116.99], [121.0, 121.59], [124.0, 126.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 86.09, 51.28, 0.0, 0.0, 0.0, 54.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.44, 0.16, 0.56, 0.55, 3.68, 4.04, 1.8, 0.81, -0.02, 4.51, 0.31, 1.53, 1.32, 0.02, 0.9, -0.14, 6.65, 1.18, 0.6, 3.71, 0.64, 1.38, 0.96, 0.64, 0.18, 0.69, 0.39, 0.03, 0.08, 1.87, 0.8, -0.01, 0.59, 2.45]}
annotations_filtered/a-SnsqKFHLY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[13.0, 14.27], [21.0, 30.08], [31.0, 32.76], [33.0, 36.46], [46.0, 49.15], [57.0, 58.58], [60.0, 82.49], [85.0, 85.43], [87.0, 88.25], [89.0, 89.78], [92.0, 94.34], [96.0, 97.58], [102.0, 107.2], [109.0, 109.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 58.05, 0.0, 58.98, 67.51, 0.0, 62.37, 0.0, 0.0, 0.0, 98.19, 0.0, 57.17, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.27, 9.08, 1.76, 3.46, 3.15, 1.58, 22.49, 0.43, 1.25, 0.78, 2.34, 1.58, 5.2, 0.32]}
annotations_filtered/a-VqYtkvmzw_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[31.0, 32.91], [35.0, 36.17], [38.0, 38.11], [39.0, 39.39], [41.0, 41.66], [44.0, 43.95], [45.0, 46.99], [52.0, 52.69], [64.0, 64.35], [66.0, 72.69]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.77], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["rumble", 48.11], ["hum", 13.72], ["mains hum", 3.13]]], "duration": [1.91, 1.17, 0.11, 0.39, 0.66, -0.05, 1.99, 0.69, 0.35, 6.69]}
annotations_filtered/a-Z66uN97Ds_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[51.0, 51.0], [58.0, 77.82], [82.0, 83.35], [88.0, 88.43], [90.0, 90.37], [92.0, 96.31], [102.0, 102.86], [104.0, 104.68]], "keep_status": [false, false, false, false, false, true, false, false], "silence_prob": [0.0, 33.85, 0.0, 0.0, 0.0, 35.73, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 37.6], ["throbbing", 26.77], ["hum", 16.89]], null, null, null, [["fly, housefly", 22.33], ["insect", 18.13], ["music", 15.21]], null, null], "duration": [0.0, 19.82, 1.35, 0.43, 0.37, 4.31, 0.86, 0.68]}
annotations_filtered/a-h2glY0jyg_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 3.0], [4.0, 5.49], [8.0, 8.6], [9.0, 10.86], [12.0, 12.8], [14.0, 15.21], [17.0, 18.4], [21.0, 23.08], [23.0, 29.29], [30.0, 32.22], [33.0, 35.28], [36.0, 36.75], [37.0, 38.53], [40.0, 41.55], [44.0, 45.18], [46.0, 46.85], [48.0, 49.23], [50.0, 58.14], [60.0, 60.4], [61.0, 62.13], [63.0, 63.49], [64.0, 64.49], [66.0, 66.75], [68.0, 69.01], [70.0, 71.29], [74.0, 73.89], [75.0, 75.44], [76.0, 76.91], [78.0, 78.98], [80.0, 81.45], [83.0, 84.11], [86.0, 86.05], [87.0, 89.18], [95.0, 95.44], [97.0, 98.22], [101.0, 101.02], [106.0, 109.19], [110.0, 113.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.07, 86.27, 88.28, 73.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 68.28, 98.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 1.49, 0.6, 1.86, 0.8, 1.21, 1.4, 2.08, 6.29, 2.22, 2.28, 0.75, 1.53, 1.55, 1.18, 0.85, 1.23, 8.14, 0.4, 1.13, 0.49, 0.49, 0.75, 1.01, 1.29, -0.11, 0.44, 0.91, 0.98, 1.45, 1.11, 0.05, 2.18, 0.44, 1.22, 0.02, 3.19, 3.27]}
annotations_filtered/a1Bx9nyw35w_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 24.34], [26.0, 32.93], [34.0, 34.55], [43.0, 45.5], [47.0, 46.9], [53.0, 86.19], [90.0, 100.9], [103.0, 103.79], [105.0, 127.36], [129.0, 132.8], [135.0, 185.3], [187.0, 188.03], [188.0, 192.18]], "keep_status": [true, true, false, false, false, false, true, false, true, true, false, false, false], "silence_prob": [34.11, 35.62, 0.0, 54.23, 0.0, 0.0, 35.39, 0.0, 30.76, 37.72, 0.0, 0.0, 46.43], "audiomae_on_audioset": [[["music", 23.3], ["noise", 10.22], ["whale vocalization", 8.51]], [["speech", 26.07], ["dog", 6.21], ["bouncing", 5.96]], null, null, null, null, [["music", 38.47], ["speech", 19.93], ["brass instrument", 6.6]], null, [["music", 33.67], ["mains hum", 14.46], ["hum", 13.77]], [["music", 46.82], ["hum", 9.03], ["didgeridoo", 3.25]], null, null, [["music", 72.37], ["musical instrument", 4.85], ["bowed string instrument", 2.66]]], "duration": [21.34, 6.93, 0.55, 2.5, -0.1, 33.19, 10.9, 0.79, 22.36, 3.8, 50.3, 1.03, 4.18]}
annotations_filtered/a1GeB9y9zzo_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[5.0, 111.92]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [106.92]}
annotations_filtered/a1REfTIc5po_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[6.0, 13.78], [18.0, 18.69], [20.0, 20.75], [22.0, 25.07], [25.0, 26.47], [30.0, 30.48], [33.0, 34.35], [39.0, 40.86], [42.0, 42.99], [44.0, 45.06], [47.0, 64.83], [73.0, 74.87], [83.0, 82.83], [86.0, 86.63], [87.0, 90.21], [90.0, 90.95], [102.0, 102.17], [107.0, 108.08], [109.0, 112.14], [120.0, 120.75], [122.0, 122.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false], "silence_prob": [99.99, 0.0, 0.0, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.2, 0.0, 0.0, 0.0, 32.08, 0.0, 0.0, 0.0, 39.86, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 43.3], ["throbbing", 11.73], ["hum", 10.69]], null, null, null, [["music", 50.04], ["speech", 13.67], ["electronic music", 1.64]], null, null, null, [["music", 52.07], ["didgeridoo", 12.94], ["hum", 5.72]], null, null], "duration": [7.78, 0.69, 0.75, 3.07, 1.47, 0.48, 1.35, 1.86, 0.99, 1.06, 17.83, 1.87, -0.17, 0.63, 3.21, 0.95, 0.17, 1.08, 3.14, 0.75, 0.12]}
annotations_filtered/a1iQDKCkh6k_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[17.0, 20.65], [21.0, 48.98], [49.0, 49.57], [52.0, 51.98], [53.0, 53.6], [54.0, 74.02], [77.0, 142.05], [144.0, 146.23], [150.0, 152.17], [153.0, 157.01]], "keep_status": [false, true, false, false, false, false, false, true, false, false], "silence_prob": [95.51, 30.38, 0.0, 0.0, 0.0, 30.37, 0.0, 35.79, 55.39, 37.73], "audiomae_on_audioset": [null, [["speech", 37.39], ["music", 15.48], ["boing", 5.38]], null, null, null, [["speech", 60.27], ["machine gun", 11.31], ["sidetone", 8.12]], null, [["music", 15.79], ["noise", 14.32], ["hum", 6.65]], null, [["sidetone", 61.57], ["speech", 18.95], ["explosion", 3.82]]], "duration": [3.65, 27.98, 0.57, -0.02, 0.6, 20.02, 65.05, 2.23, 2.17, 4.01]}
annotations_filtered/a2872XpfqKY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[108.0, 108.75]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.75]}
annotations_filtered/a2ZdXUZt3iw_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[18.0, 39.45], [40.0, 43.63], [45.0, 47.29], [49.0, 52.35], [53.0, 54.14], [56.0, 56.29], [58.0, 58.26], [59.0, 60.34], [63.0, 64.5], [65.0, 67.56], [68.0, 67.61], [68.0, 96.58], [99.0, 105.02], [107.0, 107.49], [109.0, 111.32], [114.0, 115.69]], "keep_status": [true, true, true, true, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [33.27, 45.92, 36.01, 41.42, 0.0, 0.0, 0.0, 0.0, 0.0, 79.76, 0.0, 28.85, 34.88, 0.0, 76.7, 0.0], "audiomae_on_audioset": [[["speech", 47.4], ["explosion", 10.71], ["music", 7.53]], [["music", 27.49], ["didgeridoo", 20.73], ["speech", 14.26]], [["didgeridoo", 18.3], ["speech", 16.09], ["mains hum", 14.86]], [["fart", 28.8], ["speech", 11.53], ["dog", 10.47]], null, null, null, null, null, null, null, [["speech", 57.29], ["music", 17.27], ["hum", 5.81]], [["music", 33.04], ["hum", 23.44], ["mains hum", 9.14]], null, null, null], "duration": [21.45, 3.63, 2.29, 3.35, 1.14, 0.29, 0.26, 1.34, 1.5, 2.56, -0.39, 28.58, 6.02, 0.49, 2.32, 1.69]}
annotations_filtered/a2_9fQ0U57w_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 3.08], [4.0, 10.0], [11.0, 13.39], [14.0, 20.38], [22.0, 29.86], [30.0, 29.93], [30.0, 34.3], [35.0, 34.96], [36.0, 37.96], [38.0, 42.38], [45.0, 48.05], [49.0, 57.43], [59.0, 73.77], [74.0, 73.8], [74.0, 86.61], [87.0, 101.73], [102.0, 112.19], [113.0, 122.45], [124.0, 125.93], [127.0, 133.3], [135.0, 142.94], [143.0, 143.41], [148.0, 154.11], [156.0, 158.46], [165.0, 172.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.1, 99.56, 99.95, 99.93, 0.0, 99.97, 0.0, 0.0, 99.48, 99.99, 99.84, 90.08, 0.0, 99.97, 99.95, 100.0, 100.0, 0.0, 88.64, 59.07, 0.0, 54.56, 34.26, 33.38], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.12], ["ambient music", 23.31], ["synthesizer", 4.62]], [["music", 83.17], ["ambient music", 7.73], ["scary music", 1.93]]], "duration": [1.08, 6.0, 2.39, 6.38, 7.86, -0.07, 4.3, -0.04, 1.96, 4.38, 3.05, 8.43, 14.77, -0.2, 12.61, 14.73, 10.19, 9.45, 1.93, 6.3, 7.94, 0.41, 6.11, 2.46, 7.84]}
annotations_filtered/a2gMY3TRx8s_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 2.42], [4.0, 6.76], [9.0, 9.9], [11.0, 12.07], [13.0, 14.84], [16.0, 19.18], [22.0, 24.73], [27.0, 27.8], [29.0, 30.28], [32.0, 33.05], [35.0, 36.12], [38.0, 39.66], [41.0, 41.88], [43.0, 45.87], [47.0, 48.76], [51.0, 53.15], [54.0, 57.69], [58.0, 58.72], [60.0, 60.03], [63.0, 64.1], [66.0, 68.42], [69.0, 79.03], [81.0, 82.71], [84.0, 89.18], [91.0, 92.45], [94.0, 97.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 52.86, 0.0, 0.0, 0.0, 85.54, 59.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.63, 0.0, 96.77, 70.16, 0.0, 0.0, 0.0, 94.95, 39.4, 0.0, 79.24, 0.0, 45.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 23.73], ["speech", 18.38], ["dog", 17.71]], null, null, null, [["music", 43.2], ["theremin", 8.45], ["synthesizer", 7.36]]], "duration": [1.42, 2.76, 0.9, 1.07, 1.84, 3.18, 2.73, 0.8, 1.28, 1.05, 1.12, 1.66, 0.88, 2.87, 1.76, 2.15, 3.69, 0.72, 0.03, 1.1, 2.42, 10.03, 1.71, 5.18, 1.45, 3.53]}
annotations_filtered/a2lb_3-fYFc_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[7.0, 7.13], [9.0, 9.78], [12.0, 13.12], [13.0, 13.51], [18.0, 18.57], [20.0, 20.71], [22.0, 23.06], [25.0, 26.96], [30.0, 30.43], [34.0, 34.11], [38.0, 38.01], [41.0, 41.45], [43.0, 43.48], [45.0, 45.01], [46.0, 47.09], [54.0, 58.41], [61.0, 61.48], [70.0, 70.77], [76.0, 76.06], [80.0, 80.87], [84.0, 85.5], [88.0, 88.05], [89.0, 92.55], [95.0, 97.26], [99.0, 100.06], [101.0, 100.94], [101.0, 101.88], [103.0, 107.3], [108.0, 109.85], [110.0, 111.0], [112.0, 112.53], [116.0, 116.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.53, 58.22, 0.0, 0.0, 0.0, 39.18, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 42.1], ["radio", 11.16], ["animal", 10.19]], null, null, null, null, null, null, [["sidetone", 60.73], ["music", 8.81], ["speech", 4.22]], null, null, null, null, [["fly, housefly", 25.32], ["insect", 20.5], ["hum", 9.34]], null, null, null, null], "duration": [0.13, 0.78, 1.12, 0.51, 0.57, 0.71, 1.06, 1.96, 0.43, 0.11, 0.01, 0.45, 0.48, 0.01, 1.09, 4.41, 0.48, 0.77, 0.06, 0.87, 1.5, 0.05, 3.55, 2.26, 1.06, -0.06, 0.88, 4.3, 1.85, 1.0, 0.53, 0.11]}
annotations_filtered/a2qE4hG9XCk_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[6.0, 6.51], [7.0, 16.28], [17.0, 44.27], [44.0, 48.25], [49.0, 49.55], [51.0, 62.7], [66.0, 68.79], [75.0, 78.66], [82.0, 87.18], [93.0, 93.24], [95.0, 98.24], [99.0, 101.66], [103.0, 103.11], [109.0, 109.53], [113.0, 121.42], [125.0, 140.16]], "keep_status": [false, true, true, true, false, false, true, true, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 34.06, 31.04, 31.35, 0.0, 35.1, 37.56, 30.82, 30.25, 0.0, 32.35, 30.67, 0.0, 0.0, 30.43, 30.69], "audiomae_on_audioset": [null, [["hum", 23.84], ["music", 23.15], ["speech", 15.4]], [["music", 43.75], ["speech", 17.57], ["motorcycle", 6.65]], [["music", 46.49], ["throbbing", 9.02], ["hum", 6.22]], null, [["music", 42.89], ["whale vocalization", 15.88], ["speech", 15.0]], [["whale vocalization", 24.0], ["speech", 18.08], ["noise", 10.59]], [["music", 31.6], ["throbbing", 17.26], ["hum", 10.33]], [["music", 61.56], ["throbbing", 4.44], ["hum", 4.18]], null, [["music", 54.62], ["throbbing", 15.17], ["hum", 7.45]], [["music", 46.12], ["hum", 9.91], ["mains hum", 8.59]], null, null, [["speech", 23.11], ["buzz", 19.19], ["fly, housefly", 11.27]], [["music", 52.58], ["speech", 15.87], ["throbbing", 2.57]]], "duration": [0.51, 9.28, 27.27, 4.25, 0.55, 11.7, 2.79, 3.66, 5.18, 0.24, 3.24, 2.66, 0.11, 0.53, 8.42, 15.16]}
annotations_filtered/a38HZFbhB-M_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 2.51], [5.0, 5.93], [8.0, 8.23], [10.0, 9.75], [11.0, 11.5], [13.0, 13.46], [14.0, 16.65], [17.0, 18.1], [26.0, 26.05], [28.0, 35.18], [38.0, 43.17], [51.0, 51.7], [55.0, 56.25], [57.0, 57.59], [59.0, 60.15], [61.0, 61.18], [62.0, 79.42], [83.0, 83.39], [89.0, 88.99], [92.0, 96.6], [100.0, 101.65], [104.0, 105.56], [107.0, 107.3], [110.0, 114.22], [116.0, 119.01], [121.0, 121.19], [125.0, 125.73]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.6, 0.0, 0.0, 34.11, 55.25, 0.0, 0.0, 0.0, 0.0, 0.0, 61.27, 0.0, 0.0, 98.59, 0.0, 0.0, 0.0, 99.48, 61.57, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 17.82], ["moo", 15.05], ["grunt", 9.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.51, 0.93, 0.23, -0.25, 0.5, 0.46, 2.65, 1.1, 0.05, 7.18, 5.17, 0.7, 1.25, 0.59, 1.15, 0.18, 17.42, 0.39, -0.01, 4.6, 1.65, 1.56, 0.3, 4.22, 3.01, 0.19, 0.73]}
annotations_filtered/a3HOCIXroqQ_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[8.0, 10.08], [13.0, 14.2], [19.0, 23.7], [27.0, 27.04], [34.0, 34.69], [37.0, 39.28], [40.0, 63.29], [65.0, 64.94], [65.0, 65.52], [67.0, 126.54]], "keep_status": [false, false, true, false, false, true, true, false, false, false], "silence_prob": [32.05, 0.0, 34.24, 0.0, 0.0, 29.76, 29.81, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 29.22], ["music", 21.11], ["hum", 19.91]], null, [["music", 20.85], ["speech", 18.62], ["throbbing", 17.01]], null, null, [["noise", 20.23], ["hum", 16.92], ["mains hum", 11.09]], [["vehicle", 21.13], ["music", 11.74], ["buzz", 11.25]], null, null, null], "duration": [2.08, 1.2, 4.7, 0.04, 0.69, 2.28, 23.29, -0.06, 0.52, 59.54]}
annotations_filtered/a3Xm0KpUYj4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 3.4], [11.0, 11.6], [14.0, 29.15], [31.0, 33.18], [36.0, 38.64], [40.0, 45.66], [47.0, 47.02], [48.0, 49.33], [50.0, 52.83]], "keep_status": [false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 28.51, 33.06, 32.56, 39.5, 0.0, 0.0, 36.1], "audiomae_on_audioset": [null, null, [["music", 35.34], ["hum", 24.56], ["throbbing", 24.16]], [["music", 29.16], ["synthesizer", 10.57], ["hum", 7.12]], [["music", 48.31], ["hum", 11.81], ["mains hum", 5.86]], [["speech", 55.42], ["hum", 20.14], ["mains hum", 7.45]], null, null, [["music", 65.82], ["bass guitar", 3.45], ["didgeridoo", 3.32]]], "duration": [0.4, 0.6, 15.15, 2.18, 2.64, 5.66, 0.02, 1.33, 2.83]}
annotations_filtered/a3bI7kbVBwM_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[8.0, 12.06], [14.0, 15.2], [17.0, 17.78], [18.0, 22.47], [24.0, 29.62], [30.0, 31.94], [33.0, 35.24], [37.0, 44.58], [46.0, 47.34], [50.0, 64.47], [65.0, 70.48], [74.0, 75.56], [82.0, 94.19], [97.0, 100.57], [101.0, 118.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [30.36, 0.0, 0.0, 30.17, 29.78, 0.0, 29.83, 30.65, 0.0, 30.3, 31.21, 0.0, 29.97, 29.93, 30.22], "audiomae_on_audioset": [[["music", 64.4], ["throbbing", 7.64], ["electronic music", 4.49]], null, null, [["music", 79.91], ["throbbing", 4.67], ["electronic music", 3.1]], [["music", 77.63], ["electronic music", 3.75], ["techno", 2.7]], null, [["music", 73.6], ["sampler", 2.59], ["electronic music", 2.54]], [["music", 64.57], ["hum", 5.2], ["drum and bass", 3.68]], null, [["music", 92.31], ["funny music", 1.14], ["throbbing", 0.69]], [["music", 37.47], ["didgeridoo", 7.61], ["musical instrument", 4.85]], null, [["music", 85.85], ["roll", 2.42], ["rock and roll", 2.05]], [["music", 78.76], ["buzz", 1.91], ["electronic music", 1.58]], [["music", 94.63], ["psychedelic rock", 0.83], ["rock music", 0.67]]], "duration": [4.06, 1.2, 0.78, 4.47, 5.62, 1.94, 2.24, 7.58, 1.34, 14.47, 5.48, 1.56, 12.19, 3.57, 17.32]}
annotations_filtered/a469ezsg86A_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[8.0, 8.82], [9.0, 8.88], [11.0, 12.83], [15.0, 15.8], [19.0, 19.97], [21.0, 26.54], [37.0, 50.43], [55.0, 55.63], [56.0, 57.37], [59.0, 60.0], [61.0, 61.11], [68.0, 68.05], [73.0, 72.99], [74.0, 74.49], [76.0, 76.44], [77.0, 86.58], [91.0, 93.39], [96.0, 96.04], [96.0, 105.07], [107.0, 109.0], [112.0, 119.21], [120.0, 121.61], [123.0, 140.16], [150.0, 150.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 71.29, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.89, 100.0, 0.0, 59.33, 83.52, 65.67, 0.0, 32.26, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 39.23], ["throbbing", 28.2], ["mains hum", 13.9]], null], "duration": [0.82, -0.12, 1.83, 0.8, 0.97, 5.54, 13.43, 0.63, 1.37, 1.0, 0.11, 0.05, -0.01, 0.49, 0.44, 9.58, 2.39, 0.04, 9.07, 2.0, 7.21, 1.61, 17.16, 0.18]}
annotations_filtered/a46FsHMRPkc_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 22.11], [23.0, 31.28], [36.0, 47.48], [52.0, 54.92], [59.0, 77.94], [79.0, 83.32], [84.0, 85.14], [96.0, 96.26], [100.0, 102.32], [113.0, 117.24], [118.0, 124.04]], "keep_status": [false, false, false, false, true, true, false, false, true, true, true], "silence_prob": [34.0, 33.64, 32.79, 33.0, 35.28, 30.13, 0.0, 0.0, 33.55, 30.4, 31.63], "audiomae_on_audioset": [[["music", 48.43], ["speech", 34.15], ["throbbing", 3.22]], [["throbbing", 40.2], ["hum", 36.72], ["music", 10.94]], [["music", 47.04], ["speech", 25.06], ["didgeridoo", 3.92]], [["speech", 46.67], ["music", 18.29], ["throbbing", 9.59]], [["music", 51.13], ["throbbing", 7.87], ["didgeridoo", 5.32]], [["hum", 22.39], ["mains hum", 22.38], ["music", 15.76]], null, null, [["music", 51.17], ["speech", 12.01], ["musical instrument", 2.31]], [["music", 38.96], ["hum", 9.61], ["throbbing", 9.46]], [["hum", 25.69], ["music", 16.72], ["throbbing", 13.49]]], "duration": [18.11, 8.28, 11.48, 2.92, 18.94, 4.32, 1.14, 0.26, 2.32, 4.24, 6.04]}
annotations_filtered/a46m8g3grB8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[25.0, 46.68], [51.0, 64.29], [65.0, 65.45], [66.0, 66.9], [79.0, 79.08], [80.0, 80.35], [81.0, 84.5], [85.0, 85.94], [86.0, 88.89], [93.0, 93.01], [95.0, 95.49], [100.0, 100.21], [102.0, 103.0], [105.0, 105.81], [106.0, 107.16], [108.0, 109.11], [114.0, 115.15], [116.0, 116.41], [117.0, 118.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.45, 52.74, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 62.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 63.83], ["fly, housefly", 3.57], ["livestock, farm animals, working animals", 3.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [21.68, 13.29, 0.45, 0.9, 0.08, 0.35, 3.5, 0.94, 2.89, 0.01, 0.49, 0.21, 1.0, 0.81, 1.16, 1.11, 1.15, 0.41, 1.98]}
annotations_filtered/a4EqbYUl7Rg_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []}
annotations_filtered/a4OWkIrQUJw_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 5.21], [7.0, 8.19], [9.0, 10.81], [13.0, 13.39], [14.0, 18.33], [25.0, 25.59], [33.0, 36.09], [40.0, 39.77], [40.0, 42.6], [44.0, 50.67], [52.0, 55.78], [57.0, 59.39], [63.0, 64.02], [64.0, 64.1], [64.0, 64.13], [65.0, 65.25], [66.0, 67.24], [68.0, 83.54], [85.0, 85.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.51, 0.0, 0.0, 0.0, 99.44, 0.0, 98.59, 0.0, 72.31, 91.81, 99.31, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.25, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.21, 1.19, 1.81, 0.39, 4.33, 0.59, 3.09, -0.23, 2.6, 6.67, 3.78, 2.39, 1.02, 0.1, 0.13, 0.25, 1.24, 15.54, 0.04]}
annotations_filtered/a4QlQy31HIk_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[7.0, 7.28], [8.0, 14.93], [18.0, 28.48], [30.0, 31.97], [33.0, 63.54], [66.0, 96.26], [98.0, 101.12], [103.0, 128.22]], "keep_status": [false, true, true, false, false, false, true, true], "silence_prob": [0.0, 30.27, 30.07, 0.0, 0.0, 0.0, 39.55, 42.44], "audiomae_on_audioset": [null, [["speech", 27.5], ["music", 24.35], ["hum", 9.27]], [["music", 19.56], ["speech", 15.0], ["hum", 12.25]], null, null, null, [["hum", 24.97], ["mains hum", 22.91], ["music", 20.21]], [["noise", 24.48], ["hum", 16.54], ["music", 14.5]]], "duration": [0.28, 6.93, 10.48, 1.97, 30.54, 30.26, 3.12, 25.22]}
annotations_filtered/a4Td_W5dc1w_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[5.0, 6.2], [8.0, 8.36], [10.0, 11.38], [19.0, 19.4], [23.0, 24.04], [24.0, 24.93], [26.0, 26.77], [31.0, 31.62], [35.0, 34.87], [35.0, 35.73], [36.0, 36.63], [37.0, 37.86], [41.0, 41.93], [44.0, 44.39], [51.0, 56.3], [58.0, 58.5], [59.0, 60.93], [62.0, 82.36], [86.0, 87.0], [91.0, 91.03], [93.0, 97.14], [100.0, 100.31], [108.0, 146.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 0.0, 32.04, 0.0, 0.0, 30.99, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.3], ["hum", 15.38], ["mains hum", 7.65]], null, null, [["music", 38.63], ["explosion", 10.49], ["burst, pop", 6.94]], null, null], "duration": [1.2, 0.36, 1.38, 0.4, 1.04, 0.93, 0.77, 0.62, -0.13, 0.73, 0.63, 0.86, 0.93, 0.39, 5.3, 0.5, 1.93, 20.36, 1.0, 0.03, 4.14, 0.31, 38.69]}
annotations_filtered/a4wb-xmYM50_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 3.47], [9.0, 11.67], [15.0, 22.13], [23.0, 23.46], [26.0, 34.11], [38.0, 44.25], [45.0, 46.06], [49.0, 59.48], [63.0, 69.08]], "keep_status": [false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 40.73, 35.24, 0.0, 36.3, 37.27, 0.0, 35.08, 40.88], "audiomae_on_audioset": [null, [["buzz", 56.53], ["hum", 12.33], ["mains hum", 6.05]], [["hum", 42.75], ["mains hum", 30.32], ["throbbing", 8.57]], null, [["hum", 35.12], ["speech", 17.07], ["throbbing", 14.89]], [["hum", 48.86], ["throbbing", 35.08], ["mains hum", 4.19]], null, [["hum", 30.38], ["throbbing", 23.71], ["speech", 10.64]], [["music", 77.9], ["buzz", 2.24], ["guitar", 2.01]]], "duration": [1.47, 2.67, 7.13, 0.46, 8.11, 6.25, 1.06, 10.48, 6.08]}
annotations_filtered/a51EYR5AeNk_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[31.0, 43.12], [46.0, 68.45], [71.0, 71.14], [71.0, 78.63], [83.0, 84.86], [86.0, 101.33], [102.0, 103.42], [112.0, 113.43], [116.0, 116.58], [120.0, 120.93], [131.0, 133.64], [135.0, 136.41], [140.0, 142.33], [145.0, 149.47], [151.0, 152.95], [154.0, 154.06], [158.0, 159.19]], "keep_status": [true, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.93, 31.81, 0.0, 29.17, 0.0, 31.4, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 84.07, 53.91, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 49.23], ["smash, crash", 11.94], ["buzz", 5.32]], [["music", 33.2], ["hum", 20.68], ["throbbing", 16.77]], null, [["hum", 17.99], ["music", 17.76], ["mains hum", 12.42]], null, [["speech", 29.18], ["music", 25.38], ["hum", 8.18]], null, null, null, null, null, null, null, null, null, null, null], "duration": [12.12, 22.45, 0.14, 7.63, 1.86, 15.33, 1.42, 1.43, 0.58, 0.93, 2.64, 1.41, 2.33, 4.47, 1.95, 0.06, 1.19]}
annotations_filtered/a5BtDmdw708_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 3.08], [4.0, 7.11], [8.0, 9.12], [11.0, 11.87], [21.0, 21.17], [24.0, 25.41], [26.0, 32.53], [40.0, 43.88], [44.0, 46.33], [47.0, 53.97], [54.0, 58.16]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [97.0, 99.94, 0.0, 0.0, 0.0, 0.0, 98.44, 86.27, 99.44, 38.78, 39.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 21.24], ["music", 14.23], ["fly, housefly", 7.52]], [["speech", 35.39], ["vehicle", 5.83], ["electric shaver, electric razor", 5.71]]], "duration": [2.08, 3.11, 1.12, 0.87, 0.17, 1.41, 6.53, 3.88, 2.33, 6.97, 4.16]}
annotations_filtered/a5PoLM_QBuo_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[4.0, 5.9], [8.0, 10.64], [13.0, 27.92], [31.0, 30.94], [35.0, 36.42], [38.0, 38.37], [39.0, 40.32], [41.0, 43.44], [45.0, 46.97], [47.0, 48.83], [49.0, 70.58], [73.0, 73.41], [74.0, 75.95], [77.0, 80.7], [81.0, 82.05], [84.0, 84.4], [85.0, 106.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 42.81, 0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 51.77, 0.0, 0.0, 50.71, 0.0, 0.0, 65.44], "audiomae_on_audioset": [null, null, [["speech", 61.24], ["firecracker", 16.51], ["explosion", 3.9]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.9, 2.64, 14.92, -0.06, 1.42, 0.37, 1.32, 2.44, 1.97, 1.83, 21.58, 0.41, 1.95, 3.7, 1.05, 0.4, 21.64]}
annotations_filtered/a5QBuJla5do_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 6.3], [8.0, 21.41], [23.0, 26.11], [27.0, 29.39], [35.0, 38.53], [46.0, 46.55], [48.0, 50.57], [53.0, 58.63], [60.0, 64.23], [69.0, 69.97], [78.0, 86.58], [93.0, 92.89], [94.0, 99.27], [101.0, 100.95], [108.0, 112.95], [115.0, 120.75]], "keep_status": [false, true, false, false, true, false, true, false, true, false, false, false, false, false, true, true], "silence_prob": [54.5, 34.44, 34.38, 35.29, 33.27, 0.0, 37.88, 31.02, 35.54, 0.0, 33.09, 0.0, 30.71, 0.0, 30.46, 30.68], "audiomae_on_audioset": [null, [["hum", 25.05], ["whale vocalization", 24.84], ["mains hum", 11.16]], [["music", 62.95], ["synthesizer", 9.03], ["musical instrument", 7.64]], [["music", 67.34], ["musical instrument", 6.02], ["synthesizer", 4.92]], [["music", 43.61], ["speech", 12.42], ["boing", 3.03]], null, [["speech", 24.78], ["music", 24.15], ["moo", 8.08]], [["music", 64.75], ["theremin", 8.05], ["musical instrument", 5.76]], [["music", 24.1], ["shofar", 21.51], ["speech", 8.52]], null, [["music", 53.68], ["speech", 21.59], ["sidetone", 8.85]], null, [["music", 66.88], ["synthesizer", 6.28], ["musical instrument", 4.34]], null, [["music", 29.66], ["speech", 24.47], ["theremin", 12.86]], [["music", 37.47], ["speech", 18.05], ["hum", 4.14]]], "duration": [3.3, 13.41, 3.11, 2.39, 3.53, 0.55, 2.57, 5.63, 4.23, 0.97, 8.58, -0.11, 5.27, -0.05, 4.95, 5.75]}
annotations_filtered/a5WAyc-EaNc_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 11.21], [12.0, 12.14], [12.0, 20.33], [21.0, 22.77], [23.0, 25.0], [26.0, 28.02], [30.0, 30.64], [32.0, 33.71], [35.0, 37.45], [41.0, 43.16], [44.0, 49.57], [52.0, 54.13], [56.0, 58.72], [60.0, 61.74], [62.0, 63.42], [67.0, 68.76], [70.0, 73.08]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.97, 0.0, 39.33, 0.0, 39.14, 66.76, 0.0, 0.0, 69.74, 67.0, 59.86, 76.37, 39.18, 0.0, 0.0, 0.0, 80.46], "audiomae_on_audioset": [[["music", 49.36], ["theremin", 32.05], ["ambient music", 5.47]], null, [["music", 29.12], ["hum", 14.07], ["theremin", 9.74]], null, [["speech", 49.92], ["music", 11.27], ["hum", 4.7]], null, null, null, null, null, null, null, [["speech", 58.33], ["sidetone", 22.12], ["busy signal", 6.91]], null, null, null, null], "duration": [8.21, 0.14, 8.33, 1.77, 2.0, 2.02, 0.64, 1.71, 2.45, 2.16, 5.57, 2.13, 2.72, 1.74, 1.42, 1.76, 3.08]}
annotations_filtered/a6--cEjo3bY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[5.0, 6.78], [9.0, 8.77], [13.0, 15.97], [19.0, 20.11], [21.0, 21.59], [32.0, 32.14], [36.0, 36.42], [37.0, 37.96], [41.0, 44.52], [48.0, 48.9], [58.0, 63.95], [66.0, 67.51], [69.0, 71.05], [73.0, 73.26], [73.0, 74.24], [76.0, 76.91], [77.0, 80.38], [82.0, 83.54], [85.0, 87.17], [88.0, 89.13], [90.0, 92.23], [95.0, 96.92], [102.0, 111.75], [115.0, 115.4], [116.0, 117.19], [118.0, 123.5], [124.0, 123.57], [124.0, 124.78], [130.0, 132.22], [135.0, 147.31], [147.0, 173.84], [174.0, 175.58], [176.0, 177.69]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, true, false, false, true, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 42.44, 0.0, 0.0, 0.0, 0.0, 0.0, 53.16, 0.0, 88.28, 0.0, 73.06, 0.0, 0.0, 0.0, 42.28, 0.0, 48.1, 0.0, 91.13, 0.0, 38.12, 0.0, 0.0, 36.09, 0.0, 0.0, 98.19, 35.94, 31.67, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 26.2], ["livestock, farm animals, working animals", 18.55], ["moo", 13.92]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["creak", 31.23], ["noise", 11.59], ["mosquito", 7.08]], null, [["speech", 36.9], ["insect", 8.79], ["fly, housefly", 8.46]], null, null, null, [["throbbing", 16.94], ["noise", 16.05], ["whack, thwack", 10.06]], null, null, [["speech", 57.84], ["noise", 3.97], ["hum", 3.65]], null, null, null, [["speech", 47.81], ["sidetone", 7.89], ["fart", 7.02]], [["speech", 38.55], ["whack, thwack", 9.09], ["animal", 6.55]], null, null], "duration": [1.78, -0.23, 2.97, 1.11, 0.59, 0.14, 0.42, 0.96, 3.52, 0.9, 5.95, 1.51, 2.05, 0.26, 1.24, 0.91, 3.38, 1.54, 2.17, 1.13, 2.23, 1.92, 9.75, 0.4, 1.19, 5.5, -0.43, 0.78, 2.22, 12.31, 26.84, 1.58, 1.69]}
annotations_filtered/a66f39DMwtY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[27.0, 30.94], [39.0, 43.6], [46.0, 46.23], [47.0, 47.85], [51.0, 51.19], [54.0, 54.7], [63.0, 73.25], [75.0, 75.63], [81.0, 81.21]], "keep_status": [false, true, false, false, false, false, true, false, false], "silence_prob": [38.04, 46.47, 0.0, 0.0, 0.0, 0.0, 40.92, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 43.9], ["music", 25.11], ["theremin", 3.47]], [["speech", 51.46], ["music", 10.16], ["sidetone", 7.42]], null, null, null, null, [["hum", 20.51], ["speech", 20.33], ["mains hum", 13.79]], null, null], "duration": [3.94, 4.6, 0.23, 0.85, 0.19, 0.7, 10.25, 0.63, 0.21]}
annotations_filtered/a6CsW4dCk_8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 5.56], [7.0, 7.03], [8.0, 10.0], [16.0, 16.21], [18.0, 18.72], [19.0, 20.75], [30.0, 30.69], [36.0, 35.94], [37.0, 40.19], [42.0, 61.75], [74.0, 74.6], [75.0, 76.27], [82.0, 84.91], [95.0, 101.58], [107.0, 107.0], [112.0, 141.22], [142.0, 145.91]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [80.64, 0.0, 91.98, 0.0, 0.0, 0.0, 0.0, 0.0, 31.46, 40.34, 0.0, 0.0, 30.19, 30.15, 0.0, 32.56, 92.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["ocean", 8.95], ["speech", 8.36], ["cattle, bovinae", 7.04]], [["music", 66.06], ["mains hum", 5.13], ["noise", 3.89]], null, null, [["music", 59.54], ["speech", 12.16], ["didgeridoo", 4.02]], [["music", 70.03], ["whale vocalization", 4.46], ["foghorn", 2.93]], null, [["speech", 77.42], ["vehicle", 3.96], ["boat, water vehicle", 2.4]], null], "duration": [3.56, 0.03, 2.0, 0.21, 0.72, 1.75, 0.69, -0.06, 3.19, 19.75, 0.6, 1.27, 2.91, 6.58, 0.0, 29.22, 3.91]}
annotations_filtered/a6XtVMtUZI8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[42.0, 46.57], [47.0, 47.43], [51.0, 51.9], [53.0, 53.77], [55.0, 59.09], [61.0, 62.43], [63.0, 66.53], [67.0, 74.46], [75.0, 77.92], [79.0, 80.57], [81.0, 83.24], [86.0, 111.27], [112.0, 118.86], [120.0, 120.53], [122.0, 127.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.9, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 65.09, 86.09, 0.0, 96.04, 99.48, 100.0, 0.0, 97.33], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.57, 0.43, 0.9, 0.77, 4.09, 1.43, 3.53, 7.46, 2.92, 1.57, 2.24, 25.27, 6.86, 0.53, 5.16]}
annotations_filtered/a6cUudbbHl0_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[2.0, 4.43], [6.0, 8.16], [10.0, 13.42], [14.0, 18.96], [20.0, 21.91], [24.0, 26.52], [32.0, 35.9], [40.0, 40.49], [42.0, 42.77], [44.0, 49.82], [54.0, 57.21], [59.0, 60.22], [61.0, 62.61], [65.0, 68.84], [69.0, 69.45], [69.0, 69.5], [70.0, 70.7], [76.0, 76.25], [79.0, 81.67], [84.0, 85.08], [94.0, 94.95], [97.0, 97.75], [99.0, 100.33], [103.0, 107.72], [108.0, 114.07], [115.0, 117.91], [119.0, 120.95], [123.0, 124.09], [125.0, 127.62], [130.0, 131.46], [132.0, 134.47], [136.0, 137.69], [140.0, 140.83], [142.0, 143.43], [148.0, 150.13], [151.0, 153.54], [157.0, 158.13], [159.0, 160.1], [161.0, 162.23], [165.0, 165.67], [167.0, 168.1]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.22, 44.07, 60.32, 42.58, 0.0, 52.33, 54.63, 0.0, 0.0, 55.46, 36.52, 0.0, 0.0, 31.99, 0.0, 0.0, 0.0, 0.0, 60.6, 0.0, 0.0, 0.0, 0.0, 61.57, 40.7, 31.77, 0.0, 0.0, 36.44, 0.0, 38.95, 0.0, 0.0, 0.0, 43.4, 46.54, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 48.35], ["electronic music", 9.73], ["synthesizer", 7.52]], [["music", 53.53], ["singing bowl", 26.36], ["ambient music", 5.01]], null, [["singing bowl", 28.24], ["music", 27.15], ["speech", 21.3]], null, null, null, null, null, null, [["sine wave", 39.03], ["chirp tone", 13.69], ["fire", 4.75]], null, null, [["music", 18.64], ["hum", 14.18], ["speech", 14.15]], null, null, null, null, null, null, null, null, null, null, [["music", 36.79], ["singing bowl", 33.59], ["speech", 6.61]], [["speech", 22.16], ["music", 10.02], ["thump, thud", 6.55]], null, null, [["music", 70.79], ["hum", 5.79], ["electronic music", 3.78]], null, [["music", 27.48], ["sine wave", 23.14], ["gong", 15.43]], null, null, null, [["music", 47.25], ["singing bowl", 21.38], ["ambient music", 4.26]], [["music", 62.75], ["musical instrument", 7.93], ["synthesizer", 4.96]], null, null, null, null, null], "duration": [2.43, 2.16, 3.42, 4.96, 1.91, 2.52, 3.9, 0.49, 0.77, 5.82, 3.21, 1.22, 1.61, 3.84, 0.45, 0.5, 0.7, 0.25, 2.67, 1.08, 0.95, 0.75, 1.33, 4.72, 6.07, 2.91, 1.95, 1.09, 2.62, 1.46, 2.47, 1.69, 0.83, 1.43, 2.13, 2.54, 1.13, 1.1, 1.23, 0.67, 1.1]}
annotations_filtered/a6mkbps0BmY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[7.0, 8.77], [51.0, 51.6], [53.0, 54.11], [60.0, 60.44], [67.0, 68.27], [71.0, 72.81], [77.0, 77.58], [86.0, 86.09], [88.0, 89.21], [90.0, 90.75], [93.0, 93.09], [121.0, 121.22], [122.0, 123.09], [130.0, 129.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.77, 0.6, 1.11, 0.44, 1.27, 1.81, 0.58, 0.09, 1.21, 0.75, 0.09, 0.22, 1.09, -0.16]}
annotations_filtered/a6oC5iQB4u8_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[34.0, 37.44], [41.0, 43.04], [45.0, 46.92], [47.0, 59.53], [60.0, 62.06], [63.0, 64.72], [67.0, 70.77], [72.0, 72.66], [75.0, 76.08], [77.0, 86.34], [96.0, 96.72], [97.0, 110.73], [113.0, 115.18], [116.0, 117.31], [119.0, 124.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.26, 96.17, 0.0, 99.73, 88.1, 0.0, 88.64, 0.0, 0.0, 82.97, 0.0, 99.84, 86.82, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.44, 2.04, 1.92, 12.53, 2.06, 1.72, 3.77, 0.66, 1.08, 9.34, 0.72, 13.73, 2.18, 1.31, 5.93]}
annotations_filtered/a72FDTElH9g_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[1.0, 2.83], [7.0, 9.14], [11.0, 11.42], [14.0, 15.33], [16.0, 18.6], [20.0, 21.29], [24.0, 24.38], [26.0, 26.28], [30.0, 30.18], [31.0, 32.12], [33.0, 33.61], [35.0, 34.91], [36.0, 37.93], [39.0, 44.47], [50.0, 51.71], [52.0, 136.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.8, 0.0, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.56, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.83, 2.14, 0.42, 1.33, 2.6, 1.29, 0.38, 0.28, 0.18, 1.12, 0.61, -0.09, 1.93, 5.47, 1.71, 84.34]}
annotations_filtered/a7K1xgoi_c4_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[12.0, 15.72], [17.0, 23.55], [26.0, 32.29], [37.0, 55.34], [58.0, 58.97], [62.0, 62.6], [64.0, 65.67], [72.0, 72.45]], "keep_status": [true, true, true, false, false, false, false, false], "silence_prob": [31.74, 33.25, 34.38, 32.68, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["whale vocalization", 32.88], ["eruption", 13.01], ["explosion", 5.35]], [["whale vocalization", 24.86], ["ocean", 6.15], ["boat, water vehicle", 5.71]], [["whale vocalization", 44.44], ["gurgling", 10.8], ["stomach rumble", 7.38]], [["whale vocalization", 85.03], ["music", 2.88], ["speech", 2.77]], null, null, null, null], "duration": [3.72, 6.55, 6.29, 18.34, 0.97, 0.6, 1.67, 0.45]}
annotations_filtered/a7XZaIy4a9k_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 4.23], [7.0, 8.18], [12.0, 12.66], [15.0, 16.58], [18.0, 18.15], [18.0, 27.19], [28.0, 29.71], [31.0, 31.65], [33.0, 35.41], [38.0, 39.07], [40.0, 40.34], [41.0, 42.04], [43.0, 44.15], [48.0, 48.69], [50.0, 50.79], [51.0, 55.97], [57.0, 58.18], [59.0, 61.25], [62.0, 63.12], [66.0, 68.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 66.03, 0.0, 0.0, 83.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.97, 0.0, 66.76, 0.0, 74.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.23, 1.18, 0.66, 1.58, 0.15, 9.19, 1.71, 0.65, 2.41, 1.07, 0.34, 1.04, 1.15, 0.69, 0.79, 4.97, 1.18, 2.25, 1.12, 2.69]}
annotations_filtered/a7gZgEpgKiY_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[3.0, 2.88], [4.0, 4.78], [8.0, 8.78], [12.0, 23.6], [25.0, 26.11], [26.0, 28.24], [30.0, 29.79], [31.0, 35.06], [36.0, 62.5], [64.0, 67.8], [69.0, 73.23], [75.0, 79.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.54, 0.0, 65.32, 0.0, 96.66, 69.47, 92.48, 94.52, 53.4], "audiomae_on_audioset": [null, null, null, [["music", 54.8], ["speech", 10.19], ["fart", 6.48]], null, null, null, null, null, null, null, null], "duration": [-0.12, 0.78, 0.78, 11.6, 1.11, 2.24, -0.21, 4.06, 26.5, 3.8, 4.23, 4.14]}
annotations_filtered/a7qRJ9T9TPg_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[10.0, 24.11], [28.0, 31.5], [35.0, 36.29], [37.0, 39.31], [42.0, 42.62], [44.0, 47.12], [51.0, 55.39], [59.0, 81.24], [93.0, 96.7], [104.0, 104.55], [113.0, 112.99], [118.0, 118.81], [119.0, 120.24]], "keep_status": [true, true, false, true, false, false, false, true, true, false, false, false, false], "silence_prob": [31.8, 33.24, 0.0, 33.83, 0.0, 33.18, 33.78, 32.2, 31.27, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 37.55], ["synthesizer", 9.81], ["speech", 9.02]], [["speech", 22.7], ["music", 20.68], ["vehicle", 4.96]], null, [["music", 62.8], ["foghorn", 2.4], ["musical instrument", 2.38]], null, [["music", 85.52], ["musical instrument", 1.75], ["hum", 1.75]], [["music", 55.28], ["synthesizer", 13.07], ["musical instrument", 4.61]], [["music", 21.48], ["theremin", 12.47], ["civil defense siren", 12.02]], [["music", 21.0], ["speech", 18.21], ["dog", 10.71]], null, null, null, null], "duration": [14.11, 3.5, 1.29, 2.31, 0.62, 3.12, 4.39, 22.24, 3.7, 0.55, -0.01, 0.81, 1.24]}
annotations_filtered/a7vAR-7YBWE_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[19.0, 19.67], [21.0, 22.3], [23.0, 23.62], [25.0, 25.79], [27.0, 29.39], [32.0, 35.19], [36.0, 35.85], [36.0, 40.36], [49.0, 49.57], [57.0, 57.77], [59.0, 63.15], [67.0, 67.83], [71.0, 72.74], [75.0, 81.87], [93.0, 93.06], [95.0, 96.38], [98.0, 104.58], [115.0, 115.87], [128.0, 129.05]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 64.86, 83.34, 0.0, 44.29, 0.0, 0.0, 55.18, 0.0, 0.0, 40.62, 0.0, 0.0, 36.72, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 27.72], ["music", 13.7], ["fly, housefly", 6.73]], null, null, null, null, null, [["music", 32.41], ["singing bowl", 11.96], ["synthesizer", 7.81]], null, null, [["speech", 31.39], ["mains hum", 14.2], ["music", 10.77]], null, null], "duration": [0.67, 1.3, 0.62, 0.79, 2.39, 3.19, -0.15, 4.36, 0.57, 0.77, 4.15, 0.83, 1.74, 6.87, 0.06, 1.38, 6.58, 0.87, 1.05]}
annotations_filtered/a81pNygdAXw_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[9.0, 12.95], [13.0, 14.17], [15.0, 18.67], [20.0, 20.43], [23.0, 23.65], [27.0, 27.89], [29.0, 30.08], [32.0, 32.1], [33.0, 37.05], [40.0, 41.82], [44.0, 45.62], [48.0, 48.63], [52.0, 52.89], [56.0, 57.25], [62.0, 63.68], [65.0, 73.41], [75.0, 75.86], [77.0, 79.02], [82.0, 82.78], [84.0, 85.23], [86.0, 88.08], [91.0, 93.28], [95.0, 97.23], [99.0, 101.73], [103.0, 103.67], [105.0, 106.08], [109.0, 112.58]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [60.6, 0.0, 47.23, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 99.8, 79.07, 95.91, 99.68, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, [["cat", 7.72], ["hum", 6.7], ["inside, small room", 6.0]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.95, 1.17, 3.67, 0.43, 0.65, 0.89, 1.08, 0.1, 4.05, 1.82, 1.62, 0.63, 0.89, 1.25, 1.68, 8.41, 0.86, 2.02, 0.78, 1.23, 2.08, 2.28, 2.23, 2.73, 0.67, 1.08, 3.58]}
annotations_filtered/a861J6gxqmg_filtered.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"non_speech_segments": [[39.0, 47.41], [48.0, 49.42], [53.0, 57.6], [60.0, 63.56], [65.0, 80.57], [88.0, 88.15], [89.0, 88.99], [91.0, 92.31], [94.0, 94.88], [97.0, 97.01], [101.0, 102.44], [103.0, 103.33], [105.0, 107.38], [111.0, 113.98], [115.0, 125.37]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.43, 0.0, 31.27, 88.28, 34.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.53, 100.0, 100.0], "audiomae_on_audioset": [[["music", 21.72], ["speech", 18.46], ["hum", 12.25]], null, [["music", 38.73], ["breaking", 13.78], ["hum", 9.81]], null, [["music", 41.94], ["didgeridoo", 39.46], ["gong", 2.77]], null, null, null, null, null, null, null, null, null, null], "duration": [8.41, 1.42, 4.6, 3.56, 15.57, 0.15, -0.01, 1.31, 0.88, 0.01, 1.44, 0.33, 2.38, 2.98, 10.37]}