{"segments": [[13.0, 18.0], [19.0, 20.43], [22.0, 24.17], [57.0, 62.0], [66.0, 68.44], [99.0, 100.2], [121.0, 122.76], [123.0, 125.02]], "p_music": [0.0, 0.0, 0.0, 15.92, 0.0, 0.0, 16.49, 0.0], "p_speech": [0.0, 25.32, 20.79, 14.5, 17.8, 48.19, 18.28, 18.18], "labels": ["P(~Music) = 0.0 | P(~Speech) = 0.0", "P(~Music) = 0.0 | P(~Speech) = 25.32", "P(~Music) = 0.0 | P(~Speech) = 20.79", "P(~Music) = 15.92 | P(~Speech) = 14.5", "P(~Music) = 0.0 | P(~Speech) = 17.8", "P(~Music) = 0.0 | P(~Speech) = 48.19", "P(~Music) = 16.49 | P(~Speech) = 18.28", "P(~Music) = 0.0 | P(~Speech) = 18.18"]}