File size: 3,277 Bytes
c3e6538
 
 
bb86e76
c3e6538
761cc63
e51a96f
 
 
 
 
2db1d26
17e3ef6
c3e6538
 
761cc63
 
 
 
 
17e3ef6
761cc63
c3e6538
 
 
 
761cc63
c3e6538
4817b42
 
b66c175
144c7ec
6e44725
 
 
31adb1a
6e44725
 
b66c175
c3e6538
 
0b97e6d
c3e6538
6e44725
 
c3e6538
 
 
 
6e44725
761cc63
6e44725
 
 
 
 
 
8ea3af8
6e44725
a6f8f50
6e44725
 
dc801d7
6e44725
 
5580065
0b97e6d
6e44725
 
 
 
 
4341bec
6e44725
 
c3e6538
6e44725
c3e6538
4817b42
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
import torch
from speechscore import SpeechScore 
import gradio as gr
import pprint

def score_file(test_file, ref_file, score_list_nis, score_list_is):
    score_list = []
    if score_list_nis is not None:
        score_list += score_list_nis
    if score_list_is is not None:
        score_list += score_list_is        
    mySpeechScore = SpeechScore(score_list)  
    scores = mySpeechScore(test_path=test_file, reference_path=ref_file, window=None, score_rate=16000, return_mean=False, round_digits=2)
    return scores

def score_mic(test_file, score_list_nis):
    score_list = []
    if score_list_nis is not None:
        score_list += score_list_nis       
    mySpeechScore = SpeechScore(score_list)  
    scores = mySpeechScore(test_path=test_file, reference_path=None, window=None, score_rate=16000, return_mean=False, round_digits=2)
    return scores

demo = gr.Blocks()

file_score = gr.Interface(
    fn=score_file,
    inputs=[
        gr.Audio(sources=["upload"], label="test file", type="filepath"),
        gr.Audio(sources=["upload"], label="reference file", type="filepath"),
        gr.Dropdown(
            ["DNSMOS", "SRMR"], value=["DNSMOS"], multiselect=True, label="Non-Intrusive Scores", info="Choose scores to include, reference audio is not required."
        ),
        gr.Dropdown(
            ["PESQ", 'NB_PESQ', 'STOI', 'SISDR',
        'FWSEGSNR', 'LSD', 'BSSEval',
        'SNR', 'SSNR', 'LLR', 'CSIG', 'CBAK',
        'COVL', 'MCD'], value=["PESQ", "STOI"], multiselect=True, label="Intrusive Scores", info="Choose scores to include, reference audio is required."
        ),
    ],
    outputs="text",
    title="Test your speech quality using <a href='https://github.com/modelscope/ClearerVoice-Studio/tree/main/speechscore' target='_blank'>speechscore</a></p>",
    description=(
        "Score speech quality with the click of a button! Demo includes the"
        " commonly used speech quality assessments for the audio file"
        " of arbitrary length."
    ),
)

mic_score = gr.Interface(
    fn=score_mic,
    inputs=[
        gr.Audio(sources=["microphone"],
                waveform_options=gr.WaveformOptions(
                waveform_color="#01C6FF",
                waveform_progress_color="#0066B4",
                skip_length=2,
                show_controls=False,                
                ),
                type='numpy',
            ),
        gr.Dropdown(
            ["DNSMOS", "SRMR"], value=["DNSMOS"], multiselect=True, label="Non-Intrusive Scores", info="Choose scores to include, no reference audio is required."
        ),
    ],
    outputs="text",
    title="Test your microphone quality using <a href='https://github.com/modelscope/ClearerVoice-Studio/tree/main/speechscore' target='_blank'>speechscore</a></p>",
    description=(
        "Score your microphone quality with the click of a button!"
        " Uses the most popular method to test your microphone quality"
        " with a short speech clip."
    ),
    #article = ("<a href='https://github.com/modelscope/ClearerVoice-Studio/tree/main/speechscore' target='_blank'>Github Repo</a></p> for SpeechScore")
)

with demo:
    gr.TabbedInterface([mic_score, file_score], ["Score Microphone Quality", "Score Speech Quality"])

demo.launch()