File size: 1,696 Bytes
da3e61e
 
e22d140
da3e61e
 
 
 
e22d140
da3e61e
e22d140
 
 
 
 
 
 
 
 
 
da3e61e
 
 
e22d140
da3e61e
 
e22d140
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
da3e61e
e22d140
 
 
 
 
da3e61e
 
 
 
 
 
 
 
 
 
e22d140
da3e61e
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
import gradio as gr
import os
from acrcloud.recognizer import ACRCloudRecognizer

# Retrieve ACRCloud credentials from environment variables
acr_access_key = os.environ.get('ACR_ACCESS_KEY')
acr_access_secret = os.environ.get('ACR_ACCESS_SECRET')
acr_host = os.environ.get('ACR_HOST', 'eu-west-1.api.acrcloud.com')

# ACRCloud recognizer configuration
config = {
    'host': acr_host,
    'access_key': acr_access_key,
    'access_secret': acr_access_secret,
    'timeout': 10  # seconds
}

# Initialize ACRCloud recognizer
acr = ACRCloudRecognizer(config)

def identify_audio(file):
    # Save the uploaded file temporarily
    file_path = file.name
    file.save(file_path)

    # Get the duration of the audio file in milliseconds
    duration_ms = int(acr.get_duration_ms_by_file(file_path))

    results = []

    # Process audio in 10-second chunks
    for i in range(0, duration_ms // 1000, 10):
        res = acr.recognize_by_file(file_path, i, 10)
        results.append(f"Time {i}s: {res.strip()}")

    # Full recognition result
    full_result = acr.recognize_by_file(file_path, 0)

    # Recognize using file buffer
    with open(file_path, 'rb') as f:
        buf = f.read()
        buffer_result = acr.recognize_by_filebuffer(buf, 0)

    return {
        "Partial Results": results,
        "Full Result": full_result,
        "Buffer Result": buffer_result
    }

# Create Gradio interface
iface = gr.Interface(
    fn=identify_audio,
    inputs=gr.File(label="Upload Audio File"),
    outputs=gr.JSON(label="Audio Metadata"),
    title="Audio Search by File",
    description="Upload an audio file to identify it using ACRCloud."
)

# Launch the Gradio interface
iface.launch()