Spaces:

amanmibra
/

void-demo-aisf

Runtime error

amanmibra commited on May 16, 2023

Commit

81d87a8

1 Parent(s): 5fb3738

Add url support to API

Files changed (2) hide show

server/main.py CHANGED Viewed

@@ -4,14 +4,12 @@ sys.path.append('..')
 import os
 from fastapi import FastAPI
-from pydantic import BaseModel
-import wget
 # torch
 import torch
 # utils
-from preprocess import process_from_filename, process_raw_wav
 from cnn import CNNetwork
 # load model
@@ -21,11 +19,6 @@ model.load_state_dict(state_dict)
 print(f"Model loaded! \n {model}")
-# /predict input
-# class Data(BaseModel):
-#     wav:
 app = FastAPI()
 @app.get("/")
@@ -34,12 +27,13 @@ async def root():
 @app.get("/urlpredict")
 def url_predict(url: str):
-    filename = wget.download(url)
-    wav = process_from_filename(filename)
-    print(f"\ntest {wav.shape}\n")
     model_prediction = model_predict(wav)
-    return model_prediction["predicition_index"]
 @app.put("/predict")
 def predict(wav):
@@ -49,16 +43,15 @@ def predict(wav):
     model_prediction = model_predict(wav)
     return {
-        "message": "Voiced Identified!",
         "data": model_prediction,
     }
 def model_predict(wav):
     model_input = wav.unsqueeze(0)
     output = model(model_input)
-    prediction = torch.argmax(output, 1).item()
     return {
-        "output": output,
-        "prediction_index": prediction,
     }

 import os
 from fastapi import FastAPI
 # torch
 import torch
 # utils
+from preprocess import process_from_filename, process_from_url, process_raw_wav
 from cnn import CNNetwork
 # load model
 print(f"Model loaded! \n {model}")
 app = FastAPI()
 @app.get("/")
 @app.get("/urlpredict")
 def url_predict(url: str):
+    wav = process_from_url(url)
     model_prediction = model_predict(wav)
+    return {
+        "message": "Voice Identified!",
+        "data": model_prediction,
+    }
 @app.put("/predict")
 def predict(wav):
     model_prediction = model_predict(wav)
     return {
+        "message": "Voice Identified!",
         "data": model_prediction,
     }
 def model_predict(wav):
     model_input = wav.unsqueeze(0)
     output = model(model_input)
+    prediction_index = torch.argmax(output, 1).item()
     return {
+        "prediction_index": prediction_index,
     }

server/preprocess.py CHANGED Viewed

@@ -1,11 +1,31 @@
 """
 Util functions to process any incoming audio data to be processable by the model
 """
 import torch
 import torchaudio
 DEFAULT_SAMPLE_RATE=48000
 def process_from_filename(filename, target_sample_rate=DEFAULT_SAMPLE_RATE, wav_length=5):
     wav, sample_rate = torchaudio.load(filename)
@@ -58,6 +78,6 @@ def _pad(wav, num_samples):
     if wav.shape[1] < num_samples:
         missing_samples = num_samples - wav.shape[1]
         pad = (0, missing_samples)
-        wav = torch.nn.function.pad(wav, pad)
     return wav

 """
 Util functions to process any incoming audio data to be processable by the model
 """
+import os
+import librosa
 import torch
 import torchaudio
+from scipy.io import wavfile
+import wget
 DEFAULT_SAMPLE_RATE=48000
+def process_from_url(url):
+    # download UI audio
+    filename = wget.download(url)
+    audio, sr = librosa.load(filename)
+    wavfile.write('temp.wav', DEFAULT_SAMPLE_RATE, audio)
+    # remove wget file
+    os.remove(filename)
+    # spec
+    spec = process_from_filename('temp.wav')
+    os.remove('temp.wav')
+    return spec
 def process_from_filename(filename, target_sample_rate=DEFAULT_SAMPLE_RATE, wav_length=5):
     wav, sample_rate = torchaudio.load(filename)
     if wav.shape[1] < num_samples:
         missing_samples = num_samples - wav.shape[1]
         pad = (0, missing_samples)
+        wav = torch.nn.functional.pad(wav, pad)
     return wav