Spaces:

WajeehAzeemX
/

TashkeelAPI

Sleeping

WajeehAzeemX commited on Oct 16, 2024

Commit

76b2bae

verified ·

1 Parent(s): 8bd741b

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -21,8 +21,7 @@ pipe = pipeline(
     "automatic-speech-recognition",
     model=model,
     tokenizer=processor.tokenizer,
-    feature_extractor=processor.feature_extractor,
-    generate_kwargs = {"task":"transcribe", "language":"<|ar|>"}
 )
@@ -33,15 +32,17 @@ async def transcribe_audio(request: Request):
         audio_data = await request.body()
         # Convert binary data to a file-like object
         audio_file = io.BytesIO(audio_data)
-        # Load the audio file using pydub
-        audio_array, sampling_rate = librosa.load(audio_file, sr=16000)
-        # Process the audio array
-        input_features = processor(audio_array, sampling_rate=sampling_rate, return_tensors="pt").input_features
-        # Generate token ids
-        predicted_ids = model.generate(input_features)
-        # Decode token ids to text
-        transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)
         # Print the transcription
         print(transcription[0])  # Display the transcriptiontry:
         return {"transcription": transcription[0]}
     except Exception as e:

     "automatic-speech-recognition",
     model=model,
     tokenizer=processor.tokenizer,
+    feature_extractor=processor.feature_extractor
 )
         audio_data = await request.body()
         # Convert binary data to a file-like object
         audio_file = io.BytesIO(audio_data)
+        # # Load the audio file using pydub
+        # audio_array, sampling_rate = librosa.load(audio_file, sr=16000)
+        # # Process the audio array
+        # input_features = processor(audio_array, sampling_rate=sampling_rate, return_tensors="pt").input_features
+        # # Generate token ids
+        # predicted_ids = model.generate(input_features)
+        # # Decode token ids to text
+        # transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)
+        transcription = pipe(audio_file,generate_kwargs = {"task":"transcribe", "language":"<|ar|>"})
         # Print the transcription
+        print(transcription)
         print(transcription[0])  # Display the transcriptiontry:
         return {"transcription": transcription[0]}
     except Exception as e: