Spaces:

NLPV
/

ReadabilityTest

Sleeping

App Files Files Community

NLPV commited on Apr 27

Commit

f5d520a

verified ·

1 Parent(s): 2cf982a

Update app.py

Browse files

Files changed (1) hide show

app.py +12 -13

app.py CHANGED Viewed

@@ -5,6 +5,7 @@ import difflib
 import tempfile
 import os
 import speech_recognition as sr
 # Function to play the text (optional)
 def play_text(text):
@@ -14,24 +15,26 @@ def play_text(text):
     os.system(f"start {temp_file.name}")  # Windows
     return "✅ Text is being read out. Please listen and read it yourself."
 def transcribe_audio(audio, original_text):
-    recognizer = sr.Recognizer()
     try:
-        with sr.AudioFile(audio) as source:
-            audio_data = recognizer.record(source)
-        # Try chunking if needed
-        transcription = recognizer.recognize_google(audio_data, language="hi-IN")
-        # Clean and split the text better (remove punctuations etc.)
         import re
         original_words = re.findall(r'\w+', original_text.strip())
         transcribed_words = re.findall(r'\w+', transcription.strip())
         matcher = difflib.SequenceMatcher(None, original_words, transcribed_words)
         accuracy = round(matcher.ratio() * 100, 2)
-        speed = round(len(transcribed_words) / (len(audio_data.frame_data) / audio_data.sample_rate), 2)
         result = {
             "📝 Transcribed Text": transcription,
@@ -39,10 +42,6 @@ def transcribe_audio(audio, original_text):
             "⏱️ Speaking Speed (words/sec)": speed
         }
         return result
-    except sr.UnknownValueError:
-        return {"error": "Could not understand audio"}
-    except sr.RequestError as e:
-        return {"error": f"Request error: {e}"}
     except Exception as e:
         return {"error": str(e)}

 import tempfile
 import os
 import speech_recognition as sr
+from faster_whisper import WhisperModel
 # Function to play the text (optional)
 def play_text(text):
     os.system(f"start {temp_file.name}")  # Windows
     return "✅ Text is being read out. Please listen and read it yourself."
+# Load model once (outside function for efficiency)
+model = WhisperModel("small", compute_type="float32")  # Or "medium" for better accuracy
 def transcribe_audio(audio, original_text):
     try:
+        # Run inference
+        segments, info = model.transcribe(audio, language='hi')
+        transcription = " ".join([segment.text for segment in segments])
+        # Clean and split the text better
         import re
         original_words = re.findall(r'\w+', original_text.strip())
         transcribed_words = re.findall(r'\w+', transcription.strip())
         matcher = difflib.SequenceMatcher(None, original_words, transcribed_words)
         accuracy = round(matcher.ratio() * 100, 2)
+        # Speaking speed (approximate)
+        speed = round(len(transcribed_words) / info.duration, 2)
         result = {
             "📝 Transcribed Text": transcription,
             "⏱️ Speaking Speed (words/sec)": speed
         }
         return result
     except Exception as e:
         return {"error": str(e)}