Spaces:

aletrn
/

ai-pronunciation-trainer

Running

App Files Files Community

alessandro trinca tornidor commited on Feb 25

Commit

2f5403b

1 Parent(s): 9c11a5e

feat: support python 3.10, update test cases

Browse files

Files changed (3) hide show

lambdaSpeechToScore.py +10 -6
tests/events/expected_get_speech_to_score_tuple_ok_de.json +1 -1
tests/events/expected_get_speech_to_score_tuple_ok_en.json +1 -15

lambdaSpeechToScore.py CHANGED Viewed

@@ -1,10 +1,13 @@
 import base64
 import json
-import os
 from pathlib import Path
 import tempfile
 import time
-from typing import Dict, Any, LiteralString
 import audioread
 import numpy as np
@@ -51,7 +54,8 @@ def lambda_handler(event: Dict[str, Any], context: Any) -> Dict[str, Any]:
     output = get_speech_to_score_dict(
         real_text=real_text, file_bytes_or_audiotmpfile=file_bytes_or_audiotmpfile, language=language, use_dtw=use_dtw
     )
-    output["pronunciation_accuracy"] = f"{int(output["pronunciation_accuracy"])}"
     output = json.dumps(output)
     app_logger.debug(f"output: {output} ...")
     return output
@@ -59,7 +63,7 @@ def lambda_handler(event: Dict[str, Any], context: Any) -> Dict[str, Any]:
 def get_speech_to_score_dict(
         real_text: str, file_bytes_or_audiotmpfile: str | bytes | dict, language: str = "en", extension: str = tmp_audio_extension, use_dtw: bool = False
-    ) -> Dict[str | Any, float | LiteralString | str | Any]:
     """
     Process the audio file and return a dictionary with speech-to-score results.
@@ -197,8 +201,8 @@ def get_speech_to_score_tuple(real_text: str, file_bytes_or_audiotmpfile: str |
     del output["random_file_name"]
     real_transcripts = output['real_transcripts']
     is_letter_correct_all_words = output['is_letter_correct_all_words']
-    pronunciation_accuracy = f"{output["pronunciation_accuracy"]:.2f}"
-    output["pronunciation_accuracy"] = pronunciation_accuracy
     ipa_transcript = output['ipa_transcript']
     real_transcripts_ipa = output['real_transcripts_ipa']
     end_time = [float(x) for x in output['end_time'].split(" ")]

 import base64
 import json
 from pathlib import Path
 import tempfile
 import time
+from typing import Dict, Any
+try:
+    from typing import LiteralString
+except ImportError:
+    from typing_extensions import LiteralString
 import audioread
 import numpy as np
     output = get_speech_to_score_dict(
         real_text=real_text, file_bytes_or_audiotmpfile=file_bytes_or_audiotmpfile, language=language, use_dtw=use_dtw
     )
+    pronunciation_accuracy = int(output["pronunciation_accuracy"])
+    output["pronunciation_accuracy"] = f"{pronunciation_accuracy}"
     output = json.dumps(output)
     app_logger.debug(f"output: {output} ...")
     return output
 def get_speech_to_score_dict(
         real_text: str, file_bytes_or_audiotmpfile: str | bytes | dict, language: str = "en", extension: str = tmp_audio_extension, use_dtw: bool = False
+) -> Dict[str | Any, float | LiteralString | str | Any]:
     """
     Process the audio file and return a dictionary with speech-to-score results.
     del output["random_file_name"]
     real_transcripts = output['real_transcripts']
     is_letter_correct_all_words = output['is_letter_correct_all_words']
+    pronunciation_accuracy = output['pronunciation_accuracy']
+    output["pronunciation_accuracy"] = f"{pronunciation_accuracy:.2f}"
     ipa_transcript = output['ipa_transcript']
     real_transcripts_ipa = output['real_transcripts_ipa']
     end_time = [float(x) for x in output['end_time'].split(" ")]

tests/events/expected_get_speech_to_score_tuple_ok_de.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "real_transcripts": "Hallo, wie geht es dir?",
   "is_letter_correct_all_words": "111111 111 1111 11 1111 ",
-  "pronunciation_accuracy": "100.00",
   "ipa_transcript": " halo\u02d0, vi\u02d0 \u0261e\u02d0t \u025b\u02d0s di\u02d0r?",
   "real_transcripts_ipa": "halo\u02d0, vi\u02d0 \u0261e\u02d0t \u025b\u02d0s di\u02d0r?",
   "num_words": 5,

 {
   "real_transcripts": "Hallo, wie geht es dir?",
   "is_letter_correct_all_words": "111111 111 1111 11 1111 ",
+  "pronunciation_accuracy": 100.0,
   "ipa_transcript": " halo\u02d0, vi\u02d0 \u0261e\u02d0t \u025b\u02d0s di\u02d0r?",
   "real_transcripts_ipa": "halo\u02d0, vi\u02d0 \u0261e\u02d0t \u025b\u02d0s di\u02d0r?",
   "num_words": 5,

tests/events/expected_get_speech_to_score_tuple_ok_en.json CHANGED Viewed

@@ -1,25 +1,11 @@
 {
   "real_transcripts": "Hi there, how are you?",
   "is_letter_correct_all_words": "11 111111 111 111 1111 ",
-  "pronunciation_accuracy": "100.00",
   "ipa_transcript": "ha\u026a \u00f0\u025br, ha\u028a \u0259r ju?",
   "real_transcripts_ipa": "ha\u026a \u00f0\u025br, ha\u028a \u0259r ju?",
   "num_words": 5,
   "dumped": {
-    "audio_files": [
-      "test2_en_easy__part0_start0.0_end0.19..wav",
-      "test2_en_easy__part1_start0.09_end0.35..wav",
-      "test2_en_easy__part2_start0.41_end0.63..wav",
-      "test2_en_easy__part3_start0.53_end0.75..wav",
-      "test2_en_easy__part4_start0.65_end0.91..wav"
-    ],
-    "audio_durations": [
-      0.19,
-      0.26,
-      0.22000000000000003,
-      0.21999999999999997,
-      0.26
-    ],
     "real_transcript": " Hi there, how are you?",
     "ipa_transcript": "ha\u026a \u00f0\u025br, ha\u028a \u0259r ju?",
     "pronunciation_accuracy": "100.00",

 {
   "real_transcripts": "Hi there, how are you?",
   "is_letter_correct_all_words": "11 111111 111 111 1111 ",
+  "pronunciation_accuracy": 100.0,
   "ipa_transcript": "ha\u026a \u00f0\u025br, ha\u028a \u0259r ju?",
   "real_transcripts_ipa": "ha\u026a \u00f0\u025br, ha\u028a \u0259r ju?",
   "num_words": 5,
   "dumped": {
     "real_transcript": " Hi there, how are you?",
     "ipa_transcript": "ha\u026a \u00f0\u025br, ha\u028a \u0259r ju?",
     "pronunciation_accuracy": "100.00",