Spaces:

Mihaj
/

Wav2Vec2RhytmAnalyzer

Sleeping

App Files Files Community

Mihaj commited on Apr 19, 2024

Commit

bc54321

verified ·

1 Parent(s): 40e6055

Update app.py

Browse files

Files changed (1) hide show

app.py +38 -2

app.py CHANGED Viewed

@@ -135,6 +135,42 @@ def percent_V(vowels, total_wo_pauses):
   return pV
 def transcribe(audio):
     y, sr = sf.read(audio)
@@ -163,7 +199,7 @@ def transcribe(audio):
     dC = delta_C(cons_clusters)
     pV = percent_V(vowels_duration, duration_without_pauses)
-    transcription = processor.decode(predicted_ids[0]).lower()
     text = {"transcription": transcription}
@@ -178,7 +214,7 @@ iface = gr.Interface(
     inputs=gr.Audio(type="filepath"),
     outputs="text",
     title="Mihaj/Wav2Vec2RhytmAnalyzer",
-    description="Демо анализатор ритма на основе модели Wav2Vec large от bond005. Максимум обрабатываемой длительности записи - 10 секунд.",
 )
 iface.launch()

   return pV
+# point_1 = np.array((0, 0, 0))
+# point_2 = np.array((3, 3, 3))
+def count_eucl(point_1, point_2):
+    # Initializing the points
+    # Get the square of the difference of the 2 vectors
+    square = np.square(point_1 - point_2)
+    # Get the sum of the square
+    sum_square = np.sum(square)
+    # The last step is to get the square root and print the Euclidean distance
+    distance = np.sqrt(sum_square)
+    return distance
+ex_dict = {"eng": np.array((0.0535, 0.401)), "kat": np.array((0.0452, 0.456)), "jap": np.array((0.0356, 0.531))}
+def classify_rhytm(dC, pV):
+    our = np.array((dC, pV))
+    res = {}
+    if (dC > 0.08 and pV > 0.45) or (dC < 0.03 and pV < 0.04):
+        text = "Вы не укладываетесь ни в какие рамки и прекрасны в этом!"
+    else:
+        for k, v in ex_dict.items():
+            res[k] = count_eucl(our, v)
+        sorted_tuples = sorted(res.items(), key=lambda item: item[1])
+        sorted_res = {k: v for k, v in sorted_tuples}
+        if sorted_res.keys()[0] == "eng":
+            text = "По типу ритма ваша речь близка к тактосчитающим языкам (английский)."
+        if sorted_res.keys()[0] == "kat":
+            text = "По типу ритма ваша речь близка к слогосчитающим языкам (испанский)."
+        if sorted_res.keys()[0] == "jap":
+            text = "По типу ритма ваша речь близка к моросчитающим языкам (японский)."
+    return text
 def transcribe(audio):
     y, sr = sf.read(audio)
     dC = delta_C(cons_clusters)
     pV = percent_V(vowels_duration, duration_without_pauses)
+    transcription = processor.decode(predicted_ids).lower()
     text = {"transcription": transcription}
     inputs=gr.Audio(type="filepath"),
     outputs="text",
     title="Mihaj/Wav2Vec2RhytmAnalyzer",
+    description="Демо анализатор ритма на основе модели Wav2Vec large от bond005.",
 )
 iface.launch()