MMS_1_10

Sleeping

bomolopuu commited on Oct 1, 2024

Commit

78b8142

1 Parent(s): 9cdd87f

tokenizeR

Files changed (1) hide show

asr.py CHANGED Viewed

@@ -131,7 +131,7 @@ def transcribe(model, audio_data=None, lang="eng (English)", user_transcription=
 def fine_tune_model(model, processor, user_transcription, audio_samples, lang_code):
     # Convert the user-provided transcription to a tensor
-    transcription_tensor = processor.tokenize(user_transcription, return_tensors="pt")
     # Create a new dataset with the user-provided transcription and audio samples
     dataset = [(audio_samples, transcription_tensor)]

 def fine_tune_model(model, processor, user_transcription, audio_samples, lang_code):
     # Convert the user-provided transcription to a tensor
+    transcription_tensor = processor.tokenizer(user_transcription, return_tensors="pt")
     # Create a new dataset with the user-provided transcription and audio samples
     dataset = [(audio_samples, transcription_tensor)]