Podcastking2

Running

App Files Files Community

gnosticdev commited on 20 days ago

Commit

3b3add5

verified ·

1 Parent(s): 049c2dc

Update conver.py

Browse files

Files changed (1) hide show

conver.py +21 -15

conver.py CHANGED Viewed

@@ -65,7 +65,7 @@ class URLToAudioConverter:
             prompt = self.config.custom_prompt_template.format(text=text) if self.config.custom_prompt_template else (
                 f"{text}\nConvierte el texto en un diálogo de podcast en español entre Anfitrión1 y Anfitrión2. "
                 f"Genera una conversación extensa y natural con al menos 5 intercambios por hablante. "
-                f"Devuelve SOLO un objeto JSON: "
                 f'{{"conversation": [{{"speaker": "Anfitrión1", "text": "..."}}, {{"speaker": "Anfitrión2", "text": "..."}}]}}'
             )
             response = self.llm_client.chat.completions.create(
@@ -74,27 +74,33 @@ class URLToAudioConverter:
                 response_format={"type": "json_object"}
             )
             response_content = response.choices[0].message.content
-            # Clean response to ensure valid JSON
             response_content = response_content.strip()
-            # Extract valid JSON using regex
-            json_match = re.search(r'\{.*?\}\s*$', response_content, re.DOTALL)
-            if not json_match:
                 raise ValueError("No valid JSON object found in response")
-            json_str = json_match.group(0)
-            # Clean problematic characters and fix common JSON issues
             json_str = re.sub(r',\s*([\]}])', r'\1', json_str)  # Remove trailing commas
             json_str = re.sub(r'\s+', ' ', json_str)  # Replace multiple spaces
             json_str = json_str.replace('\\"', '"').replace('"{', '{').replace('}"', '}')
             try:
                 dialogue = json.loads(json_str)
             except json.JSONDecodeError as e:
-                # Attempt to fix JSON by truncating at last valid object
-                last_valid = json_str[:json_str.rfind('}')+1]
-                try:
-                    dialogue = json.loads(last_valid)
-                except json.JSONDecodeError as e2:
-                    raise ValueError(f"JSON parsing failed: {str(e2)}")
-            if not dialogue.get("conversation"):
                 raise ValueError("No valid conversation generated")
             return dialogue
         except Exception as e:
@@ -202,7 +208,7 @@ class URLToAudioConverter:
         voice_2: str,
         custom_music_path: str = None
     ) -> Tuple[str, str]:
-        audio_files, folder_name = await self.text_to_speech(conversation, voice_1, voice_2)
         combined = self.combine_audio_files(audio_files)
         final_audio = self.add_background_music_and_tags(
             combined,

             prompt = self.config.custom_prompt_template.format(text=text) if self.config.custom_prompt_template else (
                 f"{text}\nConvierte el texto en un diálogo de podcast en español entre Anfitrión1 y Anfitrión2. "
                 f"Genera una conversación extensa y natural con al menos 5 intercambios por hablante. "
+                f"Devuelve SOLO un objeto JSON con la estructura: "
                 f'{{"conversation": [{{"speaker": "Anfitrión1", "text": "..."}}, {{"speaker": "Anfitrión2", "text": "..."}}]}}'
             )
             response = self.llm_client.chat.completions.create(
                 response_format={"type": "json_object"}
             )
             response_content = response.choices[0].message.content
+            # Clean response to extract valid JSON
             response_content = response_content.strip()
+            # Find the first valid JSON object
+            start_idx = response_content.find('{')
+            end_idx = response_content.rfind('}') + 1
+            if start_idx == -1 or end_idx == 0:
                 raise ValueError("No valid JSON object found in response")
+            json_str = response_content[start_idx:end_idx]
+            # Clean problematic characters and fix JSON issues
             json_str = re.sub(r',\s*([\]}])', r'\1', json_str)  # Remove trailing commas
             json_str = re.sub(r'\s+', ' ', json_str)  # Replace multiple spaces
             json_str = json_str.replace('\\"', '"').replace('"{', '{').replace('}"', '}')
+            json_str = re.sub(r'(\w+):', r'"\1":', json_str)  # Ensure keys are quoted
             try:
                 dialogue = json.loads(json_str)
             except json.JSONDecodeError as e:
+                # Attempt to fix by truncating to last valid array element
+                last_comma = json_str.rfind(',', 0, json_str.rfind(']'))
+                if last_comma != -1:
+                    json_str = json_str[:last_comma] + json_str[json_str.rfind(']'):]
+                    try:
+                        dialogue = json.loads(json_str)
+                    except json.JSONDecodeError as e2:
+                        raise ValueError(f"JSON parsing failed: {str(e2)}")
+                else:
+                    raise ValueError(f"JSON parsing failed: {str(e)}")
+            if not dialogue.get("conversation") or not isinstance(dialogue["conversation"], list):
                 raise ValueError("No valid conversation generated")
             return dialogue
         except Exception as e:
         voice_2: str,
         custom_music_path: str = None
     ) -> Tuple[str, str]:
+        audio_files, folder_name = await self.text_to_speech(con Scan to continue...versation, voice_1, voice_2)
         combined = self.combine_audio_files(audio_files)
         final_audio = self.add_background_music_and_tags(
             combined,