convert_test

Sleeping

Bentham commited on Dec 20, 2024

Commit

b1c0fa5

verified ·

1 Parent(s): 4777466

ajout ppt

Files changed (1) hide show

main.py CHANGED Viewed

@@ -779,14 +779,20 @@ async def convert_file_to_txt(
                 raise HTTPException(status_code=500, detail="Erreur lors du nettoyage du fichier HTML.")
             input_filename = cleaned_input_filename
-        # Conversion en HTML via pandoc si nécessaire
         if ext == '.pdf':
             html_content = pdf_to_html(input_filename)
         elif ext == '.pptx':
             html_content = convert_pptx_to_html(input_filename)
-        elif ext in ['.ppt']:
-            text = convert_ppt_to_text(input_filename)
-            html_content = text_to_html(text)
         elif ext == '.doc':
             text = convert_doc_to_text(input_filename)
             html_content = text_to_html(text)

                 raise HTTPException(status_code=500, detail="Erreur lors du nettoyage du fichier HTML.")
             input_filename = cleaned_input_filename
+        # Conversion en HTML via appropriate methods
         if ext == '.pdf':
             html_content = pdf_to_html(input_filename)
         elif ext == '.pptx':
             html_content = convert_pptx_to_html(input_filename)
+        elif ext == '.ppt':
+            try:
+                text = convert_doc_to_text(input_filename)  # Reuse convert_doc_to_text which uses textract
+                html_content = text_to_html(text)
+            except HTTPException as e:
+                raise e
+            except Exception as e:
+                logging.error(f"Erreur lors de la conversion de .ppt avec textract: {e}")
+                raise HTTPException(status_code=500, detail=f"Erreur lors de la conversion du fichier .ppt: {e}")
         elif ext == '.doc':
             text = convert_doc_to_text(input_filename)
             html_content = text_to_html(text)