Spaces:

amendolajine
/

OPIT

Running

amendolajine commited on Dec 1, 2023

Commit

41dd0e4

1 Parent(s): 674f46b

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -24,17 +24,9 @@ def extract_abstract(pdf_bytes):
 # Function to process text (summarize and convert to speech)
 def process_text(uploaded_file):
-    # Debugging: Check the type and content of the uploaded file
-    file_info = f"File type: {type(uploaded_file)}, File keys: {list(uploaded_file.keys())}"
-    # Check if 'data' key exists
-    if 'data' in uploaded_file:
-        file_info += f", Data type: {type(uploaded_file['data'])}, Data length: {len(uploaded_file['data'])}"
-    else:
-        file_info += ", 'data' key not found"
-    # For debugging, return the file info instead of processing the file
-    return file_info, "temp_output.wav"
 # Function to process text (summarize and convert to speech)
@@ -48,8 +40,6 @@ def process_text(uploaded_file):
-    abstract_text = extract_abstract(pdf_bytes)
     # Generate summary
     inputs = tokenizer([abstract_text], max_length=1024, return_tensors='pt', truncation=True)
     summary_ids = model.generate(inputs['input_ids'], num_beams=4, max_length=40, min_length=10, length_penalty=2.0, early_stopping=True, no_repeat_ngram_size=2)

 # Function to process text (summarize and convert to speech)
 def process_text(uploaded_file):
+    # Extract the file data (byte content) from the uploaded file
+    pdf_bytes = uploaded_file["data"]
+    abstract_text = extract_abstract(pdf_bytes)
 # Function to process text (summarize and convert to speech)
     # Generate summary
     inputs = tokenizer([abstract_text], max_length=1024, return_tensors='pt', truncation=True)
     summary_ids = model.generate(inputs['input_ids'], num_beams=4, max_length=40, min_length=10, length_penalty=2.0, early_stopping=True, no_repeat_ngram_size=2)