Spaces:

histlearn
/

BoletimSed

Sleeping

App Files Files Community

histlearn commited on Oct 28, 2024

Commit

75c163e

verified ·

1 Parent(s): b0f7407

Update app.py

Browse files

Files changed (1) hide show

app.py +70 -1

app.py CHANGED Viewed

@@ -71,6 +71,75 @@ class PDFReport(FPDF):
                  'Este relatório é uma análise automática e deve ser validado junto à secretaria da escola.',
                  0, new_x=XPos.LMARGIN, new_y=YPos.NEXT, align='C')
 # Funções de plotagem
 def plotar_evolucao_bimestres(disciplinas_dados: List[Dict], temp_dir: str,
                              titulo: Optional[str] = None,
@@ -193,7 +262,7 @@ def gerar_relatorio_pdf(df: pd.DataFrame, disciplinas_dados: List[Dict],
              0, new_x=XPos.LMARGIN, new_y=YPos.NEXT, align='L')
     pdf.ln(10)
-# Pontos de atenção
     pdf.set_font('Helvetica', 'B', 12)
     pdf.cell(0, 10, 'Pontos de Atenção:',
              0, new_x=XPos.LMARGIN, new_y=YPos.NEXT, align='L')

                  'Este relatório é uma análise automática e deve ser validado junto à secretaria da escola.',
                  0, new_x=XPos.LMARGIN, new_y=YPos.NEXT, align='C')
+# Função de extração de tabelas do PDF
+def extrair_tabelas_pdf(pdf_path: str) -> pd.DataFrame:
+    """Extrai tabelas do PDF usando stream para o nome e lattice para notas."""
+    try:
+        # Extrair nome do aluno usando stream
+        tables_header = camelot.read_pdf(
+            pdf_path,
+            pages='1',
+            flavor='stream',
+            edge_tol=500
+        )
+        info_aluno = {}
+        # Procurar nome do aluno
+        for table in tables_header:
+            df = table.df
+            for i in range(len(df)):
+                for j in range(len(df.columns)):
+                    texto = str(df.iloc[i,j]).strip()
+                    if 'Nome do Aluno' in texto:
+                        try:
+                            if j + 1 < len(df.columns):
+                                nome = str(df.iloc[i,j+1]).strip()
+                            elif i + 1 < len(df):
+                                nome = str(df.iloc[i+1,j]).strip()
+                            if nome and nome != 'Nome do Aluno:':
+                                info_aluno['nome'] = nome
+                                break
+                        except:
+                            continue
+        # Extrair tabela de notas usando lattice
+        tables_notas = camelot.read_pdf(
+            pdf_path,
+            pages='all',
+            flavor='lattice'
+        )
+        # Encontrar tabela de notas
+        df_notas = None
+        max_rows = 0
+        for table in tables_notas:
+            df_temp = table.df
+            if len(df_temp) > max_rows and 'Disciplina' in str(df_temp.iloc[0,0]):
+                max_rows = len(df_temp)
+                df_notas = df_temp.copy()
+                df_notas = df_notas.rename(columns={
+                    0: 'Disciplina',
+                    1: 'Nota B1', 2: 'Freq B1', 3: '%Freq B1', 4: 'AC B1',
+                    5: 'Nota B2', 6: 'Freq B2', 7: '%Freq B2', 8: 'AC B2',
+                    9: 'Nota B3', 10: 'Freq B3', 11: '%Freq B3', 12: 'AC B3',
+                    13: 'Nota B4', 14: 'Freq B4', 15: '%Freq B4', 16: 'AC B4',
+                    17: 'CF', 18: 'Nota Final', 19: 'Freq Final', 20: 'AC Final'
+                })
+        if df_notas is None:
+            raise ValueError("Tabela de notas não encontrada")
+        # Adicionar informações do aluno ao DataFrame
+        df_notas.attrs['nome'] = info_aluno.get('nome', 'Nome não encontrado')
+        return df_notas
+    except Exception as e:
+        logger.error(f"Erro na extração das tabelas: {str(e)}")
+        raise
 # Funções de plotagem
 def plotar_evolucao_bimestres(disciplinas_dados: List[Dict], temp_dir: str,
                              titulo: Optional[str] = None,
              0, new_x=XPos.LMARGIN, new_y=YPos.NEXT, align='L')
     pdf.ln(10)
+    # Pontos de atenção
     pdf.set_font('Helvetica', 'B', 12)
     pdf.cell(0, 10, 'Pontos de Atenção:',
              0, new_x=XPos.LMARGIN, new_y=YPos.NEXT, align='L')