Spaces:

GABRIELSZK
/

EXAMES

Sleeping

GABRIELSZK commited on Apr 27

Commit

f3bf590

verified ·

1 Parent(s): 150311e

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -28,7 +28,6 @@ faixas = {
     "TROPONINA": (0, 0.5)
 }
 def classificar(nome, valor):
     try:
         v = float(valor.replace(">", "").replace("<", "").strip())
@@ -63,7 +62,7 @@ def extrair_texto_pdf(pdf_input):
             texto_nativo.append(page.get_text())
             pix = page.get_pixmap(dpi=300)
             img = Image.open(io.BytesIO(pix.tobytes("png")))
-            ocr_imgs.append(melhor_imagem(img))
     tn = re.sub(r"\s+", " ", "".join(texto_nativo))
     tocr = re.sub(r"\s+", " ", " ".join(pytesseract.image_to_string(im) for im in ocr_imgs))
     return tn, tocr
@@ -127,7 +126,6 @@ ordem = [
     "PROTEINA UR","GLI UR","CETONAS UR","SANGUE UR","LEUC ESTERASE","NITRITO UR","LEUCO EAS","HEMA EAS","BACTERIAS UR"
 ]
 def extrair_exames_formatado(pdf_file):
     if not pdf_file:
         return "Nenhum arquivo enviado.", None
@@ -150,7 +148,7 @@ def extrair_exames_formatado(pdf_file):
     line_main = ' / '.join(main_fields)
     final = '\n'.join([l for l in (line_eas, line_main) if l])
-    # Gera CSV
     df = pd.DataFrame([[k, resultados[k]] for k in resultados], columns=["Exame", "Valor"])
     tmp = tempfile.NamedTemporaryFile(delete=False, suffix=".csv")
     df.to_csv(tmp.name, index=False)
@@ -166,4 +164,4 @@ with gr.Blocks() as demo:
     btn.click(extrair_exames_formatado, inputs=pdf_input, outputs=[out_txt, dl])
 if __name__ == "__main__":
-    demo.launch()

     "TROPONINA": (0, 0.5)
 }
 def classificar(nome, valor):
     try:
         v = float(valor.replace(">", "").replace("<", "").strip())
             texto_nativo.append(page.get_text())
             pix = page.get_pixmap(dpi=300)
             img = Image.open(io.BytesIO(pix.tobytes("png")))
+            ocr_imgs.append(melhorar_imagem(img))
     tn = re.sub(r"\s+", " ", "".join(texto_nativo))
     tocr = re.sub(r"\s+", " ", " ".join(pytesseract.image_to_string(im) for im in ocr_imgs))
     return tn, tocr
     "PROTEINA UR","GLI UR","CETONAS UR","SANGUE UR","LEUC ESTERASE","NITRITO UR","LEUCO EAS","HEMA EAS","BACTERIAS UR"
 ]
 def extrair_exames_formatado(pdf_file):
     if not pdf_file:
         return "Nenhum arquivo enviado.", None
     line_main = ' / '.join(main_fields)
     final = '\n'.join([l for l in (line_eas, line_main) if l])
+# Gera CSV
     df = pd.DataFrame([[k, resultados[k]] for k in resultados], columns=["Exame", "Valor"])
     tmp = tempfile.NamedTemporaryFile(delete=False, suffix=".csv")
     df.to_csv(tmp.name, index=False)
     btn.click(extrair_exames_formatado, inputs=pdf_input, outputs=[out_txt, dl])
 if __name__ == "__main__":
+    demo.launch(share=False)