Spaces:

xiaoyao9184
/

marker

Running

App Files Files Community

xiaoyao9184 commited on 16 days ago

Commit

80e784c

verified ·

1 Parent(s): 9d98688

Synced repo using 'sync_with_huggingface' Github Action

Browse files

original:
- remote: "https://github.com/xiaoyao9184/docker-marker"
- commit: "386ea4e94940750ee5f6d60aca9f504e4a1c7539"
sync_with_huggingface:
- repository: ""
- ref: ""

Files changed (1) hide show

gradio_app.py +2 -6

gradio_app.py CHANGED Viewed

@@ -128,7 +128,6 @@ with gr.Blocks(title="Marker") as demo:
             show_blocks_ckb = gr.Checkbox(label="Show Blocks", info="Display detected blocks, only when output is JSON", value=False, interactive=False)
             debug_ckb = gr.Checkbox(label="Debug", value=False, info="Show debug information")
             strip_existing_ocr_ckb = gr.Checkbox(label="Strip existing OCR", value=False, info="Strip existing OCR text from the PDF and re-OCR.")
-            format_lines_ckb = gr.Checkbox(label="Format lines", value=False, info="Format lines in the document with OCR model")
             disable_ocr_math_ckb = gr.Checkbox(label="Disable math", value=False, info="Disable math in OCR output - no inline math")
             run_marker_btn = gr.Button("Run Marker", interactive=False)
         with gr.Column():
@@ -197,7 +196,7 @@ with gr.Blocks(title="Marker") as demo:
         )
         # Run Marker
-        def run_marker_img(filename, page_range, force_ocr, output_format, show_blocks, debug, use_llm, strip_existing_ocr, format_lines, disable_ocr_math):
             """
             Run marker on the given PDF file and return processed results in multiple formats.
@@ -215,8 +214,6 @@ with gr.Blocks(title="Marker") as demo:
                     Defaults to False.
                 strip_existing_ocr (bool, optional): If True, strip embedded OCR text and re-run OCR.
                     Defaults to False.
-                format_lines (bool, optional): If True, format lines in the document with OCR model.
-                    Defaults to False.
                 disable_ocr_math (bool, optional): If True, disable math in OCR output - no inline math.
                     Defaults to False.
             Returns:
@@ -240,7 +237,6 @@ with gr.Blocks(title="Marker") as demo:
                 "output_dir": settings.DEBUG_DATA_FOLDER if debug else None,
                 "use_llm": use_llm,
                 "strip_existing_ocr": strip_existing_ocr,
-                "format_lines": format_lines,
                 "disable_ocr_math": disable_ocr_math,
             }
             config_parser = ConfigParser(cli_options)
@@ -362,7 +358,7 @@ with gr.Blocks(title="Marker") as demo:
         run_marker_btn.click(
             fn=run_marker_img,
-            inputs=[in_file, page_range_txt, force_ocr_ckb, output_format_dd, show_blocks_ckb, debug_ckb, use_llm_ckb, strip_existing_ocr_ckb, format_lines_ckb, disable_ocr_math_ckb],
             outputs=[result_md, result_json, result_html, debug_img_pdf, debug_img_layout, in_img]
         )

             show_blocks_ckb = gr.Checkbox(label="Show Blocks", info="Display detected blocks, only when output is JSON", value=False, interactive=False)
             debug_ckb = gr.Checkbox(label="Debug", value=False, info="Show debug information")
             strip_existing_ocr_ckb = gr.Checkbox(label="Strip existing OCR", value=False, info="Strip existing OCR text from the PDF and re-OCR.")
             disable_ocr_math_ckb = gr.Checkbox(label="Disable math", value=False, info="Disable math in OCR output - no inline math")
             run_marker_btn = gr.Button("Run Marker", interactive=False)
         with gr.Column():
         )
         # Run Marker
+        def run_marker_img(filename, page_range, force_ocr, output_format, show_blocks, debug, use_llm, strip_existing_ocr, disable_ocr_math):
             """
             Run marker on the given PDF file and return processed results in multiple formats.
                     Defaults to False.
                 strip_existing_ocr (bool, optional): If True, strip embedded OCR text and re-run OCR.
                     Defaults to False.
                 disable_ocr_math (bool, optional): If True, disable math in OCR output - no inline math.
                     Defaults to False.
             Returns:
                 "output_dir": settings.DEBUG_DATA_FOLDER if debug else None,
                 "use_llm": use_llm,
                 "strip_existing_ocr": strip_existing_ocr,
                 "disable_ocr_math": disable_ocr_math,
             }
             config_parser = ConfigParser(cli_options)
         run_marker_btn.click(
             fn=run_marker_img,
+            inputs=[in_file, page_range_txt, force_ocr_ckb, output_format_dd, show_blocks_ckb, debug_ckb, use_llm_ckb, strip_existing_ocr_ckb, disable_ocr_math_ckb],
             outputs=[result_md, result_json, result_html, debug_img_pdf, debug_img_layout, in_img]
         )