Commit
·
5f63988
1
Parent(s):
febfebc
refactor app.py
Browse files
app.py
CHANGED
@@ -204,7 +204,7 @@ button {
|
|
204 |
font-size: 25px !important;
|
205 |
}
|
206 |
.tight-spacing {
|
207 |
-
margin-bottom: -
|
208 |
}
|
209 |
.tight-spacing-as {
|
210 |
margin-top: 0px !important;
|
@@ -236,16 +236,16 @@ EXAMPLES_TEST = [
|
|
236 |
|
237 |
DESC_DICT = {
|
238 |
"concatenate_pages": "Whether to merge pages",
|
239 |
-
"use_formula_recognition": "Whether to use formula recognition subpipeline. If used, the formula can be converted into Latex code.
|
240 |
"use_chart_recognition": "Use the PP-Chart2Table model to parse and convert the charts in the document into tables.",
|
241 |
"use_doc_orientation_classify": "Whether to use the document image orientation classification module. After use, you can correct distorted images, such as wrinkles, tilts, etc.",
|
242 |
"use_doc_unwarping": "Whether to use the document unwarping module. After use, you can correct distorted images, such as wrinkles, tilts, etc.",
|
243 |
"use_textline_orientation": "Whether to use the text line orientation classification module to support the distinction and correction of text lines of 0 degrees and 180 degrees.",
|
244 |
"use_region_detection": "Whether to use the layout region detection. After using it, it can handle complex layouts such as newspapers and magazines.",
|
245 |
-
"use_seal_recognition": "Whether to seal text recognition subpipeline. After use, the seal text content in the document can be extracted.",
|
246 |
-
"use_table_recognition": "Whether to table recognition subpipeline. If used, the table can be identified as a structured format (such as HTML
|
247 |
"layout_threshold_nb": "The threshold used to filter out low confidence prediction results for the layout region, ranging from 0 to 1. If there are missed regions, this value can be appropriately lowered.",
|
248 |
-
"layout_nms": "Whether
|
249 |
"layout_unclip_ratio_nb": "Use this method to expand each region of the layout. The larger the value, the larger the expanded region.",
|
250 |
"text_det_limit_type": "[Short side] means to ensure that the shortest side of the image is not less than [Image side length limit for text detection], and [Long side] means to ensure that the longest side of the image is not greater than [Image side length limit for text detection].",
|
251 |
"text_det_limit_side_len_nb": "For the side length limit of the text detection input image, for large images with dense text, if you want more accurate recognition, you should choose a larger size. This parameter is used in conjunction with the [Image side length limit type for text detection]. Generally, the maximum [Long side] is suitable for scenes with large images and text, and the minimum [Short side] is suitable for document scenes with small and dense images.",
|
|
|
204 |
font-size: 25px !important;
|
205 |
}
|
206 |
.tight-spacing {
|
207 |
+
margin-bottom: -5px !important;
|
208 |
}
|
209 |
.tight-spacing-as {
|
210 |
margin-top: 0px !important;
|
|
|
236 |
|
237 |
DESC_DICT = {
|
238 |
"concatenate_pages": "Whether to merge pages",
|
239 |
+
"use_formula_recognition": "Whether to use formula recognition subpipeline. If used, the formula can be converted into Latex code. Otherwise, the formula part is the text recognition result.",
|
240 |
"use_chart_recognition": "Use the PP-Chart2Table model to parse and convert the charts in the document into tables.",
|
241 |
"use_doc_orientation_classify": "Whether to use the document image orientation classification module. After use, you can correct distorted images, such as wrinkles, tilts, etc.",
|
242 |
"use_doc_unwarping": "Whether to use the document unwarping module. After use, you can correct distorted images, such as wrinkles, tilts, etc.",
|
243 |
"use_textline_orientation": "Whether to use the text line orientation classification module to support the distinction and correction of text lines of 0 degrees and 180 degrees.",
|
244 |
"use_region_detection": "Whether to use the layout region detection. After using it, it can handle complex layouts such as newspapers and magazines.",
|
245 |
+
"use_seal_recognition": "Whether to use seal text recognition subpipeline. After use, the seal text content in the document can be extracted.",
|
246 |
+
"use_table_recognition": "Whether to use table recognition subpipeline. If used, the table can be identified as a structured format (such as HTML). Otherwise, the table will be regarded as figure.",
|
247 |
"layout_threshold_nb": "The threshold used to filter out low confidence prediction results for the layout region, ranging from 0 to 1. If there are missed regions, this value can be appropriately lowered.",
|
248 |
+
"layout_nms": "Whether to use layout region detection model uses NMS post-processing. After using it, nested boxes or those with large intersections can be removed.",
|
249 |
"layout_unclip_ratio_nb": "Use this method to expand each region of the layout. The larger the value, the larger the expanded region.",
|
250 |
"text_det_limit_type": "[Short side] means to ensure that the shortest side of the image is not less than [Image side length limit for text detection], and [Long side] means to ensure that the longest side of the image is not greater than [Image side length limit for text detection].",
|
251 |
"text_det_limit_side_len_nb": "For the side length limit of the text detection input image, for large images with dense text, if you want more accurate recognition, you should choose a larger size. This parameter is used in conjunction with the [Image side length limit type for text detection]. Generally, the maximum [Long side] is suitable for scenes with large images and text, and the minimum [Short side] is suitable for document scenes with small and dense images.",
|