guoshengjian commited on
Commit
5f63988
·
1 Parent(s): febfebc

refactor app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -5
app.py CHANGED
@@ -204,7 +204,7 @@ button {
204
  font-size: 25px !important;
205
  }
206
  .tight-spacing {
207
- margin-bottom: -20px !important;
208
  }
209
  .tight-spacing-as {
210
  margin-top: 0px !important;
@@ -236,16 +236,16 @@ EXAMPLES_TEST = [
236
 
237
  DESC_DICT = {
238
  "concatenate_pages": "Whether to merge pages",
239
- "use_formula_recognition": "Whether to use formula recognition subpipeline. If used, the formula can be converted into Latex code. If not used, the formula part is the text recognition result.",
240
  "use_chart_recognition": "Use the PP-Chart2Table model to parse and convert the charts in the document into tables.",
241
  "use_doc_orientation_classify": "Whether to use the document image orientation classification module. After use, you can correct distorted images, such as wrinkles, tilts, etc.",
242
  "use_doc_unwarping": "Whether to use the document unwarping module. After use, you can correct distorted images, such as wrinkles, tilts, etc.",
243
  "use_textline_orientation": "Whether to use the text line orientation classification module to support the distinction and correction of text lines of 0 degrees and 180 degrees.",
244
  "use_region_detection": "Whether to use the layout region detection. After using it, it can handle complex layouts such as newspapers and magazines.",
245
- "use_seal_recognition": "Whether to seal text recognition subpipeline. After use, the seal text content in the document can be extracted.",
246
- "use_table_recognition": "Whether to table recognition subpipeline. If used, the table can be identified as a structured format (such as HTML, Markdown, etc.). If not used, the table part will be in the form of an image.",
247
  "layout_threshold_nb": "The threshold used to filter out low confidence prediction results for the layout region, ranging from 0 to 1. If there are missed regions, this value can be appropriately lowered.",
248
- "layout_nms": "Whether the layout region detection model uses NMS post-processing. After using it, nested boxes or those with large intersections can be removed.",
249
  "layout_unclip_ratio_nb": "Use this method to expand each region of ​​the layout. The larger the value, the larger the expanded region.",
250
  "text_det_limit_type": "[Short side] means to ensure that the shortest side of the image is not less than [Image side length limit for text detection], and [Long side] means to ensure that the longest side of the image is not greater than [Image side length limit for text detection].",
251
  "text_det_limit_side_len_nb": "For the side length limit of the text detection input image, for large images with dense text, if you want more accurate recognition, you should choose a larger size. This parameter is used in conjunction with the [Image side length limit type for text detection]. Generally, the maximum [Long side] is suitable for scenes with large images and text, and the minimum [Short side] is suitable for document scenes with small and dense images.",
 
204
  font-size: 25px !important;
205
  }
206
  .tight-spacing {
207
+ margin-bottom: -5px !important;
208
  }
209
  .tight-spacing-as {
210
  margin-top: 0px !important;
 
236
 
237
  DESC_DICT = {
238
  "concatenate_pages": "Whether to merge pages",
239
+ "use_formula_recognition": "Whether to use formula recognition subpipeline. If used, the formula can be converted into Latex code. Otherwise, the formula part is the text recognition result.",
240
  "use_chart_recognition": "Use the PP-Chart2Table model to parse and convert the charts in the document into tables.",
241
  "use_doc_orientation_classify": "Whether to use the document image orientation classification module. After use, you can correct distorted images, such as wrinkles, tilts, etc.",
242
  "use_doc_unwarping": "Whether to use the document unwarping module. After use, you can correct distorted images, such as wrinkles, tilts, etc.",
243
  "use_textline_orientation": "Whether to use the text line orientation classification module to support the distinction and correction of text lines of 0 degrees and 180 degrees.",
244
  "use_region_detection": "Whether to use the layout region detection. After using it, it can handle complex layouts such as newspapers and magazines.",
245
+ "use_seal_recognition": "Whether to use seal text recognition subpipeline. After use, the seal text content in the document can be extracted.",
246
+ "use_table_recognition": "Whether to use table recognition subpipeline. If used, the table can be identified as a structured format (such as HTML). Otherwise, the table will be regarded as figure.",
247
  "layout_threshold_nb": "The threshold used to filter out low confidence prediction results for the layout region, ranging from 0 to 1. If there are missed regions, this value can be appropriately lowered.",
248
+ "layout_nms": "Whether to use layout region detection model uses NMS post-processing. After using it, nested boxes or those with large intersections can be removed.",
249
  "layout_unclip_ratio_nb": "Use this method to expand each region of ​​the layout. The larger the value, the larger the expanded region.",
250
  "text_det_limit_type": "[Short side] means to ensure that the shortest side of the image is not less than [Image side length limit for text detection], and [Long side] means to ensure that the longest side of the image is not greater than [Image side length limit for text detection].",
251
  "text_det_limit_side_len_nb": "For the side length limit of the text detection input image, for large images with dense text, if you want more accurate recognition, you should choose a larger size. This parameter is used in conjunction with the [Image side length limit type for text detection]. Generally, the maximum [Long side] is suitable for scenes with large images and text, and the minimum [Short side] is suitable for document scenes with small and dense images.",