Nymbo commited on
Commit
8206fd5
·
verified ·
1 Parent(s): 0d8532e

adding comments and debug logs

Browse files
Files changed (1) hide show
  1. app.py +36 -18
app.py CHANGED
@@ -9,42 +9,53 @@ from transformers import pipeline
9
 
10
  # Function to render markdown to HTML with extensions
11
  def render_markdown(md_text):
12
- return markdown.markdown(
 
 
13
  md_text,
14
  extensions=[
15
- TableExtension(),
16
- FencedCodeExtension(),
17
- TocExtension(baselevel=2),
18
- AttrListExtension(),
19
- CodeHiliteExtension(linenums=False, css_class="highlight"),
20
  ],
21
  )
 
 
22
 
23
  # Load the JinaAI ReaderLM-v2 model
24
  model_name = "jinaai/ReaderLM-v2"
25
- html_converter = pipeline("text-generation", model=model_name)
 
26
 
27
  # Function to convert HTML to Markdown or JSON
28
  def convert_html(html_input, output_format):
29
- # Prepare the prompt for the model
 
30
  prompt = f"Convert the following HTML into {output_format}:\n\n{html_input}"
 
31
 
32
- # Generate the output using the model
33
- response = html_converter(prompt, max_length=999999, num_return_sequences=1)
34
- converted_output = response[0]['generated_text']
 
35
 
36
- # Extract the relevant part of the output (remove the prompt)
37
  converted_output = converted_output.replace(prompt, "").strip()
 
38
  return converted_output
39
 
40
  # Creating the Gradio Interface
41
  with gr.Blocks(theme="Nymbo/Nymbo_Theme") as demo:
42
 
 
43
  with gr.Tab("Live Preview"):
44
- gr.Markdown("# Markdown Suite")
45
 
46
  with gr.Row():
47
  with gr.Column():
 
48
  md_input = gr.Textbox(
49
  lines=20,
50
  placeholder="Write your markdown here...",
@@ -52,37 +63,44 @@ with gr.Blocks(theme="Nymbo/Nymbo_Theme") as demo:
52
  elem_classes=["gr-textbox"]
53
  )
54
  with gr.Column():
 
55
  md_output = gr.HTML(label="Rendered Output", elem_classes=["gr-html"])
56
 
 
57
  md_input.change(render_markdown, inputs=md_input, outputs=md_output)
58
 
 
59
  with gr.Tab("HTML to Markdown/JSON"):
60
- gr.Markdown("# HTML to Markdown/JSON Converter")
61
 
62
  with gr.Row():
 
63
  html_input = gr.Textbox(
64
  lines=10,
65
  placeholder="Paste your raw HTML here...",
66
  label="Raw HTML Input"
67
  )
68
 
 
69
  output_format = gr.Radio([
70
  "Markdown",
71
  "JSON"
72
  ], label="Output Format", value="Markdown")
73
 
 
74
  converted_output = gr.Textbox(
75
  lines=10,
76
  label="Converted Output"
77
  )
78
 
79
- # Define interaction
80
  convert_button = gr.Button("Convert")
81
  convert_button.click(
82
- convert_html,
83
- inputs=[html_input, output_format],
84
- outputs=converted_output
85
  )
86
 
87
  # Launch the app
 
88
  demo.launch()
 
9
 
10
  # Function to render markdown to HTML with extensions
11
  def render_markdown(md_text):
12
+ print("[DEBUG] render_markdown called with input:", md_text) # Debug log for input
13
+ # Convert the input markdown text to HTML using various extensions for additional functionality
14
+ rendered_html = markdown.markdown(
15
  md_text,
16
  extensions=[
17
+ TableExtension(), # Enables rendering of tables in markdown
18
+ FencedCodeExtension(), # Supports fenced code blocks
19
+ TocExtension(baselevel=2), # Generates a table of contents starting at level 2
20
+ AttrListExtension(), # Allows adding attributes to markdown elements
21
+ CodeHiliteExtension(linenums=False, css_class="highlight"), # Syntax highlighting for code blocks
22
  ],
23
  )
24
+ print("[DEBUG] Rendered HTML output:", rendered_html) # Debug log for output
25
+ return rendered_html
26
 
27
  # Load the JinaAI ReaderLM-v2 model
28
  model_name = "jinaai/ReaderLM-v2"
29
+ print("[DEBUG] Loading model:", model_name) # Debug log for model loading
30
+ html_converter = pipeline("text-generation", model=model_name) # Initialize the text-generation pipeline with the specified model
31
 
32
  # Function to convert HTML to Markdown or JSON
33
  def convert_html(html_input, output_format):
34
+ print("[DEBUG] convert_html called with inputs:", html_input, output_format) # Debug log for inputs
35
+ # Prepare the prompt for the model, specifying the desired output format (Markdown or JSON)
36
  prompt = f"Convert the following HTML into {output_format}:\n\n{html_input}"
37
+ print("[DEBUG] Generated prompt:", prompt) # Debug log for the prompt
38
 
39
+ # Use the model to generate the conversion output
40
+ response = html_converter(prompt, max_length=500, num_return_sequences=1)
41
+ print("[DEBUG] Model response:", response) # Debug log for model response
42
+ converted_output = response[0]['generated_text'] # Extract the generated text from the model response
43
 
44
+ # Remove the prompt text from the generated output and clean up the result
45
  converted_output = converted_output.replace(prompt, "").strip()
46
+ print("[DEBUG] Converted output:", converted_output) # Debug log for the final output
47
  return converted_output
48
 
49
  # Creating the Gradio Interface
50
  with gr.Blocks(theme="Nymbo/Nymbo_Theme") as demo:
51
 
52
+ # Tab for the Markdown live preview feature
53
  with gr.Tab("Live Preview"):
54
+ gr.Markdown("# Markdown Suite") # Header for the tab
55
 
56
  with gr.Row():
57
  with gr.Column():
58
+ # Input textbox for entering Markdown text
59
  md_input = gr.Textbox(
60
  lines=20,
61
  placeholder="Write your markdown here...",
 
63
  elem_classes=["gr-textbox"]
64
  )
65
  with gr.Column():
66
+ # Output area to display the rendered HTML from the Markdown input
67
  md_output = gr.HTML(label="Rendered Output", elem_classes=["gr-html"])
68
 
69
+ # Define the interaction: Update the HTML preview whenever the Markdown input changes
70
  md_input.change(render_markdown, inputs=md_input, outputs=md_output)
71
 
72
+ # Tab for HTML to Markdown/JSON conversion feature
73
  with gr.Tab("HTML to Markdown/JSON"):
74
+ gr.Markdown("# HTML to Markdown/JSON Converter") # Header for the tab
75
 
76
  with gr.Row():
77
+ # Input textbox for raw HTML input
78
  html_input = gr.Textbox(
79
  lines=10,
80
  placeholder="Paste your raw HTML here...",
81
  label="Raw HTML Input"
82
  )
83
 
84
+ # Radio buttons to select the output format (Markdown or JSON)
85
  output_format = gr.Radio([
86
  "Markdown",
87
  "JSON"
88
  ], label="Output Format", value="Markdown")
89
 
90
+ # Output textbox to display the converted Markdown or JSON
91
  converted_output = gr.Textbox(
92
  lines=10,
93
  label="Converted Output"
94
  )
95
 
96
+ # Define the interaction: Convert HTML when the "Convert" button is clicked
97
  convert_button = gr.Button("Convert")
98
  convert_button.click(
99
+ convert_html, # Function to handle conversion
100
+ inputs=[html_input, output_format], # Inputs: Raw HTML and desired output format
101
+ outputs=converted_output # Output: Converted text
102
  )
103
 
104
  # Launch the app
105
+ print("[DEBUG] Launching the app") # Debug log for app launch
106
  demo.launch()