Spaces:
Paused
Paused
adding comments and debug logs
Browse files
app.py
CHANGED
@@ -9,42 +9,53 @@ from transformers import pipeline
|
|
9 |
|
10 |
# Function to render markdown to HTML with extensions
|
11 |
def render_markdown(md_text):
|
12 |
-
|
|
|
|
|
13 |
md_text,
|
14 |
extensions=[
|
15 |
-
TableExtension(),
|
16 |
-
FencedCodeExtension(),
|
17 |
-
TocExtension(baselevel=2),
|
18 |
-
AttrListExtension(),
|
19 |
-
CodeHiliteExtension(linenums=False, css_class="highlight"),
|
20 |
],
|
21 |
)
|
|
|
|
|
22 |
|
23 |
# Load the JinaAI ReaderLM-v2 model
|
24 |
model_name = "jinaai/ReaderLM-v2"
|
25 |
-
|
|
|
26 |
|
27 |
# Function to convert HTML to Markdown or JSON
|
28 |
def convert_html(html_input, output_format):
|
29 |
-
#
|
|
|
30 |
prompt = f"Convert the following HTML into {output_format}:\n\n{html_input}"
|
|
|
31 |
|
32 |
-
#
|
33 |
-
response = html_converter(prompt, max_length=
|
34 |
-
|
|
|
35 |
|
36 |
-
#
|
37 |
converted_output = converted_output.replace(prompt, "").strip()
|
|
|
38 |
return converted_output
|
39 |
|
40 |
# Creating the Gradio Interface
|
41 |
with gr.Blocks(theme="Nymbo/Nymbo_Theme") as demo:
|
42 |
|
|
|
43 |
with gr.Tab("Live Preview"):
|
44 |
-
gr.Markdown("# Markdown Suite")
|
45 |
|
46 |
with gr.Row():
|
47 |
with gr.Column():
|
|
|
48 |
md_input = gr.Textbox(
|
49 |
lines=20,
|
50 |
placeholder="Write your markdown here...",
|
@@ -52,37 +63,44 @@ with gr.Blocks(theme="Nymbo/Nymbo_Theme") as demo:
|
|
52 |
elem_classes=["gr-textbox"]
|
53 |
)
|
54 |
with gr.Column():
|
|
|
55 |
md_output = gr.HTML(label="Rendered Output", elem_classes=["gr-html"])
|
56 |
|
|
|
57 |
md_input.change(render_markdown, inputs=md_input, outputs=md_output)
|
58 |
|
|
|
59 |
with gr.Tab("HTML to Markdown/JSON"):
|
60 |
-
gr.Markdown("# HTML to Markdown/JSON Converter")
|
61 |
|
62 |
with gr.Row():
|
|
|
63 |
html_input = gr.Textbox(
|
64 |
lines=10,
|
65 |
placeholder="Paste your raw HTML here...",
|
66 |
label="Raw HTML Input"
|
67 |
)
|
68 |
|
|
|
69 |
output_format = gr.Radio([
|
70 |
"Markdown",
|
71 |
"JSON"
|
72 |
], label="Output Format", value="Markdown")
|
73 |
|
|
|
74 |
converted_output = gr.Textbox(
|
75 |
lines=10,
|
76 |
label="Converted Output"
|
77 |
)
|
78 |
|
79 |
-
# Define interaction
|
80 |
convert_button = gr.Button("Convert")
|
81 |
convert_button.click(
|
82 |
-
convert_html,
|
83 |
-
inputs=[html_input, output_format],
|
84 |
-
outputs=converted_output
|
85 |
)
|
86 |
|
87 |
# Launch the app
|
|
|
88 |
demo.launch()
|
|
|
9 |
|
10 |
# Function to render markdown to HTML with extensions
|
11 |
def render_markdown(md_text):
|
12 |
+
print("[DEBUG] render_markdown called with input:", md_text) # Debug log for input
|
13 |
+
# Convert the input markdown text to HTML using various extensions for additional functionality
|
14 |
+
rendered_html = markdown.markdown(
|
15 |
md_text,
|
16 |
extensions=[
|
17 |
+
TableExtension(), # Enables rendering of tables in markdown
|
18 |
+
FencedCodeExtension(), # Supports fenced code blocks
|
19 |
+
TocExtension(baselevel=2), # Generates a table of contents starting at level 2
|
20 |
+
AttrListExtension(), # Allows adding attributes to markdown elements
|
21 |
+
CodeHiliteExtension(linenums=False, css_class="highlight"), # Syntax highlighting for code blocks
|
22 |
],
|
23 |
)
|
24 |
+
print("[DEBUG] Rendered HTML output:", rendered_html) # Debug log for output
|
25 |
+
return rendered_html
|
26 |
|
27 |
# Load the JinaAI ReaderLM-v2 model
|
28 |
model_name = "jinaai/ReaderLM-v2"
|
29 |
+
print("[DEBUG] Loading model:", model_name) # Debug log for model loading
|
30 |
+
html_converter = pipeline("text-generation", model=model_name) # Initialize the text-generation pipeline with the specified model
|
31 |
|
32 |
# Function to convert HTML to Markdown or JSON
|
33 |
def convert_html(html_input, output_format):
|
34 |
+
print("[DEBUG] convert_html called with inputs:", html_input, output_format) # Debug log for inputs
|
35 |
+
# Prepare the prompt for the model, specifying the desired output format (Markdown or JSON)
|
36 |
prompt = f"Convert the following HTML into {output_format}:\n\n{html_input}"
|
37 |
+
print("[DEBUG] Generated prompt:", prompt) # Debug log for the prompt
|
38 |
|
39 |
+
# Use the model to generate the conversion output
|
40 |
+
response = html_converter(prompt, max_length=500, num_return_sequences=1)
|
41 |
+
print("[DEBUG] Model response:", response) # Debug log for model response
|
42 |
+
converted_output = response[0]['generated_text'] # Extract the generated text from the model response
|
43 |
|
44 |
+
# Remove the prompt text from the generated output and clean up the result
|
45 |
converted_output = converted_output.replace(prompt, "").strip()
|
46 |
+
print("[DEBUG] Converted output:", converted_output) # Debug log for the final output
|
47 |
return converted_output
|
48 |
|
49 |
# Creating the Gradio Interface
|
50 |
with gr.Blocks(theme="Nymbo/Nymbo_Theme") as demo:
|
51 |
|
52 |
+
# Tab for the Markdown live preview feature
|
53 |
with gr.Tab("Live Preview"):
|
54 |
+
gr.Markdown("# Markdown Suite") # Header for the tab
|
55 |
|
56 |
with gr.Row():
|
57 |
with gr.Column():
|
58 |
+
# Input textbox for entering Markdown text
|
59 |
md_input = gr.Textbox(
|
60 |
lines=20,
|
61 |
placeholder="Write your markdown here...",
|
|
|
63 |
elem_classes=["gr-textbox"]
|
64 |
)
|
65 |
with gr.Column():
|
66 |
+
# Output area to display the rendered HTML from the Markdown input
|
67 |
md_output = gr.HTML(label="Rendered Output", elem_classes=["gr-html"])
|
68 |
|
69 |
+
# Define the interaction: Update the HTML preview whenever the Markdown input changes
|
70 |
md_input.change(render_markdown, inputs=md_input, outputs=md_output)
|
71 |
|
72 |
+
# Tab for HTML to Markdown/JSON conversion feature
|
73 |
with gr.Tab("HTML to Markdown/JSON"):
|
74 |
+
gr.Markdown("# HTML to Markdown/JSON Converter") # Header for the tab
|
75 |
|
76 |
with gr.Row():
|
77 |
+
# Input textbox for raw HTML input
|
78 |
html_input = gr.Textbox(
|
79 |
lines=10,
|
80 |
placeholder="Paste your raw HTML here...",
|
81 |
label="Raw HTML Input"
|
82 |
)
|
83 |
|
84 |
+
# Radio buttons to select the output format (Markdown or JSON)
|
85 |
output_format = gr.Radio([
|
86 |
"Markdown",
|
87 |
"JSON"
|
88 |
], label="Output Format", value="Markdown")
|
89 |
|
90 |
+
# Output textbox to display the converted Markdown or JSON
|
91 |
converted_output = gr.Textbox(
|
92 |
lines=10,
|
93 |
label="Converted Output"
|
94 |
)
|
95 |
|
96 |
+
# Define the interaction: Convert HTML when the "Convert" button is clicked
|
97 |
convert_button = gr.Button("Convert")
|
98 |
convert_button.click(
|
99 |
+
convert_html, # Function to handle conversion
|
100 |
+
inputs=[html_input, output_format], # Inputs: Raw HTML and desired output format
|
101 |
+
outputs=converted_output # Output: Converted text
|
102 |
)
|
103 |
|
104 |
# Launch the app
|
105 |
+
print("[DEBUG] Launching the app") # Debug log for app launch
|
106 |
demo.launch()
|