Spaces:

KushwanthK
/

vedic_scriptures

Running

App Files Files Community

KushwanthK commited on May 19, 2024

Commit

a5d883c

verified ·

1 Parent(s): 510f31f

Upload app.py

Browse files

Files changed (1) hide show

app.py +167 -167

app.py CHANGED Viewed

@@ -525,52 +525,52 @@ display_highlighted_pdf()
 #     print(f"An error occurred: {e}")
-import streamlit as st
-import requests
-from bs4 import BeautifulSoup
-def fetch_html(url):
-    # Fetch the webpage content
-    response = requests.get(url)
-    if response.status_code == 200:
-        return response.content
-    else:
-        st.error(f"Failed to fetch webpage. Status code: {response.status_code}")
-def scrape_data(html_content):
-    # Parse HTML content
-    soup = BeautifulSoup(html_content, "html.parser")
-    # Scrape data (replace this with your specific scraping logic)
-    data = soup.find_all(class_="container first-container")
-    return data
-def main(url):
-    st.title("Webpage Scraper")
-    # User input for webpage URL
-    url = st.text_input("Enter the URL of the webpage:", value=url)
-    # Convert webpage to HTML and scrape data
-    if st.button("Scrape Data"):
-        if url:
-            html_content = fetch_html(url)
-            str_content = """ """
-            if html_content:
-                data = scrape_data(html_content)
-                # st.title("HTML Page Display")
-                # st.components.v1.html(html_content, height=1600, width=800)
-                # Display scraped data in a new tab
-                with st.expander("Scraped Data", expanded=True):
-                    for item in data:
-                        # Convert item to string and display
-                        str_content += str(item)
-                        # st.write(str(item))
-                        # st.title("HTML Page Display")
-                        # st.components.v1.html(data, height=1600, width=800)
-                    # st.title("HTML Page Display")
-                    st.components.v1.html(str_content, height=1600, width=680)
 # main()
@@ -602,180 +602,180 @@ def main(url):
-import requests
-from bs4 import BeautifulSoup
-# URL of the webpage
-baseurl = "https://vedabase.io/en/library/bg/"
-# Fetch the webpage content
-response = requests.get(baseurl)
-if response.status_code == 200:
-    html_content = response.content
-    # Parse HTML content
-    soup = BeautifulSoup(html_content, "html.parser")
-    # Find all direct child div elements with class="r-chapter"
-    direct_child_div_elements = soup.select("div.col-12 > div.r-chapter")
-    # List to store the extracted text
-    output = []
-    # Iterate over each direct child div element
-    for div in direct_child_div_elements:
-        # Find the <a> tag within the div
-        a_tag = div.find("a")
-        if a_tag:
-            # Extract the text from the <a> tag and append it to the output list
-            output.append(a_tag.text.strip())
-    # Print the output list
-    # print(output)
-    # print(len(output))
-### Link to all chapters
-import re
-# Sample text
-chapter = output[4]
-text_to_number = {
-    "One": "1",
-    "Two": "2",
-    "Three": "3",
-    "Four": "4",
-    "Five": "5",
-    "Six": "6",
-    "Seven": "7",
-    "Eight": "8",
-    "Nine": "9",
-    "Ten": "10",
-    # Add more numbers if needed
-}
-# Split the text by spaces
-words = chapter.split()
-# Find the text representing the number
-number_text = words[1].strip(":")  # Assuming the number text is the second word
-# Extract the numeric part
-chapter_number = text_to_number[number_text]
-# Print the chapter number
-# print(chapter_number)
-url = baseurl + chapter_number
-# print(url)
-### all Texts in each chapter
-response = requests.get(url)
-if response.status_code == 200:
-    html_content = response.content
-    # Parse HTML content
-    text = BeautifulSoup(html_content, "html.parser")
-    # print(text)
-    # Find all direct child div elements with class="r-chapter"
-    direct_child_div_elements = text.select("div.col-12 > dl.r.r-verse")
-    # print(direct_child_div_elements)
-    # List to store the extracted text
-    text_number = []
-    # Iterate over each direct child div element
-    for div in direct_child_div_elements:
-        # Find the <a> tag within the div
-        a_tag = div.find("a")
-        if a_tag:
-            # Extract the text from the <a> tag and append it to the output list
-            text_number.append(a_tag.text.strip())
-    # Print the output list
-    # print(text_number)
-    # print(len(text_number))
-### link to each Text in each chapter
-text_page = text_number[0]
-# Split the text by spaces
-words = text_page.split()
-# Find the text representing the number
-text_number = words[1].strip(":")  # Assuming the number text is the second word
-# print(f"chapter_number - {chapter_number} : text_number - {text_number}")
-texturl = baseurl + chapter_number + "/" + text_number
-# print(texturl)
-main(url=texturl)
-st.title("Display HTML File in Streamlit")
-# Path to the HTML file
-html_file_path = "../Transformers/Bg. 1.1.html"
-try:
-    # Read the HTML file
-    with open(html_file_path, "r", encoding="utf-8") as file:
-        html_content = file.read()
-    # Display the HTML content using the 'st.components.v1.html' component
-    expanded = st.checkbox("Expand HTML page")
-    if expanded:
-        st.components.v1.html(html_content, height=1600, width=680)
-    else:
-        st.components.v1.html(html_content, height=600)
-except FileNotFoundError:
-    st.error(f"HTML file '{html_file_path}' not found!")
-import streamlit as st
-st.title("Streamlit Tabs Example")
-# Add tabs to the sidebar
-tabs = st.sidebar.radio("Navigation", ["Home", "About", "Settings"])
-# Display different content based on the selected tab
-if tabs == "Home":
-    st.header("Home Page")
-    st.write("Welcome to the Home page!")
-elif tabs == "About":
-    st.header("About Page")
-    st.write("This is the About page.")
-elif tabs == "Settings":
-    st.header("Settings Page")
-    st.write("Here you can configure your settings.")
-st.title("Netflix-like Grid Display")
-import streamlit as st
-import os
-import streamlit.components.v1 as components
-# Define movie data
-movies = [
-    {"title": "Movie 1", "poster_path": "../Transformers/Bg. 1.1.html"},
-    {"title": "Movie 2", "poster_url": "https://via.placeholder.com/150"},
-    {"title": "Movie 3", "poster_url": "https://via.placeholder.com/150"},
-    {"title": "Movie 4", "poster_url": "https://via.placeholder.com/150"},
-    {"title": "Movie 5", "poster_url": "https://via.placeholder.com/150"},
-    {"title": "Movie 6", "poster_url": "https://via.placeholder.com/150"},
-    {"title": "Movie 7", "poster_url": "https://via.placeholder.com/150"},
-    {"title": "Movie 8", "poster_url": "https://via.placeholder.com/150"},
-]
 # Display movies in a grid
 # num_columns = 4

 #     print(f"An error occurred: {e}")
+# import streamlit as st
+# import requests
+# from bs4 import BeautifulSoup
+# def fetch_html(url):
+#     # Fetch the webpage content
+#     response = requests.get(url)
+#     if response.status_code == 200:
+#         return response.content
+#     else:
+#         st.error(f"Failed to fetch webpage. Status code: {response.status_code}")
+# def scrape_data(html_content):
+#     # Parse HTML content
+#     soup = BeautifulSoup(html_content, "html.parser")
+#     # Scrape data (replace this with your specific scraping logic)
+#     data = soup.find_all(class_="container first-container")
+#     return data
+# def main(url):
+#     st.title("Webpage Scraper")
+#     # User input for webpage URL
+#     url = st.text_input("Enter the URL of the webpage:", value=url)
+#     # Convert webpage to HTML and scrape data
+#     if st.button("Scrape Data"):
+#         if url:
+#             html_content = fetch_html(url)
+#             str_content = """ """
+#             if html_content:
+#                 data = scrape_data(html_content)
+#                 # st.title("HTML Page Display")
+#                 # st.components.v1.html(html_content, height=1600, width=800)
+#                 # Display scraped data in a new tab
+#                 with st.expander("Scraped Data", expanded=True):
+#                     for item in data:
+#                         # Convert item to string and display
+#                         str_content += str(item)
+#                         # st.write(str(item))
+#                         # st.title("HTML Page Display")
+#                         # st.components.v1.html(data, height=1600, width=800)
+#                     # st.title("HTML Page Display")
+#                     st.components.v1.html(str_content, height=1600, width=680)
 # main()
+# import requests
+# from bs4 import BeautifulSoup
+# # URL of the webpage
+# baseurl = "https://vedabase.io/en/library/bg/"
+# # Fetch the webpage content
+# response = requests.get(baseurl)
+# if response.status_code == 200:
+#     html_content = response.content
+#     # Parse HTML content
+#     soup = BeautifulSoup(html_content, "html.parser")
+#     # Find all direct child div elements with class="r-chapter"
+#     direct_child_div_elements = soup.select("div.col-12 > div.r-chapter")
+#     # List to store the extracted text
+#     output = []
+#     # Iterate over each direct child div element
+#     for div in direct_child_div_elements:
+#         # Find the <a> tag within the div
+#         a_tag = div.find("a")
+#         if a_tag:
+#             # Extract the text from the <a> tag and append it to the output list
+#             output.append(a_tag.text.strip())
+#     # Print the output list
+#     # print(output)
+#     # print(len(output))
+# ### Link to all chapters
+# import re
+# # Sample text
+# chapter = output[4]
+# text_to_number = {
+#     "One": "1",
+#     "Two": "2",
+#     "Three": "3",
+#     "Four": "4",
+#     "Five": "5",
+#     "Six": "6",
+#     "Seven": "7",
+#     "Eight": "8",
+#     "Nine": "9",
+#     "Ten": "10",
+#     # Add more numbers if needed
+# }
+# # Split the text by spaces
+# words = chapter.split()
+# # Find the text representing the number
+# number_text = words[1].strip(":")  # Assuming the number text is the second word
+# # Extract the numeric part
+# chapter_number = text_to_number[number_text]
+# # Print the chapter number
+# # print(chapter_number)
+# url = baseurl + chapter_number
+# # print(url)
+# ### all Texts in each chapter
+# response = requests.get(url)
+# if response.status_code == 200:
+#     html_content = response.content
+#     # Parse HTML content
+#     text = BeautifulSoup(html_content, "html.parser")
+#     # print(text)
+#     # Find all direct child div elements with class="r-chapter"
+#     direct_child_div_elements = text.select("div.col-12 > dl.r.r-verse")
+#     # print(direct_child_div_elements)
+#     # List to store the extracted text
+#     text_number = []
+#     # Iterate over each direct child div element
+#     for div in direct_child_div_elements:
+#         # Find the <a> tag within the div
+#         a_tag = div.find("a")
+#         if a_tag:
+#             # Extract the text from the <a> tag and append it to the output list
+#             text_number.append(a_tag.text.strip())
+#     # Print the output list
+#     # print(text_number)
+#     # print(len(text_number))
+# ### link to each Text in each chapter
+# text_page = text_number[0]
+# # Split the text by spaces
+# words = text_page.split()
+# # Find the text representing the number
+# text_number = words[1].strip(":")  # Assuming the number text is the second word
+# # print(f"chapter_number - {chapter_number} : text_number - {text_number}")
+# texturl = baseurl + chapter_number + "/" + text_number
+# # print(texturl)
+# main(url=texturl)
+# st.title("Display HTML File in Streamlit")
+# # Path to the HTML file
+# html_file_path = "../Transformers/Bg. 1.1.html"
+# try:
+#     # Read the HTML file
+#     with open(html_file_path, "r", encoding="utf-8") as file:
+#         html_content = file.read()
+#     # Display the HTML content using the 'st.components.v1.html' component
+#     expanded = st.checkbox("Expand HTML page")
+#     if expanded:
+#         st.components.v1.html(html_content, height=1600, width=680)
+#     else:
+#         st.components.v1.html(html_content, height=600)
+# except FileNotFoundError:
+#     st.error(f"HTML file '{html_file_path}' not found!")
+# import streamlit as st
+# st.title("Streamlit Tabs Example")
+# # Add tabs to the sidebar
+# tabs = st.sidebar.radio("Navigation", ["Home", "About", "Settings"])
+# # Display different content based on the selected tab
+# if tabs == "Home":
+#     st.header("Home Page")
+#     st.write("Welcome to the Home page!")
+# elif tabs == "About":
+#     st.header("About Page")
+#     st.write("This is the About page.")
+# elif tabs == "Settings":
+#     st.header("Settings Page")
+#     st.write("Here you can configure your settings.")
+# st.title("Netflix-like Grid Display")
+# import streamlit as st
+# import os
+# import streamlit.components.v1 as components
+# # Define movie data
+# movies = [
+#     {"title": "Movie 1", "poster_path": "../Transformers/Bg. 1.1.html"},
+#     {"title": "Movie 2", "poster_url": "https://via.placeholder.com/150"},
+#     {"title": "Movie 3", "poster_url": "https://via.placeholder.com/150"},
+#     {"title": "Movie 4", "poster_url": "https://via.placeholder.com/150"},
+#     {"title": "Movie 5", "poster_url": "https://via.placeholder.com/150"},
+#     {"title": "Movie 6", "poster_url": "https://via.placeholder.com/150"},
+#     {"title": "Movie 7", "poster_url": "https://via.placeholder.com/150"},
+#     {"title": "Movie 8", "poster_url": "https://via.placeholder.com/150"},
+# ]
 # Display movies in a grid
 # num_columns = 4