Spaces:
Sleeping
Sleeping
Upload app.py
Browse files
app.py
CHANGED
@@ -525,52 +525,52 @@ display_highlighted_pdf()
|
|
525 |
# print(f"An error occurred: {e}")
|
526 |
|
527 |
|
528 |
-
import streamlit as st
|
529 |
-
import requests
|
530 |
-
from bs4 import BeautifulSoup
|
531 |
|
532 |
-
def fetch_html(url):
|
533 |
-
|
534 |
-
|
535 |
-
|
536 |
-
|
537 |
-
|
538 |
-
|
539 |
|
540 |
-
def scrape_data(html_content):
|
541 |
-
|
542 |
-
|
543 |
|
544 |
-
|
545 |
-
|
546 |
|
547 |
-
|
548 |
|
549 |
-
def main(url):
|
550 |
-
|
551 |
|
552 |
-
|
553 |
-
|
554 |
|
555 |
-
|
556 |
-
|
557 |
-
|
558 |
-
|
559 |
-
|
560 |
-
|
561 |
-
|
562 |
-
|
563 |
-
|
564 |
-
|
565 |
-
|
566 |
-
|
567 |
-
|
568 |
-
|
569 |
-
|
570 |
-
|
571 |
-
|
572 |
-
|
573 |
-
|
574 |
# main()
|
575 |
|
576 |
|
@@ -602,180 +602,180 @@ def main(url):
|
|
602 |
|
603 |
|
604 |
|
605 |
-
import requests
|
606 |
-
from bs4 import BeautifulSoup
|
607 |
|
608 |
-
# URL of the webpage
|
609 |
-
baseurl = "https://vedabase.io/en/library/bg/"
|
610 |
|
611 |
-
# Fetch the webpage content
|
612 |
-
response = requests.get(baseurl)
|
613 |
-
if response.status_code == 200:
|
614 |
-
|
615 |
|
616 |
-
|
617 |
-
|
618 |
|
619 |
-
|
620 |
-
|
621 |
|
622 |
-
|
623 |
-
|
624 |
|
625 |
-
|
626 |
-
|
627 |
-
|
628 |
-
|
629 |
-
|
630 |
-
|
631 |
-
|
632 |
|
633 |
-
|
634 |
-
|
635 |
-
|
636 |
|
637 |
-
### Link to all chapters
|
638 |
-
import re
|
639 |
|
640 |
-
# Sample text
|
641 |
-
chapter = output[4]
|
642 |
|
643 |
-
text_to_number = {
|
644 |
-
|
645 |
-
|
646 |
-
|
647 |
-
|
648 |
-
|
649 |
-
|
650 |
-
|
651 |
-
|
652 |
-
|
653 |
-
|
654 |
-
|
655 |
-
}
|
656 |
|
657 |
-
# Split the text by spaces
|
658 |
-
words = chapter.split()
|
659 |
|
660 |
-
# Find the text representing the number
|
661 |
-
number_text = words[1].strip(":") # Assuming the number text is the second word
|
662 |
|
663 |
-
# Extract the numeric part
|
664 |
-
chapter_number = text_to_number[number_text]
|
665 |
|
666 |
-
# Print the chapter number
|
667 |
-
# print(chapter_number)
|
668 |
|
669 |
-
url = baseurl + chapter_number
|
670 |
|
671 |
-
# print(url)
|
672 |
|
673 |
-
### all Texts in each chapter
|
674 |
|
675 |
-
response = requests.get(url)
|
676 |
-
if response.status_code == 200:
|
677 |
-
|
678 |
|
679 |
-
|
680 |
-
|
681 |
|
682 |
-
|
683 |
|
684 |
-
|
685 |
-
|
686 |
|
687 |
-
|
688 |
|
689 |
-
|
690 |
-
|
691 |
|
692 |
-
|
693 |
-
|
694 |
-
|
695 |
-
|
696 |
-
|
697 |
-
|
698 |
-
|
699 |
|
700 |
-
|
701 |
-
|
702 |
-
|
703 |
|
704 |
-
### link to each Text in each chapter
|
705 |
-
text_page = text_number[0]
|
706 |
|
707 |
-
# Split the text by spaces
|
708 |
-
words = text_page.split()
|
709 |
|
710 |
-
# Find the text representing the number
|
711 |
-
text_number = words[1].strip(":") # Assuming the number text is the second word
|
712 |
|
713 |
-
# print(f"chapter_number - {chapter_number} : text_number - {text_number}")
|
714 |
-
texturl = baseurl + chapter_number + "/" + text_number
|
715 |
|
716 |
-
# print(texturl)
|
717 |
|
718 |
-
main(url=texturl)
|
719 |
|
720 |
-
st.title("Display HTML File in Streamlit")
|
721 |
|
722 |
-
# Path to the HTML file
|
723 |
-
html_file_path = "../Transformers/Bg. 1.1.html"
|
724 |
|
725 |
-
try:
|
726 |
-
|
727 |
-
|
728 |
-
|
729 |
|
730 |
-
|
731 |
-
|
732 |
-
|
733 |
-
|
734 |
-
|
735 |
-
|
736 |
-
except FileNotFoundError:
|
737 |
-
|
738 |
|
739 |
-
import streamlit as st
|
740 |
|
741 |
|
742 |
-
st.title("Streamlit Tabs Example")
|
743 |
|
744 |
-
# Add tabs to the sidebar
|
745 |
-
tabs = st.sidebar.radio("Navigation", ["Home", "About", "Settings"])
|
746 |
|
747 |
-
# Display different content based on the selected tab
|
748 |
-
if tabs == "Home":
|
749 |
-
|
750 |
-
|
751 |
|
752 |
-
elif tabs == "About":
|
753 |
-
|
754 |
-
|
755 |
|
756 |
-
elif tabs == "Settings":
|
757 |
-
|
758 |
-
|
759 |
|
760 |
-
st.title("Netflix-like Grid Display")
|
761 |
|
762 |
|
763 |
|
764 |
-
import streamlit as st
|
765 |
-
import os
|
766 |
-
import streamlit.components.v1 as components
|
767 |
-
|
768 |
-
# Define movie data
|
769 |
-
movies = [
|
770 |
-
|
771 |
-
|
772 |
-
|
773 |
-
|
774 |
-
|
775 |
-
|
776 |
-
|
777 |
-
|
778 |
-
]
|
779 |
|
780 |
# Display movies in a grid
|
781 |
# num_columns = 4
|
|
|
525 |
# print(f"An error occurred: {e}")
|
526 |
|
527 |
|
528 |
+
# import streamlit as st
|
529 |
+
# import requests
|
530 |
+
# from bs4 import BeautifulSoup
|
531 |
|
532 |
+
# def fetch_html(url):
|
533 |
+
# # Fetch the webpage content
|
534 |
+
# response = requests.get(url)
|
535 |
+
# if response.status_code == 200:
|
536 |
+
# return response.content
|
537 |
+
# else:
|
538 |
+
# st.error(f"Failed to fetch webpage. Status code: {response.status_code}")
|
539 |
|
540 |
+
# def scrape_data(html_content):
|
541 |
+
# # Parse HTML content
|
542 |
+
# soup = BeautifulSoup(html_content, "html.parser")
|
543 |
|
544 |
+
# # Scrape data (replace this with your specific scraping logic)
|
545 |
+
# data = soup.find_all(class_="container first-container")
|
546 |
|
547 |
+
# return data
|
548 |
|
549 |
+
# def main(url):
|
550 |
+
# st.title("Webpage Scraper")
|
551 |
|
552 |
+
# # User input for webpage URL
|
553 |
+
# url = st.text_input("Enter the URL of the webpage:", value=url)
|
554 |
|
555 |
+
# # Convert webpage to HTML and scrape data
|
556 |
+
# if st.button("Scrape Data"):
|
557 |
+
# if url:
|
558 |
+
# html_content = fetch_html(url)
|
559 |
+
# str_content = """ """
|
560 |
+
# if html_content:
|
561 |
+
# data = scrape_data(html_content)
|
562 |
+
# # st.title("HTML Page Display")
|
563 |
+
# # st.components.v1.html(html_content, height=1600, width=800)
|
564 |
+
# # Display scraped data in a new tab
|
565 |
+
# with st.expander("Scraped Data", expanded=True):
|
566 |
+
# for item in data:
|
567 |
+
# # Convert item to string and display
|
568 |
+
# str_content += str(item)
|
569 |
+
# # st.write(str(item))
|
570 |
+
# # st.title("HTML Page Display")
|
571 |
+
# # st.components.v1.html(data, height=1600, width=800)
|
572 |
+
# # st.title("HTML Page Display")
|
573 |
+
# st.components.v1.html(str_content, height=1600, width=680)
|
574 |
# main()
|
575 |
|
576 |
|
|
|
602 |
|
603 |
|
604 |
|
605 |
+
# import requests
|
606 |
+
# from bs4 import BeautifulSoup
|
607 |
|
608 |
+
# # URL of the webpage
|
609 |
+
# baseurl = "https://vedabase.io/en/library/bg/"
|
610 |
|
611 |
+
# # Fetch the webpage content
|
612 |
+
# response = requests.get(baseurl)
|
613 |
+
# if response.status_code == 200:
|
614 |
+
# html_content = response.content
|
615 |
|
616 |
+
# # Parse HTML content
|
617 |
+
# soup = BeautifulSoup(html_content, "html.parser")
|
618 |
|
619 |
+
# # Find all direct child div elements with class="r-chapter"
|
620 |
+
# direct_child_div_elements = soup.select("div.col-12 > div.r-chapter")
|
621 |
|
622 |
+
# # List to store the extracted text
|
623 |
+
# output = []
|
624 |
|
625 |
+
# # Iterate over each direct child div element
|
626 |
+
# for div in direct_child_div_elements:
|
627 |
+
# # Find the <a> tag within the div
|
628 |
+
# a_tag = div.find("a")
|
629 |
+
# if a_tag:
|
630 |
+
# # Extract the text from the <a> tag and append it to the output list
|
631 |
+
# output.append(a_tag.text.strip())
|
632 |
|
633 |
+
# # Print the output list
|
634 |
+
# # print(output)
|
635 |
+
# # print(len(output))
|
636 |
|
637 |
+
# ### Link to all chapters
|
638 |
+
# import re
|
639 |
|
640 |
+
# # Sample text
|
641 |
+
# chapter = output[4]
|
642 |
|
643 |
+
# text_to_number = {
|
644 |
+
# "One": "1",
|
645 |
+
# "Two": "2",
|
646 |
+
# "Three": "3",
|
647 |
+
# "Four": "4",
|
648 |
+
# "Five": "5",
|
649 |
+
# "Six": "6",
|
650 |
+
# "Seven": "7",
|
651 |
+
# "Eight": "8",
|
652 |
+
# "Nine": "9",
|
653 |
+
# "Ten": "10",
|
654 |
+
# # Add more numbers if needed
|
655 |
+
# }
|
656 |
|
657 |
+
# # Split the text by spaces
|
658 |
+
# words = chapter.split()
|
659 |
|
660 |
+
# # Find the text representing the number
|
661 |
+
# number_text = words[1].strip(":") # Assuming the number text is the second word
|
662 |
|
663 |
+
# # Extract the numeric part
|
664 |
+
# chapter_number = text_to_number[number_text]
|
665 |
|
666 |
+
# # Print the chapter number
|
667 |
+
# # print(chapter_number)
|
668 |
|
669 |
+
# url = baseurl + chapter_number
|
670 |
|
671 |
+
# # print(url)
|
672 |
|
673 |
+
# ### all Texts in each chapter
|
674 |
|
675 |
+
# response = requests.get(url)
|
676 |
+
# if response.status_code == 200:
|
677 |
+
# html_content = response.content
|
678 |
|
679 |
+
# # Parse HTML content
|
680 |
+
# text = BeautifulSoup(html_content, "html.parser")
|
681 |
|
682 |
+
# # print(text)
|
683 |
|
684 |
+
# # Find all direct child div elements with class="r-chapter"
|
685 |
+
# direct_child_div_elements = text.select("div.col-12 > dl.r.r-verse")
|
686 |
|
687 |
+
# # print(direct_child_div_elements)
|
688 |
|
689 |
+
# # List to store the extracted text
|
690 |
+
# text_number = []
|
691 |
|
692 |
+
# # Iterate over each direct child div element
|
693 |
+
# for div in direct_child_div_elements:
|
694 |
+
# # Find the <a> tag within the div
|
695 |
+
# a_tag = div.find("a")
|
696 |
+
# if a_tag:
|
697 |
+
# # Extract the text from the <a> tag and append it to the output list
|
698 |
+
# text_number.append(a_tag.text.strip())
|
699 |
|
700 |
+
# # Print the output list
|
701 |
+
# # print(text_number)
|
702 |
+
# # print(len(text_number))
|
703 |
|
704 |
+
# ### link to each Text in each chapter
|
705 |
+
# text_page = text_number[0]
|
706 |
|
707 |
+
# # Split the text by spaces
|
708 |
+
# words = text_page.split()
|
709 |
|
710 |
+
# # Find the text representing the number
|
711 |
+
# text_number = words[1].strip(":") # Assuming the number text is the second word
|
712 |
|
713 |
+
# # print(f"chapter_number - {chapter_number} : text_number - {text_number}")
|
714 |
+
# texturl = baseurl + chapter_number + "/" + text_number
|
715 |
|
716 |
+
# # print(texturl)
|
717 |
|
718 |
+
# main(url=texturl)
|
719 |
|
720 |
+
# st.title("Display HTML File in Streamlit")
|
721 |
|
722 |
+
# # Path to the HTML file
|
723 |
+
# html_file_path = "../Transformers/Bg. 1.1.html"
|
724 |
|
725 |
+
# try:
|
726 |
+
# # Read the HTML file
|
727 |
+
# with open(html_file_path, "r", encoding="utf-8") as file:
|
728 |
+
# html_content = file.read()
|
729 |
|
730 |
+
# # Display the HTML content using the 'st.components.v1.html' component
|
731 |
+
# expanded = st.checkbox("Expand HTML page")
|
732 |
+
# if expanded:
|
733 |
+
# st.components.v1.html(html_content, height=1600, width=680)
|
734 |
+
# else:
|
735 |
+
# st.components.v1.html(html_content, height=600)
|
736 |
+
# except FileNotFoundError:
|
737 |
+
# st.error(f"HTML file '{html_file_path}' not found!")
|
738 |
|
739 |
+
# import streamlit as st
|
740 |
|
741 |
|
742 |
+
# st.title("Streamlit Tabs Example")
|
743 |
|
744 |
+
# # Add tabs to the sidebar
|
745 |
+
# tabs = st.sidebar.radio("Navigation", ["Home", "About", "Settings"])
|
746 |
|
747 |
+
# # Display different content based on the selected tab
|
748 |
+
# if tabs == "Home":
|
749 |
+
# st.header("Home Page")
|
750 |
+
# st.write("Welcome to the Home page!")
|
751 |
|
752 |
+
# elif tabs == "About":
|
753 |
+
# st.header("About Page")
|
754 |
+
# st.write("This is the About page.")
|
755 |
|
756 |
+
# elif tabs == "Settings":
|
757 |
+
# st.header("Settings Page")
|
758 |
+
# st.write("Here you can configure your settings.")
|
759 |
|
760 |
+
# st.title("Netflix-like Grid Display")
|
761 |
|
762 |
|
763 |
|
764 |
+
# import streamlit as st
|
765 |
+
# import os
|
766 |
+
# import streamlit.components.v1 as components
|
767 |
+
|
768 |
+
# # Define movie data
|
769 |
+
# movies = [
|
770 |
+
# {"title": "Movie 1", "poster_path": "../Transformers/Bg. 1.1.html"},
|
771 |
+
# {"title": "Movie 2", "poster_url": "https://via.placeholder.com/150"},
|
772 |
+
# {"title": "Movie 3", "poster_url": "https://via.placeholder.com/150"},
|
773 |
+
# {"title": "Movie 4", "poster_url": "https://via.placeholder.com/150"},
|
774 |
+
# {"title": "Movie 5", "poster_url": "https://via.placeholder.com/150"},
|
775 |
+
# {"title": "Movie 6", "poster_url": "https://via.placeholder.com/150"},
|
776 |
+
# {"title": "Movie 7", "poster_url": "https://via.placeholder.com/150"},
|
777 |
+
# {"title": "Movie 8", "poster_url": "https://via.placeholder.com/150"},
|
778 |
+
# ]
|
779 |
|
780 |
# Display movies in a grid
|
781 |
# num_columns = 4
|