Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -17,7 +17,7 @@ def convert_to_mobile_url(url):
|
|
17 |
|
18 |
def scrape_naver_blog(url):
|
19 |
"""
|
20 |
-
๋ค์ด๋ฒ ๋ธ๋ก๊ทธ์
|
21 |
"""
|
22 |
try:
|
23 |
# ๋ชจ๋ฐ์ผ URL ๋ณํ
|
@@ -39,19 +39,12 @@ def scrape_naver_blog(url):
|
|
39 |
elem.get_text(strip=True) for elem in content_elements
|
40 |
) if content_elements else "๋ด์ฉ์ ์ฐพ์ ์ ์์"
|
41 |
|
42 |
-
# ์ด๋ฏธ์ง URL ์คํฌ๋ํ
|
43 |
-
image_elements = soup.find_all("img", class_="se-image-resource")
|
44 |
-
image_urls = [
|
45 |
-
img["src"] for img in image_elements if "src" in img.attrs
|
46 |
-
]
|
47 |
-
|
48 |
# ๋๋ฒ๊น
๋ฉ์์ง ์ถ๋ ฅ
|
49 |
print(f"Scraped Title: {title}")
|
50 |
print(f"Scraped Content: {content}")
|
51 |
-
print(f"Scraped Images: {image_urls}")
|
52 |
|
53 |
# ๊ฒฐ๊ณผ ๋ฐํ
|
54 |
-
result = f"์ ๋ชฉ: {title}\n\n๋ด์ฉ: {content}
|
55 |
return result
|
56 |
|
57 |
except Exception as e:
|
@@ -67,7 +60,7 @@ interface = gr.Interface(
|
|
67 |
inputs=gr.Textbox(label="๋ค์ด๋ฒ ๋ธ๋ก๊ทธ URL"),
|
68 |
outputs=gr.Textbox(label="์คํฌ๋ํ ๊ฒฐ๊ณผ"),
|
69 |
title="๋ค์ด๋ฒ ๋ธ๋ก๊ทธ ์คํฌ๋ํ",
|
70 |
-
description="๋ค์ด๋ฒ ๋ธ๋ก๊ทธ์
|
71 |
)
|
72 |
|
73 |
if __name__ == "__main__":
|
|
|
17 |
|
18 |
def scrape_naver_blog(url):
|
19 |
"""
|
20 |
+
๋ค์ด๋ฒ ๋ธ๋ก๊ทธ์ ์ ๋ชฉ๊ณผ ๋ด์ฉ(ํ
์คํธ๋ง) ์คํฌ๋ํ.
|
21 |
"""
|
22 |
try:
|
23 |
# ๋ชจ๋ฐ์ผ URL ๋ณํ
|
|
|
39 |
elem.get_text(strip=True) for elem in content_elements
|
40 |
) if content_elements else "๋ด์ฉ์ ์ฐพ์ ์ ์์"
|
41 |
|
|
|
|
|
|
|
|
|
|
|
|
|
42 |
# ๋๋ฒ๊น
๋ฉ์์ง ์ถ๋ ฅ
|
43 |
print(f"Scraped Title: {title}")
|
44 |
print(f"Scraped Content: {content}")
|
|
|
45 |
|
46 |
# ๊ฒฐ๊ณผ ๋ฐํ
|
47 |
+
result = f"์ ๋ชฉ: {title}\n\n๋ด์ฉ: {content}"
|
48 |
return result
|
49 |
|
50 |
except Exception as e:
|
|
|
60 |
inputs=gr.Textbox(label="๋ค์ด๋ฒ ๋ธ๋ก๊ทธ URL"),
|
61 |
outputs=gr.Textbox(label="์คํฌ๋ํ ๊ฒฐ๊ณผ"),
|
62 |
title="๋ค์ด๋ฒ ๋ธ๋ก๊ทธ ์คํฌ๋ํ",
|
63 |
+
description="๋ค์ด๋ฒ ๋ธ๋ก๊ทธ์ ์ ๋ชฉ๊ณผ ๋ด์ฉ์ ์คํฌ๋ํํฉ๋๋ค."
|
64 |
)
|
65 |
|
66 |
if __name__ == "__main__":
|