Spaces:

KIMOSSINO
/

hashtagtik

Sleeping

App Files Files Community

KIMOSSINO commited on Dec 10, 2024

Commit

a568782

verified ·

1 Parent(s): 4becc5b

Create app.py

Browse files

Files changed (1) hide show

app.py +134 -0

app.py ADDED Viewed

	@@ -0,0 +1,134 @@

+import gradio as gr
+from collections import Counter
+from bs4 import BeautifulSoup
+import requests
+import re
+from urllib.parse import urlparse
+import json
+from youtube_transcript_api import YouTubeTranscriptApi
+def extract_youtube_id(url):
+    """استخراج معرف فيديو يوتيوب من الرابط"""
+    if match := re.search(r'(?:v=|\/)([0-9A-Za-z_-]{11}).*', url):
+        return match.group(1)
+    return None
+def extract_tiktok_id(url):
+    """استخراج معرف فيديو تيكتوك من الرابط"""
+    if match := re.search(r'video/(\d+)', url):
+        return match.group(1)
+    return None
+def extract_instagram_shortcode(url):
+    """استخراج معرف منشور انستغرام من الرابط"""
+    if match := re.search(r'/(p|reel)/([A-Za-z0-9_-]+)', url):
+        return match.group(2)
+    return None
+def get_hashtags_from_text(text):
+    """استخراج الهاشتاغات من النص"""
+    return re.findall(r'#\w+', text)
+def extract_from_url(url):
+    """استخراج البيانات من الرابط"""
+    domain = urlparse(url).netloc
+    headers = {
+        'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36'
+    }
+    try:
+        if 'youtube.com' in domain or 'youtu.be' in domain:
+            video_id = extract_youtube_id(url)
+            if not video_id:
+                return "رابط يوتيوب غير صالح", "", ""
+            api_url = f"https://www.youtube.com/watch?v={video_id}"
+            response = requests.get(api_url, headers=headers)
+            if 'watch-title' in response.text:
+                soup = BeautifulSoup(response.text, 'html.parser')
+                title = soup.find('meta', property='og:title')['content']
+                description = soup.find('meta', property='og:description')['content']
+                hashtags = get_hashtags_from_text(description)
+                return title, description, "\n".join(hashtags)
+        elif 'tiktok.com' in domain:
+            video_id = extract_tiktok_id(url)
+            if not video_id:
+                return "رابط تيكتوك غير صالح", "", ""
+            response = requests.get(url, headers=headers)
+            if response.status_code == 200:
+                soup = BeautifulSoup(response.text, 'html.parser')
+                title = soup.find('meta', property='og:title')['content']
+                description = soup.find('meta', property='og:description')['content']
+                hashtags = get_hashtags_from_text(description)
+                return title, description, "\n".join(hashtags)
+        elif 'instagram.com' in domain:
+            shortcode = extract_instagram_shortcode(url)
+            if not shortcode:
+                return "رابط انستغرام غير صالح", "", ""
+            response = requests.get(url, headers=headers)
+            if response.status_code == 200:
+                soup = BeautifulSoup(response.text, 'html.parser')
+                title = soup.find('meta', property='og:title')['content']
+                description = soup.find('meta', property='og:description')['content']
+                hashtags = get_hashtags_from_text(description)
+                return title, description, "\n".join(hashtags)
+    except Exception as e:
+        return f"حدث خطأ: {str(e)}", "", ""
+    return "لم يتم العثور على بيانات", "", ""
+def gradio_interface():
+    with gr.Blocks() as demo:
+        gr.Markdown("## 📱 محلل روابط وسائل التواصل الاجتماعي")
+        with gr.Row():
+            url_input = gr.Textbox(
+                label="🔗 أدخل رابط يوتيوب/تيكتوك/انستغرام",
+                placeholder="https://..."
+            )
+        with gr.Row():
+            analyze_btn = gr.Button("تحليل الرابط", variant="primary")
+        with gr.Row():
+            title_output = gr.Textbox(
+                label="📝 العنوان",
+                lines=2,
+                interactive=False
+            )
+        with gr.Row():
+            description_output = gr.Textbox(
+                label="📄 الوصف",
+                lines=5,
+                interactive=False
+            )
+        with gr.Row():
+            hashtags_output = gr.Textbox(
+                label="🏷️ الهاشتاغات",
+                lines=5,
+                interactive=False
+            )
+        analyze_btn.click(
+            fn=extract_from_url,
+            inputs=[url_input],
+            outputs=[title_output, description_output, hashtags_output]
+        )
+    return demo
+if __name__ == "__main__":
+    demo = gradio_interface()
+    demo.launch()