Spaces:

Chrunos
/

mmmm

Running

App Files Files Community

Chrunos commited on Feb 7

Commit

194b841

verified ·

1 Parent(s): b6f4c25

Update app.py

Browse files

Files changed (1) hide show

app.py +51 -1

app.py CHANGED Viewed

@@ -248,6 +248,56 @@ async def get_track_download_url(video_url: str) -> str:
     return {"error": "Download URL not found"}
 async def extract_video_info(video_url: str) -> str:
     api_url = f'https://yt-dl-web.vercel.app/api/info?url={video_url}'
     session = cloudscraper.create_scraper()
@@ -282,7 +332,7 @@ async def extract_video_info(video_url: str) -> str:
 async def test_download(request: Request):
     data = await request.json()
     video_url = data.get('url')
-    response = await extract_video_info(video_url)
     return response

     return {"error": "Download URL not found"}
+import requests
+import re
+def process_url(video_url: str) -> str:
+    try:
+        # Step 1: Download the URL
+        api_url = "https://www.saveporn.net/convert/"
+        session = cloudscraper.create_scraper()
+        form_data = {"url": video_url}
+        response = session.post(video_url, data=form_data)
+        response_text = response.text
+        # Step 2: Get HTML from rich text (in this simple case, just use the response text)
+        html_text = response_text
+        # Step 3: Match text for <tr> tags
+        tr_matches = re.findall(r'<tr>(.*?)</tr>', html_text)
+        repeat_results = []
+        for tr_match in tr_matches:
+            # Step 4: Match text for <td> tags with 3 - 4 digit numbers
+            td_matches = re.findall(r'<td>(\d{3,4})</td>', tr_match)
+            quality = td_matches[0] if td_matches else None
+            if quality:
+                # Step 5: Get URLs from the current <tr> match
+                urls = re.findall(r'http[s]?://(?:[a-zA-Z]|[0-9]|[$-_@.&+]|[!*\\(\\),]|(?:%[0-9a-fA-F][0-9a-fA-F]))+',
+                                  tr_match)
+                # Step 6: Set name for the URLs
+                named_urls = [(url, f"{quality}P - MP4") for url in urls]
+                repeat_results.extend(named_urls)
+        # Step 7: Count the repeat results
+        result_count = len(repeat_results)
+        if result_count < 1:
+            print("Error: No results found.")
+            return
+        return repeat_results
+    except Exception as e:
+        print(f"An error occurred: {e}")
+        return []
 async def extract_video_info(video_url: str) -> str:
     api_url = f'https://yt-dl-web.vercel.app/api/info?url={video_url}'
     session = cloudscraper.create_scraper()
 async def test_download(request: Request):
     data = await request.json()
     video_url = data.get('url')
+    response = await process_url(video_url)
     return response