Spaces:
Running
Running
File size: 1,106 Bytes
212d694 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 |
from mediaunmasked.scrapers.article_scraper import ArticleScraper
import logging
# Configure logging
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)
def test_scraper():
scraper = ArticleScraper()
url = "https://www.channelnewsasia.com/singapore/singapore-mccy-sg-culture-pass-arts-culture-heritage-4951451"
logger.info(f"Testing scraper with URL: {url}")
try:
result = scraper.scrape_article(url)
if result:
print("\nScraping Successful!")
print("-" * 50)
print(f"Headline: {result['headline']}")
print("-" * 50)
print("Content Preview (first 500 chars):")
print(result['content'][:500])
print("...")
print("-" * 50)
print(f"Total content length: {len(result['content'])} characters")
else:
print("Scraping failed - no result returned")
except Exception as e:
logger.error(f"Error during scraping: {str(e)}", exc_info=True)
if __name__ == "__main__":
test_scraper() |