File size: 4,780 Bytes
170f767 13e013d 3a8cc41 4c464b0 c850600 ca2f0f4 170f767 c850600 3a8cc41 ca2f0f4 d874f49 3a8cc41 d874f49 3a8cc41 d874f49 3a8cc41 e392f4c 13e013d 6dc63dd eb779a0 ca2f0f4 c850600 ca2f0f4 d874f49 ca2f0f4 1203cd3 d874f49 1203cd3 d874f49 1203cd3 d874f49 ca2f0f4 c850600 d874f49 ca2f0f4 d874f49 c8dd415 1203cd3 d874f49 1203cd3 c8dd415 1203cd3 d874f49 1203cd3 d874f49 1203cd3 d874f49 1203cd3 c850600 d874f49 ca2f0f4 1203cd3 ca2f0f4 1203cd3 d874f49 1203cd3 144d636 5b3bf54 170f767 eb779a0 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 |
project:
type: website
website:
title: "🧭 Einstieg ins Web Scraping - Daten sammeln leicht gemacht"
page-navigation: true
repo-actions: [edit, source, issue]
repo-url: https://huggingface.co/spaces/datenwerkzeuge/CDL-Webscraping-Workshop-2025/
repo-subdir: src
repo-link-target: _blank
issue-url: https://huggingface.co/spaces/datenwerkzeuge/CDL-Webscraping-Workshop-2025/discussions
navbar:
left:
- href: index.qmd
text: "1️⃣ Start"
- href: basics.qmd
text: "2️⃣ No Code"
- href: low_code.qmd
text: "3️⃣ Low Code"
- href: use_case.qmd
text: "4️⃣ Anwendungsfall"
sidebar:
- title: "Start"
contents:
- href: index.qmd
section: "Willkommen👋"
contents:
- href: 01_setup/agenda.qmd
text: "Agenda📅"
- section: "Vorbereitung🛠️"
href: 01_setup/vorbereitung.qmd
contents:
- href: 01_setup/erforderlich/google-konto.qmd
text: "Google Konto erstellen"
- href: 01_setup/erforderlich/colab.qmd
text: "Colab nutzen"
- href: 01_setup/erforderlich/huggingface.qmd
text: "Huggingface Ressourcen"
- section: "Optional"
href: 01_setup/vorbereitung.html#optional
contents:
- href: 01_setup/optional/colab-github.qmd
text: "Colab & GitHub🤝"
- href: 01_setup/optional/quarto-lokal.qmd
text: "Hallo Quarto✨"
- href: 01_setup/aufbereitung.qmd
text: "Aufbereitung🤩"
- href: 01_setup/glossar.qmd
text: "Glossar"
- href: 01_setup/ressourcen.qmd
text: "Weitere Ressourcen"
- title: "No Code"
contents:
- href: basics.qmd
section: "No Code Übersicht"
contents:
- section: "PDF📝"
href: 02_basics/pdf.qmd
contents:
- href: 02_basics/pdf/pdf-link-extractor.qmd
text: "PDF Sammler🔍"
- href: 02_basics/pdf/pdf-grouping.qmd
text: "PDFs gruppieren🗂️"
- href: 02_basics/app_market/google-play-search.qmd
text: "Google Play Search🛒"
- section: "Webspider🕸️"
href: 02_basics/webspider.qmd
contents:
- href: 02_basics/webspider/website-url-extractor.qmd
text: "URL Extractor"
- href: 02_basics/webspider/webspider.qmd
text: "Webspider"
- title: "Low Code"
contents:
- section: "Low Code Übersicht"
href: low_code.qmd
contents:
- section: "Kataloge erfassen"
href: 03_low_code/catalogue.qmd
contents:
- href: 03_low_code/catalogue/bookstoscrape.ipynb
text: "Bücherliste scrapen📚"
- href: 03_low_code/catalogue/quotes_scraper.ipynb
text: "Zitate scrapen💬"
- href: 03_low_code/app_market_scraping/app_market_scraping.ipynb
text: "App Markt analysieren📱"
- section: "Video Transkripte"
href: 03_low_code/video_transcripts.qmd
contents:
- href: 03_low_code/video_transcripts/social-media.qmd
text: "Hinweise Scraping Social Media⚠️"
- href: 03_low_code/video_transcripts/get_videos_for_youtube_channels.ipynb
text: "YouTube Channel Videos🎥"
- href: 03_low_code/video_transcripts/youtube-transcript-extraction.ipynb
text: "YouTube Video Transcripts📝"
- title: "Use-Case"
contents:
- section: "Anwendungsfall Übersicht"
href: use_case.qmd
contents:
- href: 04_use_case/laws/Gesetze_im_Internet_Aktualitätendienst.ipynb
text: "Aktualitätendienst Gesetze📜"
- href: 04_use_case/jobs/Jobboerse_API.ipynb
text: "Jobbörse💼"
- href: 04_use_case/forum/buergergeld_forum.ipynb
text: "Buergergeld Forum💬"
- section: "Anwendungsfall Bonus"
contents:
- href: 04_use_case_bonus/podcasts/aggregate_podcast_episodes_to_markdown.ipynb
text: "Podcasts aggregieren"
- href: 04_use_case_bonus/news/zeitungsartikel.ipynb
text: "Nachrichten-Data Mining"
- href: 04_use_case_bonus/trend-monitoring/innovationsmanagement.ipynb
text: "Pytrends & Suchinteresse"
- href: 04_use_case_bonus/events/veranstaltungen_aggregieren.ipynb
text: "Veranstaltungen sammeln
"
format:
html:
theme: cosmo
css: styles.css
toc: true
|