File size: 4,780 Bytes
170f767
 
 
13e013d
3a8cc41
4c464b0
 
 
 
 
c850600
 
 
 
ca2f0f4
 
 
 
 
 
170f767
c850600
 
 
3a8cc41
ca2f0f4
d874f49
3a8cc41
 
d874f49
 
 
 
 
 
 
 
 
 
 
 
3a8cc41
d874f49
3a8cc41
e392f4c
 
13e013d
 
6dc63dd
eb779a0
ca2f0f4
c850600
ca2f0f4
d874f49
ca2f0f4
1203cd3
d874f49
 
 
1203cd3
d874f49
1203cd3
 
 
 
d874f49
 
 
 
 
 
ca2f0f4
c850600
d874f49
 
ca2f0f4
d874f49
 
 
c8dd415
1203cd3
d874f49
1203cd3
c8dd415
1203cd3
d874f49
 
 
 
1203cd3
d874f49
1203cd3
d874f49
1203cd3
c850600
 
d874f49
 
 
ca2f0f4
1203cd3
ca2f0f4
1203cd3
d874f49
1203cd3
144d636
 
 
5b3bf54
 
 
 
 
 
 
 
170f767
 
 
 
 
eb779a0
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
project:
  type: website
website:
  title: "🧭 Einstieg ins Web Scraping - Daten sammeln leicht gemacht"
  page-navigation: true
  repo-actions: [edit, source, issue]
  repo-url: https://huggingface.co/spaces/datenwerkzeuge/CDL-Webscraping-Workshop-2025/
  repo-subdir: src
  repo-link-target: _blank
  issue-url: https://huggingface.co/spaces/datenwerkzeuge/CDL-Webscraping-Workshop-2025/discussions
  navbar:
    left:
      - href: index.qmd
        text: "1️⃣ Start"
      - href: basics.qmd
        text: "2️⃣ No Code"
      - href: low_code.qmd
        text: "3️⃣ Low Code"
      - href: use_case.qmd
        text: "4️⃣ Anwendungsfall"
  sidebar:
    - title: "Start"
      contents:
        - href: index.qmd
          section: "Willkommen👋"
          contents:
          - href: 01_setup/agenda.qmd
            text: "Agenda📅"
          - section: "Vorbereitung🛠️"
            href: 01_setup/vorbereitung.qmd
            contents:
            - href: 01_setup/erforderlich/google-konto.qmd
              text: "Google Konto erstellen"
            - href: 01_setup/erforderlich/colab.qmd
              text: "Colab nutzen"
            - href: 01_setup/erforderlich/huggingface.qmd
              text: "Huggingface Ressourcen"
          - section: "Optional"
            href: 01_setup/vorbereitung.html#optional
            contents:
            - href: 01_setup/optional/colab-github.qmd
              text: "Colab & GitHub🤝"
            - href: 01_setup/optional/quarto-lokal.qmd
              text: "Hallo Quarto✨"
          - href: 01_setup/aufbereitung.qmd
            text: "Aufbereitung🤩"
          - href: 01_setup/glossar.qmd
            text: "Glossar"
          - href: 01_setup/ressourcen.qmd
            text: "Weitere Ressourcen"
    - title: "No Code"
      contents:
        - href: basics.qmd
          section: "No Code Übersicht"
          contents:
          - section: "PDF📝"
            href: 02_basics/pdf.qmd
            contents:
            - href: 02_basics/pdf/pdf-link-extractor.qmd
              text: "PDF Sammler🔍"
            - href: 02_basics/pdf/pdf-grouping.qmd
              text: "PDFs gruppieren🗂️"
          - href: 02_basics/app_market/google-play-search.qmd
            text: "Google Play Search🛒"
          - section: "Webspider🕸️"
            href: 02_basics/webspider.qmd
            contents:
            - href: 02_basics/webspider/website-url-extractor.qmd
              text: "URL Extractor"
            - href: 02_basics/webspider/webspider.qmd
              text: "Webspider"
    - title: "Low Code"
      contents:
        - section: "Low Code Übersicht"
          href: low_code.qmd
          contents:
          - section: "Kataloge erfassen"
            href: 03_low_code/catalogue.qmd
            contents:
              - href: 03_low_code/catalogue/bookstoscrape.ipynb
                text: "Bücherliste scrapen📚"
              - href: 03_low_code/catalogue/quotes_scraper.ipynb
                text: "Zitate scrapen💬"
          - href: 03_low_code/app_market_scraping/app_market_scraping.ipynb
            text: "App Markt analysieren📱"
          - section: "Video Transkripte"
            href: 03_low_code/video_transcripts.qmd
            contents:
              - href: 03_low_code/video_transcripts/social-media.qmd
                text: "Hinweise Scraping Social Media⚠️"
              - href: 03_low_code/video_transcripts/get_videos_for_youtube_channels.ipynb
                text: "YouTube Channel Videos🎥"
              - href: 03_low_code/video_transcripts/youtube-transcript-extraction.ipynb
                text: "YouTube Video Transcripts📝"
    - title: "Use-Case"
      contents:
        - section: "Anwendungsfall Übersicht"
          href: use_case.qmd
          contents: 
          - href: 04_use_case/laws/Gesetze_im_Internet_Aktualitätendienst.ipynb
            text: "Aktualitätendienst Gesetze📜"
          - href: 04_use_case/jobs/Jobboerse_API.ipynb
            text: "Jobbörse💼"
          - href: 04_use_case/forum/buergergeld_forum.ipynb
            text: "Buergergeld Forum💬"
        - section: "Anwendungsfall Bonus"
          contents: 
          - href: 04_use_case_bonus/podcasts/aggregate_podcast_episodes_to_markdown.ipynb
            text: "Podcasts aggregieren" 
          - href: 04_use_case_bonus/news/zeitungsartikel.ipynb
            text: "Nachrichten-Data Mining" 
          - href: 04_use_case_bonus/trend-monitoring/innovationsmanagement.ipynb
            text: "Pytrends & Suchinteresse" 
          - href: 04_use_case_bonus/events/veranstaltungen_aggregieren.ipynb
            text: "Veranstaltungen sammeln
"

format:
  html:
    theme: cosmo
    css: styles.css
    toc: true