jeffeux commited on
Commit
21e639d
·
1 Parent(s): afcb081

Add application file

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +7 -11
  2. crawler_jeff/jeff_crawler_ver1.py +99 -0
  3. crawler_jeff/jeff_crawler_ver2.py +44 -0
  4. data/corpus.json +0 -0
  5. ptt-crawler/.gitignore +136 -0
  6. ptt-crawler/Dockerfile +16 -0
  7. ptt-crawler/Pipfile +19 -0
  8. ptt-crawler/Pipfile.lock +742 -0
  9. ptt-crawler/README.md +113 -0
  10. ptt-crawler/docker-compose.yml +27 -0
  11. ptt-crawler/requirements.txt +8 -0
  12. ptt-crawler/scraptt/__init__.py +0 -0
  13. ptt-crawler/scraptt/configs/__init__.py +4 -0
  14. ptt-crawler/scraptt/configs/configs.py +13 -0
  15. ptt-crawler/scraptt/items/__init__.py +4 -0
  16. ptt-crawler/scraptt/items/items.py +21 -0
  17. ptt-crawler/scraptt/middlewares/__init__.py +4 -0
  18. ptt-crawler/scraptt/middlewares/pyquery.py +13 -0
  19. ptt-crawler/scraptt/models/__init__.py +4 -0
  20. ptt-crawler/scraptt/models/redis.py +13 -0
  21. ptt-crawler/scraptt/pipelines/__init__.py +4 -0
  22. ptt-crawler/scraptt/pipelines/csv.py +45 -0
  23. ptt-crawler/scraptt/settings.py +96 -0
  24. ptt-crawler/scraptt/spiders/__init__.py +4 -0
  25. ptt-crawler/scraptt/spiders/base/__init__.py +4 -0
  26. ptt-crawler/scraptt/spiders/base/base.py +63 -0
  27. ptt-crawler/scraptt/spiders/ptt.py +46 -0
  28. ptt-crawler/scraptt/spiders/utils/parsers/html/__init__.py +12 -0
  29. ptt-crawler/scraptt/spiders/utils/parsers/html/base.py +15 -0
  30. ptt-crawler/scraptt/spiders/utils/parsers/html/index.py +21 -0
  31. ptt-crawler/scraptt/spiders/utils/parsers/html/latest_index.py +36 -0
  32. ptt-crawler/scraptt/spiders/utils/parsers/html/utils.py +18 -0
  33. ptt-crawler/scraptt/spiders/utils/parsers/html/year_backward_index.py +44 -0
  34. ptt-crawler/scraptt/spiders/utils/parsers/posts/comments/__init__.py +4 -0
  35. ptt-crawler/scraptt/spiders/utils/parsers/posts/comments/counter.py +17 -0
  36. ptt-crawler/scraptt/spiders/utils/parsers/posts/ip/__init__.py +5 -0
  37. ptt-crawler/scraptt/spiders/utils/parsers/posts/ip/ip.py +33 -0
  38. ptt-crawler/scraptt/spiders/utils/parsers/posts/ip/location.py +51 -0
  39. ptt-crawler/scraptt/spiders/utils/parsers/posts/meta/__init__.py +3 -0
  40. ptt-crawler/scraptt/spiders/utils/parsers/posts/meta/date.py +22 -0
  41. ptt-crawler/scraptt/spiders/utils/parsers/posts/meta/post.py +29 -0
  42. ptt-crawler/scraptt/spiders/utils/requests/__init__.py +4 -0
  43. ptt-crawler/scraptt/spiders/utils/requests/requests.py +35 -0
  44. ptt-crawler/scrapy.cfg +11 -0
  45. requirements.txt +7 -0
  46. twNLP-app/Dockerfile +20 -0
  47. twNLP-app/LICENSE +201 -0
  48. twNLP-app/Pipfile +18 -0
  49. twNLP-app/Pipfile.lock +953 -0
  50. twNLP-app/README.md +1 -0
README.md CHANGED
@@ -1,12 +1,8 @@
1
- ---
2
- title: Assignment 1 JeffeuxMartin
3
- emoji: 📉
4
- colorFrom: red
5
- colorTo: red
6
- sdk: streamlit
7
- sdk_version: 1.10.0
8
- app_file: app.py
9
- pinned: false
10
- ---
11
 
12
- Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
 
 
 
 
 
 
1
+ # PTT 搜尋分析工具 ver 0.1 (modified from **`ckip-cwn-app`**)
 
 
 
 
 
 
 
 
 
2
 
3
+ [![Open in Visual Studio Code](https://classroom.github.com/assets/open-in-vscode-c66648af7eb3fe8bc4f294546bfd86ef473780cde1dea487d3c4ff354943c9ae.svg)](https://classroom.github.com/online_ide?assignment_repo_id=8767745&assignment_repo_type=AssignmentRepo)
4
+
5
+ ## Basic Information
6
+ * 學號:R09942097
7
+ * 姓名:陳建成
8
+ * Streamlit cloud link: https://jeffeuxmartin-assignment-1-jeffeuxmartin-twnlp-appsrcapp-8mil4y.streamlitapp.com/
crawler_jeff/jeff_crawler_ver1.py ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ # -*- coding: utf-8 -*-
3
+ """
4
+ Created on Fri May 29 00:38:13 2020
5
+ @author: ASUS
6
+ """
7
+
8
+
9
+ # 導入 模組(module)
10
+ import requests
11
+ # 導入 BeautifulSoup 模組(module):解析HTML 語法工具
12
+ import bs4
13
+
14
+ # 文章連結
15
+ # URL = "https://www.ptt.cc/bbs/Gossiping/M.1590678355.A.246.html"
16
+ URL = """https://www.ptt.cc/bbs/Gossiping/index.html"""
17
+
18
+
19
+
20
+ from urllib.parse import urlparse
21
+
22
+ def get_host(URL):
23
+ parsed_uri = urlparse(URL)
24
+ result = "{uri.scheme}://{uri.netloc}/".format(uri=parsed_uri)
25
+ return result
26
+
27
+
28
+ def proc(ch, HOSTNAME):
29
+ try:
30
+ [title_a] = ch.select('.title' )[0].select('a')
31
+ except ValueError as err:
32
+ return
33
+
34
+ return dict(
35
+ title= title_a.getText(),
36
+ link= HOSTNAME + '/' + title_a.attrs['href'],
37
+ author=ch.select('.author')[0].getText(),
38
+ date= ch.select('.date' )[0].getText(),
39
+ )
40
+
41
+
42
+ def getall(URL):
43
+ HOSTNAME = get_host(URL)
44
+
45
+
46
+ # 設定Header與Cookie
47
+ # my_headers = {'cookie': 'over18=1;'}
48
+ cookies = {
49
+ 'over18': '1'
50
+ }
51
+
52
+ # 發送get 請求 到 ptt 八卦版
53
+ response = requests.get(URL,
54
+ # headers = my_headers
55
+ cookies=cookies
56
+ )
57
+
58
+
59
+ # 把網頁程式碼(HTML) 丟入 bs4模組分析
60
+ soup = bs4.BeautifulSoup(response.text,"html.parser")
61
+
62
+ all_articles = soup.find("div", class_="r-list-container action-bar-margin bbs-screen")
63
+ mu = []
64
+ for ch in all_articles.children: # .select('div'):
65
+ if isinstance(ch, bs4.element.Tag):
66
+ if ch.attrs['class'] == ['r-ent']:
67
+ output = proc(ch, HOSTNAME)
68
+ if output:
69
+ mu.append(output)
70
+ elif ch.attrs['class'] == ['r-list-sep']:
71
+ break
72
+
73
+
74
+ buttons = soup.select('a.btn.wide')
75
+ prev_page, next_page = None, None
76
+ for button in buttons:
77
+ if '上頁' in button.getText():
78
+ if 'disabled' not in button.attrs['class']:
79
+ prev_page = HOSTNAME + '/' + button.attrs['href']
80
+ else:
81
+ prev_page = None
82
+ if '下頁' in button.getText():
83
+ if 'disabled' not in button.attrs['class']:
84
+ next_page = HOSTNAME + '/' + button.attrs['href']
85
+ else:
86
+ next_page = None
87
+
88
+ return mu, prev_page, next_page
89
+
90
+
91
+ URL = """https://www.ptt.cc/bbs/Gossiping/index.html"""
92
+ RR = []
93
+ from tqdm import tqdm
94
+ for iiii in tqdm(range(100)):
95
+ res, prev_, next_ = getall(URL)
96
+ print(res[0]["date"], end='\t')
97
+ print(res[-1]["date"])
98
+ URL = prev_
99
+ RR.extend(res)
crawler_jeff/jeff_crawler_ver2.py ADDED
@@ -0,0 +1,44 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from PyPtt import PTT
2
+ ptt_bot = PTT.API()
3
+ ptt_bot.login('jeffchen111', 'ntuee111')
4
+
5
+ def cc(RESRES):
6
+ def crawl_handler(post_info):
7
+
8
+ if post_info.delete_status != PTT.data_type.post_delete_status.NOT_DELETED:
9
+ if post_info.delete_status == PTT.data_type.post_delete_status.MODERATOR:
10
+ # print(f"[板主刪除][{post_info.author}]")
11
+ pass
12
+ elif post_info.delete_status == PTT.data_type.post_delete_status.AUTHOR:
13
+ # print(f"[作者刪除][{post_info.author}]")
14
+ pass
15
+ elif post_info.delete_status == PTT.data_type.post_delete_status.UNKNOWN:
16
+ # print(f"[不明刪除]")
17
+ pass
18
+ return
19
+
20
+ # print(f"[{post_info.aid}][{post_info.title}]")
21
+ # return post_info
22
+ PP = dict(
23
+ aid=post_info.aid,
24
+ index=post_info.index,
25
+ web_url=post_info.web_url,
26
+ title=post_info.title,
27
+ )
28
+ RESRES.append(PP)
29
+ return crawl_handler
30
+
31
+
32
+ boardname = "Gossiping"
33
+ newest = ptt_bot.get_newest_index(PTT.data_type.index_type.BBS, boardname)
34
+ RESRES = []
35
+ error_post_list, del_post_list = ptt_bot.crawl_board(
36
+ PTT.data_type.crawl_type.BBS,
37
+ # crawl_handler,
38
+ cc(RESRES),
39
+ boardname,
40
+ start_index=newest - 1000 * 2,
41
+ end_index=newest, # - 100 * 2,
42
+ # Optional
43
+ query=True,
44
+ )
data/corpus.json ADDED
The diff for this file is too large to render. See raw diff
 
ptt-crawler/.gitignore ADDED
@@ -0,0 +1,136 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Byte-compiled / optimized / DLL files
2
+ __pycache__/
3
+ *.py[cod]
4
+ *$py.class
5
+
6
+ # C extensions
7
+ *.so
8
+
9
+ # Distribution / packaging
10
+ .Python
11
+ build/
12
+ develop-eggs/
13
+ dist/
14
+ downloads/
15
+ eggs/
16
+ .eggs/
17
+ lib/
18
+ lib64/
19
+ parts/
20
+ sdist/
21
+ var/
22
+ wheels/
23
+ pip-wheel-metadata/
24
+ share/python-wheels/
25
+ *.egg-info/
26
+ .installed.cfg
27
+ *.egg
28
+ MANIFEST
29
+
30
+ # PyInstaller
31
+ # Usually these files are written by a python script from a template
32
+ # before PyInstaller builds the exe, so as to inject date/other infos into it.
33
+ *.manifest
34
+ *.spec
35
+
36
+ # Installer logs
37
+ pip-log.txt
38
+ pip-delete-this-directory.txt
39
+
40
+ # Unit test / coverage reports
41
+ htmlcov/
42
+ .tox/
43
+ .nox/
44
+ .coverage
45
+ .coverage.*
46
+ .cache
47
+ nosetests.xml
48
+ coverage.xml
49
+ *.cover
50
+ *.py,cover
51
+ .hypothesis/
52
+ .pytest_cache/
53
+
54
+ # Translations
55
+ *.mo
56
+ *.pot
57
+
58
+ # Django stuff:
59
+ *.log
60
+ local_settings.py
61
+ db.sqlite3
62
+ db.sqlite3-journal
63
+
64
+ # Flask stuff:
65
+ instance/
66
+ .webassets-cache
67
+
68
+ # Scrapy stuff:
69
+ .scrapy
70
+
71
+ # Sphinx documentation
72
+ docs/_build/
73
+
74
+ # PyBuilder
75
+ target/
76
+
77
+ # Jupyter Notebook
78
+ .ipynb_checkpoints
79
+
80
+ # IPython
81
+ profile_default/
82
+ ipython_config.py
83
+
84
+ # pyenv
85
+ .python-version
86
+
87
+ # pipenv
88
+ # According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
89
+ # However, in case of collaboration, if having platform-specific dependencies or dependencies
90
+ # having no cross-platform support, pipenv may install dependencies that don't work, or not
91
+ # install all needed dependencies.
92
+ #Pipfile.lock
93
+
94
+ # PEP 582; used by e.g. github.com/David-OConnor/pyflow
95
+ __pypackages__/
96
+
97
+ # Celery stuff
98
+ celerybeat-schedule
99
+ celerybeat.pid
100
+
101
+ # SageMath parsed files
102
+ *.sage.py
103
+
104
+ # Environments
105
+ .env
106
+ .venv
107
+ env/
108
+ venv/
109
+ ENV/
110
+ env.bak/
111
+ venv.bak/
112
+
113
+ # Spyder project settings
114
+ .spyderproject
115
+ .spyproject
116
+
117
+ # Rope project settings
118
+ .ropeproject
119
+
120
+ # mkdocs documentation
121
+ /site
122
+
123
+ # mypy
124
+ .mypy_cache/
125
+ .dmypy.json
126
+ dmypy.json
127
+
128
+ # Pyre type checker
129
+ .pyre/
130
+ *.ipynb
131
+
132
+ # sqlite3 database
133
+ *.db
134
+
135
+ # tempCodeRunnerFile
136
+ tempCodeRunnerFile.py
ptt-crawler/Dockerfile ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ FROM python:3.10-slim
2
+
3
+ WORKDIR /app
4
+
5
+ COPY ./Pipfile* ./
6
+
7
+ RUN pip install pipenv && \
8
+ apt-get update && \
9
+ apt-get install -y --no-install-recommends gcc python3-dev libssl-dev && \
10
+ pipenv install --deploy --system && \
11
+ apt-get remove -y gcc python3-dev libssl-dev && \
12
+ apt-get autoremove -y && \
13
+ pip uninstall pipenv -y
14
+
15
+ COPY ./scrapy.cfg ./
16
+ COPY ./scraptt ./scraptt
ptt-crawler/Pipfile ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [[source]]
2
+ url = "https://pypi.org/simple"
3
+ verify_ssl = true
4
+ name = "pypi"
5
+
6
+ [packages]
7
+ scrapy = "*"
8
+ pyquery = "*"
9
+ pydantic = "*"
10
+ requests = "*"
11
+ scrapy-user-agents = "*"
12
+ scrapy-fake-useragent = "*"
13
+ redis = "*"
14
+ python-dotenv = "*"
15
+
16
+ [dev-packages]
17
+
18
+ [requires]
19
+ python_version = "3.9"
ptt-crawler/Pipfile.lock ADDED
@@ -0,0 +1,742 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_meta": {
3
+ "hash": {
4
+ "sha256": "bc8f4c10537b5ee8c35f567b92a02909bd396375759fc1998d92a19b8d7beccb"
5
+ },
6
+ "pipfile-spec": 6,
7
+ "requires": {
8
+ "python_version": "3.9"
9
+ },
10
+ "sources": [
11
+ {
12
+ "name": "pypi",
13
+ "url": "https://pypi.org/simple",
14
+ "verify_ssl": true
15
+ }
16
+ ]
17
+ },
18
+ "default": {
19
+ "async-timeout": {
20
+ "hashes": [
21
+ "sha256:2163e1640ddb52b7a8c80d0a67a08587e5d245cc9c553a74a847056bc2976b15",
22
+ "sha256:8ca1e4fcf50d07413d66d1a5e416e42cfdf5851c981d679a09851a6853383b3c"
23
+ ],
24
+ "markers": "python_version >= '3.6'",
25
+ "version": "==4.0.2"
26
+ },
27
+ "attrs": {
28
+ "hashes": [
29
+ "sha256:29adc2665447e5191d0e7c568fde78b21f9672d344281d0c6e1ab085429b22b6",
30
+ "sha256:86efa402f67bf2df34f51a335487cf46b1ec130d02b8d39fd248abfd30da551c"
31
+ ],
32
+ "markers": "python_version >= '3.5'",
33
+ "version": "==22.1.0"
34
+ },
35
+ "automat": {
36
+ "hashes": [
37
+ "sha256:7979803c74610e11ef0c0d68a2942b152df52da55336e0c9d58daf1831cbdf33",
38
+ "sha256:b6feb6455337df834f6c9962d6ccf771515b7d939bca142b29c20c2376bc6111"
39
+ ],
40
+ "version": "==20.2.0"
41
+ },
42
+ "certifi": {
43
+ "hashes": [
44
+ "sha256:43dadad18a7f168740e66944e4fa82c6611848ff9056ad910f8f7a3e46ab89e0",
45
+ "sha256:cffdcd380919da6137f76633531a5817e3a9f268575c128249fb637e4f9e73fb"
46
+ ],
47
+ "markers": "python_version >= '3.6'",
48
+ "version": "==2022.6.15.1"
49
+ },
50
+ "cffi": {
51
+ "hashes": [
52
+ "sha256:00a9ed42e88df81ffae7a8ab6d9356b371399b91dbdf0c3cb1e84c03a13aceb5",
53
+ "sha256:03425bdae262c76aad70202debd780501fabeaca237cdfddc008987c0e0f59ef",
54
+ "sha256:04ed324bda3cda42b9b695d51bb7d54b680b9719cfab04227cdd1e04e5de3104",
55
+ "sha256:0e2642fe3142e4cc4af0799748233ad6da94c62a8bec3a6648bf8ee68b1c7426",
56
+ "sha256:173379135477dc8cac4bc58f45db08ab45d228b3363adb7af79436135d028405",
57
+ "sha256:198caafb44239b60e252492445da556afafc7d1e3ab7a1fb3f0584ef6d742375",
58
+ "sha256:1e74c6b51a9ed6589199c787bf5f9875612ca4a8a0785fb2d4a84429badaf22a",
59
+ "sha256:2012c72d854c2d03e45d06ae57f40d78e5770d252f195b93f581acf3ba44496e",
60
+ "sha256:21157295583fe8943475029ed5abdcf71eb3911894724e360acff1d61c1d54bc",
61
+ "sha256:2470043b93ff09bf8fb1d46d1cb756ce6132c54826661a32d4e4d132e1977adf",
62
+ "sha256:285d29981935eb726a4399badae8f0ffdff4f5050eaa6d0cfc3f64b857b77185",
63
+ "sha256:30d78fbc8ebf9c92c9b7823ee18eb92f2e6ef79b45ac84db507f52fbe3ec4497",
64
+ "sha256:320dab6e7cb2eacdf0e658569d2575c4dad258c0fcc794f46215e1e39f90f2c3",
65
+ "sha256:33ab79603146aace82c2427da5ca6e58f2b3f2fb5da893ceac0c42218a40be35",
66
+ "sha256:3548db281cd7d2561c9ad9984681c95f7b0e38881201e157833a2342c30d5e8c",
67
+ "sha256:3799aecf2e17cf585d977b780ce79ff0dc9b78d799fc694221ce814c2c19db83",
68
+ "sha256:39d39875251ca8f612b6f33e6b1195af86d1b3e60086068be9cc053aa4376e21",
69
+ "sha256:3b926aa83d1edb5aa5b427b4053dc420ec295a08e40911296b9eb1b6170f6cca",
70
+ "sha256:3bcde07039e586f91b45c88f8583ea7cf7a0770df3a1649627bf598332cb6984",
71
+ "sha256:3d08afd128ddaa624a48cf2b859afef385b720bb4b43df214f85616922e6a5ac",
72
+ "sha256:3eb6971dcff08619f8d91607cfc726518b6fa2a9eba42856be181c6d0d9515fd",
73
+ "sha256:40f4774f5a9d4f5e344f31a32b5096977b5d48560c5592e2f3d2c4374bd543ee",
74
+ "sha256:4289fc34b2f5316fbb762d75362931e351941fa95fa18789191b33fc4cf9504a",
75
+ "sha256:470c103ae716238bbe698d67ad020e1db9d9dba34fa5a899b5e21577e6d52ed2",
76
+ "sha256:4f2c9f67e9821cad2e5f480bc8d83b8742896f1242dba247911072d4fa94c192",
77
+ "sha256:50a74364d85fd319352182ef59c5c790484a336f6db772c1a9231f1c3ed0cbd7",
78
+ "sha256:54a2db7b78338edd780e7ef7f9f6c442500fb0d41a5a4ea24fff1c929d5af585",
79
+ "sha256:5635bd9cb9731e6d4a1132a498dd34f764034a8ce60cef4f5319c0541159392f",
80
+ "sha256:59c0b02d0a6c384d453fece7566d1c7e6b7bae4fc5874ef2ef46d56776d61c9e",
81
+ "sha256:5d598b938678ebf3c67377cdd45e09d431369c3b1a5b331058c338e201f12b27",
82
+ "sha256:5df2768244d19ab7f60546d0c7c63ce1581f7af8b5de3eb3004b9b6fc8a9f84b",
83
+ "sha256:5ef34d190326c3b1f822a5b7a45f6c4535e2f47ed06fec77d3d799c450b2651e",
84
+ "sha256:6975a3fac6bc83c4a65c9f9fcab9e47019a11d3d2cf7f3c0d03431bf145a941e",
85
+ "sha256:6c9a799e985904922a4d207a94eae35c78ebae90e128f0c4e521ce339396be9d",
86
+ "sha256:70df4e3b545a17496c9b3f41f5115e69a4f2e77e94e1d2a8e1070bc0c38c8a3c",
87
+ "sha256:7473e861101c9e72452f9bf8acb984947aa1661a7704553a9f6e4baa5ba64415",
88
+ "sha256:8102eaf27e1e448db915d08afa8b41d6c7ca7a04b7d73af6514df10a3e74bd82",
89
+ "sha256:87c450779d0914f2861b8526e035c5e6da0a3199d8f1add1a665e1cbc6fc6d02",
90
+ "sha256:8b7ee99e510d7b66cdb6c593f21c043c248537a32e0bedf02e01e9553a172314",
91
+ "sha256:91fc98adde3d7881af9b59ed0294046f3806221863722ba7d8d120c575314325",
92
+ "sha256:94411f22c3985acaec6f83c6df553f2dbe17b698cc7f8ae751ff2237d96b9e3c",
93
+ "sha256:98d85c6a2bef81588d9227dde12db8a7f47f639f4a17c9ae08e773aa9c697bf3",
94
+ "sha256:9ad5db27f9cabae298d151c85cf2bad1d359a1b9c686a275df03385758e2f914",
95
+ "sha256:a0b71b1b8fbf2b96e41c4d990244165e2c9be83d54962a9a1d118fd8657d2045",
96
+ "sha256:a0f100c8912c114ff53e1202d0078b425bee3649ae34d7b070e9697f93c5d52d",
97
+ "sha256:a591fe9e525846e4d154205572a029f653ada1a78b93697f3b5a8f1f2bc055b9",
98
+ "sha256:a5c84c68147988265e60416b57fc83425a78058853509c1b0629c180094904a5",
99
+ "sha256:a66d3508133af6e8548451b25058d5812812ec3798c886bf38ed24a98216fab2",
100
+ "sha256:a8c4917bd7ad33e8eb21e9a5bbba979b49d9a97acb3a803092cbc1133e20343c",
101
+ "sha256:b3bbeb01c2b273cca1e1e0c5df57f12dce9a4dd331b4fa1635b8bec26350bde3",
102
+ "sha256:cba9d6b9a7d64d4bd46167096fc9d2f835e25d7e4c121fb2ddfc6528fb0413b2",
103
+ "sha256:cc4d65aeeaa04136a12677d3dd0b1c0c94dc43abac5860ab33cceb42b801c1e8",
104
+ "sha256:ce4bcc037df4fc5e3d184794f27bdaab018943698f4ca31630bc7f84a7b69c6d",
105
+ "sha256:cec7d9412a9102bdc577382c3929b337320c4c4c4849f2c5cdd14d7368c5562d",
106
+ "sha256:d400bfb9a37b1351253cb402671cea7e89bdecc294e8016a707f6d1d8ac934f9",
107
+ "sha256:d61f4695e6c866a23a21acab0509af1cdfd2c013cf256bbf5b6b5e2695827162",
108
+ "sha256:db0fbb9c62743ce59a9ff687eb5f4afbe77e5e8403d6697f7446e5f609976f76",
109
+ "sha256:dd86c085fae2efd48ac91dd7ccffcfc0571387fe1193d33b6394db7ef31fe2a4",
110
+ "sha256:e00b098126fd45523dd056d2efba6c5a63b71ffe9f2bbe1a4fe1716e1d0c331e",
111
+ "sha256:e229a521186c75c8ad9490854fd8bbdd9a0c9aa3a524326b55be83b54d4e0ad9",
112
+ "sha256:e263d77ee3dd201c3a142934a086a4450861778baaeeb45db4591ef65550b0a6",
113
+ "sha256:ed9cb427ba5504c1dc15ede7d516b84757c3e3d7868ccc85121d9310d27eed0b",
114
+ "sha256:fa6693661a4c91757f4412306191b6dc88c1703f780c8234035eac011922bc01",
115
+ "sha256:fcd131dd944808b5bdb38e6f5b53013c5aa4f334c5cad0c72742f6eba4b73db0"
116
+ ],
117
+ "version": "==1.15.1"
118
+ },
119
+ "charset-normalizer": {
120
+ "hashes": [
121
+ "sha256:5a3d016c7c547f69d6f81fb0db9449ce888b418b5b9952cc5e6e66843e9dd845",
122
+ "sha256:83e9a75d1911279afd89352c68b45348559d1fc0506b054b346651b5e7fee29f"
123
+ ],
124
+ "markers": "python_version >= '3.6'",
125
+ "version": "==2.1.1"
126
+ },
127
+ "constantly": {
128
+ "hashes": [
129
+ "sha256:586372eb92059873e29eba4f9dec8381541b4d3834660707faf8ba59146dfc35",
130
+ "sha256:dd2fa9d6b1a51a83f0d7dd76293d734046aa176e384bf6e33b7e44880eb37c5d"
131
+ ],
132
+ "version": "==15.1.0"
133
+ },
134
+ "cryptography": {
135
+ "hashes": [
136
+ "sha256:0297ffc478bdd237f5ca3a7dc96fc0d315670bfa099c04dc3a4a2172008a405a",
137
+ "sha256:10d1f29d6292fc95acb597bacefd5b9e812099d75a6469004fd38ba5471a977f",
138
+ "sha256:16fa61e7481f4b77ef53991075de29fc5bacb582a1244046d2e8b4bb72ef66d0",
139
+ "sha256:194044c6b89a2f9f169df475cc167f6157eb9151cc69af8a2a163481d45cc407",
140
+ "sha256:1db3d807a14931fa317f96435695d9ec386be7b84b618cc61cfa5d08b0ae33d7",
141
+ "sha256:3261725c0ef84e7592597606f6583385fed2a5ec3909f43bc475ade9729a41d6",
142
+ "sha256:3b72c360427889b40f36dc214630e688c2fe03e16c162ef0aa41da7ab1455153",
143
+ "sha256:3e3a2599e640927089f932295a9a247fc40a5bdf69b0484532f530471a382750",
144
+ "sha256:3fc26e22840b77326a764ceb5f02ca2d342305fba08f002a8c1f139540cdfaad",
145
+ "sha256:5067ee7f2bce36b11d0e334abcd1ccf8c541fc0bbdaf57cdd511fdee53e879b6",
146
+ "sha256:52e7bee800ec869b4031093875279f1ff2ed12c1e2f74923e8f49c916afd1d3b",
147
+ "sha256:64760ba5331e3f1794d0bcaabc0d0c39e8c60bf67d09c93dc0e54189dfd7cfe5",
148
+ "sha256:765fa194a0f3372d83005ab83ab35d7c5526c4e22951e46059b8ac678b44fa5a",
149
+ "sha256:79473cf8a5cbc471979bd9378c9f425384980fcf2ab6534b18ed7d0d9843987d",
150
+ "sha256:896dd3a66959d3a5ddcfc140a53391f69ff1e8f25d93f0e2e7830c6de90ceb9d",
151
+ "sha256:89ed49784ba88c221756ff4d4755dbc03b3c8d2c5103f6d6b4f83a0fb1e85294",
152
+ "sha256:ac7e48f7e7261207d750fa7e55eac2d45f720027d5703cd9007e9b37bbb59ac0",
153
+ "sha256:ad7353f6ddf285aeadfaf79e5a6829110106ff8189391704c1d8801aa0bae45a",
154
+ "sha256:b0163a849b6f315bf52815e238bc2b2346604413fa7c1601eea84bcddb5fb9ac",
155
+ "sha256:b6c9b706316d7b5a137c35e14f4103e2115b088c412140fdbd5f87c73284df61",
156
+ "sha256:c2e5856248a416767322c8668ef1845ad46ee62629266f84a8f007a317141013",
157
+ "sha256:ca9f6784ea96b55ff41708b92c3f6aeaebde4c560308e5fbbd3173fbc466e94e",
158
+ "sha256:d1a5bd52d684e49a36582193e0b89ff267704cd4025abefb9e26803adeb3e5fb",
159
+ "sha256:d3971e2749a723e9084dd507584e2a2761f78ad2c638aa31e80bc7a15c9db4f9",
160
+ "sha256:d4ef6cc305394ed669d4d9eebf10d3a101059bdcf2669c366ec1d14e4fb227bd",
161
+ "sha256:d9e69ae01f99abe6ad646947bba8941e896cb3aa805be2597a0400e0764b5818"
162
+ ],
163
+ "markers": "python_version >= '3.6'",
164
+ "version": "==38.0.1"
165
+ },
166
+ "cssselect": {
167
+ "hashes": [
168
+ "sha256:f612ee47b749c877ebae5bb77035d8f4202c6ad0f0fc1271b3c18ad6c4468ecf",
169
+ "sha256:f95f8dedd925fd8f54edb3d2dfb44c190d9d18512377d3c1e2388d16126879bc"
170
+ ],
171
+ "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3'",
172
+ "version": "==1.1.0"
173
+ },
174
+ "deprecated": {
175
+ "hashes": [
176
+ "sha256:43ac5335da90c31c24ba028af536a91d41d53f9e6901ddb021bcc572ce44e38d",
177
+ "sha256:64756e3e14c8c5eea9795d93c524551432a0be75629f8f29e67ab8caf076c76d"
178
+ ],
179
+ "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3'",
180
+ "version": "==1.2.13"
181
+ },
182
+ "fake-useragent": {
183
+ "hashes": [
184
+ "sha256:c104998b750eb097eefc28ae28e92d66397598d2cf41a31aa45d5559ef1adf35"
185
+ ],
186
+ "version": "==0.1.11"
187
+ },
188
+ "faker": {
189
+ "hashes": [
190
+ "sha256:6db56e2c43a2b74250d1c332ef25fef7dc07dcb6c5fab5329dd7b4467b8ed7b9",
191
+ "sha256:e02c55a5b0586caaf913cc6c254b3de178e08b031c5922e590fd033ebbdbfd02"
192
+ ],
193
+ "markers": "python_version >= '3.6'",
194
+ "version": "==14.2.0"
195
+ },
196
+ "filelock": {
197
+ "hashes": [
198
+ "sha256:55447caa666f2198c5b6b13a26d2084d26fa5b115c00d065664b2124680c4edc",
199
+ "sha256:617eb4e5eedc82fc5f47b6d61e4d11cb837c56cb4544e39081099fa17ad109d4"
200
+ ],
201
+ "markers": "python_version >= '3.7'",
202
+ "version": "==3.8.0"
203
+ },
204
+ "hyperlink": {
205
+ "hashes": [
206
+ "sha256:427af957daa58bc909471c6c40f74c5450fa123dd093fc53efd2e91d2705a56b",
207
+ "sha256:e6b14c37ecb73e89c77d78cdb4c2cc8f3fb59a885c5b3f819ff4ed80f25af1b4"
208
+ ],
209
+ "version": "==21.0.0"
210
+ },
211
+ "idna": {
212
+ "hashes": [
213
+ "sha256:84d9dd047ffa80596e0f246e2eab0b391788b0503584e8945f2368256d2735ff",
214
+ "sha256:9d643ff0a55b762d5cdb124b8eaa99c66322e2157b69160bc32796e824360e6d"
215
+ ],
216
+ "markers": "python_version >= '3.5'",
217
+ "version": "==3.3"
218
+ },
219
+ "incremental": {
220
+ "hashes": [
221
+ "sha256:02f5de5aff48f6b9f665d99d48bfc7ec03b6e3943210de7cfc88856d755d6f57",
222
+ "sha256:92014aebc6a20b78a8084cdd5645eeaa7f74b8933f70fa3ada2cfbd1e3b54321"
223
+ ],
224
+ "version": "==21.3.0"
225
+ },
226
+ "itemadapter": {
227
+ "hashes": [
228
+ "sha256:0e0ab4ddf92c71af57c2386952a61756ae2ecf6c65f976ffaee9ba91ae87a91c",
229
+ "sha256:32c061ec9ab47d5343e8011b268730f48ff632a0192b95292d118b18dbd7687a"
230
+ ],
231
+ "markers": "python_version >= '3.6'",
232
+ "version": "==0.7.0"
233
+ },
234
+ "itemloaders": {
235
+ "hashes": [
236
+ "sha256:248702909af3ab45ae32846f5bdefa0166dc88cffb5f758d662223dcd0953bd9",
237
+ "sha256:8a6b2945a4233a14042a368e17950f447eb1d42494d75634552586342090cb4a"
238
+ ],
239
+ "markers": "python_version >= '3.6'",
240
+ "version": "==1.0.6"
241
+ },
242
+ "jmespath": {
243
+ "hashes": [
244
+ "sha256:02e2e4cc71b5bcab88332eebf907519190dd9e6e82107fa7f83b1003a6252980",
245
+ "sha256:90261b206d6defd58fdd5e85f478bf633a2901798906be2ad389150c5c60edbe"
246
+ ],
247
+ "markers": "python_version >= '3.7'",
248
+ "version": "==1.0.1"
249
+ },
250
+ "lxml": {
251
+ "hashes": [
252
+ "sha256:04da965dfebb5dac2619cb90fcf93efdb35b3c6994fea58a157a834f2f94b318",
253
+ "sha256:0538747a9d7827ce3e16a8fdd201a99e661c7dee3c96c885d8ecba3c35d1032c",
254
+ "sha256:0645e934e940107e2fdbe7c5b6fb8ec6232444260752598bc4d09511bd056c0b",
255
+ "sha256:079b68f197c796e42aa80b1f739f058dcee796dc725cc9a1be0cdb08fc45b000",
256
+ "sha256:0f3f0059891d3254c7b5fb935330d6db38d6519ecd238ca4fce93c234b4a0f73",
257
+ "sha256:10d2017f9150248563bb579cd0d07c61c58da85c922b780060dcc9a3aa9f432d",
258
+ "sha256:1355755b62c28950f9ce123c7a41460ed9743c699905cbe664a5bcc5c9c7c7fb",
259
+ "sha256:13c90064b224e10c14dcdf8086688d3f0e612db53766e7478d7754703295c7c8",
260
+ "sha256:1423631e3d51008871299525b541413c9b6c6423593e89f9c4cfbe8460afc0a2",
261
+ "sha256:1436cf0063bba7888e43f1ba8d58824f085410ea2025befe81150aceb123e345",
262
+ "sha256:1a7c59c6ffd6ef5db362b798f350e24ab2cfa5700d53ac6681918f314a4d3b94",
263
+ "sha256:1e1cf47774373777936c5aabad489fef7b1c087dcd1f426b621fda9dcc12994e",
264
+ "sha256:206a51077773c6c5d2ce1991327cda719063a47adc02bd703c56a662cdb6c58b",
265
+ "sha256:21fb3d24ab430fc538a96e9fbb9b150029914805d551deeac7d7822f64631dfc",
266
+ "sha256:27e590352c76156f50f538dbcebd1925317a0f70540f7dc8c97d2931c595783a",
267
+ "sha256:287605bede6bd36e930577c5925fcea17cb30453d96a7b4c63c14a257118dbb9",
268
+ "sha256:2aaf6a0a6465d39b5ca69688fce82d20088c1838534982996ec46633dc7ad6cc",
269
+ "sha256:32a73c53783becdb7eaf75a2a1525ea8e49379fb7248c3eeefb9412123536387",
270
+ "sha256:41fb58868b816c202e8881fd0f179a4644ce6e7cbbb248ef0283a34b73ec73bb",
271
+ "sha256:4780677767dd52b99f0af1f123bc2c22873d30b474aa0e2fc3fe5e02217687c7",
272
+ "sha256:4878e667ebabe9b65e785ac8da4d48886fe81193a84bbe49f12acff8f7a383a4",
273
+ "sha256:487c8e61d7acc50b8be82bda8c8d21d20e133c3cbf41bd8ad7eb1aaeb3f07c97",
274
+ "sha256:4beea0f31491bc086991b97517b9683e5cfb369205dac0148ef685ac12a20a67",
275
+ "sha256:4cfbe42c686f33944e12f45a27d25a492cc0e43e1dc1da5d6a87cbcaf2e95627",
276
+ "sha256:4d5bae0a37af799207140652a700f21a85946f107a199bcb06720b13a4f1f0b7",
277
+ "sha256:4e285b5f2bf321fc0857b491b5028c5f276ec0c873b985d58d7748ece1d770dd",
278
+ "sha256:57e4d637258703d14171b54203fd6822fda218c6c2658a7d30816b10995f29f3",
279
+ "sha256:5974895115737a74a00b321e339b9c3f45c20275d226398ae79ac008d908bff7",
280
+ "sha256:5ef87fca280fb15342726bd5f980f6faf8b84a5287fcc2d4962ea8af88b35130",
281
+ "sha256:603a464c2e67d8a546ddaa206d98e3246e5db05594b97db844c2f0a1af37cf5b",
282
+ "sha256:6653071f4f9bac46fbc30f3c7838b0e9063ee335908c5d61fb7a4a86c8fd2036",
283
+ "sha256:6ca2264f341dd81e41f3fffecec6e446aa2121e0b8d026fb5130e02de1402785",
284
+ "sha256:6d279033bf614953c3fc4a0aa9ac33a21e8044ca72d4fa8b9273fe75359d5cca",
285
+ "sha256:6d949f53ad4fc7cf02c44d6678e7ff05ec5f5552b235b9e136bd52e9bf730b91",
286
+ "sha256:6daa662aba22ef3258934105be2dd9afa5bb45748f4f702a3b39a5bf53a1f4dc",
287
+ "sha256:6eafc048ea3f1b3c136c71a86db393be36b5b3d9c87b1c25204e7d397cee9536",
288
+ "sha256:830c88747dce8a3e7525defa68afd742b4580df6aa2fdd6f0855481e3994d391",
289
+ "sha256:86e92728ef3fc842c50a5cb1d5ba2bc66db7da08a7af53fb3da79e202d1b2cd3",
290
+ "sha256:8caf4d16b31961e964c62194ea3e26a0e9561cdf72eecb1781458b67ec83423d",
291
+ "sha256:8d1a92d8e90b286d491e5626af53afef2ba04da33e82e30744795c71880eaa21",
292
+ "sha256:8f0a4d179c9a941eb80c3a63cdb495e539e064f8054230844dcf2fcb812b71d3",
293
+ "sha256:9232b09f5efee6a495a99ae6824881940d6447debe272ea400c02e3b68aad85d",
294
+ "sha256:927a9dd016d6033bc12e0bf5dee1dde140235fc8d0d51099353c76081c03dc29",
295
+ "sha256:93e414e3206779ef41e5ff2448067213febf260ba747fc65389a3ddaa3fb8715",
296
+ "sha256:98cafc618614d72b02185ac583c6f7796202062c41d2eeecdf07820bad3295ed",
297
+ "sha256:9c3a88d20e4fe4a2a4a84bf439a5ac9c9aba400b85244c63a1ab7088f85d9d25",
298
+ "sha256:9f36de4cd0c262dd9927886cc2305aa3f2210db437aa4fed3fb4940b8bf4592c",
299
+ "sha256:a60f90bba4c37962cbf210f0188ecca87daafdf60271f4c6948606e4dabf8785",
300
+ "sha256:a614e4afed58c14254e67862456d212c4dcceebab2eaa44d627c2ca04bf86837",
301
+ "sha256:ae06c1e4bc60ee076292e582a7512f304abdf6c70db59b56745cca1684f875a4",
302
+ "sha256:b122a188cd292c4d2fcd78d04f863b789ef43aa129b233d7c9004de08693728b",
303
+ "sha256:b570da8cd0012f4af9fa76a5635cd31f707473e65a5a335b186069d5c7121ff2",
304
+ "sha256:bcaa1c495ce623966d9fc8a187da80082334236a2a1c7e141763ffaf7a405067",
305
+ "sha256:bd34f6d1810d9354dc7e35158aa6cc33456be7706df4420819af6ed966e85448",
306
+ "sha256:be9eb06489bc975c38706902cbc6888f39e946b81383abc2838d186f0e8b6a9d",
307
+ "sha256:c4b2e0559b68455c085fb0f6178e9752c4be3bba104d6e881eb5573b399d1eb2",
308
+ "sha256:c62e8dd9754b7debda0c5ba59d34509c4688f853588d75b53c3791983faa96fc",
309
+ "sha256:c852b1530083a620cb0de5f3cd6826f19862bafeaf77586f1aef326e49d95f0c",
310
+ "sha256:d9fc0bf3ff86c17348dfc5d322f627d78273eba545db865c3cd14b3f19e57fa5",
311
+ "sha256:dad7b164905d3e534883281c050180afcf1e230c3d4a54e8038aa5cfcf312b84",
312
+ "sha256:e5f66bdf0976ec667fc4594d2812a00b07ed14d1b44259d19a41ae3fff99f2b8",
313
+ "sha256:e8f0c9d65da595cfe91713bc1222af9ecabd37971762cb830dea2fc3b3bb2acf",
314
+ "sha256:edffbe3c510d8f4bf8640e02ca019e48a9b72357318383ca60e3330c23aaffc7",
315
+ "sha256:eea5d6443b093e1545ad0210e6cf27f920482bfcf5c77cdc8596aec73523bb7e",
316
+ "sha256:ef72013e20dd5ba86a8ae1aed7f56f31d3374189aa8b433e7b12ad182c0d2dfb",
317
+ "sha256:f05251bbc2145349b8d0b77c0d4e5f3b228418807b1ee27cefb11f69ed3d233b",
318
+ "sha256:f1be258c4d3dc609e654a1dc59d37b17d7fef05df912c01fc2e15eb43a9735f3",
319
+ "sha256:f9ced82717c7ec65a67667bb05865ffe38af0e835cdd78728f1209c8fffe0cad",
320
+ "sha256:fe17d10b97fdf58155f858606bddb4e037b805a60ae023c009f760d8361a4eb8",
321
+ "sha256:fe749b052bb7233fe5d072fcb549221a8cb1a16725c47c37e42b0b9cb3ff2c3f"
322
+ ],
323
+ "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3, 3.4'",
324
+ "version": "==4.9.1"
325
+ },
326
+ "packaging": {
327
+ "hashes": [
328
+ "sha256:dd47c42927d89ab911e606518907cc2d3a1f38bbd026385970643f9c5b8ecfeb",
329
+ "sha256:ef103e05f519cdc783ae24ea4e2e0f508a9c99b2d4969652eed6a2e1ea5bd522"
330
+ ],
331
+ "markers": "python_version >= '3.6'",
332
+ "version": "==21.3"
333
+ },
334
+ "parsel": {
335
+ "hashes": [
336
+ "sha256:70efef0b651a996cceebc69e55a85eb2233be0890959203ba7c3a03c72725c79",
337
+ "sha256:9e1fa8db1c0b4a878bf34b35c043d89c9d1cbebc23b4d34dbc3c0ec33f2e087d"
338
+ ],
339
+ "version": "==1.6.0"
340
+ },
341
+ "protego": {
342
+ "hashes": [
343
+ "sha256:04419b18f20e8909f1691c6b678392988271cc2a324a72f9663cb3af838b4bf7",
344
+ "sha256:df666d4304dab774e2dc9feb208bb1ac8d71ea5ceec12f4c99eba30fbd642ff2"
345
+ ],
346
+ "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3, 3.4'",
347
+ "version": "==0.2.1"
348
+ },
349
+ "pyasn1": {
350
+ "hashes": [
351
+ "sha256:014c0e9976956a08139dc0712ae195324a75e142284d5f87f1a87ee1b068a359",
352
+ "sha256:03840c999ba71680a131cfaee6fab142e1ed9bbd9c693e285cc6aca0d555e576",
353
+ "sha256:0458773cfe65b153891ac249bcf1b5f8f320b7c2ce462151f8fa74de8934becf",
354
+ "sha256:08c3c53b75eaa48d71cf8c710312316392ed40899cb34710d092e96745a358b7",
355
+ "sha256:39c7e2ec30515947ff4e87fb6f456dfc6e84857d34be479c9d4a4ba4bf46aa5d",
356
+ "sha256:5c9414dcfede6e441f7e8f81b43b34e834731003427e5b09e4e00e3172a10f00",
357
+ "sha256:6e7545f1a61025a4e58bb336952c5061697da694db1cae97b116e9c46abcf7c8",
358
+ "sha256:78fa6da68ed2727915c4767bb386ab32cdba863caa7dbe473eaae45f9959da86",
359
+ "sha256:7ab8a544af125fb704feadb008c99a88805126fb525280b2270bb25cc1d78a12",
360
+ "sha256:99fcc3c8d804d1bc6d9a099921e39d827026409a58f2a720dcdb89374ea0c776",
361
+ "sha256:aef77c9fb94a3ac588e87841208bdec464471d9871bd5050a287cc9a475cd0ba",
362
+ "sha256:e89bf84b5437b532b0803ba5c9a5e054d21fec423a89952a74f87fa2c9b7bce2",
363
+ "sha256:fec3e9d8e36808a28efb59b489e4528c10ad0f480e57dcc32b4de5c9d8c9fdf3"
364
+ ],
365
+ "version": "==0.4.8"
366
+ },
367
+ "pyasn1-modules": {
368
+ "hashes": [
369
+ "sha256:0845a5582f6a02bb3e1bde9ecfc4bfcae6ec3210dd270522fee602365430c3f8",
370
+ "sha256:0fe1b68d1e486a1ed5473f1302bd991c1611d319bba158e98b106ff86e1d7199",
371
+ "sha256:15b7c67fabc7fc240d87fb9aabf999cf82311a6d6fb2c70d00d3d0604878c811",
372
+ "sha256:426edb7a5e8879f1ec54a1864f16b882c2837bfd06eee62f2c982315ee2473ed",
373
+ "sha256:65cebbaffc913f4fe9e4808735c95ea22d7a7775646ab690518c056784bc21b4",
374
+ "sha256:905f84c712230b2c592c19470d3ca8d552de726050d1d1716282a1f6146be65e",
375
+ "sha256:a50b808ffeb97cb3601dd25981f6b016cbb3d31fbf57a8b8a87428e6158d0c74",
376
+ "sha256:a99324196732f53093a84c4369c996713eb8c89d360a496b599fb1a9c47fc3eb",
377
+ "sha256:b80486a6c77252ea3a3e9b1e360bc9cf28eaac41263d173c032581ad2f20fe45",
378
+ "sha256:c29a5e5cc7a3f05926aff34e097e84f8589cd790ce0ed41b67aed6857b26aafd",
379
+ "sha256:cbac4bc38d117f2a49aeedec4407d23e8866ea4ac27ff2cf7fb3e5b570df19e0",
380
+ "sha256:f39edd8c4ecaa4556e989147ebf219227e2cd2e8a43c7e7fcb1f1c18c5fd6a3d",
381
+ "sha256:fe0644d9ab041506b62782e92b06b8c68cca799e1a9636ec398675459e031405"
382
+ ],
383
+ "version": "==0.2.8"
384
+ },
385
+ "pycparser": {
386
+ "hashes": [
387
+ "sha256:8ee45429555515e1f6b185e78100aea234072576aa43ab53aefcae078162fca9",
388
+ "sha256:e644fdec12f7872f86c58ff790da456218b10f863970249516d60a5eaca77206"
389
+ ],
390
+ "version": "==2.21"
391
+ },
392
+ "pydantic": {
393
+ "hashes": [
394
+ "sha256:05e00dbebbe810b33c7a7362f231893183bcc4251f3f2ff991c31d5c08240c42",
395
+ "sha256:06094d18dd5e6f2bbf93efa54991c3240964bb663b87729ac340eb5014310624",
396
+ "sha256:0b959f4d8211fc964772b595ebb25f7652da3f22322c007b6fed26846a40685e",
397
+ "sha256:19b3b9ccf97af2b7519c42032441a891a5e05c68368f40865a90eb88833c2559",
398
+ "sha256:1b6ee725bd6e83ec78b1aa32c5b1fa67a3a65badddde3976bca5fe4568f27709",
399
+ "sha256:1ee433e274268a4b0c8fde7ad9d58ecba12b069a033ecc4645bb6303c062d2e9",
400
+ "sha256:216f3bcbf19c726b1cc22b099dd409aa371f55c08800bcea4c44c8f74b73478d",
401
+ "sha256:2d0567e60eb01bccda3a4df01df677adf6b437958d35c12a3ac3e0f078b0ee52",
402
+ "sha256:2e05aed07fa02231dbf03d0adb1be1d79cabb09025dd45aa094aa8b4e7b9dcda",
403
+ "sha256:352aedb1d71b8b0736c6d56ad2bd34c6982720644b0624462059ab29bd6e5912",
404
+ "sha256:355639d9afc76bcb9b0c3000ddcd08472ae75318a6eb67a15866b87e2efa168c",
405
+ "sha256:37c90345ec7dd2f1bcef82ce49b6235b40f282b94d3eec47e801baf864d15525",
406
+ "sha256:4b8795290deaae348c4eba0cebb196e1c6b98bdbe7f50b2d0d9a4a99716342fe",
407
+ "sha256:5760e164b807a48a8f25f8aa1a6d857e6ce62e7ec83ea5d5c5a802eac81bad41",
408
+ "sha256:6eb843dcc411b6a2237a694f5e1d649fc66c6064d02b204a7e9d194dff81eb4b",
409
+ "sha256:7b5ba54d026c2bd2cb769d3468885f23f43710f651688e91f5fb1edcf0ee9283",
410
+ "sha256:7c2abc4393dea97a4ccbb4ec7d8658d4e22c4765b7b9b9445588f16c71ad9965",
411
+ "sha256:81a7b66c3f499108b448f3f004801fcd7d7165fb4200acb03f1c2402da73ce4c",
412
+ "sha256:91b8e218852ef6007c2b98cd861601c6a09f1aa32bbbb74fab5b1c33d4a1e410",
413
+ "sha256:9300fcbebf85f6339a02c6994b2eb3ff1b9c8c14f502058b5bf349d42447dcf5",
414
+ "sha256:9cabf4a7f05a776e7793e72793cd92cc865ea0e83a819f9ae4ecccb1b8aa6116",
415
+ "sha256:a1f5a63a6dfe19d719b1b6e6106561869d2efaca6167f84f5ab9347887d78b98",
416
+ "sha256:a4c805731c33a8db4b6ace45ce440c4ef5336e712508b4d9e1aafa617dc9907f",
417
+ "sha256:ae544c47bec47a86bc7d350f965d8b15540e27e5aa4f55170ac6a75e5f73b644",
418
+ "sha256:b97890e56a694486f772d36efd2ba31612739bc6f3caeee50e9e7e3ebd2fdd13",
419
+ "sha256:bb6ad4489af1bac6955d38ebcb95079a836af31e4c4f74aba1ca05bb9f6027bd",
420
+ "sha256:bedf309630209e78582ffacda64a21f96f3ed2e51fbf3962d4d488e503420254",
421
+ "sha256:c1ba1afb396148bbc70e9eaa8c06c1716fdddabaf86e7027c5988bae2a829ab6",
422
+ "sha256:c33602f93bfb67779f9c507e4d69451664524389546bacfe1bee13cae6dc7488",
423
+ "sha256:c4aac8e7103bf598373208f6299fa9a5cfd1fc571f2d40bf1dd1955a63d6eeb5",
424
+ "sha256:c6f981882aea41e021f72779ce2a4e87267458cc4d39ea990729e21ef18f0f8c",
425
+ "sha256:cc78cc83110d2f275ec1970e7a831f4e371ee92405332ebfe9860a715f8336e1",
426
+ "sha256:d49f3db871575e0426b12e2f32fdb25e579dea16486a26e5a0474af87cb1ab0a",
427
+ "sha256:dd3f9a40c16daf323cf913593083698caee97df2804aa36c4b3175d5ac1b92a2",
428
+ "sha256:e0bedafe4bc165ad0a56ac0bd7695df25c50f76961da29c050712596cf092d6d",
429
+ "sha256:e9069e1b01525a96e6ff49e25876d90d5a563bc31c658289a8772ae186552236"
430
+ ],
431
+ "index": "pypi",
432
+ "version": "==1.10.2"
433
+ },
434
+ "pydispatcher": {
435
+ "hashes": [
436
+ "sha256:3d7e4f43c70000a1dca31f92694e99d0101934fa6eab5d5455a758858d86df95"
437
+ ],
438
+ "markers": "platform_python_implementation == 'CPython'",
439
+ "version": "==2.0.6"
440
+ },
441
+ "pyopenssl": {
442
+ "hashes": [
443
+ "sha256:660b1b1425aac4a1bea1d94168a85d99f0b3144c869dd4390d27629d0087f1bf",
444
+ "sha256:ea252b38c87425b64116f808355e8da644ef9b07e429398bfece610f893ee2e0"
445
+ ],
446
+ "markers": "python_version >= '3.6'",
447
+ "version": "==22.0.0"
448
+ },
449
+ "pyparsing": {
450
+ "hashes": [
451
+ "sha256:2b020ecf7d21b687f219b71ecad3631f644a47f01403fa1d1036b0c6416d70fb",
452
+ "sha256:5026bae9a10eeaefb61dab2f09052b9f4307d44aee4eda64b309723d8d206bbc"
453
+ ],
454
+ "markers": "python_full_version >= '3.6.8'",
455
+ "version": "==3.0.9"
456
+ },
457
+ "pyquery": {
458
+ "hashes": [
459
+ "sha256:1fc33b7699455ed25c75282bc8f80ace1ac078b0dda5a933dacbd8b1c1f83963",
460
+ "sha256:a388eefb6bc4a55350de0316fbd97cda999ae669b6743ae5b99102ba54f5aa72"
461
+ ],
462
+ "index": "pypi",
463
+ "version": "==1.4.3"
464
+ },
465
+ "python-dateutil": {
466
+ "hashes": [
467
+ "sha256:0123cacc1627ae19ddf3c27a5de5bd67ee4586fbdd6440d9748f8abb483d3e86",
468
+ "sha256:961d03dc3453ebbc59dbdea9e4e11c5651520a876d0f4db161e8674aae935da9"
469
+ ],
470
+ "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3'",
471
+ "version": "==2.8.2"
472
+ },
473
+ "python-dotenv": {
474
+ "hashes": [
475
+ "sha256:1684eb44636dd462b66c3ee016599815514527ad99965de77f43e0944634a7e5",
476
+ "sha256:b77d08274639e3d34145dfa6c7008e66df0f04b7be7a75fd0d5292c191d79045"
477
+ ],
478
+ "index": "pypi",
479
+ "version": "==0.21.0"
480
+ },
481
+ "queuelib": {
482
+ "hashes": [
483
+ "sha256:4b207267f2642a8699a1f806045c56eb7ad1a85a10c0e249884580d139c2fcd2",
484
+ "sha256:4b96d48f650a814c6fb2fd11b968f9c46178b683aad96d68f930fe13a8574d19"
485
+ ],
486
+ "markers": "python_version >= '3.5'",
487
+ "version": "==1.6.2"
488
+ },
489
+ "redis": {
490
+ "hashes": [
491
+ "sha256:a52d5694c9eb4292770084fa8c863f79367ca19884b329ab574d5cb2036b3e54",
492
+ "sha256:ddf27071df4adf3821c4f2ca59d67525c3a82e5f268bed97b813cb4fabf87880"
493
+ ],
494
+ "index": "pypi",
495
+ "version": "==4.3.4"
496
+ },
497
+ "requests": {
498
+ "hashes": [
499
+ "sha256:7c5599b102feddaa661c826c56ab4fee28bfd17f5abca1ebbe3e7f19d7c97983",
500
+ "sha256:8fefa2a1a1365bf5520aac41836fbee479da67864514bdb821f31ce07ce65349"
501
+ ],
502
+ "index": "pypi",
503
+ "version": "==2.28.1"
504
+ },
505
+ "requests-file": {
506
+ "hashes": [
507
+ "sha256:07d74208d3389d01c38ab89ef403af0cfec63957d53a0081d8eca738d0247d8e",
508
+ "sha256:dfe5dae75c12481f68ba353183c53a65e6044c923e64c24b2209f6c7570ca953"
509
+ ],
510
+ "version": "==1.5.1"
511
+ },
512
+ "scrapy": {
513
+ "hashes": [
514
+ "sha256:53528bcaf8c2c77aca359af11f349dec5dad98845a13d4c0bb9abd07f302298d",
515
+ "sha256:55e21181165f25337105fff1efc8393296375cea7de699a7e703bbd265595f26"
516
+ ],
517
+ "index": "pypi",
518
+ "version": "==2.6.2"
519
+ },
520
+ "scrapy-fake-useragent": {
521
+ "hashes": [
522
+ "sha256:3b17e982e646918dc25080da0672812d07bfb7a92a58377c014c74e0182c665e",
523
+ "sha256:da0589d9245fe6348b491821f3be3387dd6563540146058e6b6c4f1bbe1358bf"
524
+ ],
525
+ "index": "pypi",
526
+ "version": "==1.4.4"
527
+ },
528
+ "scrapy-user-agents": {
529
+ "hashes": [
530
+ "sha256:284c9af555f3128697a2953ab3cdb987b160b091a12896562d969cf9e81d1350",
531
+ "sha256:aa1f78c8cbae42f1a7159c5ea16c2638ac17e78d7d44111d164ed099ec48705f"
532
+ ],
533
+ "index": "pypi",
534
+ "version": "==0.1.1"
535
+ },
536
+ "service-identity": {
537
+ "hashes": [
538
+ "sha256:6e6c6086ca271dc11b033d17c3a8bea9f24ebff920c587da090afc9519419d34",
539
+ "sha256:f0b0caac3d40627c3c04d7a51b6e06721857a0e10a8775f2d1d7e72901b3a7db"
540
+ ],
541
+ "version": "==21.1.0"
542
+ },
543
+ "setuptools": {
544
+ "hashes": [
545
+ "sha256:2e24e0bec025f035a2e72cdd1961119f557d78ad331bb00ff82efb2ab8da8e82",
546
+ "sha256:7732871f4f7fa58fb6bdcaeadb0161b2bd046c85905dbaa066bdcbcc81953b57"
547
+ ],
548
+ "markers": "python_version >= '3.7'",
549
+ "version": "==65.3.0"
550
+ },
551
+ "six": {
552
+ "hashes": [
553
+ "sha256:1e61c37477a1626458e36f7b1d82aa5c9b094fa4802892072e49de9c60c4c926",
554
+ "sha256:8abb2f1d86890a2dfb989f9a77cfcfd3e47c2a354b01111771326f8aa26e0254"
555
+ ],
556
+ "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3'",
557
+ "version": "==1.16.0"
558
+ },
559
+ "tldextract": {
560
+ "hashes": [
561
+ "sha256:35a0260570e214d8d3cfeeb403992fe9e2b686925f63c9b03c5933408ac2aa5a",
562
+ "sha256:fe15ac3205e5a25b61689369f98cb45c7778a8f2af113d7c11559ece5195f2d6"
563
+ ],
564
+ "markers": "python_version >= '3.7'",
565
+ "version": "==3.3.1"
566
+ },
567
+ "twisted": {
568
+ "hashes": [
569
+ "sha256:8d4718d1e48dcc28933f8beb48dc71cfe77a125e37ad1eb7a3d0acc49baf6c99",
570
+ "sha256:e5b60de39f2d1da153fbe1874d885fe3fcbdb21fcc446fa759a53e8fc3513bed"
571
+ ],
572
+ "markers": "python_full_version >= '3.7.1'",
573
+ "version": "==22.8.0"
574
+ },
575
+ "typing-extensions": {
576
+ "hashes": [
577
+ "sha256:25642c956049920a5aa49edcdd6ab1e06d7e5d467fc00e0506c44ac86fbfca02",
578
+ "sha256:e6d2677a32f47fc7eb2795db1dd15c1f34eff616bcaf2cfb5e997f854fa1c4a6"
579
+ ],
580
+ "markers": "python_version >= '3.7'",
581
+ "version": "==4.3.0"
582
+ },
583
+ "ua-parser": {
584
+ "hashes": [
585
+ "sha256:ed3efc695f475ffe56248c9789b3016247e9c20e3556cfa4d5aadc78ab4b26c6",
586
+ "sha256:f97126300df8ac0f8f2c9d8559669532d626a1af529265fd253cba56e73ab36e"
587
+ ],
588
+ "version": "==0.16.1"
589
+ },
590
+ "urllib3": {
591
+ "hashes": [
592
+ "sha256:3fa96cf423e6987997fc326ae8df396db2a8b7c667747d47ddd8ecba91f4a74e",
593
+ "sha256:b930dd878d5a8afb066a637fbb35144fe7901e3b209d1cd4f524bd0e9deee997"
594
+ ],
595
+ "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3, 3.4, 3.5' and python_version < '4'",
596
+ "version": "==1.26.12"
597
+ },
598
+ "user-agents": {
599
+ "hashes": [
600
+ "sha256:a98c4dc72ecbc64812c4534108806fb0a0b3a11ec3fd1eafe807cee5b0a942e7",
601
+ "sha256:d36d25178db65308d1458c5fa4ab39c9b2619377010130329f3955e7626ead26"
602
+ ],
603
+ "version": "==2.2.0"
604
+ },
605
+ "w3lib": {
606
+ "hashes": [
607
+ "sha256:13df15f8c17b163de0fd5faa892c1ad143e190dfcbdb98534bb975eb37c6c7d6",
608
+ "sha256:c5d966f86ae3fb546854478c769250c3ccb7581515b3221bcd2f864440000188"
609
+ ],
610
+ "markers": "python_version >= '3.6'",
611
+ "version": "==2.0.1"
612
+ },
613
+ "wrapt": {
614
+ "hashes": [
615
+ "sha256:00b6d4ea20a906c0ca56d84f93065b398ab74b927a7a3dbd470f6fc503f95dc3",
616
+ "sha256:01c205616a89d09827986bc4e859bcabd64f5a0662a7fe95e0d359424e0e071b",
617
+ "sha256:02b41b633c6261feff8ddd8d11c711df6842aba629fdd3da10249a53211a72c4",
618
+ "sha256:07f7a7d0f388028b2df1d916e94bbb40624c59b48ecc6cbc232546706fac74c2",
619
+ "sha256:11871514607b15cfeb87c547a49bca19fde402f32e2b1c24a632506c0a756656",
620
+ "sha256:1b376b3f4896e7930f1f772ac4b064ac12598d1c38d04907e696cc4d794b43d3",
621
+ "sha256:21ac0156c4b089b330b7666db40feee30a5d52634cc4560e1905d6529a3897ff",
622
+ "sha256:257fd78c513e0fb5cdbe058c27a0624c9884e735bbd131935fd49e9fe719d310",
623
+ "sha256:2b39d38039a1fdad98c87279b48bc5dce2c0ca0d73483b12cb72aa9609278e8a",
624
+ "sha256:2cf71233a0ed05ccdabe209c606fe0bac7379fdcf687f39b944420d2a09fdb57",
625
+ "sha256:2fe803deacd09a233e4762a1adcea5db5d31e6be577a43352936179d14d90069",
626
+ "sha256:3232822c7d98d23895ccc443bbdf57c7412c5a65996c30442ebe6ed3df335383",
627
+ "sha256:34aa51c45f28ba7f12accd624225e2b1e5a3a45206aa191f6f9aac931d9d56fe",
628
+ "sha256:36f582d0c6bc99d5f39cd3ac2a9062e57f3cf606ade29a0a0d6b323462f4dd87",
629
+ "sha256:380a85cf89e0e69b7cfbe2ea9f765f004ff419f34194018a6827ac0e3edfed4d",
630
+ "sha256:40e7bc81c9e2b2734ea4bc1aceb8a8f0ceaac7c5299bc5d69e37c44d9081d43b",
631
+ "sha256:43ca3bbbe97af00f49efb06e352eae40434ca9d915906f77def219b88e85d907",
632
+ "sha256:4fcc4649dc762cddacd193e6b55bc02edca674067f5f98166d7713b193932b7f",
633
+ "sha256:5a0f54ce2c092aaf439813735584b9537cad479575a09892b8352fea5e988dc0",
634
+ "sha256:5a9a0d155deafd9448baff28c08e150d9b24ff010e899311ddd63c45c2445e28",
635
+ "sha256:5b02d65b9ccf0ef6c34cba6cf5bf2aab1bb2f49c6090bafeecc9cd81ad4ea1c1",
636
+ "sha256:60db23fa423575eeb65ea430cee741acb7c26a1365d103f7b0f6ec412b893853",
637
+ "sha256:642c2e7a804fcf18c222e1060df25fc210b9c58db7c91416fb055897fc27e8cc",
638
+ "sha256:6a9a25751acb379b466ff6be78a315e2b439d4c94c1e99cb7266d40a537995d3",
639
+ "sha256:6b1a564e6cb69922c7fe3a678b9f9a3c54e72b469875aa8018f18b4d1dd1adf3",
640
+ "sha256:6d323e1554b3d22cfc03cd3243b5bb815a51f5249fdcbb86fda4bf62bab9e164",
641
+ "sha256:6e743de5e9c3d1b7185870f480587b75b1cb604832e380d64f9504a0535912d1",
642
+ "sha256:709fe01086a55cf79d20f741f39325018f4df051ef39fe921b1ebe780a66184c",
643
+ "sha256:7b7c050ae976e286906dd3f26009e117eb000fb2cf3533398c5ad9ccc86867b1",
644
+ "sha256:7d2872609603cb35ca513d7404a94d6d608fc13211563571117046c9d2bcc3d7",
645
+ "sha256:7ef58fb89674095bfc57c4069e95d7a31cfdc0939e2a579882ac7d55aadfd2a1",
646
+ "sha256:80bb5c256f1415f747011dc3604b59bc1f91c6e7150bd7db03b19170ee06b320",
647
+ "sha256:81b19725065dcb43df02b37e03278c011a09e49757287dca60c5aecdd5a0b8ed",
648
+ "sha256:833b58d5d0b7e5b9832869f039203389ac7cbf01765639c7309fd50ef619e0b1",
649
+ "sha256:88bd7b6bd70a5b6803c1abf6bca012f7ed963e58c68d76ee20b9d751c74a3248",
650
+ "sha256:8ad85f7f4e20964db4daadcab70b47ab05c7c1cf2a7c1e51087bfaa83831854c",
651
+ "sha256:8c0ce1e99116d5ab21355d8ebe53d9460366704ea38ae4d9f6933188f327b456",
652
+ "sha256:8d649d616e5c6a678b26d15ece345354f7c2286acd6db868e65fcc5ff7c24a77",
653
+ "sha256:903500616422a40a98a5a3c4ff4ed9d0066f3b4c951fa286018ecdf0750194ef",
654
+ "sha256:9736af4641846491aedb3c3f56b9bc5568d92b0692303b5a305301a95dfd38b1",
655
+ "sha256:988635d122aaf2bdcef9e795435662bcd65b02f4f4c1ae37fbee7401c440b3a7",
656
+ "sha256:9cca3c2cdadb362116235fdbd411735de4328c61425b0aa9f872fd76d02c4e86",
657
+ "sha256:9e0fd32e0148dd5dea6af5fee42beb949098564cc23211a88d799e434255a1f4",
658
+ "sha256:9f3e6f9e05148ff90002b884fbc2a86bd303ae847e472f44ecc06c2cd2fcdb2d",
659
+ "sha256:a85d2b46be66a71bedde836d9e41859879cc54a2a04fad1191eb50c2066f6e9d",
660
+ "sha256:a9a52172be0b5aae932bef82a79ec0a0ce87288c7d132946d645eba03f0ad8a8",
661
+ "sha256:aa31fdcc33fef9eb2552cbcbfee7773d5a6792c137b359e82879c101e98584c5",
662
+ "sha256:b014c23646a467558be7da3d6b9fa409b2c567d2110599b7cf9a0c5992b3b471",
663
+ "sha256:b21bb4c09ffabfa0e85e3a6b623e19b80e7acd709b9f91452b8297ace2a8ab00",
664
+ "sha256:b5901a312f4d14c59918c221323068fad0540e34324925c8475263841dbdfe68",
665
+ "sha256:b9b7a708dd92306328117d8c4b62e2194d00c365f18eff11a9b53c6f923b01e3",
666
+ "sha256:d1967f46ea8f2db647c786e78d8cc7e4313dbd1b0aca360592d8027b8508e24d",
667
+ "sha256:d52a25136894c63de15a35bc0bdc5adb4b0e173b9c0d07a2be9d3ca64a332735",
668
+ "sha256:d77c85fedff92cf788face9bfa3ebaa364448ebb1d765302e9af11bf449ca36d",
669
+ "sha256:d79d7d5dc8a32b7093e81e97dad755127ff77bcc899e845f41bf71747af0c569",
670
+ "sha256:dbcda74c67263139358f4d188ae5faae95c30929281bc6866d00573783c422b7",
671
+ "sha256:ddaea91abf8b0d13443f6dac52e89051a5063c7d014710dcb4d4abb2ff811a59",
672
+ "sha256:dee0ce50c6a2dd9056c20db781e9c1cfd33e77d2d569f5d1d9321c641bb903d5",
673
+ "sha256:dee60e1de1898bde3b238f18340eec6148986da0455d8ba7848d50470a7a32fb",
674
+ "sha256:e2f83e18fe2f4c9e7db597e988f72712c0c3676d337d8b101f6758107c42425b",
675
+ "sha256:e3fb1677c720409d5f671e39bac6c9e0e422584e5f518bfd50aa4cbbea02433f",
676
+ "sha256:ee2b1b1769f6707a8a445162ea16dddf74285c3964f605877a20e38545c3c462",
677
+ "sha256:ee6acae74a2b91865910eef5e7de37dc6895ad96fa23603d1d27ea69df545015",
678
+ "sha256:ef3f72c9666bba2bab70d2a8b79f2c6d2c1a42a7f7e2b0ec83bb2f9e383950af"
679
+ ],
680
+ "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3, 3.4'",
681
+ "version": "==1.14.1"
682
+ },
683
+ "zope.interface": {
684
+ "hashes": [
685
+ "sha256:08f9636e99a9d5410181ba0729e0408d3d8748026ea938f3b970a0249daa8192",
686
+ "sha256:0b465ae0962d49c68aa9733ba92a001b2a0933c317780435f00be7ecb959c702",
687
+ "sha256:0cba8477e300d64a11a9789ed40ee8932b59f9ee05f85276dbb4b59acee5dd09",
688
+ "sha256:0cee5187b60ed26d56eb2960136288ce91bcf61e2a9405660d271d1f122a69a4",
689
+ "sha256:0ea1d73b7c9dcbc5080bb8aaffb776f1c68e807767069b9ccdd06f27a161914a",
690
+ "sha256:0f91b5b948686659a8e28b728ff5e74b1be6bf40cb04704453617e5f1e945ef3",
691
+ "sha256:15e7d1f7a6ee16572e21e3576d2012b2778cbacf75eb4b7400be37455f5ca8bf",
692
+ "sha256:17776ecd3a1fdd2b2cd5373e5ef8b307162f581c693575ec62e7c5399d80794c",
693
+ "sha256:194d0bcb1374ac3e1e023961610dc8f2c78a0f5f634d0c737691e215569e640d",
694
+ "sha256:1c0e316c9add0db48a5b703833881351444398b04111188069a26a61cfb4df78",
695
+ "sha256:205e40ccde0f37496904572035deea747390a8b7dc65146d30b96e2dd1359a83",
696
+ "sha256:273f158fabc5ea33cbc936da0ab3d4ba80ede5351babc4f577d768e057651531",
697
+ "sha256:2876246527c91e101184f63ccd1d716ec9c46519cc5f3d5375a3351c46467c46",
698
+ "sha256:2c98384b254b37ce50eddd55db8d381a5c53b4c10ee66e1e7fe749824f894021",
699
+ "sha256:2e5a26f16503be6c826abca904e45f1a44ff275fdb7e9d1b75c10671c26f8b94",
700
+ "sha256:334701327f37c47fa628fc8b8d28c7d7730ce7daaf4bda1efb741679c2b087fc",
701
+ "sha256:3748fac0d0f6a304e674955ab1365d515993b3a0a865e16a11ec9d86fb307f63",
702
+ "sha256:3c02411a3b62668200910090a0dff17c0b25aaa36145082a5a6adf08fa281e54",
703
+ "sha256:3dd4952748521205697bc2802e4afac5ed4b02909bb799ba1fe239f77fd4e117",
704
+ "sha256:3f24df7124c323fceb53ff6168da70dbfbae1442b4f3da439cd441681f54fe25",
705
+ "sha256:469e2407e0fe9880ac690a3666f03eb4c3c444411a5a5fddfdabc5d184a79f05",
706
+ "sha256:4de4bc9b6d35c5af65b454d3e9bc98c50eb3960d5a3762c9438df57427134b8e",
707
+ "sha256:5208ebd5152e040640518a77827bdfcc73773a15a33d6644015b763b9c9febc1",
708
+ "sha256:52de7fc6c21b419078008f697fd4103dbc763288b1406b4562554bd47514c004",
709
+ "sha256:5bb3489b4558e49ad2c5118137cfeaf59434f9737fa9c5deefc72d22c23822e2",
710
+ "sha256:5dba5f530fec3f0988d83b78cc591b58c0b6eb8431a85edd1569a0539a8a5a0e",
711
+ "sha256:5dd9ca406499444f4c8299f803d4a14edf7890ecc595c8b1c7115c2342cadc5f",
712
+ "sha256:5f931a1c21dfa7a9c573ec1f50a31135ccce84e32507c54e1ea404894c5eb96f",
713
+ "sha256:63b82bb63de7c821428d513607e84c6d97d58afd1fe2eb645030bdc185440120",
714
+ "sha256:66c0061c91b3b9cf542131148ef7ecbecb2690d48d1612ec386de9d36766058f",
715
+ "sha256:6f0c02cbb9691b7c91d5009108f975f8ffeab5dff8f26d62e21c493060eff2a1",
716
+ "sha256:71aace0c42d53abe6fc7f726c5d3b60d90f3c5c055a447950ad6ea9cec2e37d9",
717
+ "sha256:7d97a4306898b05404a0dcdc32d9709b7d8832c0c542b861d9a826301719794e",
718
+ "sha256:7df1e1c05304f26faa49fa752a8c690126cf98b40b91d54e6e9cc3b7d6ffe8b7",
719
+ "sha256:8270252effc60b9642b423189a2fe90eb6b59e87cbee54549db3f5562ff8d1b8",
720
+ "sha256:867a5ad16892bf20e6c4ea2aab1971f45645ff3102ad29bd84c86027fa99997b",
721
+ "sha256:877473e675fdcc113c138813a5dd440da0769a2d81f4d86614e5d62b69497155",
722
+ "sha256:8892f89999ffd992208754851e5a052f6b5db70a1e3f7d54b17c5211e37a98c7",
723
+ "sha256:9a9845c4c6bb56e508651f005c4aeb0404e518c6f000d5a1123ab077ab769f5c",
724
+ "sha256:a1e6e96217a0f72e2b8629e271e1b280c6fa3fe6e59fa8f6701bec14e3354325",
725
+ "sha256:a8156e6a7f5e2a0ff0c5b21d6bcb45145efece1909efcbbbf48c56f8da68221d",
726
+ "sha256:a9506a7e80bcf6eacfff7f804c0ad5350c8c95b9010e4356a4b36f5322f09abb",
727
+ "sha256:af310ec8335016b5e52cae60cda4a4f2a60a788cbb949a4fbea13d441aa5a09e",
728
+ "sha256:b0297b1e05fd128d26cc2460c810d42e205d16d76799526dfa8c8ccd50e74959",
729
+ "sha256:bf68f4b2b6683e52bec69273562df15af352e5ed25d1b6641e7efddc5951d1a7",
730
+ "sha256:d0c1bc2fa9a7285719e5678584f6b92572a5b639d0e471bb8d4b650a1a910920",
731
+ "sha256:d4d9d6c1a455d4babd320203b918ccc7fcbefe308615c521062bc2ba1aa4d26e",
732
+ "sha256:db1fa631737dab9fa0b37f3979d8d2631e348c3b4e8325d6873c2541d0ae5a48",
733
+ "sha256:dd93ea5c0c7f3e25335ab7d22a507b1dc43976e1345508f845efc573d3d779d8",
734
+ "sha256:f44e517131a98f7a76696a7b21b164bcb85291cee106a23beccce454e1f433a4",
735
+ "sha256:f7ee479e96f7ee350db1cf24afa5685a5899e2b34992fb99e1f7c1b0b758d263"
736
+ ],
737
+ "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3, 3.4'",
738
+ "version": "==5.4.0"
739
+ }
740
+ },
741
+ "develop": {}
742
+ }
ptt-crawler/README.md ADDED
@@ -0,0 +1,113 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # **批踢踢爬蟲 ptt-crawler**
2
+ ### 學術研究用途,請勿不當使用。
3
+
4
+ This project scrapes the post details from the website [PTT](https://term.ptt.cc/), and writes the scraped items to csv files.
5
+
6
+
7
+ | author | alias |title | date | ip | city | country | ups | downs | comments | url |
8
+ |----|----|----|----|----|----|----|----|----|----|----|
9
+ | jason789780 | majiLove | \[請益\] google問題的精確與方向 | 2022-09-06 10:39:42 | 223.137.68.113 | Yilan | Taiwan | 9 | 0 | 29 | https://www.ptt.cc/bbs/Soft_Job/M.1662431984.A.A3F.html |
10
+ | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
11
+
12
+
13
+
14
+ ## **說明**
15
+ ### 1. Installation
16
+
17
+ 1. Python version
18
+ * `python >= 3.9`
19
+
20
+ 2. Clone repository
21
+
22
+ ```bash
23
+ git clone [email protected]:lopentu/nlp_web.git
24
+ ```
25
+
26
+ 3. Install Requirement
27
+ ```bash
28
+ cd nlp_web/assignments/ptt-crawler && pip install -r requirements.txt
29
+ ```
30
+
31
+
32
+ ### 2. 使用方式
33
+
34
+ 1. Commands
35
+ ```
36
+ scrapy crawl ptt -a boards=BOARDS [-a scrap_all=BOOLEAN]
37
+ [-a index_from=NUMBER -a index_to=NUMBER]
38
+ [-a since=YEAR] [-a data_dir=PATH]
39
+ [-a ip_cache=BOOLEAN]
40
+
41
+ positional arguments:
42
+ -a boards=BOARDS ptt board name (e.g. Soft_Job)
43
+ -a index_from=NUMBER -a index_to=NUMBER html index number from a ptt board
44
+ -a scrap_all=BOOLEAN scrap all posts if true
45
+ -a since=YEAR scrap all posts from a given year
46
+ -a data_dir=PATH output file path (default: ./data)
47
+ -a ip_cache=BOOLEAN enable redis service to cache ip if true
48
+ ```
49
+
50
+ > If you enable `ip_cache`, please make sure you have Redis on your local machine. Otherwise, you can use `docker-compose` to run the crawler.
51
+
52
+
53
+ * Crawl all the posts of a board:
54
+ ```bash
55
+ scrapy crawl ptt -a boards=Soft_Job -a scrap_all=True
56
+ ```
57
+
58
+ * Crawl all the posts of a board from a year in the past:
59
+ ```bash
60
+ scrapy crawl ptt -a boards=Soft_Job -a since=2020
61
+ ```
62
+
63
+ * Crawl the posts of a board based on html indexes:
64
+ ```bash
65
+ scrapy crawl ptt -a boards=Soft_Job -a index_from=1722 -a index_to=1723
66
+ ```
67
+
68
+ > Please make sure the number of `index_from` is greater than `index_to`.
69
+
70
+ * Crawl the posts of multiple boards. For example:
71
+ ```bash
72
+ scrapy crawl ptt -a boards=Soft_Job,Gossiping -a index_from=1722 -a index_to=1723
73
+ ```
74
+
75
+ >Note: the comma in the argument `boards` cannot have spaces. It cannot be `boards=Soft_Job, Baseball` or `boards=["Soft_Job", "Baseball"]`.
76
+
77
+
78
+
79
+ ### 3. 使用 Docker
80
+ A Docker setup is provided for the crawler.
81
+
82
+ To run the crawler, go to the `docker-compose.yml` file to edit the command:
83
+
84
+ ```yaml
85
+ version: "3"
86
+
87
+ services:
88
+ scraptt:
89
+ build: .
90
+ environment:
91
+ - PYTHON_ENV=production
92
+ depends_on:
93
+ - redis
94
+ links:
95
+ - redis
96
+
97
+ # define your crawler here!
98
+ command: bash -c "scrapy crawl ptt -a boards=Soft_Job,Gossiping -a index_from=1722 -a index_to=1723 -a ip_cache=True"
99
+ ```
100
+ > Feel free to change the command as long as it follows the command format as stated above.
101
+
102
+ Now start the crawler:
103
+
104
+ ```bash
105
+ docker-compose up
106
+ ```
107
+
108
+ We suggest setting the argument `ip_cache` to `true` when you run the crawler via Docker. The reason is that the crawler will connect to Redis container, and there is no need for you to have Redis on your local machine. Most importantly, the performance of the crawler will be increased!
109
+
110
+
111
+
112
+ ## Contact
113
+ If you have any suggestion or question, please do not hesitate to email us at [email protected] or [email protected]
ptt-crawler/docker-compose.yml ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ version: "3"
2
+
3
+ services:
4
+ scraptt:
5
+ build: .
6
+ environment:
7
+ - PYTHON_ENV=production
8
+ depends_on:
9
+ - redis
10
+ links:
11
+ - redis
12
+
13
+ # define your crawler here!
14
+ command: bash -c "scrapy crawl ptt -a boards=Soft_Job -a index_from=1500 -a index_to=1500 -a ip_cache=True"
15
+
16
+ volumes:
17
+ - "./data:/app/data"
18
+
19
+ redis:
20
+ image: redis:7
21
+ restart: always
22
+ healthcheck:
23
+ test: "redis-cli ping"
24
+ interval: 3s
25
+ timeout: 3s
26
+ retries: 5
27
+ start_period: 5s
ptt-crawler/requirements.txt ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ redis==4.3.4
2
+ scrapy==2.6.2
3
+ pyquery==1.4.3
4
+ pydantic==1.10.2
5
+ requests==2.28.1
6
+ python-dotenv==0.21.0
7
+ scrapy-user-agents==0.1.1
8
+ scrapy-fake-useragent==1.4.4
ptt-crawler/scraptt/__init__.py ADDED
File without changes
ptt-crawler/scraptt/configs/__init__.py ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ from .configs import PTT, PTT_BOARD, COOKIES
2
+
3
+
4
+ __all__ = ["PTT", "PTT_BOARD", "COOKIES"]
ptt-crawler/scraptt/configs/configs.py ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # --------------------------------------------------------------------
2
+ # ptt urls
3
+
4
+
5
+ PTT = "https://www.ptt.cc/bbs"
6
+ PTT_BOARD = PTT + "/{}/index{}.html" # template string (board, html index)
7
+
8
+
9
+ # --------------------------------------------------------------------
10
+ # cookies
11
+
12
+
13
+ COOKIES = {"over18": "1"}
ptt-crawler/scraptt/items/__init__.py ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ from .items import ScrapttItem
2
+
3
+
4
+ __all__ = ["ScrapttItem"]
ptt-crawler/scraptt/items/items.py ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from typing import Union
2
+ from pydantic import BaseModel
3
+
4
+
5
+ class ScrapttItem(BaseModel):
6
+ """
7
+ The ScrapttItem object keeps track of an item in inventory.
8
+ """
9
+
10
+ board: str
11
+ author: str
12
+ alias: str
13
+ title: str
14
+ date: str
15
+ ip: str
16
+ city: Union[str, None]
17
+ country: Union[str, None]
18
+ ups: int
19
+ downs: int
20
+ comments: int
21
+ url: str
ptt-crawler/scraptt/middlewares/__init__.py ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ from .pyquery import PyqueryMiddleware
2
+
3
+
4
+ __all__ = ["PyqueryMiddleware"]
ptt-crawler/scraptt/middlewares/pyquery.py ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from ..configs import PTT
2
+ from pyquery import PyQuery
3
+ from scrapy.http.response.html import HtmlResponse
4
+
5
+
6
+ class PyqueryMiddleware:
7
+ """
8
+ The PyqueryMiddleware object injects PyQuery object into Scrapy `response`.
9
+ """
10
+
11
+ def process_response(self, request, response, spider) -> HtmlResponse:
12
+ response.dom = PyQuery(response.text).make_links_absolute(PTT)
13
+ return response
ptt-crawler/scraptt/models/__init__.py ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ from .redis import redis_cli
2
+
3
+
4
+ __all__ = ["redis_cli"]
ptt-crawler/scraptt/models/redis.py ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import os
2
+ import redis
3
+ from pathlib import Path
4
+ from dotenv import load_dotenv
5
+
6
+ env_path = Path("__file__").resolve().parent / ".env"
7
+ load_dotenv(env_path)
8
+
9
+ is_production = os.environ.get("PYTHON_ENV") == "production"
10
+ host = "redis" if is_production else "localhost"
11
+
12
+ pool = redis.ConnectionPool(host=host, port=6379, decode_responses=True)
13
+ redis_cli = redis.Redis(connection_pool=pool)
ptt-crawler/scraptt/pipelines/__init__.py ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ from .csv import CsvPipeline
2
+
3
+
4
+ __all__ = ["CsvPipeline"]
ptt-crawler/scraptt/pipelines/csv.py ADDED
@@ -0,0 +1,45 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from pathlib import Path
2
+ from io import BufferedWriter
3
+ from datetime import datetime
4
+ from ..spiders import PttSpider
5
+ from typing import Any, Dict, Tuple
6
+ from scrapy.exporters import BaseItemExporter, CsvItemExporter
7
+
8
+
9
+ class CsvPipeline:
10
+ """
11
+ The CsvPipeline object writes the scraped item to csv.
12
+ """
13
+
14
+ def open_spider(self, spider: PttSpider) -> None:
15
+ self.exporters_list: Dict[str, Tuple[BaseItemExporter, BufferedWriter]] = {}
16
+
17
+ def _exporter_for_item(
18
+ self, item: Dict[str, Any], spider: PttSpider
19
+ ) -> CsvItemExporter:
20
+ data_dir = spider.data_dir
21
+ board = item.pop("board")
22
+ date = datetime.strptime(item["date"], "%Y-%m-%d %H:%M:%S")
23
+ year = date.year
24
+ month = date.month
25
+ dir_path = f"{data_dir}/{board}/{year}"
26
+ file_path = f"{dir_path}/{board}_{year}_{month}"
27
+ Path(dir_path).mkdir(parents=True, exist_ok=True)
28
+
29
+ if file_path not in self.exporters_list:
30
+ file = open(f"{file_path}.csv", "wb")
31
+ exporter = CsvItemExporter(file)
32
+ exporter.start_exporting()
33
+ self.exporters_list[file_path] = (exporter, file)
34
+
35
+ return self.exporters_list[file_path][0]
36
+
37
+ def process_item(self, item: Dict[str, Any], spider: PttSpider) -> Dict[str, Any]:
38
+ exporter = self._exporter_for_item(item, spider)
39
+ exporter.export_item(item)
40
+ return item
41
+
42
+ def close_spider(self, spider: PttSpider) -> None:
43
+ for exporter, csv_file in self.exporters_list.values():
44
+ exporter.finish_exporting()
45
+ csv_file.close()
ptt-crawler/scraptt/settings.py ADDED
@@ -0,0 +1,96 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Scrapy settings for scraptt project
2
+ #
3
+ # For simplicity, this file contains only settings considered important or
4
+ # commonly used. You can find more settings consulting the documentation:
5
+ #
6
+ # https://docs.scrapy.org/en/latest/topics/settings.html
7
+ # https://docs.scrapy.org/en/latest/topics/downloader-middleware.html
8
+ # https://docs.scrapy.org/en/latest/topics/spider-middleware.html
9
+
10
+ BOT_NAME = "scraptt"
11
+
12
+ SPIDER_MODULES = ["scraptt.spiders"]
13
+ NEWSPIDER_MODULE = "scraptt.spiders"
14
+
15
+
16
+ # Crawl responsibly by identifying yourself (and your website) on the user-agent
17
+ # USER_AGENT = 'scraptt (+http://www.yourdomain.com)'
18
+
19
+ # Obey robots.txt rules
20
+ ROBOTSTXT_OBEY = False
21
+
22
+ # Configure maximum concurrent requests performed by Scrapy (default: 16)
23
+ CONCURRENT_REQUESTS = 16
24
+
25
+ # Configure a delay for requests for the same website (default: 0)
26
+ # See https://docs.scrapy.org/en/latest/topics/settings.html#download-delay
27
+ # See also autothrottle settings and docs
28
+ DOWNLOAD_DELAY = 0.4
29
+ # The download delay setting will honor only one of:
30
+ CONCURRENT_REQUESTS_PER_DOMAIN = 16
31
+ CONCURRENT_REQUESTS_PER_IP = 16
32
+
33
+ # Disable cookies (enabled by default)
34
+ COOKIES_ENABLED = True
35
+
36
+ # Disable Telnet Console (enabled by default)
37
+ TELNETCONSOLE_ENABLED = False
38
+
39
+ # Override the default request headers:
40
+ # DEFAULT_REQUEST_HEADERS = {
41
+ # 'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8',
42
+ # 'Accept-Language': 'en',
43
+ # }
44
+
45
+ # Enable or disable spider middlewares
46
+ # See https://docs.scrapy.org/en/latest/topics/spider-middleware.html
47
+ # SPIDER_MIDDLEWARES = {
48
+ # 'scraptt.middlewares.ScrapttSpiderMiddleware': 543,
49
+ # }
50
+
51
+ # Enable or disable downloader middlewares
52
+ # See https://docs.scrapy.org/en/latest/topics/downloader-middleware.html
53
+ DOWNLOADER_MIDDLEWARES = {
54
+ # "scraptt.middlewares.ScrapttDownloaderMiddleware": 543,
55
+ "scraptt.middlewares.PyqueryMiddleware": 543,
56
+ "scrapy.downloadermiddlewares.useragent.UserAgentMiddleware": None,
57
+ "scrapy_user_agents.middlewares.RandomUserAgentMiddleware": 400,
58
+ }
59
+
60
+ # Enable or disable extensions
61
+ # See https://docs.scrapy.org/en/latest/topics/extensions.html
62
+ EXTENSIONS = {
63
+ "scrapy.extensions.telnet.TelnetConsole": None,
64
+ }
65
+
66
+ # Configure item pipelines
67
+ # See https://docs.scrapy.org/en/latest/topics/item-pipeline.html
68
+ ITEM_PIPELINES = {
69
+ 'scraptt.pipelines.CsvPipeline': 300,
70
+ }
71
+
72
+ # Enable and configure the AutoThrottle extension (disabled by default)
73
+ # See https://docs.scrapy.org/en/latest/topics/autothrottle.html
74
+ # AUTOTHROTTLE_ENABLED = True
75
+ # The initial download delay
76
+ # AUTOTHROTTLE_START_DELAY = 5
77
+ # The maximum download delay to be set in case of high latencies
78
+ # AUTOTHROTTLE_MAX_DELAY = 60
79
+ # The average number of requests Scrapy should be sending in parallel to
80
+ # each remote server
81
+ # AUTOTHROTTLE_TARGET_CONCURRENCY = 1.0
82
+ # Enable showing throttling stats for every response received:
83
+ # AUTOTHROTTLE_DEBUG = False
84
+
85
+ # Enable and configure HTTP caching (disabled by default)
86
+ # See https://docs.scrapy.org/en/latest/topics/downloader-middleware.html#httpcache-middleware-settings
87
+ # HTTPCACHE_ENABLED = True
88
+ # HTTPCACHE_EXPIRATION_SECS = 0
89
+ # HTTPCACHE_DIR = 'httpcache'
90
+ # HTTPCACHE_IGNORE_HTTP_CODES = []
91
+ # HTTPCACHE_STORAGE = 'scrapy.extensions.httpcache.FilesystemCacheStorage'
92
+
93
+
94
+ RETRY_ENABLED = True
95
+ RETRY_HTTP_CODES = [500, 502, 503, 504, 520, 521, 522, 524, 525, 408, 429]
96
+ RETRY_TIMES = 5
ptt-crawler/scraptt/spiders/__init__.py ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ from .ptt import PttSpider
2
+
3
+
4
+ __all__ = ["PttSpider"]
ptt-crawler/scraptt/spiders/base/__init__.py ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ from .base import BaseSpider
2
+
3
+
4
+ __all__ = ["BaseSpider"]
ptt-crawler/scraptt/spiders/base/base.py ADDED
@@ -0,0 +1,63 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from scrapy import Spider
2
+ from typing import Optional
3
+ from ..utils.parsers.html import (
4
+ IndexParser,
5
+ LatestIndexParser,
6
+ YearBackwardIndexParser,
7
+ get_title_tags,
8
+ )
9
+ from abc import ABC, abstractmethod
10
+ from ..utils.requests import fetch_ptt_boards
11
+ from scrapy.http.response.html import HtmlResponse
12
+
13
+
14
+ class BaseSpider(Spider, ABC):
15
+ """
16
+ The BasePostSpider object defines the behaviour for crawling and parsing ptt posts.
17
+ """
18
+
19
+ allowed_domains = ["ptt.cc"]
20
+
21
+ def __init__(
22
+ self,
23
+ boards: str,
24
+ data_dir: str = "./data",
25
+ ip_cache: bool = False,
26
+ scrap_all: Optional[bool] = None,
27
+ index_from: Optional[int] = None,
28
+ index_to: Optional[int] = None,
29
+ since: Optional[int] = None,
30
+ *args,
31
+ **kwargs
32
+ ) -> None:
33
+ super().__init__(*args, **kwargs)
34
+ self.boards = boards.split(",")
35
+ self.data_dir = data_dir
36
+ self.ip_cache = ip_cache
37
+ self.scrap_all = scrap_all
38
+ self.index_from = index_from
39
+ self.index_to = index_to
40
+ self.since = since
41
+
42
+ def start_requests(self):
43
+ return fetch_ptt_boards(
44
+ self.boards, self.parse_index, self.index_from, self.index_to
45
+ )
46
+
47
+ def parse_index(self, response: HtmlResponse):
48
+ title_tags = get_title_tags(response)
49
+
50
+ if self.scrap_all:
51
+ return LatestIndexParser(self.logger).parse(response, self.parse_index)
52
+ elif self.since:
53
+ return YearBackwardIndexParser(
54
+ self.since,
55
+ title_tags,
56
+ self.logger,
57
+ ).parse(response, callback=self.parse, self_callback=self.parse_index)
58
+ else:
59
+ return IndexParser(title_tags).parse(self.parse)
60
+
61
+ @abstractmethod
62
+ def parse(self, response: HtmlResponse, **kwargs):
63
+ pass
ptt-crawler/scraptt/spiders/ptt.py ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import asyncio
2
+ from .base import BaseSpider
3
+ from ..items import ScrapttItem
4
+ from scrapy.http.response.html import HtmlResponse
5
+ from .utils.parsers.posts.meta import get_meta_data
6
+ from .utils.parsers.posts.ip import get_ip, get_ip_loc
7
+ from .utils.parsers.posts.comments import count_comments
8
+
9
+
10
+ async def get_post_data(response: HtmlResponse):
11
+ return await asyncio.gather(
12
+ *[get_meta_data(response), count_comments(response), get_ip(response)]
13
+ )
14
+
15
+
16
+ class PttSpider(BaseSpider):
17
+ name = "ptt"
18
+
19
+ def __init__(self, **kwargs) -> None:
20
+ super().__init__(**kwargs)
21
+
22
+ def parse(self, response: HtmlResponse):
23
+ post_url = response.url
24
+ meta_data, comment_counter, ip = asyncio.run(get_post_data(response))
25
+ author, alias, board, title, date = meta_data
26
+ ups = comment_counter["推"]
27
+ downs = comment_counter["噓"]
28
+ comments = comment_counter["→"]
29
+ city, country = get_ip_loc(ip, self.ip_cache)
30
+
31
+ data = {
32
+ "board": board,
33
+ "author": author,
34
+ "alias": alias,
35
+ "title": title,
36
+ "date": date,
37
+ "ip": ip,
38
+ "city": city,
39
+ "country": country,
40
+ "ups": ups,
41
+ "downs": downs,
42
+ "comments": comments,
43
+ "url": post_url,
44
+ }
45
+
46
+ yield ScrapttItem(**data).dict()
ptt-crawler/scraptt/spiders/utils/parsers/html/__init__.py ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from .index import IndexParser
2
+ from .utils import get_title_tags
3
+ from .latest_index import LatestIndexParser
4
+ from .year_backward_index import YearBackwardIndexParser
5
+
6
+
7
+ __all__ = [
8
+ "IndexParser",
9
+ "get_title_tags",
10
+ "LatestIndexParser",
11
+ "YearBackwardIndexParser",
12
+ ]
ptt-crawler/scraptt/spiders/utils/parsers/html/base.py ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from typing import Callable
2
+ from abc import ABC, abstractmethod
3
+ from scrapy.http.response.html import HtmlResponse
4
+
5
+
6
+ class Parser(ABC):
7
+ """
8
+ The Parser object defines the behaviour for processing the response and
9
+ returning scraped data or more URLs to follow.
10
+ """
11
+
12
+ @abstractmethod
13
+ def parse(self, response: HtmlResponse, callback: Callable, **kwargs):
14
+ """The parse method initiates the parsing processes."""
15
+ pass
ptt-crawler/scraptt/spiders/utils/parsers/html/index.py ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from .base import Parser
2
+ from .....configs import COOKIES
3
+ from typing import Callable, List
4
+ from dataclasses import dataclass
5
+ from scrapy import Request, Selector
6
+
7
+
8
+ @dataclass
9
+ class IndexParser(Parser):
10
+ """
11
+ The IndexParser object parses one of the index.html files.
12
+ """
13
+
14
+ title_tags: List[Selector]
15
+
16
+ def parse(self, callback: Callable):
17
+ tag_lists = list(self.title_tags.items())
18
+
19
+ for title_tag in tag_lists:
20
+ url = title_tag.attr("href")
21
+ yield Request(url, cookies=COOKIES, callback=callback)
ptt-crawler/scraptt/spiders/utils/parsers/html/latest_index.py ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import re
2
+ from .base import Parser
3
+ from scrapy import Request
4
+ from typing import Callable
5
+ from .....configs import COOKIES
6
+ from logging import LoggerAdapter
7
+ from dataclasses import dataclass
8
+ from scrapy.http.response.html import HtmlResponse
9
+
10
+
11
+ @dataclass
12
+ class LatestIndexParser(Parser):
13
+ """
14
+ The LatestIndexParser objects parses the latest index.html file.
15
+ """
16
+
17
+ logger: LoggerAdapter
18
+
19
+ def get_latest_index(self, prev_url: str):
20
+ return int(re.search(r"index(\d{1,6})\.html", prev_url).group(1))
21
+
22
+ def get_board(self, url: str):
23
+ return re.search(r"www\.ptt\.cc\/bbs\/([\w\d\-_]{1,30})\/", url).group(1)
24
+
25
+ def parse(self, response: HtmlResponse, callback: Callable):
26
+ prev_url = response.css('.btn.wide:contains("上頁")::attr(href)').get()
27
+ self.logger.info(f"index link: {prev_url}")
28
+
29
+ latest_index = self.get_latest_index(prev_url)
30
+ board = self.get_board(response.url)
31
+
32
+ for index in range(1, latest_index + 1):
33
+ url = f"https://www.ptt.cc/bbs/{board}/index{index}.html"
34
+ self.logger.info(f"index link: {url}")
35
+
36
+ yield Request(url, cookies=COOKIES, callback=callback)
ptt-crawler/scraptt/spiders/utils/parsers/html/utils.py ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from typing import List
2
+ from scrapy.selector import Selector
3
+ from scrapy.http.response.html import HtmlResponse
4
+
5
+
6
+ def get_title_tags(response: HtmlResponse) -> List[Selector]:
7
+ """The get_title_tags function gets the title tags DOM.
8
+ Args:
9
+ response (HtmlResponse): the scrapy HtmlResponse.
10
+ Returns:
11
+ a list of scrapy anchor tag selectors
12
+ """
13
+ title_css = ".r-ent .title a"
14
+
15
+ if response.url.endswith("index.html"):
16
+ return response.dom(".r-list-sep").prev_all(title_css)
17
+
18
+ return response.dom(title_css)
ptt-crawler/scraptt/spiders/utils/parsers/html/year_backward_index.py ADDED
@@ -0,0 +1,44 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import re
2
+ from .base import Parser
3
+ from datetime import datetime
4
+ from .....configs import COOKIES
5
+ from logging import LoggerAdapter
6
+ from typing import Callable, List
7
+ from dataclasses import dataclass
8
+ from scrapy import Request, Selector
9
+ from scrapy.http.response.html import HtmlResponse
10
+
11
+
12
+ @dataclass
13
+ class YearBackwardIndexParser(Parser):
14
+ """
15
+ The YearBackwardIndexParser object parses the index.html files from a year in the
16
+ past to the current one.
17
+ """
18
+
19
+ since: str
20
+ title_tags: List[Selector]
21
+ logger: LoggerAdapter
22
+
23
+ def parse(
24
+ self, response: HtmlResponse, callback: Callable, self_callback: Callable
25
+ ):
26
+ for title_tag in reversed(list(self.title_tags.items())):
27
+ title = title_tag.text()
28
+ post_url = title_tag.attr("href")
29
+ timestamp = re.search(r"(\d{10})", post_url).group(1)
30
+
31
+ if int(timestamp) < int(self.since):
32
+ return None
33
+
34
+ self.logger.info(
35
+ f"+ {title}, {post_url}, {datetime.fromtimestamp(int(timestamp))}"
36
+ )
37
+
38
+ yield Request(post_url, cookies=COOKIES, callback=callback)
39
+
40
+ prev_url = response.dom('.btn.wide:contains("上頁")').attr("href")
41
+ self.logger.info(f"index link: {prev_url}")
42
+
43
+ if prev_url:
44
+ yield Request(prev_url, cookies=COOKIES, callback=self_callback)
ptt-crawler/scraptt/spiders/utils/parsers/posts/comments/__init__.py ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ from .counter import count_comments
2
+
3
+
4
+ __all__ = ["count_comments"]
ptt-crawler/scraptt/spiders/utils/parsers/posts/comments/counter.py ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from typing import List
2
+ from collections import Counter
3
+ from scrapy.http.response.html import HtmlResponse
4
+
5
+
6
+ async def count_comments(response: HtmlResponse) -> Counter:
7
+ """The count_comments function counts the total number of comments in a ptt post.
8
+
9
+ Args:
10
+ response (HtmlResponse): the response to parse
11
+ Returns:
12
+ a Counter object.
13
+ """
14
+
15
+ push_tags: List[str] = response.css('span[class*="push-tag"]::text').getall()
16
+ total_comments = [push_tag.strip() for push_tag in push_tags]
17
+ return Counter(total_comments)
ptt-crawler/scraptt/spiders/utils/parsers/posts/ip/__init__.py ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ from .ip import get_ip
2
+ from .location import get_ip_loc
3
+
4
+
5
+ __all__ = ["get_ip", "get_ip_loc"]
ptt-crawler/scraptt/spiders/utils/parsers/posts/ip/ip.py ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import re
2
+ from scrapy.http.response.html import HtmlResponse
3
+
4
+
5
+ async def get_ip(response: HtmlResponse) -> str:
6
+ """The get_ip function gets the ip address from a ptt post.
7
+
8
+ Args:
9
+ response (HtmlResponse): the response to parse
10
+ Returns:
11
+ a str
12
+ """
13
+ f2_spans = response.dom(".f2")
14
+ old_ip_format = "([0-9.]*)$"
15
+ old_ip = re.search(old_ip_format, f"{f2_spans}").group(1)
16
+
17
+ if old_ip:
18
+ return old_ip
19
+
20
+ f2_spans_list = [f2_span.text() for f2_span in f2_spans.items()]
21
+
22
+ try:
23
+ text = [
24
+ f2_span
25
+ for f2_span in f2_spans_list
26
+ if re.match(r"※ 發信站: 批踢踢實業坊\(ptt\.cc\), 來自:", f2_span)
27
+ ][0]
28
+ return re.search(r"來自: ([0-9.]*)", text).group(1)
29
+
30
+ except:
31
+ ip_match = r"\d{1,3}\.\d{1,3}\.\d{1,3}\.\d{1,3}"
32
+ text = [span for span in f2_spans_list if re.findall(ip_match, span)][-1]
33
+ return re.findall(ip_match, text)[-1]
ptt-crawler/scraptt/spiders/utils/parsers/posts/ip/location.py ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import re
2
+ import requests
3
+ from typing import Tuple
4
+ from ......models import redis_cli
5
+ from requests.adapters import HTTPAdapter, Retry
6
+ from scrapy.http.response.html import HtmlResponse
7
+
8
+
9
+ def fetch_ip(ip: str) -> Tuple[str, str]:
10
+ session = requests.Session()
11
+ retries = Retry(total=5, backoff_factor=1, status_forcelist=[502, 503, 504])
12
+ session.mount("http://", HTTPAdapter(max_retries=retries))
13
+
14
+ response = requests.get(f"http://www.geoplugin.net/json.gp?ip={ip}")
15
+ result = response.json()
16
+ city = result["geoplugin_city"]
17
+ country = result["geoplugin_countryName"]
18
+ return city, country
19
+
20
+
21
+ def fetch_ip_with_cache(ip) -> Tuple[str, str]:
22
+ ip_result = redis_cli.hgetall(ip)
23
+
24
+ if ip_result:
25
+ city = ip_result["city"]
26
+ country = ip_result["country"]
27
+ return city, country
28
+
29
+ city, country = fetch_ip(ip)
30
+
31
+ ttl = 10 * 60
32
+ redis_cli.hset(ip, mapping={"city": city, "country": country})
33
+ redis_cli.expire(name=ip, time=ttl)
34
+
35
+ return city, country
36
+
37
+
38
+ def get_ip_loc(ip: str, ip_cache: bool) -> Tuple[str, str]:
39
+ """The get_ip_loc function get info from an ip.
40
+
41
+ Args:
42
+ ip (str): the ip from a ptt post.
43
+ ip_cache (bool): a boolean that is used to determine whether
44
+ to enable redis service to cache ip.
45
+ Returns:
46
+ a tuple, containing city and country
47
+ """
48
+ if ip_cache:
49
+ return fetch_ip_with_cache(ip)
50
+
51
+ return fetch_ip(ip)
ptt-crawler/scraptt/spiders/utils/parsers/posts/meta/__init__.py ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ from .post import get_meta_data
2
+
3
+ __all__ = ['get_meta_data']
ptt-crawler/scraptt/spiders/utils/parsers/posts/meta/date.py ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import re
2
+ from datetime import datetime
3
+
4
+
5
+ async def format_date(str_date: str) -> str:
6
+ """The format_date function formats dates and times of a ptt post.
7
+
8
+ Args:
9
+ str_date (str): a string date from a ptt post
10
+ Returns:
11
+ a str
12
+ """
13
+ str_format = "%Y-%m-%d %H:%M:%S"
14
+
15
+ try:
16
+ return datetime.strptime(str_date, "%a %b %d %H:%M:%S %Y").strftime(str_format)
17
+ except:
18
+ # handle incomplete date
19
+ str_date = re.match(r"(.*\d{2}:\d{2}:\d{2}).*", str_date).group(1)
20
+ date = datetime.strptime(str_date, "%a %b %d %H:%M:%S")
21
+ date = date.replace(year=datetime.now().year)
22
+ return date.strftime(str_format)
ptt-crawler/scraptt/spiders/utils/parsers/posts/meta/post.py ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import re
2
+ from typing import List
3
+ from .date import format_date
4
+ from scrapy.http.response.html import HtmlResponse
5
+
6
+ meta_tag_selector = '//*[@id="main-content"]/div/span[@class="article-meta-tag"]'
7
+
8
+
9
+ async def get_meta_data(response: HtmlResponse) -> List[str]:
10
+ """The get_meta_data function gets the meta data from a ptt post.
11
+
12
+ Args:
13
+ response (HtmlResponse): the response to parse
14
+ Returns:
15
+ a list of strings
16
+ """
17
+
18
+ meta_tag = response.xpath(
19
+ f"{meta_tag_selector}/following-sibling::*/text()"
20
+ ).getall()
21
+
22
+ author_info = meta_tag[0]
23
+ author = re.search(r"([^(]*)", author_info).group(1).strip()
24
+ alias_match = re.search(r"\((.*)\)", author_info)
25
+ alias = alias_match.group(1) if alias_match else ""
26
+ meta_tag[0] = author
27
+ meta_tag[-1] = await format_date(meta_tag[-1])
28
+ meta_tag.insert(1, alias)
29
+ return meta_tag
ptt-crawler/scraptt/spiders/utils/requests/__init__.py ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ from .requests import fetch_ptt_boards
2
+
3
+
4
+ __all__ = ["fetch_ptt_boards"]
ptt-crawler/scraptt/spiders/utils/requests/requests.py ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from scrapy import Request
2
+ from ....configs import PTT_BOARD, COOKIES
3
+ from typing import Callable, List, Optional
4
+
5
+
6
+ def fetch_ptt_boards(
7
+ boards_list: List[str],
8
+ callback: Callable,
9
+ index_from: Optional[str] = None,
10
+ index_to: Optional[str] = None,
11
+ ):
12
+ """The fetch_ptt_boards function fetches the ptt boards htm indexes.
13
+
14
+ Args:
15
+ boards_list (list): a list of boards
16
+ callback (Callable): a scrapy parse function
17
+ index_from (str | None): the starting html index
18
+ index_to (str | None): the ending html index
19
+ Returns:
20
+ a scrapy Request.
21
+ """
22
+
23
+ for board in boards_list:
24
+ if index_from is not None and index_to is not None:
25
+ if int(index_from) > int(index_to):
26
+ raise ValueError(
27
+ "the value of `index_from` cannot be greater than `index_to`."
28
+ )
29
+
30
+ for index in range(int(index_from), int(index_to) + 1):
31
+ url = PTT_BOARD.format(board, index)
32
+ yield Request(url, cookies=COOKIES, callback=callback)
33
+ else:
34
+ url = PTT_BOARD.format(board, "")
35
+ yield Request(url, cookies=COOKIES, callback=callback)
ptt-crawler/scrapy.cfg ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Automatically created by: scrapy startproject
2
+ #
3
+ # For more information about the [deploy] section see:
4
+ # https://scrapyd.readthedocs.io/en/latest/deploy.html
5
+
6
+ [settings]
7
+ default = scraptt.settings
8
+
9
+ [deploy]
10
+ #url = http://localhost:6800/
11
+ project = scraptt
requirements.txt ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ aiofiles==0.8.0
2
+ cwngraph==0.4.0
3
+ distiltag==0.2.2
4
+ streamlit==1.12.2
5
+ python-dotenv==0.20.0
6
+ cwnsensetagger==0.1.6
7
+ ckip-transformers==0.3.2
twNLP-app/Dockerfile ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ FROM python:3.7-slim
2
+
3
+ WORKDIR /app
4
+
5
+ COPY ./Pipfile* ./
6
+
7
+ RUN pip install pipenv && \
8
+ apt-get update && \
9
+ apt-get install -y --no-install-recommends gcc python3-dev libssl-dev && \
10
+ pipenv install --deploy --system && \
11
+ apt-get remove -y gcc python3-dev libssl-dev && \
12
+ apt-get autoremove -y && \
13
+ pip uninstall pipenv -y \
14
+ && rm -rf /var/lib/apt/lists/*
15
+
16
+ COPY ./.streamlit ./.streamlit
17
+
18
+ COPY ./src ./src
19
+
20
+ EXPOSE 8501
twNLP-app/LICENSE ADDED
@@ -0,0 +1,201 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Apache License
2
+ Version 2.0, January 2004
3
+ http://www.apache.org/licenses/
4
+
5
+ TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
6
+
7
+ 1. Definitions.
8
+
9
+ "License" shall mean the terms and conditions for use, reproduction,
10
+ and distribution as defined by Sections 1 through 9 of this document.
11
+
12
+ "Licensor" shall mean the copyright owner or entity authorized by
13
+ the copyright owner that is granting the License.
14
+
15
+ "Legal Entity" shall mean the union of the acting entity and all
16
+ other entities that control, are controlled by, or are under common
17
+ control with that entity. For the purposes of this definition,
18
+ "control" means (i) the power, direct or indirect, to cause the
19
+ direction or management of such entity, whether by contract or
20
+ otherwise, or (ii) ownership of fifty percent (50%) or more of the
21
+ outstanding shares, or (iii) beneficial ownership of such entity.
22
+
23
+ "You" (or "Your") shall mean an individual or Legal Entity
24
+ exercising permissions granted by this License.
25
+
26
+ "Source" form shall mean the preferred form for making modifications,
27
+ including but not limited to software source code, documentation
28
+ source, and configuration files.
29
+
30
+ "Object" form shall mean any form resulting from mechanical
31
+ transformation or translation of a Source form, including but
32
+ not limited to compiled object code, generated documentation,
33
+ and conversions to other media types.
34
+
35
+ "Work" shall mean the work of authorship, whether in Source or
36
+ Object form, made available under the License, as indicated by a
37
+ copyright notice that is included in or attached to the work
38
+ (an example is provided in the Appendix below).
39
+
40
+ "Derivative Works" shall mean any work, whether in Source or Object
41
+ form, that is based on (or derived from) the Work and for which the
42
+ editorial revisions, annotations, elaborations, or other modifications
43
+ represent, as a whole, an original work of authorship. For the purposes
44
+ of this License, Derivative Works shall not include works that remain
45
+ separable from, or merely link (or bind by name) to the interfaces of,
46
+ the Work and Derivative Works thereof.
47
+
48
+ "Contribution" shall mean any work of authorship, including
49
+ the original version of the Work and any modifications or additions
50
+ to that Work or Derivative Works thereof, that is intentionally
51
+ submitted to Licensor for inclusion in the Work by the copyright owner
52
+ or by an individual or Legal Entity authorized to submit on behalf of
53
+ the copyright owner. For the purposes of this definition, "submitted"
54
+ means any form of electronic, verbal, or written communication sent
55
+ to the Licensor or its representatives, including but not limited to
56
+ communication on electronic mailing lists, source code control systems,
57
+ and issue tracking systems that are managed by, or on behalf of, the
58
+ Licensor for the purpose of discussing and improving the Work, but
59
+ excluding communication that is conspicuously marked or otherwise
60
+ designated in writing by the copyright owner as "Not a Contribution."
61
+
62
+ "Contributor" shall mean Licensor and any individual or Legal Entity
63
+ on behalf of whom a Contribution has been received by Licensor and
64
+ subsequently incorporated within the Work.
65
+
66
+ 2. Grant of Copyright License. Subject to the terms and conditions of
67
+ this License, each Contributor hereby grants to You a perpetual,
68
+ worldwide, non-exclusive, no-charge, royalty-free, irrevocable
69
+ copyright license to reproduce, prepare Derivative Works of,
70
+ publicly display, publicly perform, sublicense, and distribute the
71
+ Work and such Derivative Works in Source or Object form.
72
+
73
+ 3. Grant of Patent License. Subject to the terms and conditions of
74
+ this License, each Contributor hereby grants to You a perpetual,
75
+ worldwide, non-exclusive, no-charge, royalty-free, irrevocable
76
+ (except as stated in this section) patent license to make, have made,
77
+ use, offer to sell, sell, import, and otherwise transfer the Work,
78
+ where such license applies only to those patent claims licensable
79
+ by such Contributor that are necessarily infringed by their
80
+ Contribution(s) alone or by combination of their Contribution(s)
81
+ with the Work to which such Contribution(s) was submitted. If You
82
+ institute patent litigation against any entity (including a
83
+ cross-claim or counterclaim in a lawsuit) alleging that the Work
84
+ or a Contribution incorporated within the Work constitutes direct
85
+ or contributory patent infringement, then any patent licenses
86
+ granted to You under this License for that Work shall terminate
87
+ as of the date such litigation is filed.
88
+
89
+ 4. Redistribution. You may reproduce and distribute copies of the
90
+ Work or Derivative Works thereof in any medium, with or without
91
+ modifications, and in Source or Object form, provided that You
92
+ meet the following conditions:
93
+
94
+ (a) You must give any other recipients of the Work or
95
+ Derivative Works a copy of this License; and
96
+
97
+ (b) You must cause any modified files to carry prominent notices
98
+ stating that You changed the files; and
99
+
100
+ (c) You must retain, in the Source form of any Derivative Works
101
+ that You distribute, all copyright, patent, trademark, and
102
+ attribution notices from the Source form of the Work,
103
+ excluding those notices that do not pertain to any part of
104
+ the Derivative Works; and
105
+
106
+ (d) If the Work includes a "NOTICE" text file as part of its
107
+ distribution, then any Derivative Works that You distribute must
108
+ include a readable copy of the attribution notices contained
109
+ within such NOTICE file, excluding those notices that do not
110
+ pertain to any part of the Derivative Works, in at least one
111
+ of the following places: within a NOTICE text file distributed
112
+ as part of the Derivative Works; within the Source form or
113
+ documentation, if provided along with the Derivative Works; or,
114
+ within a display generated by the Derivative Works, if and
115
+ wherever such third-party notices normally appear. The contents
116
+ of the NOTICE file are for informational purposes only and
117
+ do not modify the License. You may add Your own attribution
118
+ notices within Derivative Works that You distribute, alongside
119
+ or as an addendum to the NOTICE text from the Work, provided
120
+ that such additional attribution notices cannot be construed
121
+ as modifying the License.
122
+
123
+ You may add Your own copyright statement to Your modifications and
124
+ may provide additional or different license terms and conditions
125
+ for use, reproduction, or distribution of Your modifications, or
126
+ for any such Derivative Works as a whole, provided Your use,
127
+ reproduction, and distribution of the Work otherwise complies with
128
+ the conditions stated in this License.
129
+
130
+ 5. Submission of Contributions. Unless You explicitly state otherwise,
131
+ any Contribution intentionally submitted for inclusion in the Work
132
+ by You to the Licensor shall be under the terms and conditions of
133
+ this License, without any additional terms or conditions.
134
+ Notwithstanding the above, nothing herein shall supersede or modify
135
+ the terms of any separate license agreement you may have executed
136
+ with Licensor regarding such Contributions.
137
+
138
+ 6. Trademarks. This License does not grant permission to use the trade
139
+ names, trademarks, service marks, or product names of the Licensor,
140
+ except as required for reasonable and customary use in describing the
141
+ origin of the Work and reproducing the content of the NOTICE file.
142
+
143
+ 7. Disclaimer of Warranty. Unless required by applicable law or
144
+ agreed to in writing, Licensor provides the Work (and each
145
+ Contributor provides its Contributions) on an "AS IS" BASIS,
146
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
147
+ implied, including, without limitation, any warranties or conditions
148
+ of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
149
+ PARTICULAR PURPOSE. You are solely responsible for determining the
150
+ appropriateness of using or redistributing the Work and assume any
151
+ risks associated with Your exercise of permissions under this License.
152
+
153
+ 8. Limitation of Liability. In no event and under no legal theory,
154
+ whether in tort (including negligence), contract, or otherwise,
155
+ unless required by applicable law (such as deliberate and grossly
156
+ negligent acts) or agreed to in writing, shall any Contributor be
157
+ liable to You for damages, including any direct, indirect, special,
158
+ incidental, or consequential damages of any character arising as a
159
+ result of this License or out of the use or inability to use the
160
+ Work (including but not limited to damages for loss of goodwill,
161
+ work stoppage, computer failure or malfunction, or any and all
162
+ other commercial damages or losses), even if such Contributor
163
+ has been advised of the possibility of such damages.
164
+
165
+ 9. Accepting Warranty or Additional Liability. While redistributing
166
+ the Work or Derivative Works thereof, You may choose to offer,
167
+ and charge a fee for, acceptance of support, warranty, indemnity,
168
+ or other liability obligations and/or rights consistent with this
169
+ License. However, in accepting such obligations, You may act only
170
+ on Your own behalf and on Your sole responsibility, not on behalf
171
+ of any other Contributor, and only if You agree to indemnify,
172
+ defend, and hold each Contributor harmless for any liability
173
+ incurred by, or claims asserted against, such Contributor by reason
174
+ of your accepting any such warranty or additional liability.
175
+
176
+ END OF TERMS AND CONDITIONS
177
+
178
+ APPENDIX: How to apply the Apache License to your work.
179
+
180
+ To apply the Apache License to your work, attach the following
181
+ boilerplate notice, with the fields enclosed by brackets "[]"
182
+ replaced with your own identifying information. (Don't include
183
+ the brackets!) The text should be enclosed in the appropriate
184
+ comment syntax for the file format. We also recommend that a
185
+ file or class name and description of purpose be included on the
186
+ same "printed page" as the copyright notice for easier
187
+ identification within third-party archives.
188
+
189
+ Copyright [yyyy] [name of copyright owner]
190
+
191
+ Licensed under the Apache License, Version 2.0 (the "License");
192
+ you may not use this file except in compliance with the License.
193
+ You may obtain a copy of the License at
194
+
195
+ http://www.apache.org/licenses/LICENSE-2.0
196
+
197
+ Unless required by applicable law or agreed to in writing, software
198
+ distributed under the License is distributed on an "AS IS" BASIS,
199
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
200
+ See the License for the specific language governing permissions and
201
+ limitations under the License.
twNLP-app/Pipfile ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [[source]]
2
+ url = "https://pypi.org/simple"
3
+ verify_ssl = true
4
+ name = "pypi"
5
+
6
+ [packages]
7
+ streamlit = "*"
8
+ ckip-transformers = "*"
9
+ cwngraph = "*"
10
+ distiltag = "*"
11
+ cwnsensetagger = "*"
12
+ aiofiles = "*"
13
+ python-dotenv = "*"
14
+
15
+ [dev-packages]
16
+
17
+ [requires]
18
+ python_version = "3.7"
twNLP-app/Pipfile.lock ADDED
@@ -0,0 +1,953 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_meta": {
3
+ "hash": {
4
+ "sha256": "c3ccdc36761e5f63f4df701a2b449aae3db40ccf5b055b6fc06ba39e61001309"
5
+ },
6
+ "pipfile-spec": 6,
7
+ "requires": {
8
+ "python_version": "3.7"
9
+ },
10
+ "sources": [
11
+ {
12
+ "name": "pypi",
13
+ "url": "https://pypi.org/simple",
14
+ "verify_ssl": true
15
+ }
16
+ ]
17
+ },
18
+ "default": {
19
+ "aiofiles": {
20
+ "hashes": [
21
+ "sha256:7a973fc22b29e9962d0897805ace5856e6a566ab1f0c8e5c91ff6c866519c937",
22
+ "sha256:8334f23235248a3b2e83b2c3a78a22674f39969b96397126cc93664d9a901e59"
23
+ ],
24
+ "index": "pypi",
25
+ "version": "==0.8.0"
26
+ },
27
+ "altair": {
28
+ "hashes": [
29
+ "sha256:0c724848ae53410c13fa28be2b3b9a9dcb7b5caa1a70f7f217bd663bb419935a",
30
+ "sha256:d87d9372e63b48cd96b2a6415f0cf9457f50162ab79dc7a31cd7e024dd840026"
31
+ ],
32
+ "markers": "python_version >= '3.7'",
33
+ "version": "==4.2.0"
34
+ },
35
+ "attrs": {
36
+ "hashes": [
37
+ "sha256:29adc2665447e5191d0e7c568fde78b21f9672d344281d0c6e1ab085429b22b6",
38
+ "sha256:86efa402f67bf2df34f51a335487cf46b1ec130d02b8d39fd248abfd30da551c"
39
+ ],
40
+ "markers": "python_version >= '3.5'",
41
+ "version": "==22.1.0"
42
+ },
43
+ "backports.zoneinfo": {
44
+ "hashes": [
45
+ "sha256:17746bd546106fa389c51dbea67c8b7c8f0d14b5526a579ca6ccf5ed72c526cf",
46
+ "sha256:1b13e654a55cd45672cb54ed12148cd33628f672548f373963b0bff67b217328",
47
+ "sha256:1c5742112073a563c81f786e77514969acb58649bcdf6cdf0b4ed31a348d4546",
48
+ "sha256:4a0f800587060bf8880f954dbef70de6c11bbe59c673c3d818921f042f9954a6",
49
+ "sha256:5c144945a7752ca544b4b78c8c41544cdfaf9786f25fe5ffb10e838e19a27570",
50
+ "sha256:7b0a64cda4145548fed9efc10322770f929b944ce5cee6c0dfe0c87bf4c0c8c9",
51
+ "sha256:8439c030a11780786a2002261569bdf362264f605dfa4d65090b64b05c9f79a7",
52
+ "sha256:8961c0f32cd0336fb8e8ead11a1f8cd99ec07145ec2931122faaac1c8f7fd987",
53
+ "sha256:89a48c0d158a3cc3f654da4c2de1ceba85263fafb861b98b59040a5086259722",
54
+ "sha256:a76b38c52400b762e48131494ba26be363491ac4f9a04c1b7e92483d169f6582",
55
+ "sha256:da6013fd84a690242c310d77ddb8441a559e9cb3d3d59ebac9aca1a57b2e18bc",
56
+ "sha256:e55b384612d93be96506932a786bbcde5a2db7a9e6a4bb4bffe8b733f5b9036b",
57
+ "sha256:e81b76cace8eda1fca50e345242ba977f9be6ae3945af8d46326d776b4cf78d1",
58
+ "sha256:e8236383a20872c0cdf5a62b554b27538db7fa1bbec52429d8d106effbaeca08",
59
+ "sha256:f04e857b59d9d1ccc39ce2da1021d196e47234873820cbeaad210724b1ee28ac",
60
+ "sha256:fadbfe37f74051d024037f223b8e001611eac868b5c5b06144ef4d8b799862f2"
61
+ ],
62
+ "markers": "python_version < '3.9'",
63
+ "version": "==0.2.1"
64
+ },
65
+ "beautifulsoup4": {
66
+ "hashes": [
67
+ "sha256:58d5c3d29f5a36ffeb94f02f0d786cd53014cf9b3b3951d42e0080d8a9498d30",
68
+ "sha256:ad9aa55b65ef2808eb405f46cf74df7fcb7044d5cbc26487f96eb2ef2e436693"
69
+ ],
70
+ "markers": "python_version >= '3.6'",
71
+ "version": "==4.11.1"
72
+ },
73
+ "blinker": {
74
+ "hashes": [
75
+ "sha256:1eb563df6fdbc39eeddc177d953203f99f097e9bf0e2b8f9f3cf18b6ca425e36",
76
+ "sha256:923e5e2f69c155f2cc42dafbbd70e16e3fde24d2d4aa2ab72fbe386238892462"
77
+ ],
78
+ "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3, 3.4'",
79
+ "version": "==1.5"
80
+ },
81
+ "cachetools": {
82
+ "hashes": [
83
+ "sha256:6a94c6402995a99c3970cc7e4884bb60b4a8639938157eeed436098bf9831757",
84
+ "sha256:f9f17d2aec496a9aa6b76f53e3b614c965223c061982d434d160f930c698a9db"
85
+ ],
86
+ "markers": "python_version ~= '3.7'",
87
+ "version": "==5.2.0"
88
+ },
89
+ "certifi": {
90
+ "hashes": [
91
+ "sha256:84c85a9078b11105f04f3036a9482ae10e4621616db313fe045dd24743a0820d",
92
+ "sha256:fe86415d55e84719d75f8b69414f6438ac3547d2078ab91b67e779ef69378412"
93
+ ],
94
+ "markers": "python_version >= '3.6'",
95
+ "version": "==2022.6.15"
96
+ },
97
+ "charset-normalizer": {
98
+ "hashes": [
99
+ "sha256:5a3d016c7c547f69d6f81fb0db9449ce888b418b5b9952cc5e6e66843e9dd845",
100
+ "sha256:83e9a75d1911279afd89352c68b45348559d1fc0506b054b346651b5e7fee29f"
101
+ ],
102
+ "markers": "python_version >= '3.6'",
103
+ "version": "==2.1.1"
104
+ },
105
+ "ckip-transformers": {
106
+ "hashes": [
107
+ "sha256:48affb723a40e535ccbcc0b4bbb14a86695373167218786eb00b06531cebb22e",
108
+ "sha256:a13c8ec21e209d3854601dae623f91046d2ee2c7f3fcb693752bfd57e896c776"
109
+ ],
110
+ "index": "pypi",
111
+ "version": "==0.3.2"
112
+ },
113
+ "click": {
114
+ "hashes": [
115
+ "sha256:7682dc8afb30297001674575ea00d1814d808d6a36af415a82bd481d37ba7b8e",
116
+ "sha256:bb4d8133cb15a609f44e8213d9b391b0809795062913b383c62be0ee95b1db48"
117
+ ],
118
+ "markers": "python_version >= '3.7'",
119
+ "version": "==8.1.3"
120
+ },
121
+ "commonmark": {
122
+ "hashes": [
123
+ "sha256:452f9dc859be7f06631ddcb328b6919c67984aca654e5fefb3914d54691aed60",
124
+ "sha256:da2f38c92590f83de410ba1a3cbceafbc74fee9def35f9251ba9a971d6d66fd9"
125
+ ],
126
+ "version": "==0.9.1"
127
+ },
128
+ "cwngraph": {
129
+ "hashes": [
130
+ "sha256:20acb3e9b6ac86e724537718d729c0fc81c7634932213bef42d8c03c94ae9236",
131
+ "sha256:bb88150cfa088db51b19094794de156d1214539cb67928f35c424e81ab39c392"
132
+ ],
133
+ "index": "pypi",
134
+ "version": "==0.4.0"
135
+ },
136
+ "cwnsensetagger": {
137
+ "hashes": [
138
+ "sha256:00727031fa61585d8b21465630b134b35be37138b6edbad7b7f43c76769a1ca0",
139
+ "sha256:f3a7a720ab81c452cf87294f84bd9e62357000127db39c32526da19fdeddafa0"
140
+ ],
141
+ "index": "pypi",
142
+ "version": "==0.1.6"
143
+ },
144
+ "decorator": {
145
+ "hashes": [
146
+ "sha256:637996211036b6385ef91435e4fae22989472f9d571faba8927ba8253acbc330",
147
+ "sha256:b8c3f85900b9dc423225913c5aace94729fe1fa9763b38939a95226f02d37186"
148
+ ],
149
+ "markers": "python_version >= '3.5'",
150
+ "version": "==5.1.1"
151
+ },
152
+ "distiltag": {
153
+ "hashes": [
154
+ "sha256:24dff55253d54e237aa1339d5d7252de3e2c832b5082ba0751fd946db1f085bd",
155
+ "sha256:2bc723a952cae40ced3478a04698399a91612f8025142c7fb313fd905a6b7a7e"
156
+ ],
157
+ "index": "pypi",
158
+ "version": "==0.2.2"
159
+ },
160
+ "entrypoints": {
161
+ "hashes": [
162
+ "sha256:b706eddaa9218a19ebcd67b56818f05bb27589b1ca9e8d797b74affad4ccacd4",
163
+ "sha256:f174b5ff827504fd3cd97cc3f8649f3693f51538c7e4bdf3ef002c8429d42f9f"
164
+ ],
165
+ "markers": "python_version >= '3.6'",
166
+ "version": "==0.4"
167
+ },
168
+ "filelock": {
169
+ "hashes": [
170
+ "sha256:55447caa666f2198c5b6b13a26d2084d26fa5b115c00d065664b2124680c4edc",
171
+ "sha256:617eb4e5eedc82fc5f47b6d61e4d11cb837c56cb4544e39081099fa17ad109d4"
172
+ ],
173
+ "markers": "python_version >= '3.7'",
174
+ "version": "==3.8.0"
175
+ },
176
+ "gdown": {
177
+ "hashes": [
178
+ "sha256:8217061063d8afcaad9d8e2d5410fbc0989c2b3f0946a6bd9bfeb9461616cc6a"
179
+ ],
180
+ "version": "==4.5.1"
181
+ },
182
+ "gitdb": {
183
+ "hashes": [
184
+ "sha256:8033ad4e853066ba6ca92050b9df2f89301b8fc8bf7e9324d412a63f8bf1a8fd",
185
+ "sha256:bac2fd45c0a1c9cf619e63a90d62bdc63892ef92387424b855792a6cabe789aa"
186
+ ],
187
+ "markers": "python_version >= '3.6'",
188
+ "version": "==4.0.9"
189
+ },
190
+ "gitpython": {
191
+ "hashes": [
192
+ "sha256:1c885ce809e8ba2d88a29befeb385fcea06338d3640712b59ca623c220bb5704",
193
+ "sha256:5b68b000463593e05ff2b261acff0ff0972df8ab1b70d3cdbd41b546c8b8fc3d"
194
+ ],
195
+ "markers": "python_version >= '3.7'",
196
+ "version": "==3.1.27"
197
+ },
198
+ "huggingface-hub": {
199
+ "hashes": [
200
+ "sha256:6395f26aaf44bbb4a73d3e14aca228fa39534696f651c6c82a6347f8c9f5950b",
201
+ "sha256:7a588046bdeb84e7bc99b3da58bbb4312a56d94ba51ebc60dfe610c18b3d0b9f"
202
+ ],
203
+ "markers": "python_version >= '3.7'",
204
+ "version": "==0.9.1"
205
+ },
206
+ "idna": {
207
+ "hashes": [
208
+ "sha256:84d9dd047ffa80596e0f246e2eab0b391788b0503584e8945f2368256d2735ff",
209
+ "sha256:9d643ff0a55b762d5cdb124b8eaa99c66322e2157b69160bc32796e824360e6d"
210
+ ],
211
+ "markers": "python_version >= '3.5'",
212
+ "version": "==3.3"
213
+ },
214
+ "importlib-metadata": {
215
+ "hashes": [
216
+ "sha256:637245b8bab2b6502fcbc752cc4b7a6f6243bb02b31c5c26156ad103d3d45670",
217
+ "sha256:7401a975809ea1fdc658c3aa4f78cc2195a0e019c5cbc4c06122884e9ae80c23"
218
+ ],
219
+ "markers": "python_version >= '3.7'",
220
+ "version": "==4.12.0"
221
+ },
222
+ "importlib-resources": {
223
+ "hashes": [
224
+ "sha256:5481e97fb45af8dcf2f798952625591c58fe599d0735d86b10f54de086a61681",
225
+ "sha256:f78a8df21a79bcc30cfd400bdc38f314333de7c0fb619763f6b9dabab8268bb7"
226
+ ],
227
+ "markers": "python_version < '3.9'",
228
+ "version": "==5.9.0"
229
+ },
230
+ "jinja2": {
231
+ "hashes": [
232
+ "sha256:31351a702a408a9e7595a8fc6150fc3f43bb6bf7e319770cbc0db9df9437e852",
233
+ "sha256:6088930bfe239f0e6710546ab9c19c9ef35e29792895fed6e6e31a023a182a61"
234
+ ],
235
+ "markers": "python_version >= '3.7'",
236
+ "version": "==3.1.2"
237
+ },
238
+ "joblib": {
239
+ "hashes": [
240
+ "sha256:4158fcecd13733f8be669be0683b96ebdbbd38d23559f54dca7205aea1bf1e35",
241
+ "sha256:f21f109b3c7ff9d95f8387f752d0d9c34a02aa2f7060c2135f465da0e5160ff6"
242
+ ],
243
+ "markers": "python_version >= '3.6'",
244
+ "version": "==1.1.0"
245
+ },
246
+ "jsonschema": {
247
+ "hashes": [
248
+ "sha256:15062f4cc6f591400cd528d2c355f2cfa6a57e44c820dc783aee5e23d36a831f",
249
+ "sha256:9892b8d630a82990521a9ca630d3446bd316b5ad54dbe981338802787f3e0d2d"
250
+ ],
251
+ "markers": "python_version >= '3.7'",
252
+ "version": "==4.14.0"
253
+ },
254
+ "markupsafe": {
255
+ "hashes": [
256
+ "sha256:0212a68688482dc52b2d45013df70d169f542b7394fc744c02a57374a4207003",
257
+ "sha256:089cf3dbf0cd6c100f02945abeb18484bd1ee57a079aefd52cffd17fba910b88",
258
+ "sha256:10c1bfff05d95783da83491be968e8fe789263689c02724e0c691933c52994f5",
259
+ "sha256:33b74d289bd2f5e527beadcaa3f401e0df0a89927c1559c8566c066fa4248ab7",
260
+ "sha256:3799351e2336dc91ea70b034983ee71cf2f9533cdff7c14c90ea126bfd95d65a",
261
+ "sha256:3ce11ee3f23f79dbd06fb3d63e2f6af7b12db1d46932fe7bd8afa259a5996603",
262
+ "sha256:421be9fbf0ffe9ffd7a378aafebbf6f4602d564d34be190fc19a193232fd12b1",
263
+ "sha256:43093fb83d8343aac0b1baa75516da6092f58f41200907ef92448ecab8825135",
264
+ "sha256:46d00d6cfecdde84d40e572d63735ef81423ad31184100411e6e3388d405e247",
265
+ "sha256:4a33dea2b688b3190ee12bd7cfa29d39c9ed176bda40bfa11099a3ce5d3a7ac6",
266
+ "sha256:4b9fe39a2ccc108a4accc2676e77da025ce383c108593d65cc909add5c3bd601",
267
+ "sha256:56442863ed2b06d19c37f94d999035e15ee982988920e12a5b4ba29b62ad1f77",
268
+ "sha256:671cd1187ed5e62818414afe79ed29da836dde67166a9fac6d435873c44fdd02",
269
+ "sha256:694deca8d702d5db21ec83983ce0bb4b26a578e71fbdbd4fdcd387daa90e4d5e",
270
+ "sha256:6a074d34ee7a5ce3effbc526b7083ec9731bb3cbf921bbe1d3005d4d2bdb3a63",
271
+ "sha256:6d0072fea50feec76a4c418096652f2c3238eaa014b2f94aeb1d56a66b41403f",
272
+ "sha256:6fbf47b5d3728c6aea2abb0589b5d30459e369baa772e0f37a0320185e87c980",
273
+ "sha256:7f91197cc9e48f989d12e4e6fbc46495c446636dfc81b9ccf50bb0ec74b91d4b",
274
+ "sha256:86b1f75c4e7c2ac2ccdaec2b9022845dbb81880ca318bb7a0a01fbf7813e3812",
275
+ "sha256:8dc1c72a69aa7e082593c4a203dcf94ddb74bb5c8a731e4e1eb68d031e8498ff",
276
+ "sha256:8e3dcf21f367459434c18e71b2a9532d96547aef8a871872a5bd69a715c15f96",
277
+ "sha256:8e576a51ad59e4bfaac456023a78f6b5e6e7651dcd383bcc3e18d06f9b55d6d1",
278
+ "sha256:96e37a3dc86e80bf81758c152fe66dbf60ed5eca3d26305edf01892257049925",
279
+ "sha256:97a68e6ada378df82bc9f16b800ab77cbf4b2fada0081794318520138c088e4a",
280
+ "sha256:99a2a507ed3ac881b975a2976d59f38c19386d128e7a9a18b7df6fff1fd4c1d6",
281
+ "sha256:a49907dd8420c5685cfa064a1335b6754b74541bbb3706c259c02ed65b644b3e",
282
+ "sha256:b09bf97215625a311f669476f44b8b318b075847b49316d3e28c08e41a7a573f",
283
+ "sha256:b7bd98b796e2b6553da7225aeb61f447f80a1ca64f41d83612e6139ca5213aa4",
284
+ "sha256:b87db4360013327109564f0e591bd2a3b318547bcef31b468a92ee504d07ae4f",
285
+ "sha256:bcb3ed405ed3222f9904899563d6fc492ff75cce56cba05e32eff40e6acbeaa3",
286
+ "sha256:d4306c36ca495956b6d568d276ac11fdd9c30a36f1b6eb928070dc5360b22e1c",
287
+ "sha256:d5ee4f386140395a2c818d149221149c54849dfcfcb9f1debfe07a8b8bd63f9a",
288
+ "sha256:dda30ba7e87fbbb7eab1ec9f58678558fd9a6b8b853530e176eabd064da81417",
289
+ "sha256:e04e26803c9c3851c931eac40c695602c6295b8d432cbe78609649ad9bd2da8a",
290
+ "sha256:e1c0b87e09fa55a220f058d1d49d3fb8df88fbfab58558f1198e08c1e1de842a",
291
+ "sha256:e72591e9ecd94d7feb70c1cbd7be7b3ebea3f548870aa91e2732960fa4d57a37",
292
+ "sha256:e8c843bbcda3a2f1e3c2ab25913c80a3c5376cd00c6e8c4a86a89a28c8dc5452",
293
+ "sha256:efc1913fd2ca4f334418481c7e595c00aad186563bbc1ec76067848c7ca0a933",
294
+ "sha256:f121a1420d4e173a5d96e47e9a0c0dcff965afdf1626d28de1460815f7c4ee7a",
295
+ "sha256:fc7b548b17d238737688817ab67deebb30e8073c95749d55538ed473130ec0c7"
296
+ ],
297
+ "markers": "python_version >= '3.7'",
298
+ "version": "==2.1.1"
299
+ },
300
+ "nltk": {
301
+ "hashes": [
302
+ "sha256:ba3de02490308b248f9b94c8bc1ac0683e9aa2ec49ee78536d8667afb5e3eec8",
303
+ "sha256:d6507d6460cec76d70afea4242a226a7542f85c669177b9c7f562b7cf1b05502"
304
+ ],
305
+ "markers": "python_version >= '3.7'",
306
+ "version": "==3.7"
307
+ },
308
+ "numpy": {
309
+ "hashes": [
310
+ "sha256:1dbe1c91269f880e364526649a52eff93ac30035507ae980d2fed33aaee633ac",
311
+ "sha256:357768c2e4451ac241465157a3e929b265dfac85d9214074985b1786244f2ef3",
312
+ "sha256:3820724272f9913b597ccd13a467cc492a0da6b05df26ea09e78b171a0bb9da6",
313
+ "sha256:4391bd07606be175aafd267ef9bea87cf1b8210c787666ce82073b05f202add1",
314
+ "sha256:4aa48afdce4660b0076a00d80afa54e8a97cd49f457d68a4342d188a09451c1a",
315
+ "sha256:58459d3bad03343ac4b1b42ed14d571b8743dc80ccbf27444f266729df1d6f5b",
316
+ "sha256:5c3c8def4230e1b959671eb959083661b4a0d2e9af93ee339c7dada6759a9470",
317
+ "sha256:5f30427731561ce75d7048ac254dbe47a2ba576229250fb60f0fb74db96501a1",
318
+ "sha256:643843bcc1c50526b3a71cd2ee561cf0d8773f062c8cbaf9ffac9fdf573f83ab",
319
+ "sha256:67c261d6c0a9981820c3a149d255a76918278a6b03b6a036800359aba1256d46",
320
+ "sha256:67f21981ba2f9d7ba9ade60c9e8cbaa8cf8e9ae51673934480e45cf55e953673",
321
+ "sha256:6aaf96c7f8cebc220cdfc03f1d5a31952f027dda050e5a703a0d1c396075e3e7",
322
+ "sha256:7c4068a8c44014b2d55f3c3f574c376b2494ca9cc73d2f1bd692382b6dffe3db",
323
+ "sha256:7c7e5fa88d9ff656e067876e4736379cc962d185d5cd808014a8a928d529ef4e",
324
+ "sha256:7f5ae4f304257569ef3b948810816bc87c9146e8c446053539947eedeaa32786",
325
+ "sha256:82691fda7c3f77c90e62da69ae60b5ac08e87e775b09813559f8901a88266552",
326
+ "sha256:8737609c3bbdd48e380d463134a35ffad3b22dc56295eff6f79fd85bd0eeeb25",
327
+ "sha256:9f411b2c3f3d76bba0865b35a425157c5dcf54937f82bbeb3d3c180789dd66a6",
328
+ "sha256:a6be4cb0ef3b8c9250c19cc122267263093eee7edd4e3fa75395dfda8c17a8e2",
329
+ "sha256:bcb238c9c96c00d3085b264e5c1a1207672577b93fa666c3b14a45240b14123a",
330
+ "sha256:bf2ec4b75d0e9356edea834d1de42b31fe11f726a81dfb2c2112bc1eaa508fcf",
331
+ "sha256:d136337ae3cc69aa5e447e78d8e1514be8c3ec9b54264e680cf0b4bd9011574f",
332
+ "sha256:d4bf4d43077db55589ffc9009c0ba0a94fa4908b9586d6ccce2e0b164c86303c",
333
+ "sha256:d6a96eef20f639e6a97d23e57dd0c1b1069a7b4fd7027482a4c5c451cd7732f4",
334
+ "sha256:d9caa9d5e682102453d96a0ee10c7241b72859b01a941a397fd965f23b3e016b",
335
+ "sha256:dd1c8f6bd65d07d3810b90d02eba7997e32abbdf1277a481d698969e921a3be0",
336
+ "sha256:e31f0bb5928b793169b87e3d1e070f2342b22d5245c755e2b81caa29756246c3",
337
+ "sha256:ecb55251139706669fdec2ff073c98ef8e9a84473e51e716211b41aa0f18e656",
338
+ "sha256:ee5ec40fdd06d62fe5d4084bef4fd50fd4bb6bfd2bf519365f569dc470163ab0",
339
+ "sha256:f17e562de9edf691a42ddb1eb4a5541c20dd3f9e65b09ded2beb0799c0cf29bb",
340
+ "sha256:fdffbfb6832cd0b300995a2b08b8f6fa9f6e856d562800fea9182316d99c4e8e"
341
+ ],
342
+ "markers": "python_version < '3.11' and python_version >= '3.7'",
343
+ "version": "==1.21.6"
344
+ },
345
+ "packaging": {
346
+ "hashes": [
347
+ "sha256:dd47c42927d89ab911e606518907cc2d3a1f38bbd026385970643f9c5b8ecfeb",
348
+ "sha256:ef103e05f519cdc783ae24ea4e2e0f508a9c99b2d4969652eed6a2e1ea5bd522"
349
+ ],
350
+ "markers": "python_version >= '3.6'",
351
+ "version": "==21.3"
352
+ },
353
+ "pandas": {
354
+ "hashes": [
355
+ "sha256:1e4285f5de1012de20ca46b188ccf33521bff61ba5c5ebd78b4fb28e5416a9f1",
356
+ "sha256:2651d75b9a167cc8cc572cf787ab512d16e316ae00ba81874b560586fa1325e0",
357
+ "sha256:2c21778a688d3712d35710501f8001cdbf96eb70a7c587a3d5613573299fdca6",
358
+ "sha256:32e1a26d5ade11b547721a72f9bfc4bd113396947606e00d5b4a5b79b3dcb006",
359
+ "sha256:3345343206546545bc26a05b4602b6a24385b5ec7c75cb6059599e3d56831da2",
360
+ "sha256:344295811e67f8200de2390093aeb3c8309f5648951b684d8db7eee7d1c81fb7",
361
+ "sha256:37f06b59e5bc05711a518aa10beaec10942188dccb48918bb5ae602ccbc9f1a0",
362
+ "sha256:552020bf83b7f9033b57cbae65589c01e7ef1544416122da0c79140c93288f56",
363
+ "sha256:5cce0c6bbeb266b0e39e35176ee615ce3585233092f685b6a82362523e59e5b4",
364
+ "sha256:5f261553a1e9c65b7a310302b9dbac31cf0049a51695c14ebe04e4bfd4a96f02",
365
+ "sha256:60a8c055d58873ad81cae290d974d13dd479b82cbb975c3e1fa2cf1920715296",
366
+ "sha256:62d5b5ce965bae78f12c1c0df0d387899dd4211ec0bdc52822373f13a3a022b9",
367
+ "sha256:7d28a3c65463fd0d0ba8bbb7696b23073efee0510783340a44b08f5e96ffce0c",
368
+ "sha256:8025750767e138320b15ca16d70d5cdc1886e8f9cc56652d89735c016cd8aea6",
369
+ "sha256:8b6dbec5f3e6d5dc80dcfee250e0a2a652b3f28663492f7dab9a24416a48ac39",
370
+ "sha256:a395692046fd8ce1edb4c6295c35184ae0c2bbe787ecbe384251da609e27edcb",
371
+ "sha256:a62949c626dd0ef7de11de34b44c6475db76995c2064e2d99c6498c3dba7fe58",
372
+ "sha256:aaf183a615ad790801fa3cf2fa450e5b6d23a54684fe386f7e3208f8b9bfbef6",
373
+ "sha256:adfeb11be2d54f275142c8ba9bf67acee771b7186a5745249c7d5a06c670136b",
374
+ "sha256:b6b87b2fb39e6383ca28e2829cddef1d9fc9e27e55ad91ca9c435572cdba51bf",
375
+ "sha256:bd971a3f08b745a75a86c00b97f3007c2ea175951286cdda6abe543e687e5f2f",
376
+ "sha256:c69406a2808ba6cf580c2255bcf260b3f214d2664a3a4197d0e640f573b46fd3",
377
+ "sha256:d3bc49af96cd6285030a64779de5b3688633a07eb75c124b0747134a63f4c05f",
378
+ "sha256:fd541ab09e1f80a2a1760032d665f6e032d8e44055d602d65eeea6e6e85498cb",
379
+ "sha256:fe95bae4e2d579812865db2212bb733144e34d0c6785c0685329e5b60fcb85dd"
380
+ ],
381
+ "markers": "python_full_version >= '3.7.1'",
382
+ "version": "==1.3.5"
383
+ },
384
+ "pillow": {
385
+ "hashes": [
386
+ "sha256:0030fdbd926fb85844b8b92e2f9449ba89607231d3dd597a21ae72dc7fe26927",
387
+ "sha256:030e3460861488e249731c3e7ab59b07c7853838ff3b8e16aac9561bb345da14",
388
+ "sha256:0ed2c4ef2451de908c90436d6e8092e13a43992f1860275b4d8082667fbb2ffc",
389
+ "sha256:136659638f61a251e8ed3b331fc6ccd124590eeff539de57c5f80ef3a9594e58",
390
+ "sha256:13b725463f32df1bfeacbf3dd197fb358ae8ebcd8c5548faa75126ea425ccb60",
391
+ "sha256:1536ad017a9f789430fb6b8be8bf99d2f214c76502becc196c6f2d9a75b01b76",
392
+ "sha256:15928f824870535c85dbf949c09d6ae7d3d6ac2d6efec80f3227f73eefba741c",
393
+ "sha256:17d4cafe22f050b46d983b71c707162d63d796a1235cdf8b9d7a112e97b15bac",
394
+ "sha256:1802f34298f5ba11d55e5bb09c31997dc0c6aed919658dfdf0198a2fe75d5490",
395
+ "sha256:1cc1d2451e8a3b4bfdb9caf745b58e6c7a77d2e469159b0d527a4554d73694d1",
396
+ "sha256:1fd6f5e3c0e4697fa7eb45b6e93996299f3feee73a3175fa451f49a74d092b9f",
397
+ "sha256:254164c57bab4b459f14c64e93df11eff5ded575192c294a0c49270f22c5d93d",
398
+ "sha256:2ad0d4df0f5ef2247e27fc790d5c9b5a0af8ade9ba340db4a73bb1a4a3e5fb4f",
399
+ "sha256:2c58b24e3a63efd22554c676d81b0e57f80e0a7d3a5874a7e14ce90ec40d3069",
400
+ "sha256:2d33a11f601213dcd5718109c09a52c2a1c893e7461f0be2d6febc2879ec2402",
401
+ "sha256:337a74fd2f291c607d220c793a8135273c4c2ab001b03e601c36766005f36885",
402
+ "sha256:37ff6b522a26d0538b753f0b4e8e164fdada12db6c6f00f62145d732d8a3152e",
403
+ "sha256:3d1f14f5f691f55e1b47f824ca4fdcb4b19b4323fe43cc7bb105988cad7496be",
404
+ "sha256:408673ed75594933714482501fe97e055a42996087eeca7e5d06e33218d05aa8",
405
+ "sha256:4134d3f1ba5f15027ff5c04296f13328fecd46921424084516bdb1b2548e66ff",
406
+ "sha256:4ad2f835e0ad81d1689f1b7e3fbac7b01bb8777d5a985c8962bedee0cc6d43da",
407
+ "sha256:50dff9cc21826d2977ef2d2a205504034e3a4563ca6f5db739b0d1026658e004",
408
+ "sha256:510cef4a3f401c246cfd8227b300828715dd055463cdca6176c2e4036df8bd4f",
409
+ "sha256:5aed7dde98403cd91d86a1115c78d8145c83078e864c1de1064f52e6feb61b20",
410
+ "sha256:69bd1a15d7ba3694631e00df8de65a8cb031911ca11f44929c97fe05eb9b6c1d",
411
+ "sha256:6bf088c1ce160f50ea40764f825ec9b72ed9da25346216b91361eef8ad1b8f8c",
412
+ "sha256:6e8c66f70fb539301e064f6478d7453e820d8a2c631da948a23384865cd95544",
413
+ "sha256:727dd1389bc5cb9827cbd1f9d40d2c2a1a0c9b32dd2261db522d22a604a6eec9",
414
+ "sha256:74a04183e6e64930b667d321524e3c5361094bb4af9083db5c301db64cd341f3",
415
+ "sha256:75e636fd3e0fb872693f23ccb8a5ff2cd578801251f3a4f6854c6a5d437d3c04",
416
+ "sha256:7761afe0126d046974a01e030ae7529ed0ca6a196de3ec6937c11df0df1bc91c",
417
+ "sha256:7888310f6214f19ab2b6df90f3f06afa3df7ef7355fc025e78a3044737fab1f5",
418
+ "sha256:7b0554af24df2bf96618dac71ddada02420f946be943b181108cac55a7a2dcd4",
419
+ "sha256:7c7b502bc34f6e32ba022b4a209638f9e097d7a9098104ae420eb8186217ebbb",
420
+ "sha256:808add66ea764ed97d44dda1ac4f2cfec4c1867d9efb16a33d158be79f32b8a4",
421
+ "sha256:831e648102c82f152e14c1a0938689dbb22480c548c8d4b8b248b3e50967b88c",
422
+ "sha256:93689632949aff41199090eff5474f3990b6823404e45d66a5d44304e9cdc467",
423
+ "sha256:96b5e6874431df16aee0c1ba237574cb6dff1dcb173798faa6a9d8b399a05d0e",
424
+ "sha256:9a54614049a18a2d6fe156e68e188da02a046a4a93cf24f373bffd977e943421",
425
+ "sha256:a138441e95562b3c078746a22f8fca8ff1c22c014f856278bdbdd89ca36cff1b",
426
+ "sha256:a647c0d4478b995c5e54615a2e5360ccedd2f85e70ab57fbe817ca613d5e63b8",
427
+ "sha256:a9c9bc489f8ab30906d7a85afac4b4944a572a7432e00698a7239f44a44e6efb",
428
+ "sha256:ad2277b185ebce47a63f4dc6302e30f05762b688f8dc3de55dbae4651872cdf3",
429
+ "sha256:b6d5e92df2b77665e07ddb2e4dbd6d644b78e4c0d2e9272a852627cdba0d75cf",
430
+ "sha256:bc431b065722a5ad1dfb4df354fb9333b7a582a5ee39a90e6ffff688d72f27a1",
431
+ "sha256:bdd0de2d64688ecae88dd8935012c4a72681e5df632af903a1dca8c5e7aa871a",
432
+ "sha256:c79698d4cd9318d9481d89a77e2d3fcaeff5486be641e60a4b49f3d2ecca4e28",
433
+ "sha256:cb6259196a589123d755380b65127ddc60f4c64b21fc3bb46ce3a6ea663659b0",
434
+ "sha256:d5b87da55a08acb586bad5c3aa3b86505f559b84f39035b233d5bf844b0834b1",
435
+ "sha256:dcd7b9c7139dc8258d164b55696ecd16c04607f1cc33ba7af86613881ffe4ac8",
436
+ "sha256:dfe4c1fedfde4e2fbc009d5ad420647f7730d719786388b7de0999bf32c0d9fd",
437
+ "sha256:ea98f633d45f7e815db648fd7ff0f19e328302ac36427343e4432c84432e7ff4",
438
+ "sha256:ec52c351b35ca269cb1f8069d610fc45c5bd38c3e91f9ab4cbbf0aebc136d9c8",
439
+ "sha256:eef7592281f7c174d3d6cbfbb7ee5984a671fcd77e3fc78e973d492e9bf0eb3f",
440
+ "sha256:f07f1f00e22b231dd3d9b9208692042e29792d6bd4f6639415d2f23158a80013",
441
+ "sha256:f3fac744f9b540148fa7715a435d2283b71f68bfb6d4aae24482a890aed18b59",
442
+ "sha256:fa768eff5f9f958270b081bb33581b4b569faabf8774726b283edb06617101dc",
443
+ "sha256:fac2d65901fb0fdf20363fbd345c01958a742f2dc62a8dd4495af66e3ff502a4"
444
+ ],
445
+ "markers": "python_version >= '3.7'",
446
+ "version": "==9.2.0"
447
+ },
448
+ "pkgutil-resolve-name": {
449
+ "hashes": [
450
+ "sha256:357d6c9e6a755653cfd78893817c0853af365dd51ec97f3d358a819373bbd174",
451
+ "sha256:ca27cc078d25c5ad71a9de0a7a330146c4e014c2462d9af19c6b828280649c5e"
452
+ ],
453
+ "markers": "python_version < '3.9'",
454
+ "version": "==1.3.10"
455
+ },
456
+ "protobuf": {
457
+ "hashes": [
458
+ "sha256:06059eb6953ff01e56a25cd02cca1a9649a75a7e65397b5b9b4e929ed71d10cf",
459
+ "sha256:097c5d8a9808302fb0da7e20edf0b8d4703274d140fd25c5edabddcde43e081f",
460
+ "sha256:284f86a6207c897542d7e956eb243a36bb8f9564c1742b253462386e96c6b78f",
461
+ "sha256:32ca378605b41fd180dfe4e14d3226386d8d1b002ab31c969c366549e66a2bb7",
462
+ "sha256:3cc797c9d15d7689ed507b165cd05913acb992d78b379f6014e013f9ecb20996",
463
+ "sha256:62f1b5c4cd6c5402b4e2d63804ba49a327e0c386c99b1675c8a0fefda23b2067",
464
+ "sha256:69ccfdf3657ba59569c64295b7d51325f91af586f8d5793b734260dfe2e94e2c",
465
+ "sha256:6f50601512a3d23625d8a85b1638d914a0970f17920ff39cec63aaef80a93fb7",
466
+ "sha256:7403941f6d0992d40161aa8bb23e12575637008a5a02283a930addc0508982f9",
467
+ "sha256:755f3aee41354ae395e104d62119cb223339a8f3276a0cd009ffabfcdd46bb0c",
468
+ "sha256:77053d28427a29987ca9caf7b72ccafee011257561259faba8dd308fda9a8739",
469
+ "sha256:7e371f10abe57cee5021797126c93479f59fccc9693dafd6bd5633ab67808a91",
470
+ "sha256:9016d01c91e8e625141d24ec1b20fed584703e527d28512aa8c8707f105a683c",
471
+ "sha256:9be73ad47579abc26c12024239d3540e6b765182a91dbc88e23658ab71767153",
472
+ "sha256:adc31566d027f45efe3f44eeb5b1f329da43891634d61c75a5944e9be6dd42c9",
473
+ "sha256:adfc6cf69c7f8c50fd24c793964eef18f0ac321315439d94945820612849c388",
474
+ "sha256:af0ebadc74e281a517141daad9d0f2c5d93ab78e9d455113719a45a49da9db4e",
475
+ "sha256:cb29edb9eab15742d791e1025dd7b6a8f6fcb53802ad2f6e3adcb102051063ab",
476
+ "sha256:cd68be2559e2a3b84f517fb029ee611546f7812b1fdd0aa2ecc9bc6ec0e4fdde",
477
+ "sha256:cdee09140e1cd184ba9324ec1df410e7147242b94b5f8b0c64fc89e38a8ba531",
478
+ "sha256:db977c4ca738dd9ce508557d4fce0f5aebd105e158c725beec86feb1f6bc20d8",
479
+ "sha256:dd5789b2948ca702c17027c84c2accb552fc30f4622a98ab5c51fcfe8c50d3e7",
480
+ "sha256:e250a42f15bf9d5b09fe1b293bdba2801cd520a9f5ea2d7fb7536d4441811d20",
481
+ "sha256:ff8d8fa42675249bb456f5db06c00de6c2f4c27a065955917b28c4f15978b9c3"
482
+ ],
483
+ "markers": "python_version >= '3.7'",
484
+ "version": "==3.20.1"
485
+ },
486
+ "pyarrow": {
487
+ "hashes": [
488
+ "sha256:0238998dc692efcb4e41ae74738d7c1234723271ccf520bd8312dca07d49ef8d",
489
+ "sha256:02b820ecd1da02012092c180447de449fc688d0c3f9ff8526ca301cdd60dacd0",
490
+ "sha256:1c5a073a930c632058461547e0bc572da1e724b17b6b9eb31a97da13f50cb6e0",
491
+ "sha256:29eb3e086e2b26202f3a4678316b93cfb15d0e2ba20f3ec12db8fd9cc07cde63",
492
+ "sha256:2c715eca2092273dcccf6f08437371e04d112f9354245ba2fbe6c801879450b7",
493
+ "sha256:2e753f8fcf07d8e3a0efa0c8bd51fef5c90281ffd4c5637c08ce42cd0ac297de",
494
+ "sha256:3eef8a981f45d89de403e81fb83b8119c20824caddf1404274e41a5d66c73806",
495
+ "sha256:4eebdab05afa23d5d5274b24c1cbeb1ba017d67c280f7d39fd8a8f18cbad2ec9",
496
+ "sha256:5526a3bfb404ff6d31d62ea582cf2466c7378a474a99ee04d1a9b05de5264541",
497
+ "sha256:55328348b9139c2b47450d512d716c2248fd58e2f04e2fc23a65e18726666d42",
498
+ "sha256:767cafb14278165ad539a2918c14c1b73cf20689747c21375c38e3fe62884902",
499
+ "sha256:7fa56cbd415cef912677270b8e41baad70cde04c6d8a8336eeb2aba85aa93706",
500
+ "sha256:7fb02bebc13ab55573d1ae9bb5002a6d20ba767bf8569b52fce5301d42495ab7",
501
+ "sha256:81a60bb291a964f63b2717fb1b28f6615ffab7e8585322bfb8a6738e6b321282",
502
+ "sha256:8ad430cee28ebc4d6661fc7315747c7a18ae2a74e67498dcb039e1c762a2fb67",
503
+ "sha256:92f3977e901db1ef5cba30d6cc1d7942b8d94b910c60f89013e8f7bb86a86eef",
504
+ "sha256:9cef618159567d5f62040f2b79b1c7b38e3885f4ffad0ec97cd2d86f88b67cef",
505
+ "sha256:a5b390bdcfb8c5b900ef543f911cdfec63e88524fafbcc15f83767202a4a2491",
506
+ "sha256:d9eb04db626fa24fdfb83c00f76679ca0d98728cdbaa0481b6402bf793a290c0",
507
+ "sha256:da3e0f319509a5881867effd7024099fb06950a0768dad0d6873668bb88cfaba",
508
+ "sha256:f11a645a41ee531c3a5edda45dea07c42267f52571f818d388971d33fc7e2d4a",
509
+ "sha256:f241bd488c2705df930eedfe304ada71191dcf67d6b98ceda0cc934fd2a8388e",
510
+ "sha256:f59bcd5217a3ae1e17870792f82b2ff92df9f3862996e2c78e156c13e56ff62e",
511
+ "sha256:f8c46bde1030d704e2796182286d1c56846552c50a39ad5bf5a20c0d8159fc35",
512
+ "sha256:fc856628acd8d281652c15b6268ec7f27ebcb015abbe99d9baad17f02adc51f1",
513
+ "sha256:fe2ce795fa1d95e4e940fe5661c3c58aee7181c730f65ac5dd8794a77228de59"
514
+ ],
515
+ "markers": "python_version >= '3.7'",
516
+ "version": "==9.0.0"
517
+ },
518
+ "pydeck": {
519
+ "hashes": [
520
+ "sha256:b446e810e3c615e1604f4364e0e162ba371712805fab97a6b7722200b286b466",
521
+ "sha256:f7dec070b954b88d17795a4a41fe59192843f4f4cd9ecedde4eab167d0096c40"
522
+ ],
523
+ "markers": "python_version >= '3.7'",
524
+ "version": "==0.8.0b1"
525
+ },
526
+ "pygments": {
527
+ "hashes": [
528
+ "sha256:56a8508ae95f98e2b9bdf93a6be5ae3f7d8af858b43e02c5a2ff083726be40c1",
529
+ "sha256:f643f331ab57ba3c9d89212ee4a2dabc6e94f117cf4eefde99a0574720d14c42"
530
+ ],
531
+ "markers": "python_version >= '3.6'",
532
+ "version": "==2.13.0"
533
+ },
534
+ "pympler": {
535
+ "hashes": [
536
+ "sha256:993f1a3599ca3f4fcd7160c7545ad06310c9e12f70174ae7ae8d4e25f6c5d3fa",
537
+ "sha256:d260dda9ae781e1eab6ea15bacb84015849833ba5555f141d2d9b7b7473b307d"
538
+ ],
539
+ "markers": "python_version >= '3.6'",
540
+ "version": "==1.0.1"
541
+ },
542
+ "pyparsing": {
543
+ "hashes": [
544
+ "sha256:2b020ecf7d21b687f219b71ecad3631f644a47f01403fa1d1036b0c6416d70fb",
545
+ "sha256:5026bae9a10eeaefb61dab2f09052b9f4307d44aee4eda64b309723d8d206bbc"
546
+ ],
547
+ "markers": "python_full_version >= '3.6.8'",
548
+ "version": "==3.0.9"
549
+ },
550
+ "pyrsistent": {
551
+ "hashes": [
552
+ "sha256:0e3e1fcc45199df76053026a51cc59ab2ea3fc7c094c6627e93b7b44cdae2c8c",
553
+ "sha256:1b34eedd6812bf4d33814fca1b66005805d3640ce53140ab8bbb1e2651b0d9bc",
554
+ "sha256:4ed6784ceac462a7d6fcb7e9b663e93b9a6fb373b7f43594f9ff68875788e01e",
555
+ "sha256:5d45866ececf4a5fff8742c25722da6d4c9e180daa7b405dc0a2a2790d668c26",
556
+ "sha256:636ce2dc235046ccd3d8c56a7ad54e99d5c1cd0ef07d9ae847306c91d11b5fec",
557
+ "sha256:6455fc599df93d1f60e1c5c4fe471499f08d190d57eca040c0ea182301321286",
558
+ "sha256:6bc66318fb7ee012071b2792024564973ecc80e9522842eb4e17743604b5e045",
559
+ "sha256:7bfe2388663fd18bd8ce7db2c91c7400bf3e1a9e8bd7d63bf7e77d39051b85ec",
560
+ "sha256:7ec335fc998faa4febe75cc5268a9eac0478b3f681602c1f27befaf2a1abe1d8",
561
+ "sha256:914474c9f1d93080338ace89cb2acee74f4f666fb0424896fcfb8d86058bf17c",
562
+ "sha256:b568f35ad53a7b07ed9b1b2bae09eb15cdd671a5ba5d2c66caee40dbf91c68ca",
563
+ "sha256:cdfd2c361b8a8e5d9499b9082b501c452ade8bbf42aef97ea04854f4a3f43b22",
564
+ "sha256:d1b96547410f76078eaf66d282ddca2e4baae8964364abb4f4dcdde855cd123a",
565
+ "sha256:d4d61f8b993a7255ba714df3aca52700f8125289f84f704cf80916517c46eb96",
566
+ "sha256:d7a096646eab884bf8bed965bad63ea327e0d0c38989fc83c5ea7b8a87037bfc",
567
+ "sha256:df46c854f490f81210870e509818b729db4488e1f30f2a1ce1698b2295a878d1",
568
+ "sha256:e24a828f57e0c337c8d8bb9f6b12f09dfdf0273da25fda9e314f0b684b415a07",
569
+ "sha256:e4f3149fd5eb9b285d6bfb54d2e5173f6a116fe19172686797c056672689daf6",
570
+ "sha256:e92a52c166426efbe0d1ec1332ee9119b6d32fc1f0bbfd55d5c1088070e7fc1b",
571
+ "sha256:f87cc2863ef33c709e237d4b5f4502a62a00fab450c9e020892e8e2ede5847f5",
572
+ "sha256:fd8da6d0124efa2f67d86fa70c851022f87c98e205f0594e1fae044e7119a5a6"
573
+ ],
574
+ "markers": "python_version >= '3.7'",
575
+ "version": "==0.18.1"
576
+ },
577
+ "pysocks": {
578
+ "hashes": [
579
+ "sha256:08e69f092cc6dbe92a0fdd16eeb9b9ffbc13cadfe5ca4c7bd92ffb078b293299",
580
+ "sha256:2725bd0a9925919b9b51739eea5f9e2bae91e83288108a9ad338b2e3a4435ee5",
581
+ "sha256:3f8804571ebe159c380ac6de37643bb4685970655d3bba243530d6558b799aa0"
582
+ ],
583
+ "version": "==1.7.1"
584
+ },
585
+ "python-dateutil": {
586
+ "hashes": [
587
+ "sha256:0123cacc1627ae19ddf3c27a5de5bd67ee4586fbdd6440d9748f8abb483d3e86",
588
+ "sha256:961d03dc3453ebbc59dbdea9e4e11c5651520a876d0f4db161e8674aae935da9"
589
+ ],
590
+ "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3'",
591
+ "version": "==2.8.2"
592
+ },
593
+ "python-dotenv": {
594
+ "hashes": [
595
+ "sha256:b7e3b04a59693c42c36f9ab1cc2acc46fa5df8c78e178fc33a8d4cd05c8d498f",
596
+ "sha256:d92a187be61fe482e4fd675b6d52200e7be63a12b724abbf931a40ce4fa92938"
597
+ ],
598
+ "index": "pypi",
599
+ "version": "==0.20.0"
600
+ },
601
+ "pytz": {
602
+ "hashes": [
603
+ "sha256:220f481bdafa09c3955dfbdddb7b57780e9a94f5127e35456a48589b9e0c0197",
604
+ "sha256:cea221417204f2d1a2aa03ddae3e867921971d0d76f14d87abb4414415bbdcf5"
605
+ ],
606
+ "version": "==2022.2.1"
607
+ },
608
+ "pytz-deprecation-shim": {
609
+ "hashes": [
610
+ "sha256:8314c9692a636c8eb3bda879b9f119e350e93223ae83e70e80c31675a0fdc1a6",
611
+ "sha256:af097bae1b616dde5c5744441e2ddc69e74dfdcb0c263129610d85b87445a59d"
612
+ ],
613
+ "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3, 3.4, 3.5'",
614
+ "version": "==0.1.0.post0"
615
+ },
616
+ "pyyaml": {
617
+ "hashes": [
618
+ "sha256:0283c35a6a9fbf047493e3a0ce8d79ef5030852c51e9d911a27badfde0605293",
619
+ "sha256:055d937d65826939cb044fc8c9b08889e8c743fdc6a32b33e2390f66013e449b",
620
+ "sha256:07751360502caac1c067a8132d150cf3d61339af5691fe9e87803040dbc5db57",
621
+ "sha256:0b4624f379dab24d3725ffde76559cff63d9ec94e1736b556dacdfebe5ab6d4b",
622
+ "sha256:0ce82d761c532fe4ec3f87fc45688bdd3a4c1dc5e0b4a19814b9009a29baefd4",
623
+ "sha256:1e4747bc279b4f613a09eb64bba2ba602d8a6664c6ce6396a4d0cd413a50ce07",
624
+ "sha256:213c60cd50106436cc818accf5baa1aba61c0189ff610f64f4a3e8c6726218ba",
625
+ "sha256:231710d57adfd809ef5d34183b8ed1eeae3f76459c18fb4a0b373ad56bedcdd9",
626
+ "sha256:277a0ef2981ca40581a47093e9e2d13b3f1fbbeffae064c1d21bfceba2030287",
627
+ "sha256:2cd5df3de48857ed0544b34e2d40e9fac445930039f3cfe4bcc592a1f836d513",
628
+ "sha256:40527857252b61eacd1d9af500c3337ba8deb8fc298940291486c465c8b46ec0",
629
+ "sha256:473f9edb243cb1935ab5a084eb238d842fb8f404ed2193a915d1784b5a6b5fc0",
630
+ "sha256:48c346915c114f5fdb3ead70312bd042a953a8ce5c7106d5bfb1a5254e47da92",
631
+ "sha256:50602afada6d6cbfad699b0c7bb50d5ccffa7e46a3d738092afddc1f9758427f",
632
+ "sha256:68fb519c14306fec9720a2a5b45bc9f0c8d1b9c72adf45c37baedfcd949c35a2",
633
+ "sha256:77f396e6ef4c73fdc33a9157446466f1cff553d979bd00ecb64385760c6babdc",
634
+ "sha256:819b3830a1543db06c4d4b865e70ded25be52a2e0631ccd2f6a47a2822f2fd7c",
635
+ "sha256:897b80890765f037df3403d22bab41627ca8811ae55e9a722fd0392850ec4d86",
636
+ "sha256:98c4d36e99714e55cfbaaee6dd5badbc9a1ec339ebfc3b1f52e293aee6bb71a4",
637
+ "sha256:9df7ed3b3d2e0ecfe09e14741b857df43adb5a3ddadc919a2d94fbdf78fea53c",
638
+ "sha256:9fa600030013c4de8165339db93d182b9431076eb98eb40ee068700c9c813e34",
639
+ "sha256:a80a78046a72361de73f8f395f1f1e49f956c6be882eed58505a15f3e430962b",
640
+ "sha256:b3d267842bf12586ba6c734f89d1f5b871df0273157918b0ccefa29deb05c21c",
641
+ "sha256:b5b9eccad747aabaaffbc6064800670f0c297e52c12754eb1d976c57e4f74dcb",
642
+ "sha256:c5687b8d43cf58545ade1fe3e055f70eac7a5a1a0bf42824308d868289a95737",
643
+ "sha256:cba8c411ef271aa037d7357a2bc8f9ee8b58b9965831d9e51baf703280dc73d3",
644
+ "sha256:d15a181d1ecd0d4270dc32edb46f7cb7733c7c508857278d3d378d14d606db2d",
645
+ "sha256:d4db7c7aef085872ef65a8fd7d6d09a14ae91f691dec3e87ee5ee0539d516f53",
646
+ "sha256:d4eccecf9adf6fbcc6861a38015c2a64f38b9d94838ac1810a9023a0609e1b78",
647
+ "sha256:d67d839ede4ed1b28a4e8909735fc992a923cdb84e618544973d7dfc71540803",
648
+ "sha256:daf496c58a8c52083df09b80c860005194014c3698698d1a57cbcfa182142a3a",
649
+ "sha256:e61ceaab6f49fb8bdfaa0f92c4b57bcfbea54c09277b1b4f7ac376bfb7a7c174",
650
+ "sha256:f84fbc98b019fef2ee9a1cb3ce93e3187a6df0b2538a651bfb890254ba9f90b5"
651
+ ],
652
+ "markers": "python_version >= '3.6'",
653
+ "version": "==6.0"
654
+ },
655
+ "regex": {
656
+ "hashes": [
657
+ "sha256:02b6dc102123f5178796dcdb5a90f6e88895607fd1a1d115d8de1af8161ca2b4",
658
+ "sha256:0843cc977b9cc00eb2299b624db6481d25e7f5b093f7a7c2bb727028d4a26eda",
659
+ "sha256:085ca3dc9360c0210e0a70e5d34d66454a06077644e7679fef6358b1f053e62e",
660
+ "sha256:0a9d5a64e974bc5f160f30f76aaf993d49eeddb405676be6bf76a5a2c131e185",
661
+ "sha256:0de0ce11c0835e1117eacbfe8fa6fa98dc0e8e746b486735cb0fdebe46a02222",
662
+ "sha256:1418d3506a9582b23a27373f125ea2b0da523c581e7cf678a6f036254d134faa",
663
+ "sha256:14750172c0a616140a8f496dfef28ed24080e87d06d5838e008f959ad307a8c5",
664
+ "sha256:1b6d2c579ffdcbb3d93f63b6a7f697364594e1c1b6856958b3e61e3ca22c140a",
665
+ "sha256:1df31eaf147ecff3665ba861acb8f78221cd5501df072c9151dfa341dd24599f",
666
+ "sha256:21b6f939916aa61beea56393ebc8a9999060632ac22b8193c2cb67d6fd7cb2c3",
667
+ "sha256:2240fce3af236e4586a045c1be8bbf16c4f8831e68b7df918b72fc31a80143be",
668
+ "sha256:242f546fc5e49bb7395624ac3b4fc168bf454e11ace9804c58c4c3a90d84e38f",
669
+ "sha256:25bffa248b99b53a61b1f20fc7d19f711e38e9f0bc90d44c26670f8dc282ad7d",
670
+ "sha256:2ada67e02fa3fcca9e3b90cf24c2c6bc77f0abc126209937956aea10eeba40c7",
671
+ "sha256:2c198921afc811bc0f105c6e5150fbdebf9520c9b7d43cfc0ab156ca97f506d7",
672
+ "sha256:370b1d7aed26e29915c3fb3e72e327f194824a76cedb60c0b9f6c6af53e89d72",
673
+ "sha256:3aafbbf5076f2a48bcf31ceb42b410323daaa0ddb42544640592957bc906ace6",
674
+ "sha256:3d3d769b3d485b28d6a591b46723dbacc696e6503f48a3ef52e6fc2c90edb482",
675
+ "sha256:3d83fd6dd4263595d0e4f595d4abd54397cbed52c0147f7dd148a7b72910301e",
676
+ "sha256:45cb798095b886e4df6ff4a1f7661eb70620ccdef127e3c3e00a1aaa22d30e53",
677
+ "sha256:4bd9443f7ff6e6288dd4496215c5d903f851e55cbc09d5963587af0c6d565a0a",
678
+ "sha256:4bdfd016ab12c4075ef93f025b3cf4c8962b9b7a5e52bb7039ab64cb7755930c",
679
+ "sha256:4c6554073e3e554fbb3dff88376ada3da32ca789ea1b9e381f684d49ddb61199",
680
+ "sha256:4dad9d68574e93e1e23be53b4ecfb0f083bd5cc08cc7f1984a4ee3ebf12aa446",
681
+ "sha256:4e12a3c2d4781ee5d03f229c940934fa1e4ea4f4995e68ab97a2815b139e0804",
682
+ "sha256:53c9eca0d6070a8a3de42182ad26daf90ba12132eb74a2f45702332762aff84e",
683
+ "sha256:5910bb355f9517309f77101238dbacb7151ede3434a2f1fad26ecc62f13d8324",
684
+ "sha256:5c77eab46f3a2b2cd8bbe06467df783543bf7396df431eb4a144cc4b89e9fb3c",
685
+ "sha256:5d541bc430a74c787684d1ebcd205a5212a88c3de73848143e77489b2c25b911",
686
+ "sha256:5e7c8f9f8824143c219dd93cdc733c20d2c12f154034c89bcb4911db8e45bd92",
687
+ "sha256:5f14430535645712f546f1e07013507d1cc0c8abd851811dacce8c7fb584bf52",
688
+ "sha256:6059ae91667932d256d9dc03abd3512ebcade322b3a42d1b8354bd1db7f66dcc",
689
+ "sha256:61f6966371fa1cbf26c6209771a02bef80336cdaca0c0af4dfa33d51019c0b93",
690
+ "sha256:62d56a9d3c1e5a83076db4da060dad7ea35ac2f3cbd3c53ba5a51fe0caedb500",
691
+ "sha256:634f090a388351eadf1dcc1d168a190718fb68efb4b8fdc1b119cf837ca01905",
692
+ "sha256:64ecfcc386420192fbe98fdde777d993f7f2dfec9552e4f4024d3447d3a3e637",
693
+ "sha256:6af38997f178889d417851bae8fb5c00448f7405cfcab38734d771f1dd5d5973",
694
+ "sha256:6b30c8d299ba48ee919064628fd8bc296bdc6e4827d315491bea39437130d3e1",
695
+ "sha256:6f0c8807bac16984901c0573725bad786f2f004f9bd5df8476c6431097b6c5b3",
696
+ "sha256:6f62c8a59f6b8e608880c61b138ae22668184bc266b025d33200dcf2cebe0872",
697
+ "sha256:74d4aabd612d32282f3cb3ebb4436046fb840d25c754157a755bc9f66e7cd307",
698
+ "sha256:7658d2dfc1dabfb008ffe12ae47b98559e2aedd8237bee12f5aafb74d90479e3",
699
+ "sha256:777ceea2860a48e9e362a4e2a9a691782ea97bd05c24627c92e876fdd2c22e61",
700
+ "sha256:79f34d5833cd0d53ecf48bc030e4da3216bd4846224d17eeb64509be5cb098fd",
701
+ "sha256:7a52d547259495a53e61e37ffc6d5cecf8d298aeb1bc0d9b25289d65ddb31183",
702
+ "sha256:840063aa8eeb1dda07d7d7dee15648838bffef1d415f5f79061854a182a429aa",
703
+ "sha256:8e8ec94d1b1a0a297c2c69a0bf000baf9a79607ca0c084f577f811a9b447c319",
704
+ "sha256:95fb62a3980cf43e76c2fe95edab06ec70dc495b8aa660975eb9f0b2ffdae1e1",
705
+ "sha256:9668da78bcc219542467f51c2cd01894222be6aceec4b5efb806705900b794d8",
706
+ "sha256:99a7c5786de9e92ff5ffee2e8bed745f5d25495206f3f14656c379031e518334",
707
+ "sha256:a1e283ad918df44bad3ccf042c2fe283c63d17617570eb91b8c370ef677b0b83",
708
+ "sha256:a25d251546acb5edb1635631c4ae0e330fa4ec7c6316c01d256728fbfb9bbff2",
709
+ "sha256:abe1adb32e2535aaa171e8b2b2d3f083f863c9974a3e6e7dae6bf4827fc8b983",
710
+ "sha256:ae85112da2d826b65aa7c7369c56ca41d9a89644312172979cbee5cf788e0b09",
711
+ "sha256:b3379a83dc63fe06538c751961f9ed730b5d7f08f96a57bbad8d52db5820df1f",
712
+ "sha256:b3c7c6c4aac19b964c1d12784aecae7f0315314640b0f41dd6f0d4e2bf439072",
713
+ "sha256:b7ddecc80e87acf12c2cf12bf3721def47188c403f04e706f104b5e71fed2f31",
714
+ "sha256:bbaf6785d3f1cd3e617b9d0fb3c5528023ef7bc7cc1356234801dc1941df8ce9",
715
+ "sha256:be6f5b453f7ed2219a9555bb6840663950b9ab1dc034216f68eac64db66633c2",
716
+ "sha256:c2b6404631b22617b5127c6de2355393ccda693ca733a098b6802e7dabb3457a",
717
+ "sha256:c4f6609f6e867a58cdf173e1cbe1f3736d25962108bd5cb01ad5a130875ff2c8",
718
+ "sha256:c76dd2c0615a28de21c97f9f6862e84faef58ff4d700196b4e395ef6a52291e4",
719
+ "sha256:c78c72f7878071a78337510ec78ab856d60b4bdcd3a95fd68b939e7cb30434b3",
720
+ "sha256:cb0c9a1476d279524538ba9a00ecec9eadcef31a6a60b2c8bd2f29f62044a559",
721
+ "sha256:ccb986e80674c929f198464bce55e995178dea26833421e2479ff04a6956afac",
722
+ "sha256:cfa62063c5eafb04e4435459ce15746b4ae6c14efeae8f16bd0e3d2895dad698",
723
+ "sha256:d13bd83284b46c304eb10de93f8a3f2c80361f91f4e8a4e1273caf83e16c4409",
724
+ "sha256:d76e585368388d99ddd2f95989e6ac80a8fe23115e93931faad99fa34550612f",
725
+ "sha256:dc32029b9cc784a529f9201289d4f841cc24a2ae3126a112cd467bc41bbc2f10",
726
+ "sha256:e0b55651db770b4b5a6c7d015f24d1a6ede307296bbdf0c47fc5f6a6adc7abee",
727
+ "sha256:e37886929ee83a5fa5c73164abada00e7f3cc1cbf3f8f6e1e8cfecae9d6cfc47",
728
+ "sha256:f7b88bc7306136b123fd1a9beed16ca02900ee31d1c36e73fa33d9e525a5562d",
729
+ "sha256:fac611bde2609a46fcbd92da7171286faa2f5c191f84d22f61cd7dc27213f51d",
730
+ "sha256:fafed60103132e74cdfbd651abe94801eb87a9765ce275b3dca9af8f3e06622a"
731
+ ],
732
+ "markers": "python_version >= '3.6'",
733
+ "version": "==2022.8.17"
734
+ },
735
+ "requests": {
736
+ "hashes": [
737
+ "sha256:7c5599b102feddaa661c826c56ab4fee28bfd17f5abca1ebbe3e7f19d7c97983",
738
+ "sha256:8fefa2a1a1365bf5520aac41836fbee479da67864514bdb821f31ce07ce65349"
739
+ ],
740
+ "markers": "python_version >= '3.7' and python_version < '4'",
741
+ "version": "==2.28.1"
742
+ },
743
+ "rich": {
744
+ "hashes": [
745
+ "sha256:2eb4e6894cde1e017976d2975ac210ef515d7548bc595ba20e195fb9628acdeb",
746
+ "sha256:63a5c5ce3673d3d5fbbf23cd87e11ab84b6b451436f1b7f19ec54b6bc36ed7ca"
747
+ ],
748
+ "markers": "python_version < '4' and python_full_version >= '3.6.3'",
749
+ "version": "==12.5.1"
750
+ },
751
+ "semver": {
752
+ "hashes": [
753
+ "sha256:ced8b23dceb22134307c1b8abfa523da14198793d9787ac838e70e29e77458d4",
754
+ "sha256:fa0fe2722ee1c3f57eac478820c3a5ae2f624af8264cbdf9000c980ff7f75e3f"
755
+ ],
756
+ "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3'",
757
+ "version": "==2.13.0"
758
+ },
759
+ "six": {
760
+ "hashes": [
761
+ "sha256:1e61c37477a1626458e36f7b1d82aa5c9b094fa4802892072e49de9c60c4c926",
762
+ "sha256:8abb2f1d86890a2dfb989f9a77cfcfd3e47c2a354b01111771326f8aa26e0254"
763
+ ],
764
+ "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3'",
765
+ "version": "==1.16.0"
766
+ },
767
+ "smmap": {
768
+ "hashes": [
769
+ "sha256:2aba19d6a040e78d8b09de5c57e96207b09ed71d8e55ce0959eeee6c8e190d94",
770
+ "sha256:c840e62059cd3be204b0c9c9f74be2c09d5648eddd4580d9314c3ecde0b30936"
771
+ ],
772
+ "markers": "python_version >= '3.6'",
773
+ "version": "==5.0.0"
774
+ },
775
+ "soupsieve": {
776
+ "hashes": [
777
+ "sha256:3b2503d3c7084a42b1ebd08116e5f81aadfaea95863628c80a3b774a11b7c759",
778
+ "sha256:fc53893b3da2c33de295667a0e19f078c14bf86544af307354de5fcf12a3f30d"
779
+ ],
780
+ "markers": "python_version >= '3.6'",
781
+ "version": "==2.3.2.post1"
782
+ },
783
+ "streamlit": {
784
+ "hashes": [
785
+ "sha256:c56d0775feb39116ff90a8b01ee15be27212ee50abb88943607205d26d1d9923",
786
+ "sha256:f0461bebd6c1b58c38f0f602ee9bb6699f66dfe14fd2e05abc25ebe96ff4ba21"
787
+ ],
788
+ "index": "pypi",
789
+ "version": "==1.12.2"
790
+ },
791
+ "tokenizers": {
792
+ "hashes": [
793
+ "sha256:01abe6fbfe55e4131ca0c4c3d1a9d7ef5df424a8d536e998d2a4fc0bc57935f4",
794
+ "sha256:070746f86efa6c873db341e55cf17bb5e7bdd5450330ca8eca542f5c3dab2c66",
795
+ "sha256:0bf2380ad59c50222959a9b6f231339200a826fc5cb2be09ff96d8a59f65fc5e",
796
+ "sha256:2158baf80cbc09259bfd6e0e0fc4597b611e7a72ad5443dad63918a90f1dd304",
797
+ "sha256:230f51a0a82ca7b90077eaca2415f12ff9bd144607888b9c50c2ee543452322e",
798
+ "sha256:258873634406bd1d438c799993a5e44bbc0132ff055985c03c4fe30f702e9a33",
799
+ "sha256:27d93b712aa2d4346aa506ecd4ec9e94edeebeaf2d484357b482cdeffc02b5f5",
800
+ "sha256:28825dade9e52ad464164020758f9d49eb7251c32b6ae146601c506a23c67c0e",
801
+ "sha256:38625595b2fd37bfcce64ff9bfb6868c07e9a7b7f205c909d94a615ce9472287",
802
+ "sha256:3f2647cc256d6a53d18b9dcd71d377828e9f8991fbcbd6fcd8ca2ceb174552b0",
803
+ "sha256:411ebc89228f30218ffa9d9c49d414864b0df5026a47c24820431821c4360460",
804
+ "sha256:419d113e3bcc4fe20a313afc47af81e62906306b08fe1601e1443d747d46af1f",
805
+ "sha256:5188e13fc09edfe05712ca3ae5a44e7f2b0137927b1ca210d0fad90d3e58315a",
806
+ "sha256:53b5f4012ce3ffddd5b00827441b80dc7a0f6b41f4fc5248ae6d36e7d3920c6d",
807
+ "sha256:619728df2551bdfe6f96ff177f9ded958e7ed9e2af94c8d5ac2834d1eb06d112",
808
+ "sha256:62a723bd4b18bc55121f5c34cd8efd6c651f2d3b81f81dd50e5351fb65b8a617",
809
+ "sha256:664f36f0a0d409c24f2201d495161fec4d8bc93e091fbb78814eb426f29905a3",
810
+ "sha256:6a38b2019d4807d42afeff603a119094ee00f63bea2921136524c8814e9003f8",
811
+ "sha256:6a7a106d04154c2159db6cd7d042af2e2e0e53aee432f872fe6c8be45100436a",
812
+ "sha256:7c5c54080a7d5c89c990e0d478e0882dbac88926d43323a3aa236492a3c9455f",
813
+ "sha256:7d43de14b4469b57490dbaf136a31c266cb676fa22320f01f230af9219ae9034",
814
+ "sha256:7f4cb68dc538b52240d1986d2034eb0a6373be2ab5f0787d1be3ad1444ce71b7",
815
+ "sha256:8cea98f3f9577d1541b7bb0f7a3308a911751067e1d83e01485c9d3411bbf087",
816
+ "sha256:8d4339c376b695de2ad8ccaebffa75e4dc1d7857be1103d80e7925b34af8cf78",
817
+ "sha256:91906d725cb84d8ee71ce05fbb155d39d494849622b4f9349e5176a8eb01c49b",
818
+ "sha256:ae6c04b629ac2cd2f695739988cb70b9bd8d5e7f849f5b14c4510e942bee5770",
819
+ "sha256:b9779944559cb7ace6a8516e402895f239b0d9d3c833c67dbaec496310e7e206",
820
+ "sha256:bdbca79726fe883c696088ea163715b2f902aec638a8e24bcf9790ff8fa45019",
821
+ "sha256:cdeba37c2fb44e1aec8a72af4cb369655b59ba313181b1b4b8183f08e759c49c",
822
+ "sha256:d737df0f8f26e093a82bfb106b6cfb510a0e9302d35834568e5b20b73ddc5a9c",
823
+ "sha256:eff5ff411f18a201eec137b7b32fcb55e0c48b372d370bd24f965f5bad471fa4",
824
+ "sha256:f1271224acafb27639c432e1ce4e7d38eab40305ba1c546e871d5c8a32f4f195",
825
+ "sha256:fde8dccb9033fa344ffce3ee1837939a50e7a210a768f1cf2059beeafa755481"
826
+ ],
827
+ "version": "==0.12.1"
828
+ },
829
+ "toml": {
830
+ "hashes": [
831
+ "sha256:806143ae5bfb6a3c6e736a764057db0e6a0e05e338b5630894a5f779cabb4f9b",
832
+ "sha256:b3bda1d108d5dd99f4a20d24d9c348e91c4db7ab1b749200bded2f839ccbe68f"
833
+ ],
834
+ "markers": "python_version >= '2.6' and python_version not in '3.0, 3.1, 3.2, 3.3'",
835
+ "version": "==0.10.2"
836
+ },
837
+ "toolz": {
838
+ "hashes": [
839
+ "sha256:2059bd4148deb1884bb0eb770a3cde70e7f954cfbbdc2285f1f2de01fd21eb6f",
840
+ "sha256:88c570861c440ee3f2f6037c4654613228ff40c93a6c25e0eba70d17282c6194"
841
+ ],
842
+ "markers": "python_version >= '3.5'",
843
+ "version": "==0.12.0"
844
+ },
845
+ "torch": {
846
+ "hashes": [
847
+ "sha256:03e31c37711db2cd201e02de5826de875529e45a55631d317aadce2f1ed45aa8",
848
+ "sha256:0b44601ec56f7dd44ad8afc00846051162ef9c26a8579dda0a02194327f2d55e",
849
+ "sha256:42e115dab26f60c29e298559dbec88444175528b729ae994ec4c65d56fe267dd",
850
+ "sha256:42f639501928caabb9d1d55ddd17f07cd694de146686c24489ab8c615c2871f2",
851
+ "sha256:4e1b9c14cf13fd2ab8d769529050629a0e68a6fc5cb8e84b4a3cc1dd8c4fe541",
852
+ "sha256:68104e4715a55c4bb29a85c6a8d57d820e0757da363be1ba680fa8cc5be17b52",
853
+ "sha256:69fe2cae7c39ccadd65a123793d30e0db881f1c1927945519c5c17323131437e",
854
+ "sha256:6cf6f54b43c0c30335428195589bd00e764a6d27f3b9ba637aaa8c11aaf93073",
855
+ "sha256:743784ccea0dc8f2a3fe6a536bec8c4763bd82c1352f314937cb4008d4805de1",
856
+ "sha256:8a34a2fbbaa07c921e1b203f59d3d6e00ed379f2b384445773bd14e328a5b6c8",
857
+ "sha256:976c3f997cea38ee91a0dd3c3a42322785414748d1761ef926b789dfa97c6134",
858
+ "sha256:9b356aea223772cd754edb4d9ecf2a025909b8615a7668ac7d5130f86e7ec421",
859
+ "sha256:9c038662db894a23e49e385df13d47b2a777ffd56d9bcd5b832593fab0a7e286",
860
+ "sha256:a8320ba9ad87e80ca5a6a016e46ada4d1ba0c54626e135d99b2129a4541c509d",
861
+ "sha256:b5dbcca369800ce99ba7ae6dee3466607a66958afca3b740690d88168752abcf",
862
+ "sha256:bfec2843daa654f04fda23ba823af03e7b6f7650a873cdb726752d0e3718dada",
863
+ "sha256:cd26d8c5640c3a28c526d41ccdca14cf1cbca0d0f2e14e8263a7ac17194ab1d2",
864
+ "sha256:e9c8f4a311ac29fc7e8e955cfb7733deb5dbe1bdaabf5d4af2765695824b7e0d",
865
+ "sha256:f00c721f489089dc6364a01fd84906348fe02243d0af737f944fddb36003400d",
866
+ "sha256:f3b52a634e62821e747e872084ab32fbcb01b7fa7dbb7471b6218279f02a178a"
867
+ ],
868
+ "markers": "python_version >= '3.7'",
869
+ "version": "==1.12.1"
870
+ },
871
+ "tornado": {
872
+ "hashes": [
873
+ "sha256:1d54d13ab8414ed44de07efecb97d4ef7c39f7438cf5e976ccd356bebb1b5fca",
874
+ "sha256:20f638fd8cc85f3cbae3c732326e96addff0a15e22d80f049e00121651e82e72",
875
+ "sha256:5c87076709343557ef8032934ce5f637dbb552efa7b21d08e89ae7619ed0eb23",
876
+ "sha256:5f8c52d219d4995388119af7ccaa0bcec289535747620116a58d830e7c25d8a8",
877
+ "sha256:6fdfabffd8dfcb6cf887428849d30cf19a3ea34c2c248461e1f7d718ad30b66b",
878
+ "sha256:87dcafae3e884462f90c90ecc200defe5e580a7fbbb4365eda7c7c1eb809ebc9",
879
+ "sha256:9b630419bde84ec666bfd7ea0a4cb2a8a651c2d5cccdbdd1972a0c859dfc3c13",
880
+ "sha256:b8150f721c101abdef99073bf66d3903e292d851bee51910839831caba341a75",
881
+ "sha256:ba09ef14ca9893954244fd872798b4ccb2367c165946ce2dd7376aebdde8e3ac",
882
+ "sha256:d3a2f5999215a3a06a4fc218026cd84c61b8b2b40ac5296a6db1f1451ef04c1e",
883
+ "sha256:e5f923aa6a47e133d1cf87d60700889d7eae68988704e20c75fb2d65677a8e4b"
884
+ ],
885
+ "markers": "python_version >= '3.7'",
886
+ "version": "==6.2"
887
+ },
888
+ "tqdm": {
889
+ "hashes": [
890
+ "sha256:40be55d30e200777a307a7585aee69e4eabb46b4ec6a4b4a5f2d9f11e7d5408d",
891
+ "sha256:74a2cdefe14d11442cedf3ba4e21a3b84ff9a2dbdc6cfae2c34addb2a14a5ea6"
892
+ ],
893
+ "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3'",
894
+ "version": "==4.64.0"
895
+ },
896
+ "transformers": {
897
+ "hashes": [
898
+ "sha256:07f3df80144f7f032ad5d367507445980d4aa25855a5d658cfa47ac5fff32aca",
899
+ "sha256:c03c150857e2d8f18f6dcb51e3061207522425ad57a0a6dc6cde407226a45e3e"
900
+ ],
901
+ "markers": "python_version >= '3.7'",
902
+ "version": "==4.21.2"
903
+ },
904
+ "typing-extensions": {
905
+ "hashes": [
906
+ "sha256:25642c956049920a5aa49edcdd6ab1e06d7e5d467fc00e0506c44ac86fbfca02",
907
+ "sha256:e6d2677a32f47fc7eb2795db1dd15c1f34eff616bcaf2cfb5e997f854fa1c4a6"
908
+ ],
909
+ "markers": "python_version >= '3.7'",
910
+ "version": "==4.3.0"
911
+ },
912
+ "tzdata": {
913
+ "hashes": [
914
+ "sha256:21f4f0d7241572efa7f7a4fdabb052e61b55dc48274e6842697ccdf5253e5451",
915
+ "sha256:c3119520447d68ef3eb8187a55a4f44fa455f30eb1b4238fa5691ba094f2b05b"
916
+ ],
917
+ "markers": "python_version >= '3.6'",
918
+ "version": "==2022.2"
919
+ },
920
+ "tzlocal": {
921
+ "hashes": [
922
+ "sha256:89885494684c929d9191c57aa27502afc87a579be5cdd3225c77c463ea043745",
923
+ "sha256:ee5842fa3a795f023514ac2d801c4a81d1743bbe642e3940143326b3a00addd7"
924
+ ],
925
+ "markers": "python_version >= '3.6'",
926
+ "version": "==4.2"
927
+ },
928
+ "urllib3": {
929
+ "hashes": [
930
+ "sha256:3fa96cf423e6987997fc326ae8df396db2a8b7c667747d47ddd8ecba91f4a74e",
931
+ "sha256:b930dd878d5a8afb066a637fbb35144fe7901e3b209d1cd4f524bd0e9deee997"
932
+ ],
933
+ "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3, 3.4, 3.5' and python_version < '4'",
934
+ "version": "==1.26.12"
935
+ },
936
+ "validators": {
937
+ "hashes": [
938
+ "sha256:24148ce4e64100a2d5e267233e23e7afeb55316b47d30faae7eb6e7292bc226a"
939
+ ],
940
+ "markers": "python_version >= '3.4'",
941
+ "version": "==0.20.0"
942
+ },
943
+ "zipp": {
944
+ "hashes": [
945
+ "sha256:05b45f1ee8f807d0cc928485ca40a07cb491cf092ff587c0df9cb1fd154848d2",
946
+ "sha256:47c40d7fe183a6f21403a199b3e4192cca5774656965b0a4988ad2f8feb5f009"
947
+ ],
948
+ "markers": "python_version >= '3.7'",
949
+ "version": "==3.8.1"
950
+ }
951
+ },
952
+ "develop": {}
953
+ }
twNLP-app/README.md ADDED
@@ -0,0 +1 @@
 
 
1
+ # **ckip-cwn-app**