Spaces:
Running
Running
File size: 2,358 Bytes
c149479 fe3c056 c149479 fe3c056 c149479 fe3c056 c149479 fe3c056 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 |
from src.interfaces.aclanthology import AclanthologyPaperList
from src.interfaces.arxiv import ArxivPaperList
from src.utils import dump_paper_list_to_markdown_checklist
if __name__ == "__main__":
# # use `bash scripts/get_aclanthology.sh` to download and prepare anthology data
# acl_paper_list = AclanthologyPaperList("cache/aclanthology.json")
# ee_query = {
# "title": [
# ["information extraction"],
# ["event", "extraction"],
# ["event", "argument", "extraction"],
# ["event", "detection"],
# ["event", "classification"],
# ["event", "tracking"],
# ["event", "relation", "extraction"],
# ],
# "venue": [
# ["acl"],
# ["emnlp"],
# ["naacl"],
# ["coling"],
# ["findings"],
# ["tacl"],
# ["cl"],
# ],
# }
# ee_papers = acl_paper_list.search(ee_query)
# dump_paper_list_to_markdown_checklist(ee_papers, "results/ee-paper-list.md")
# doc_query = {
# "title": [
# ["document-level"],
# ],
# "venue": [
# ["acl"],
# ["emnlp"],
# ["naacl"],
# ["coling"],
# ["findings"],
# ["tacl"],
# ["cl"],
# ],
# }
# doc_papers = acl_paper_list.search(doc_query)
# dump_paper_list_to_markdown_checklist(doc_papers, "results/doc-paper-list.md")
arxiv_paper_list = ArxivPaperList(
"cache/ee-arxiv.xml",
use_cache=True,
title="Event Extraction OR Event Argument Extraction OR Event Detection OR Event Classification OR Event Tracking OR Event Relation Extraction OR Information Extraction",
category="cs.CL",
)
arxiv_ee_query = {
"title": [
["information extraction"],
["event", "extraction"],
["event", "argument", "extraction"],
["event", "detection"],
["event", "classification"],
["event", "tracking"],
["event", "relation", "extraction"],
],
"venue": [
["cs.CL"],
],
}
arxiv_ee_papers = arxiv_paper_list.search(arxiv_ee_query)
dump_paper_list_to_markdown_checklist(arxiv_ee_papers, "results/arxiv-ee-paper-list.md")
|