File size: 2,358 Bytes
c149479
fe3c056
c149479
 
 
fe3c056
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
c149479
 
 
 
 
 
 
 
 
 
fe3c056
c149479
 
fe3c056
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
from src.interfaces.aclanthology import AclanthologyPaperList
from src.interfaces.arxiv import ArxivPaperList
from src.utils import dump_paper_list_to_markdown_checklist

if __name__ == "__main__":
    # # use `bash scripts/get_aclanthology.sh` to download and prepare anthology data
    # acl_paper_list = AclanthologyPaperList("cache/aclanthology.json")
    # ee_query = {
    #     "title": [
    #         ["information extraction"],
    #         ["event", "extraction"],
    #         ["event", "argument", "extraction"],
    #         ["event", "detection"],
    #         ["event", "classification"],
    #         ["event", "tracking"],
    #         ["event", "relation", "extraction"],
    #     ],
    #     "venue": [
    #         ["acl"],
    #         ["emnlp"],
    #         ["naacl"],
    #         ["coling"],
    #         ["findings"],
    #         ["tacl"],
    #         ["cl"],
    #     ],
    # }
    # ee_papers = acl_paper_list.search(ee_query)
    # dump_paper_list_to_markdown_checklist(ee_papers, "results/ee-paper-list.md")

    # doc_query = {
    #     "title": [
    #         ["document-level"],
    #     ],
    #     "venue": [
    #         ["acl"],
    #         ["emnlp"],
    #         ["naacl"],
    #         ["coling"],
    #         ["findings"],
    #         ["tacl"],
    #         ["cl"],
    #     ],
    # }
    # doc_papers = acl_paper_list.search(doc_query)
    # dump_paper_list_to_markdown_checklist(doc_papers, "results/doc-paper-list.md")

    arxiv_paper_list = ArxivPaperList(
        "cache/ee-arxiv.xml",
        use_cache=True,
        title="Event Extraction OR Event Argument Extraction OR Event Detection OR Event Classification OR Event Tracking OR Event Relation Extraction OR Information Extraction",
        category="cs.CL",
    )
    arxiv_ee_query = {
        "title": [
            ["information extraction"],
            ["event", "extraction"],
            ["event", "argument", "extraction"],
            ["event", "detection"],
            ["event", "classification"],
            ["event", "tracking"],
            ["event", "relation", "extraction"],
        ],
        "venue": [
            ["cs.CL"],
        ],
    }
    arxiv_ee_papers = arxiv_paper_list.search(arxiv_ee_query)
    dump_paper_list_to_markdown_checklist(arxiv_ee_papers, "results/arxiv-ee-paper-list.md")