File size: 3,250 Bytes
9cb4156
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91

import requests
import re

def get_arxiv_metadata(arxiv_id):
    # 检查arXiv ID格式
    if not re.match(r'^\d{4}\.\d{4,5}(v\d+)?$', arxiv_id):
        raise ValueError("请输入有效的arXiv编号,例如:2301.12345")
    
    # 构建API请求URL
    url = f'http://export.arxiv.org/api/query?id_list={arxiv_id}'
    response = requests.get(url)
    
    if response.status_code != 200:
        raise Exception("无法从arXiv获取数据,请检查网络连接和arXiv编号。")
    
    # 解析XML响应
    import xml.etree.ElementTree as ET
    root = ET.fromstring(response.text)
    ns = {'atom': 'http://www.w3.org/2005/Atom'}
    
    entry = root.find('atom:entry', ns)
    if entry is None:
        raise Exception("未找到该arXiv编号的论文信息。")
    
    # 获取论文标题
    title = entry.find('atom:title', ns).text.strip()
    
    # 获取作者列表
    authors = entry.findall('atom:author/atom:name', ns)
    author_names = [author.text.strip() for author in authors]
    
    # 获取出版年份(使用发表日期的年份)
    published = entry.find('atom:published', ns).text
    year = published[:4]
    
    # 获取版本号
    arxiv_url = entry.find('atom:id', ns).text
    version_search = re.search(r'v(\d+)$', arxiv_url)
    version = version_search.group(0) if version_search else ''
    
    # 返回元数据
    metadata = {
        'title': title,
        'authors': author_names,
        'year': year,
        'arxiv_id': arxiv_id,
        'version': version
    }
    return metadata

def format_citation(metadata, style='APA'):
    authors = metadata['authors']
    title = metadata['title']
    arxiv_id = metadata['arxiv_id']
    version = metadata['version']
    year = metadata['year']
    
    # 处理作者姓名格式
    if style.upper() == 'APA':
        formatted_authors = ', '.join(authors)
        citation = f"{formatted_authors}. ({year}). {title}. *arXiv*预印本arXiv:{arxiv_id}{version}"
    elif style.upper() == 'MLA':
        formatted_authors = '、'.join(authors)
        citation = f"{formatted_authors}。《{title}》。*arXiv*预印本 arXiv:{arxiv_id}{version} ({year})。"
    elif style.upper() == 'CHICAGO':
        formatted_authors = ', '.join(authors)
        citation = f"{formatted_authors}。“{title}。” *arXiv*预印本 arXiv:{arxiv_id}{version}{year}。"
    elif style.upper() == 'IEEE':
        # IEEE风格通常使用英文名,需要将中文名转为拼音或使用英文名
        formatted_authors = ' and '.join(authors)
        citation = f"{formatted_authors}, \"{title},\" *arXiv* preprint arXiv:{arxiv_id}{version}, {year}."
    else:
        raise ValueError("不支持的引用格式。请选择APA、MLA、Chicago或IEEE。")
    
    return citation

def main():
    arxiv_id = input("请输入arXiv编号(例如2301.12345):").strip()
    style = input("请输入引用格式(APA、MLA、Chicago、IEEE):").strip()
    
    try:
        metadata = get_arxiv_metadata(arxiv_id)
        citation = format_citation(metadata, style)
        print("\n生成的引用:\n")
        print(citation)
    except Exception as e:
        print(f"发生错误:{e}")

if __name__ == '__main__':
    main()