zjrwtxtechstudio's picture
Upload 4 files
9cb4156 verified
import requests
import re
def get_arxiv_metadata(arxiv_id):
# 检查arXiv ID格式
if not re.match(r'^\d{4}\.\d{4,5}(v\d+)?$', arxiv_id):
raise ValueError("请输入有效的arXiv编号,例如:2301.12345")
# 构建API请求URL
url = f'http://export.arxiv.org/api/query?id_list={arxiv_id}'
response = requests.get(url)
if response.status_code != 200:
raise Exception("无法从arXiv获取数据,请检查网络连接和arXiv编号。")
# 解析XML响应
import xml.etree.ElementTree as ET
root = ET.fromstring(response.text)
ns = {'atom': 'http://www.w3.org/2005/Atom'}
entry = root.find('atom:entry', ns)
if entry is None:
raise Exception("未找到该arXiv编号的论文信息。")
# 获取论文标题
title = entry.find('atom:title', ns).text.strip()
# 获取作者列表
authors = entry.findall('atom:author/atom:name', ns)
author_names = [author.text.strip() for author in authors]
# 获取出版年份(使用发表日期的年份)
published = entry.find('atom:published', ns).text
year = published[:4]
# 获取版本号
arxiv_url = entry.find('atom:id', ns).text
version_search = re.search(r'v(\d+)$', arxiv_url)
version = version_search.group(0) if version_search else ''
# 返回元数据
metadata = {
'title': title,
'authors': author_names,
'year': year,
'arxiv_id': arxiv_id,
'version': version
}
return metadata
def format_citation(metadata, style='APA'):
authors = metadata['authors']
title = metadata['title']
arxiv_id = metadata['arxiv_id']
version = metadata['version']
year = metadata['year']
# 处理作者姓名格式
if style.upper() == 'APA':
formatted_authors = ', '.join(authors)
citation = f"{formatted_authors}. ({year}). {title}. *arXiv*预印本arXiv:{arxiv_id}{version}"
elif style.upper() == 'MLA':
formatted_authors = '、'.join(authors)
citation = f"{formatted_authors}。《{title}》。*arXiv*预印本 arXiv:{arxiv_id}{version} ({year})。"
elif style.upper() == 'CHICAGO':
formatted_authors = ', '.join(authors)
citation = f"{formatted_authors}。“{title}。” *arXiv*预印本 arXiv:{arxiv_id}{version}{year}。"
elif style.upper() == 'IEEE':
# IEEE风格通常使用英文名,需要将中文名转为拼音或使用英文名
formatted_authors = ' and '.join(authors)
citation = f"{formatted_authors}, \"{title},\" *arXiv* preprint arXiv:{arxiv_id}{version}, {year}."
else:
raise ValueError("不支持的引用格式。请选择APA、MLA、Chicago或IEEE。")
return citation
def main():
arxiv_id = input("请输入arXiv编号(例如2301.12345):").strip()
style = input("请输入引用格式(APA、MLA、Chicago、IEEE):").strip()
try:
metadata = get_arxiv_metadata(arxiv_id)
citation = format_citation(metadata, style)
print("\n生成的引用:\n")
print(citation)
except Exception as e:
print(f"发生错误:{e}")
if __name__ == '__main__':
main()