Spaces:
Build error
Build error
import json | |
input_file = 'XXX.jsonl' | |
output_file = 'YYY.jsonl' | |
with ( | |
open(input_file, 'r', encoding='utf-8') as fin, | |
open(output_file, 'w', encoding='utf-8') as fout, | |
): | |
for line in fin: | |
line = line.strip() | |
if not line: | |
continue | |
data = json.loads(line) | |
item = data | |
# 提取原始数据 | |
org = item.get('org', '') | |
repo = item.get('repo', '') | |
number = str(item.get('number', '')) | |
new_item = {} | |
new_item['repo'] = f'{org}/{repo}' | |
new_item['instance_id'] = f'{org}__{repo}-{number}' | |
new_item['problem_statement'] = ( | |
item['resolved_issues'][0].get('title', '') | |
+ '\n' | |
+ item['resolved_issues'][0].get('body', '') | |
) | |
new_item['FAIL_TO_PASS'] = [] | |
new_item['PASS_TO_PASS'] = [] | |
new_item['base_commit'] = item['base'].get('sha', '') | |
new_item['version'] = '0.1' # depends | |
output_data = new_item | |
fout.write(json.dumps(output_data, ensure_ascii=False) + '\n') | |