File size: 3,137 Bytes
dfe37be |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 |
import json
with open("humaneval_new.json", "r", encoding="utf-8") as f:
data = json.load(f)
line_counts=[17,17,17,17,17,15]
line_counts_I=line_counts[0]*0.01*164
line_counts_II=line_counts[1]*0.01*164
line_counts_III=line_counts[2]*0.01*164
line_counts_IV=line_counts[3]*0.01*164
line_counts_V=line_counts[4]*0.01*164
line_counts_VI=line_counts[5]*0.01*164
token_counts=[17,17,17,17,17,15]
token_counts_I=token_counts[0]*0.01*164
token_counts_II=token_counts[1]*0.01*164
token_counts_III=token_counts[2]*0.01*164
token_counts_IV=token_counts[3]*0.01*164
token_counts_V=token_counts[4]*0.01*164
token_counts_VI=token_counts[5]*0.01*164
cyclomatic_complexity=[17,17,17,17,17,15]
cyclomatic_complexity_I=cyclomatic_complexity[0]*0.01*164
cyclomatic_complexity_II=cyclomatic_complexity[1]*0.01*164
cyclomatic_complexity_III=cyclomatic_complexity[2]*0.01*164
cyclomatic_complexity_IV=cyclomatic_complexity[3]*0.01*164
cyclomatic_complexity_V=cyclomatic_complexity[4]*0.01*164
cyclomatic_complexity_VI=cyclomatic_complexity[5]*0.01*164
data.sort(key=lambda x: x['line'])
for i, item in enumerate(data):
if i < line_counts_I:
item['line_diff'] = 0
elif i <line_counts_I+line_counts_II:
item['line_diff'] = 1
elif i <line_counts_I+line_counts_II+line_counts_III:
item['line_diff'] = 2
elif i <line_counts_I+line_counts_II+line_counts_III+line_counts_IV:
item['line_diff'] = 3
elif i <line_counts_I+line_counts_II+line_counts_III+line_counts_IV+line_counts_V:
item['line_diff'] = 4
else:
item['line_diff'] = 5
data.sort(key=lambda x: x['token'])
for i, item in enumerate(data):
if i < token_counts_I:
item['token_diff'] = 0
elif i < token_counts_I + token_counts_II:
item['token_diff'] = 1
elif i < token_counts_I + token_counts_II+token_counts_III:
item['token_diff'] = 2
elif i < token_counts_I + token_counts_II+token_counts_III+token_counts_IV:
item['token_diff'] = 3
elif i < token_counts_I + token_counts_II+token_counts_III+token_counts_IV+token_counts_V:
item['token_diff'] = 4
else:
item['token_diff'] = 5
data.sort(key=lambda x: x['cyclomatic_complexity'])
for i, item in enumerate(data):
if i < cyclomatic_complexity_I:
item['CC_diff'] = 0
elif i < cyclomatic_complexity_I + cyclomatic_complexity_II:
item['CC_diff'] = 1
elif i < cyclomatic_complexity_I + cyclomatic_complexity_II+cyclomatic_complexity_III:
item['CC_diff'] = 2
elif i < cyclomatic_complexity_I + cyclomatic_complexity_II+cyclomatic_complexity_III+cyclomatic_complexity_IV:
item['CC_diff'] = 3
elif i < cyclomatic_complexity_I + cyclomatic_complexity_II+cyclomatic_complexity_III+cyclomatic_complexity_IV+cyclomatic_complexity_V:
item['CC_diff'] = 4
else:
item['CC_diff'] = 5
data.sort(key=lambda x: x['id'])
# 将更新后的数据写回JSON文件
with open('QS.json', 'w', encoding='utf-8') as file:
json.dump(data, file, ensure_ascii=False, indent=4)
|