Spaces:
Running
Running
import json | |
with open("sub_mbpp.json", "r", encoding="utf-8") as f: | |
data = json.load(f) | |
# token_counts=[12, 12, 12, 12, 13, 13, 13, 13] | |
# token_counts_I=token_counts[0]*0.01*974 | |
# token_counts_II=token_counts[1]*0.01*974 | |
# token_counts_III=token_counts[2]*0.01*974 | |
# token_counts_IV=token_counts[3]*0.01*974 | |
# token_counts_V=token_counts[4]*0.01*974 | |
# token_counts_VI=token_counts[5]*0.01*974 | |
# token_counts_VII=token_counts[6]*0.01*974 | |
# token_counts_VIII=token_counts[7]*0.01*974 | |
# | |
# cyclomatic_complexity=[12, 12, 12, 12, 13, 13, 13, 13] | |
# cyclomatic_complexity_I=cyclomatic_complexity[0]*0.01*974 | |
# cyclomatic_complexity_II=cyclomatic_complexity[1]*0.01*974 | |
# cyclomatic_complexity_III=cyclomatic_complexity[2]*0.01*974 | |
# cyclomatic_complexity_IV=cyclomatic_complexity[3]*0.01*974 | |
# cyclomatic_complexity_V=cyclomatic_complexity[4]*0.01*974 | |
# cyclomatic_complexity_VI=cyclomatic_complexity[5]*0.01*974 | |
# cyclomatic_complexity_VII=cyclomatic_complexity[6]*0.01*974 | |
# cyclomatic_complexity_VIII=cyclomatic_complexity[7]*0.01*974 | |
# print([cyclomatic_complexity_I,cyclomatic_complexity_II,cyclomatic_complexity_III,cyclomatic_complexity_IV,cyclomatic_complexity_V,cyclomatic_complexity_VI,cyclomatic_complexity_VII,cyclomatic_complexity_VIII]) | |
# | |
token_counts=[12, 12, 12, 12, 13, 13, 13, 13] | |
token_counts_I=token_counts[0]*0.01*500 | |
token_counts_II=token_counts[1]*0.01*500 | |
token_counts_III=token_counts[2]*0.01*500 | |
token_counts_IV=token_counts[3]*0.01*500 | |
token_counts_V=token_counts[4]*0.01*500 | |
token_counts_VI=token_counts[5]*0.01*500 | |
token_counts_VII=token_counts[6]*0.01*500 | |
token_counts_VIII=token_counts[7]*0.01*500 | |
cyclomatic_complexity=[12, 12, 12, 12, 13, 13, 13, 13] | |
cyclomatic_complexity_I=cyclomatic_complexity[0]*0.01*500 | |
cyclomatic_complexity_II=cyclomatic_complexity[1]*0.01*500 | |
cyclomatic_complexity_III=cyclomatic_complexity[2]*0.01*500 | |
cyclomatic_complexity_IV=cyclomatic_complexity[3]*0.01*500 | |
cyclomatic_complexity_V=cyclomatic_complexity[4]*0.01*500 | |
cyclomatic_complexity_VI=cyclomatic_complexity[5]*0.01*500 | |
cyclomatic_complexity_VII=cyclomatic_complexity[6]*0.01*500 | |
cyclomatic_complexity_VIII=cyclomatic_complexity[7]*0.01*500 | |
print([cyclomatic_complexity_I,cyclomatic_complexity_II,cyclomatic_complexity_III,cyclomatic_complexity_IV,cyclomatic_complexity_V,cyclomatic_complexity_VI,cyclomatic_complexity_VII,cyclomatic_complexity_VIII]) | |
data.sort(key=lambda x: x['token']) | |
for i, item in enumerate(data): | |
if i < token_counts_I: | |
item['token_diff'] = 0 | |
elif i < token_counts_I + token_counts_II: | |
item['token_diff'] = 1 | |
elif i < token_counts_I + token_counts_II+token_counts_III: | |
item['token_diff'] = 2 | |
elif i < token_counts_I + token_counts_II+token_counts_III+token_counts_IV: | |
item['token_diff'] = 3 | |
elif i < token_counts_I + token_counts_II+token_counts_III+token_counts_IV+token_counts_V: | |
item['token_diff'] = 4 | |
elif i < token_counts_I + token_counts_II + token_counts_III + token_counts_IV + token_counts_V+token_counts_VI: | |
item['token_diff'] = 5 | |
elif i < token_counts_I + token_counts_II + token_counts_III + token_counts_IV + token_counts_V+token_counts_VI+token_counts_VII: | |
item['token_diff'] = 6 | |
else: | |
item['token_diff'] = 7 | |
data.sort(key=lambda x: x['cc']) | |
for i, item in enumerate(data): | |
if i < cyclomatic_complexity_I: | |
item['CC_diff'] = 0 | |
elif i < cyclomatic_complexity_I + cyclomatic_complexity_II: | |
item['CC_diff'] = 1 | |
elif i < cyclomatic_complexity_I + cyclomatic_complexity_II+cyclomatic_complexity_III: | |
item['CC_diff'] = 2 | |
elif i < cyclomatic_complexity_I + cyclomatic_complexity_II+cyclomatic_complexity_III+cyclomatic_complexity_IV: | |
item['CC_diff'] = 3 | |
elif i < cyclomatic_complexity_I + cyclomatic_complexity_II+cyclomatic_complexity_III+cyclomatic_complexity_IV+cyclomatic_complexity_V: | |
item['CC_diff'] = 4 | |
elif i < cyclomatic_complexity_I + cyclomatic_complexity_II+cyclomatic_complexity_III+cyclomatic_complexity_IV+cyclomatic_complexity_V+cyclomatic_complexity_VI: | |
item['CC_diff'] = 5 | |
elif i < cyclomatic_complexity_I + cyclomatic_complexity_II+cyclomatic_complexity_III+cyclomatic_complexity_IV+cyclomatic_complexity_V+cyclomatic_complexity_VI+cyclomatic_complexity_VII: | |
item['CC_diff'] = 6 | |
else: | |
item['CC_diff'] = 7 | |
data.sort(key=lambda x: x['id']) | |
# 将更新后的数据写回JSON文件 | |
with open('QS.json', 'w', encoding='utf-8') as file: | |
json.dump(data, file, ensure_ascii=False, indent=4) | |