Spaces:
Runtime error
Runtime error
File size: 2,236 Bytes
c87c295 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 |
def fix(data):
# fix 140 https://github.com/evalplus/evalplus/issues/3
assert data[140]["task_id"] == "HumanEval/140"
data[140]["canonical_solution"] = data[140]["canonical_solution"].replace(
"range(len(text)-1, 2, -1)", "range(len(text), 2, -1)"
)
# fix 75 https://github.com/evalplus/evalplus/issues/4
assert data[75]["task_id"] == "HumanEval/75"
org_contract = '\n assert type(a) == int, "invalid inputs" # $_CONTRACT_$\n'
assert org_contract in data[75]["contract"]
data[75]["contract"] = (
org_contract + ' assert a < 100, "invalid inputs" # $_CONTRACT_$\n'
)
data[75]["base_input"] = [x for x in data[75]["base_input"] if x[0] < 100]
data[75]["plus_input"] = [x for x in data[75]["plus_input"] if x[0] < 100]
# fix 129 https://github.com/evalplus/evalplus/issues/4
assert data[129]["task_id"] == "HumanEval/129"
data[129][
"contract"
] = R"""
assert type(k) == int, "invalid inputs" # $_CONTRACT_$
assert k > 0, "invalid inputs" # $_CONTRACT_$
assert len(grid) >= 2, "invalid inputs" # $_CONTRACT_$
assert all(len(l) == len(grid) for l in grid), "invalid inputs" # $_CONTRACT_$
assert {x for l in grid for x in l} == set(range(1, len(grid) ** 2 + 1)), "invalid inputs" # $_CONTRACT_$
"""
def check_unique(grid):
return {x for l in grid for x in l} == set(range(1, len(grid) ** 2 + 1))
data[129]["base_input"] = [x for x in data[129]["base_input"] if check_unique(x[0])]
data[129]["plus_input"] = [x for x in data[129]["plus_input"] if check_unique(x[0])]
return data
if __name__ == "__main__":
import json
with open("HumanEvalPlus-v0.1.1.jsonl") as f:
data = [json.loads(line) for line in f.readlines() if line]
data = fix(data)
with open("HumanEvalPlus-v0.1.2.jsonl", "wb") as f:
for x in data:
f.write((json.dumps(x) + "\n").encode("utf-8"))
with open("HumanEvalPlus-Mini-v0.1.1.jsonl") as f:
data = [json.loads(line) for line in f.readlines() if line]
data = fix(data)
with open("HumanEvalPlus-Mini-v0.1.2.jsonl", "wb") as f:
for x in data:
f.write((json.dumps(x) + "\n").encode("utf-8"))
|