Kewen Zhao commited on
Commit
53d1889
·
1 Parent(s): 7ddd4d3

merge inputs into references

Browse files
Files changed (1) hide show
  1. code_eval_stdio.py +5 -5
code_eval_stdio.py CHANGED
@@ -145,8 +145,8 @@ class CodeEval(evaluate.Metric):
145
  "predictions": datasets.Sequence(datasets.Value("string")),
146
  "references": datasets.Sequence(
147
  {
148
- "inputs": datasets.Value("string"),
149
- "expected_output": datasets.Value("string"),
150
  }
151
  ),
152
  }
@@ -161,7 +161,7 @@ class CodeEval(evaluate.Metric):
161
  """
162
  Returns the scores
163
  predictions: List[List[str]] the python program
164
- references: List[Tuple[str, str]] test inputs and expected outputs
165
  """
166
 
167
  if os.getenv("HF_ALLOW_CODE_EVAL", 0) != "1":
@@ -176,9 +176,9 @@ class CodeEval(evaluate.Metric):
176
  n_samples = 0
177
  results = defaultdict(list)
178
 
179
- for task_id, (candidates, (input_data, expected_output)) in enumerate(zip(predictions, references)):
180
  for candidate in candidates:
181
- args = (candidate, input_data, expected_output, timeout, task_id, completion_id[task_id])
182
  future = executor.submit(check_correctness, *args)
183
  futures.append(future)
184
  completion_id[task_id] += 1
 
145
  "predictions": datasets.Sequence(datasets.Value("string")),
146
  "references": datasets.Sequence(
147
  {
148
+ "input": datasets.Value("string"),
149
+ "reference_output": datasets.Value("string"),
150
  }
151
  ),
152
  }
 
161
  """
162
  Returns the scores
163
  predictions: List[List[str]] the python program
164
+ references: List[Dict[str, str]] test inputs and reference outputs
165
  """
166
 
167
  if os.getenv("HF_ALLOW_CODE_EVAL", 0) != "1":
 
176
  n_samples = 0
177
  results = defaultdict(list)
178
 
179
+ for task_id, (candidates, reference) in enumerate(zip(predictions, references)):
180
  for candidate in candidates:
181
+ args = (candidate, reference['input'], reference['reference_output'], timeout, task_id, completion_id[task_id])
182
  future = executor.submit(check_correctness, *args)
183
  futures.append(future)
184
  completion_id[task_id] += 1