|
icl_tasks: |
|
- |
|
label: human_eval |
|
dataset_uri: eval/local_data/programming/human_eval.jsonl |
|
num_fewshot: [0] |
|
pass_at_k: 1 |
|
num_beams: 20 |
|
batch_size: 1 |
|
icl_task_type: code_evaluation |
|
|
|
- |
|
label: human_eval_cpp |
|
dataset_uri: eval/local_data/programming/processed_human_eval_cpp.jsonl |
|
num_fewshot: [0] |
|
pass_at_k: 1 |
|
num_beams: 20 |
|
batch_size: 1 |
|
icl_task_type: code_evaluation |
|
- |
|
label: human_eval_js |
|
dataset_uri: eval/local_data/programming/processed_human_eval_js.jsonl |
|
num_fewshot: [0] |
|
pass_at_k: 1 |
|
num_beams: 20 |
|
batch_size: 1 |
|
icl_task_type: code_evaluation |
|
- |
|
label: human_eval_return_simple |
|
dataset_uri: eval/local_data/programming/human_eval_return_simple.jsonl |
|
num_fewshot: [0] |
|
pass_at_k: 1 |
|
num_beams: 20 |
|
batch_size: 1 |
|
icl_task_type: code_evaluation |
|
- |
|
label: human_eval_return_complex |
|
dataset_uri: eval/local_data/programming/human_eval_return_complex.jsonl |
|
num_fewshot: [0] |
|
pass_at_k: 1 |
|
num_beams: 20 |
|
batch_size: 1 |
|
icl_task_type: code_evaluation |
|
- |
|
label: human_eval_25 |
|
dataset_uri: eval/local_data/programming/human_eval-0.25.jsonl |
|
num_fewshot: [0] |
|
pass_at_k: 1 |
|
num_beams: 20 |
|
batch_size: 1 |
|
icl_task_type: code_evaluation |
|
- |
|
label: human_eval_50 |
|
dataset_uri: eval/local_data/programming/human_eval-0.5.jsonl |
|
num_fewshot: [0] |
|
pass_at_k: 1 |
|
num_beams: 20 |
|
batch_size: 1 |
|
icl_task_type: code_evaluation |
|
- |
|
label: human_eval_75 |
|
dataset_uri: eval/local_data/programming/human_eval-0.75.jsonl |
|
num_fewshot: [0] |
|
pass_at_k: 1 |
|
num_beams: 20 |
|
batch_size: 1 |
|
icl_task_type: code_evaluation |
|
|