diff --git a/scripts/eval/yamls/coding_tasks.yaml b/scripts/eval/yamls/coding_tasks.yaml index 065f291ea0..2c1c602250 100644 --- a/scripts/eval/yamls/coding_tasks.yaml +++ b/scripts/eval/yamls/coding_tasks.yaml @@ -24,33 +24,33 @@ icl_tasks: label: human_eval_return_simple dataset_uri: eval/local_data/programming/human_eval_return_simple.jsonl # ADD YOUR OWN DATASET URI num_fewshot: [0] - pass_at_k : 1 + pass_at_k: 1 num_beams: 20 - label: human_eval_return_complex dataset_uri: eval/local_data/programming/human_eval_return_complex.jsonl # ADD YOUR OWN DATASET URI num_fewshot: [0] - pass_at_k : 1 + pass_at_k: 1 num_beams: 20 icl_task_type: code_evaluation - label: human_eval_25 dataset_uri: eval/local_data/programming/split-0.25.jsonl # ADD YOUR OWN DATASET URI num_fewshot: [0] - pass_at_k : 1 + pass_at_k: 1 num_beams: 20 icl_task_type: code_evaluation - label: human_eval_50 dataset_uri: eval/local_data/programming/split-0.5.jsonl # ADD YOUR OWN DATASET URI num_fewshot: [0] - pass_at_k : 1 + pass_at_k: 1 num_beams: 20 icl_task_type: code_evaluation - label: human_eval_75 dataset_uri: eval/local_data/programming/split-0.75.jsonl # ADD YOUR OWN DATASET URI num_fewshot: [0] - pass_at_k : 1 + pass_at_k: 1 num_beams: 20 icl_task_type: code_evaluation diff --git a/scripts/eval/yamls/tasks.yaml b/scripts/eval/yamls/tasks.yaml index 6f082e5893..7481ada872 100644 --- a/scripts/eval/yamls/tasks.yaml +++ b/scripts/eval/yamls/tasks.yaml @@ -198,33 +198,33 @@ icl_tasks: label: human_eval_return_simple dataset_uri: eval/local_data/programming/human_eval_return_simple.jsonl # ADD YOUR OWN DATASET URI num_fewshot: [0] - pass_at_k : 1 + pass_at_k: 1 num_beams: 20 - label: human_eval_return_complex dataset_uri: eval/local_data/programming/human_eval_return_complex.jsonl # ADD YOUR OWN DATASET URI num_fewshot: [0] - pass_at_k : 1 + pass_at_k: 1 num_beams: 20 icl_task_type: code_evaluation - label: human_eval_25 dataset_uri: eval/local_data/programming/human_eval-0.25.jsonl # ADD YOUR OWN DATASET URI num_fewshot: [0] - pass_at_k : 1 + pass_at_k: 1 num_beams: 20 icl_task_type: code_evaluation - label: human_eval_50 dataset_uri: eval/local_data/programming/human_eval-0.5.jsonl # ADD YOUR OWN DATASET URI num_fewshot: [0] - pass_at_k : 1 + pass_at_k: 1 num_beams: 20 icl_task_type: code_evaluation - label: human_eval_75 dataset_uri: eval/local_data/programming/human_eval-0.75.jsonl # ADD YOUR OWN DATASET URI num_fewshot: [0] - pass_at_k : 1 + pass_at_k: 1 num_beams: 20 icl_task_type: code_evaluation