fix precommit

mosaicml · Feb 2, 2024 · 9e31ec0 · 9e31ec0
1 parent 6276cf2
commit 9e31ec0
Show file tree

Hide file tree

Showing 4 changed files with 21 additions and 20 deletions.
diff --git a/llmfoundry/utils/builders.py b/llmfoundry/utils/builders.py
@@ -507,9 +507,9 @@ def _validate_cfg(icl_cfg: DictConfig):
             dist.barrier()
             early_stopping_criteria = icl_cfg.get('early_stopping_criteria',
                                                   None)
-            early_stopping_criteria = list(
-                early_stopping_criteria
-            ) if early_stopping_criteria is not None else None
+            # early_stopping_criteria = list(
+            #     early_stopping_criteria
+            # ) if early_stopping_criteria is not None else None
             dataloaders = get_icl_task_dataloader(
                 icl_cfg.icl_task_type,
                 icl_cfg.dataset_uri,

diff --git a/scripts/eval/eval.py b/scripts/eval/eval.py
@@ -268,7 +268,8 @@ def main(cfg: DictConfig) -> Tuple[List[Trainer], pd.DataFrame]:
     # Mandatory Evaluation Parameters
     icl_tasks: Union[str, ListConfig] = pop_config(cfg,
                                                    'icl_tasks',
-                                                   must_exist=True)
+                                                   must_exist=True,
+                                                   convert=True)
     max_seq_len: int = pop_config(cfg, 'max_seq_len', must_exist=True)
     device_eval_batch_size: int = pop_config(cfg,
                                              'device_eval_batch_size',

diff --git a/scripts/eval/yamls/hf_eval.yaml b/scripts/eval/yamls/hf_eval.yaml
@@ -43,5 +43,5 @@ device_eval_batch_size: 4
 #   forward_prefetch: True
 #   limit_all_gathers: True
 
-icl_tasks: 'eval/yamls/tasks_v0.3.yaml'
-eval_gauntlet: 'eval/yamls/eval_gauntlet_v0.3.yaml'
+icl_tasks: "eval/yamls/tasks_v0.3.yaml"
+eval_gauntlet: "eval/yamls/eval_gauntlet_v0.3.yaml"
diff --git a/scripts/eval/yamls/tasks_v0.3.yaml b/scripts/eval/yamls/tasks_v0.3.yaml
@@ -1,7 +1,7 @@
 icl_tasks:
 -
   label: human_eval
-  dataset_uri: eval/local_data/programming/human_eval.jsonl # ADD YOUR OWN DATASET URI
+  dataset_uri: eval/local_data/programming/human_eval.jsonl
   num_fewshot: [0]
   pass_at_k: 1
   num_beams: 5
@@ -12,7 +12,7 @@ icl_tasks:
   dataset_uri: eval/local_data/symbolic_problem_solving/gsm8k_prepended_8shot.jsonl
   num_fewshot: [0]
   icl_task_type: question_answering
-  cot_delimiter: 'The answer is '
+  cot_delimiter: "The answer is "
   continuation_delimiter: "\n\nA:"
   question_prelimiter: ""
   do_normalization: false
@@ -21,15 +21,15 @@ icl_tasks:
   - "Question:"
 -
   label: human_eval_cpp
-  dataset_uri: eval/local_data/programming/processed_human_eval_cpp.jsonl # ADD YOUR OWN DATASET URI
+  dataset_uri: eval/local_data/programming/processed_human_eval_cpp.jsonl
   num_fewshot: [0]
   pass_at_k: 1
   num_beams: 5
   batch_size: 1
   icl_task_type: code_evaluation
 -
   label: human_eval_js
-  dataset_uri: eval/local_data/programming/processed_human_eval_js.jsonl # ADD YOUR OWN DATASET URI
+  dataset_uri: eval/local_data/programming/processed_human_eval_js.jsonl
   num_fewshot: [0]
   pass_at_k: 1
   num_beams: 5
@@ -46,7 +46,7 @@ icl_tasks:
   dataset_uri: eval/local_data/symbolic_problem_solving/math.jsonl
   num_fewshot: [4]
   icl_task_type: question_answering
-  cot_delimiter: 'The answer is '
+  cot_delimiter: "The answer is "
   continuation_delimiter: "\n\nA:"
   question_prelimiter: "Question: "
   do_normalization: false
@@ -58,7 +58,7 @@ icl_tasks:
   dataset_uri: eval/local_data/symbolic_problem_solving/agi_eval_sat_math.jsonl
   num_fewshot: [3]
   icl_task_type: question_answering
-  cot_delimiter: 'The answer is '
+  cot_delimiter: "The answer is "
   continuation_delimiter: "\n\nA:"
   question_prelimiter: "Question: "
   do_normalization: false
@@ -70,7 +70,7 @@ icl_tasks:
   dataset_uri: eval/local_data/symbolic_problem_solving/aqua.jsonl
   num_fewshot: [3]
   icl_task_type: question_answering
-  cot_delimiter: 'The answer is '
+  cot_delimiter: "The answer is "
   continuation_delimiter: "\n\nA:"
   question_prelimiter: "Question: "
   do_normalization: false
@@ -82,7 +82,7 @@ icl_tasks:
   dataset_uri: eval/local_data/symbolic_problem_solving/svamp.jsonl
   num_fewshot: [5]
   icl_task_type: question_answering
-  cot_delimiter: 'The answer is '
+  cot_delimiter: "The answer is "
   continuation_delimiter: "\n\nA:"
   question_prelimiter: "Question: "
   do_normalization: false
@@ -94,7 +94,7 @@ icl_tasks:
   dataset_uri: eval/local_data/world_knowledge/jeopardy_all.jsonl
   num_fewshot: [3]
   icl_task_type: language_modeling
-  continuation_delimiter: "\nAnswer: " # this separates questions from answers
+  continuation_delimiter: "\nAnswer: "
   has_categories: true
 -
   label: bigbench_qa_wikidata
@@ -106,19 +106,19 @@ icl_tasks:
   dataset_uri: eval/local_data/world_knowledge/arc_easy.jsonl
   num_fewshot: [3]
   icl_task_type: multiple_choice
-  continuation_delimiter: "\nAnswer: " # this separates questions from answers
+  continuation_delimiter: "\nAnswer: "
 -
   label: arc_challenge
   dataset_uri: eval/local_data/world_knowledge/arc_challenge.jsonl
   num_fewshot: [3, 25]
   icl_task_type: multiple_choice
-  continuation_delimiter: "\nAnswer: " # this separates questions from answers
+  continuation_delimiter: "\nAnswer: "
 -
   label: mmlu
   dataset_uri: eval/local_data/world_knowledge/mmlu.jsonl
   num_fewshot: [5]
   icl_task_type: multiple_choice
-  continuation_delimiter: "\nAnswer: " # this separates questions from answers
+  continuation_delimiter: "\nAnswer: "
   has_categories: true
 -
   label: copa
@@ -140,7 +140,7 @@ icl_tasks:
   dataset_uri: eval/local_data/commonsense_reasoning/piqa.jsonl
   num_fewshot: [0]
   icl_task_type: multiple_choice
-  continuation_delimiter: "\nAnswer: " # this separates questions from answers
+  continuation_delimiter: "\nAnswer: "
 -
   label: openbook_qa
   dataset_uri: eval/local_data/commonsense_reasoning/openbook_qa.jsonl
@@ -241,7 +241,7 @@ icl_tasks:
   dataset_uri: eval/local_data/reading_comprehension/boolq.jsonl
   num_fewshot: [0]
   icl_task_type: multiple_choice
-  continuation_delimiter: "\nAnswer: " # this separates questions from answers
+  continuation_delimiter: "\nAnswer: "
 -
   label: agi_eval_sat_en
   dataset_uri: eval/local_data/reading_comprehension/agi_eval_sat_en.jsonl