From 67b98886306aba93232cb8766f95126566c23a9d Mon Sep 17 00:00:00 2001 From: NanoCode012 Date: Sat, 23 Sep 2023 13:11:27 +0900 Subject: [PATCH] Feat(doc): Add eval_sample_packing to doc (#625) --- README.md | 2 ++ 1 file changed, 2 insertions(+) diff --git a/README.md b/README.md index 6e91158934..6ec81eed3c 100644 --- a/README.md +++ b/README.md @@ -493,6 +493,8 @@ pad_to_sequence_len: max_packed_sequence_len: 1024 # use efficient multi-packing with block diagonal attention and per sequence position_ids. Recommend set to 'true' sample_packing: +# set to 'false' if getting errors during eval with sample_packing on. +eval_sample_packing: # you can set these packing optimizations AFTER starting a training at least once. # The trainer will provide recommended values for these values. sample_packing_eff_est: