Feat(doc): Add eval_sample_packing to doc (#625)
Browse files
README.md
CHANGED
@@ -493,6 +493,8 @@ pad_to_sequence_len:
|
|
493 |
max_packed_sequence_len: 1024
|
494 |
# use efficient multi-packing with block diagonal attention and per sequence position_ids. Recommend set to 'true'
|
495 |
sample_packing:
|
|
|
|
|
496 |
# you can set these packing optimizations AFTER starting a training at least once.
|
497 |
# The trainer will provide recommended values for these values.
|
498 |
sample_packing_eff_est:
|
|
|
493 |
max_packed_sequence_len: 1024
|
494 |
# use efficient multi-packing with block diagonal attention and per sequence position_ids. Recommend set to 'true'
|
495 |
sample_packing:
|
496 |
+
# set to 'false' if getting errors during eval with sample_packing on.
|
497 |
+
eval_sample_packing:
|
498 |
# you can set these packing optimizations AFTER starting a training at least once.
|
499 |
# The trainer will provide recommended values for these values.
|
500 |
sample_packing_eff_est:
|