Feat(doc): Add eval_sample_packing to doc (#625)
Browse files
README.md
CHANGED
|
@@ -493,6 +493,8 @@ pad_to_sequence_len:
|
|
| 493 |
max_packed_sequence_len: 1024
|
| 494 |
# use efficient multi-packing with block diagonal attention and per sequence position_ids. Recommend set to 'true'
|
| 495 |
sample_packing:
|
|
|
|
|
|
|
| 496 |
# you can set these packing optimizations AFTER starting a training at least once.
|
| 497 |
# The trainer will provide recommended values for these values.
|
| 498 |
sample_packing_eff_est:
|
|
|
|
| 493 |
max_packed_sequence_len: 1024
|
| 494 |
# use efficient multi-packing with block diagonal attention and per sequence position_ids. Recommend set to 'true'
|
| 495 |
sample_packing:
|
| 496 |
+
# set to 'false' if getting errors during eval with sample_packing on.
|
| 497 |
+
eval_sample_packing:
|
| 498 |
# you can set these packing optimizations AFTER starting a training at least once.
|
| 499 |
# The trainer will provide recommended values for these values.
|
| 500 |
sample_packing_eff_est:
|