Resolve merge conflicts: unify pretraining utils imports, add alias handling; fix rl.py per new RL dataset API; resolve config schema conflict and add sequence_len_overflow_handling field

2025-08-12 20:45:26 +02:00
parent f5a3e3529e 3d45620008
commit 47b3fe8af3
603 changed files with 37614 additions and 14002 deletions
--- a/examples/orpheus/finetune.yml
+++ b/examples/orpheus/finetune.yml
@@ -18,7 +18,7 @@ output_dir: ./outputs/out

 sequence_len: 8192
 sample_packing: true
-pad_to_sequence_len: true
+

 wandb_project:
 wandb_entity:
@@ -43,10 +43,12 @@ resume_from_checkpoint:
 logging_steps: 1
 flash_attention: true

-warmup_steps: 20
+warmup_ratio: 0.1
 evals_per_epoch: 5
 saves_per_epoch: 5
 weight_decay: 0.05

 special_tokens:
  pad_token: <custom_token_7>
+
+# save_first_step: true  # uncomment this to validate checkpoint saving works with your config