Merge pull request #178 from PocketDocLabs/main

Update README.md to reflect current gradient checkpointing support
2023-06-10 08:26:48 +09:00
parent b9083a7fc1 16f9e28048
commit 6b50200234
1 changed files with 1 additions and 1 deletions
--- a/README.md
+++ b/README.md
@@ -387,7 +387,7 @@ train_on_inputs: false
 # don't use this, leads to wonky training (according to someone on the internet)
 group_by_length: false

-# does not work with current implementation of 4-bit LoRA
+# Whether to use gradient checkpointing https://huggingface.co/docs/transformers/v4.18.0/en/performance#gradient-checkpointing
 gradient_checkpointing: false

 # stop training after this many evaluation losses have increased in a row