don't resize embeddings to multiples of 32x by default

2023-07-22 01:52:38 -04:00
parent 1b63bf13bc
commit 1066751358
2 changed files with 8 additions and 1 deletions
--- a/README.md
+++ b/README.md
@@ -322,6 +322,9 @@ tokenizer_type: AutoTokenizer
 trust_remote_code:
 # use_fast option for tokenizer loading from_pretrained, default to True
 tokenizer_use_fast:
+# resize the model embeddings when new tokens are added to multiples of 32
+# this is reported to improve training speed on some models
+resize_token_embeddings_to_32x:

 # whether you are training a 4-bit GPTQ quantized model
 gptq: true