various bugfixes

This commit is contained in:
Wing Lian
2023-04-14 21:37:07 -04:00
parent 45f77dd51e
commit 80b2ed29d8
5 changed files with 33 additions and 26 deletions

View File

@@ -1,4 +1,4 @@
base_model: decapoda-research/llama-65b-hf
base_model: huggyllama/llama-7b
model_type: LlamaForCausalLM
tokenizer_type: LlamaTokenizer
load_in_8bit: true
@@ -33,8 +33,8 @@ num_epochs: 5
learning_rate: 0.00003
train_on_inputs: false
group_by_length: false
bf16: True
tf32: True
bf16: true
tf32: true
resume_from_checkpoint:
local_rank:
deepspeed: