Add eval_batch_size for evaluation
This commit is contained in:
@@ -85,6 +85,7 @@ output_dir: ./completed-model
|
|||||||
# training hyperparameters
|
# training hyperparameters
|
||||||
batch_size: 8
|
batch_size: 8
|
||||||
micro_batch_size: 2
|
micro_batch_size: 2
|
||||||
|
eval_batch_size: 2
|
||||||
num_epochs: 3
|
num_epochs: 3
|
||||||
warmup_steps: 100
|
warmup_steps: 100
|
||||||
learning_rate: 0.00003
|
learning_rate: 0.00003
|
||||||
|
|||||||
@@ -47,6 +47,7 @@ def setup_trainer(cfg, train_dataset, eval_dataset, model, tokenizer):
|
|||||||
|
|
||||||
training_args = transformers.TrainingArguments(
|
training_args = transformers.TrainingArguments(
|
||||||
per_device_train_batch_size=cfg.micro_batch_size,
|
per_device_train_batch_size=cfg.micro_batch_size,
|
||||||
|
per_device_eval_batch_size=cfg.eval_batch_size,
|
||||||
gradient_accumulation_steps=cfg.gradient_accumulation_steps,
|
gradient_accumulation_steps=cfg.gradient_accumulation_steps,
|
||||||
num_train_epochs=cfg.num_epochs,
|
num_train_epochs=cfg.num_epochs,
|
||||||
learning_rate=cfg.learning_rate,
|
learning_rate=cfg.learning_rate,
|
||||||
|
|||||||
Reference in New Issue
Block a user