Compare commits
2 Commits
fix/merge-
...
fix/diffus
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
08c8f3f22f | ||
|
|
76f0fe2621 |
@@ -30,7 +30,7 @@ eval_sample_packing: true
|
||||
gradient_accumulation_steps: 4
|
||||
micro_batch_size: 4
|
||||
num_epochs: 1
|
||||
warmup_steps: 0.1
|
||||
warmup_ratio: 0.1
|
||||
|
||||
optimizer: adamw_8bit
|
||||
lr_scheduler: cosine
|
||||
@@ -44,7 +44,7 @@ resume_from_checkpoint:
|
||||
sdp_attention: true
|
||||
|
||||
logging_steps: 1
|
||||
save_strategy: best
|
||||
save_strategy: epoch
|
||||
eval_strategy: epoch
|
||||
|
||||
special_tokens:
|
||||
|
||||
@@ -631,7 +631,9 @@ class AxolotlTrainer(
|
||||
logs["tokens_per_second_per_gpu"] = round(
|
||||
self.state.last_tokens_per_second.item() / self.args.logging_steps, 2
|
||||
)
|
||||
logs["total_tokens"] = int(self.state.total_tokens.item())
|
||||
|
||||
if hasattr(self.state, "total_tokens"):
|
||||
logs["total_tokens"] = int(self.state.total_tokens.item())
|
||||
|
||||
del self._stored_metrics[train_eval]
|
||||
|
||||
|
||||
Reference in New Issue
Block a user