Fix: shorten mem logs to 2 decimal places and renamed nd docs (#3011) [skip ci]

* fix: shorten memory logs

* fix: title name
This commit is contained in:
NanoCode012
2025-08-04 21:23:36 +07:00
committed by GitHub
parent 5691992d34
commit a54c1be972
2 changed files with 7 additions and 5 deletions

View File

@@ -1,4 +1,6 @@
# N-D Parallelism
---
title: "N-D Parallelism"
---
Axolotl enables training models at scale by composing different parallelism techniques. This is essential when:

View File

@@ -567,10 +567,10 @@ class AxolotlTrainer(
# Add memory usage
try:
active, allocated, reserved = get_gpu_memory_usage()
logs["memory/max_memory_active"] = active
logs["memory/max_memory_allocated"] = allocated
logs["memory/device_memory_reserved"] = reserved
except (ValueError, FileNotFoundError):
logs["memory/max_memory_active(gib)"] = round(active, 2)
logs["memory/max_memory_allocated(gib)"] = round(allocated, 2)
logs["memory/device_memory_reserved(gib)"] = round(reserved, 2)
except (ValueError, TypeError, FileNotFoundError):
pass
del self._stored_metrics[train_eval]