Basic evaluate CLI command / codepath (#2188)
* basic evaluate CLI command / codepath * tests for evaluate CLI command * fixes and cleanup * review comments; slightly DRYing up things --------- Co-authored-by: Dan Saunders <danjsaund@gmail.com>
This commit is contained in:
@@ -26,7 +26,7 @@ from axolotl.logging_config import configure_logging
|
|||||||
from axolotl.utils.dict import DictDefault
|
from axolotl.utils.dict import DictDefault
|
||||||
from axolotl.utils.freeze import freeze_layers_except
|
from axolotl.utils.freeze import freeze_layers_except
|
||||||
from axolotl.utils.models import load_model, load_processor, load_tokenizer
|
from axolotl.utils.models import load_model, load_processor, load_tokenizer
|
||||||
from axolotl.utils.trainer import setup_trainer
|
from axolotl.utils.trainer import set_pytorch_cuda_alloc_conf, setup_trainer
|
||||||
|
|
||||||
try:
|
try:
|
||||||
from optimum.bettertransformer import BetterTransformer
|
from optimum.bettertransformer import BetterTransformer
|
||||||
|
|||||||
@@ -512,6 +512,17 @@ def prepare_opinionated_env(cfg):
|
|||||||
os.environ["TOKENIZERS_PARALLELISM"] = "false"
|
os.environ["TOKENIZERS_PARALLELISM"] = "false"
|
||||||
|
|
||||||
|
|
||||||
|
def set_pytorch_cuda_alloc_conf():
|
||||||
|
"""Set up CUDA allocation config if using PyTorch >= 2.2"""
|
||||||
|
torch_version = torch.__version__.split(".")
|
||||||
|
torch_major, torch_minor = int(torch_version[0]), int(torch_version[1])
|
||||||
|
if torch_major == 2 and torch_minor >= 2:
|
||||||
|
if os.getenv("PYTORCH_CUDA_ALLOC_CONF") is None:
|
||||||
|
os.environ[
|
||||||
|
"PYTORCH_CUDA_ALLOC_CONF"
|
||||||
|
] = "expandable_segments:True,roundup_power2_divisions:16"
|
||||||
|
|
||||||
|
|
||||||
def setup_trainer(
|
def setup_trainer(
|
||||||
cfg, train_dataset, eval_dataset, model, tokenizer, processor, total_num_steps
|
cfg, train_dataset, eval_dataset, model, tokenizer, processor, total_num_steps
|
||||||
):
|
):
|
||||||
|
|||||||
Reference in New Issue
Block a user