* support for mamba * more mamba fixes * use fork for mamba kwargs fix * grad checkpointing doesn't work * fix extras for mamaba * mamba loss fix * use fp32 and remove verbose logging * mamba fixes * fix collator for mamba * set model_type on training_args * don't save safetensors for mamba * update mamba config to disable safetensor checkpooints, install for tests * no evals for mamba tests * handle save_pretrained * handle unused safetensors arg
59 lines
1.8 KiB
Python
59 lines
1.8 KiB
Python
"""setup.py for axolotl"""
|
|
|
|
from setuptools import find_packages, setup
|
|
|
|
|
|
def parse_requirements():
|
|
_install_requires = []
|
|
_dependency_links = []
|
|
with open("./requirements.txt", encoding="utf-8") as requirements_file:
|
|
lines = [r.strip() for r in requirements_file.readlines()]
|
|
for line in lines:
|
|
if line.startswith("--extra-index-url"):
|
|
# Handle custom index URLs
|
|
_, url = line.split()
|
|
_dependency_links.append(url)
|
|
elif (
|
|
"flash-attn" not in line
|
|
and "deepspeed" not in line
|
|
and line
|
|
and line[0] != "#"
|
|
):
|
|
# Handle standard packages
|
|
_install_requires.append(line)
|
|
|
|
# TODO(wing) remove once xformers release supports torch 2.1.0
|
|
if "torch==2.1.0" in _install_requires:
|
|
_install_requires.pop(_install_requires.index("xformers>=0.0.22"))
|
|
_install_requires.append(
|
|
"xformers @ git+https://github.com/facebookresearch/xformers.git@main"
|
|
)
|
|
|
|
return _install_requires, _dependency_links
|
|
|
|
|
|
install_requires, dependency_links = parse_requirements()
|
|
|
|
|
|
setup(
|
|
name="axolotl",
|
|
version="0.3.0",
|
|
description="LLM Trainer",
|
|
long_description="Axolotl is a tool designed to streamline the fine-tuning of various AI models, offering support for multiple configurations and architectures.",
|
|
package_dir={"": "src"},
|
|
packages=find_packages(),
|
|
install_requires=install_requires,
|
|
dependency_links=dependency_links,
|
|
extras_require={
|
|
"flash-attn": [
|
|
"flash-attn==2.3.3",
|
|
],
|
|
"deepspeed": [
|
|
"deepspeed",
|
|
],
|
|
"mamba-ssm": [
|
|
"mamba-ssm==1.0.1",
|
|
],
|
|
},
|
|
)
|