Compare commits
6 Commits
moekernels
...
ec94d632f3
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
ec94d632f3 | ||
|
|
e8bd3b0b3b | ||
|
|
5a08b94668 | ||
|
|
ecb8c1f4b3 | ||
|
|
ab57be6526 | ||
|
|
c9640bca2c |
2
.github/workflows/preview-docs.yml
vendored
2
.github/workflows/preview-docs.yml
vendored
@@ -10,7 +10,7 @@ on:
|
|||||||
- '**/*.qmd' # any Quarto file
|
- '**/*.qmd' # any Quarto file
|
||||||
- '_quarto.yml'
|
- '_quarto.yml'
|
||||||
- docs/scripts/generate_config_docs.py
|
- docs/scripts/generate_config_docs.py
|
||||||
- src/axolotl/utils/schemas/**.py
|
- src/axolotl/**/*.py
|
||||||
|
|
||||||
permissions:
|
permissions:
|
||||||
checks: write
|
checks: write
|
||||||
|
|||||||
10
TODO.md
10
TODO.md
@@ -1,10 +0,0 @@
|
|||||||
# todo list
|
|
||||||
|
|
||||||
- [] Validation of parameters for combinations that won't work
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
## things that are known not to work
|
|
||||||
|
|
||||||
- FSDP offload and gradient_checkpointing - https://github.com/pytorch/pytorch/issues/82203
|
|
||||||
- adamw_bnb_8bit doesn't play well with FSDP offload
|
|
||||||
@@ -74,7 +74,9 @@ def generate_config_files(config: str, sweep: str | None) -> Iterator[tuple[str,
|
|||||||
sweep: Sweep configuration file
|
sweep: Sweep configuration file
|
||||||
|
|
||||||
Yields:
|
Yields:
|
||||||
Tuple of configuration file name and whether this is a group of configurations
|
tuple[str, bool]: (config_file, is_group)
|
||||||
|
- config_file: configuration file path
|
||||||
|
- is_group: whether this is a group of configurations
|
||||||
"""
|
"""
|
||||||
|
|
||||||
if not sweep:
|
if not sweep:
|
||||||
|
|||||||
Reference in New Issue
Block a user