* upgrade dependencies * don't use reset sessions * downgrade transformers, upgrade other deps * upgrade bnb to 0.49.0 * restore s3 cache * explicit use local files w hub * decompress and strip top level dir * use 2 levels for strip components * try to preserve permissions for symlinks * use updated tar * fix #3293 for distributed * downgrade bnb * fast fail after 4 * fix total tokens device * patch accelerate CP/SP (#3309) --------- Co-authored-by: salman <salman.mohammadi@outlook.com>
26 lines
852 B
Bash
Executable File
26 lines
852 B
Bash
Executable File
#!/bin/bash
|
|
set -e
|
|
|
|
# Only run two tests at a time to avoid OOM on GPU (with coverage collection)
|
|
pytest -v --durations=10 -n2 --maxfail=4 \
|
|
--ignore=/workspace/axolotl/tests/e2e/multigpu/solo/ \
|
|
--ignore=/workspace/axolotl/tests/e2e/multigpu/patched/ \
|
|
/workspace/axolotl/tests/e2e/multigpu/ \
|
|
--cov=axolotl
|
|
|
|
# Run solo tests with coverage append
|
|
pytest -v --durations=10 -n1 \
|
|
/workspace/axolotl/tests/e2e/multigpu/solo/ \
|
|
--cov=axolotl \
|
|
--cov-append
|
|
|
|
pytest -v --durations=10 -n1 /workspace/axolotl/tests/e2e/multigpu/patched/ \
|
|
--cov=axolotl \
|
|
--cov-append \
|
|
--cov-report=xml:multigpu-coverage.xml
|
|
|
|
# Upload coverage to Codecov if CODECOV_TOKEN is available
|
|
if [ -n "$CODECOV_TOKEN" ]; then
|
|
codecov upload-process -t "${CODECOV_TOKEN}" -f multigpu-coverage.xml -F multigpu,docker-tests,pytorch-${PYTORCH_VERSION} || true
|
|
fi
|