[bitsandbytes] Simplify bnb int8 dequant #27909
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
name: Fast tests for PRs | |
on: | |
pull_request: | |
branches: | |
- main | |
paths: | |
- "src/diffusers/**.py" | |
- "benchmarks/**.py" | |
- "examples/**.py" | |
- "scripts/**.py" | |
- "tests/**.py" | |
- ".github/**.yml" | |
- "utils/**.py" | |
push: | |
branches: | |
- ci-* | |
concurrency: | |
group: ${{ github.workflow }}-${{ github.head_ref || github.run_id }} | |
cancel-in-progress: true | |
env: | |
DIFFUSERS_IS_CI: yes | |
HF_HUB_ENABLE_HF_TRANSFER: 1 | |
OMP_NUM_THREADS: 4 | |
MKL_NUM_THREADS: 4 | |
PYTEST_TIMEOUT: 60 | |
jobs: | |
check_code_quality: | |
runs-on: ubuntu-22.04 | |
steps: | |
- uses: actions/checkout@v3 | |
- name: Set up Python | |
uses: actions/setup-python@v4 | |
with: | |
python-version: "3.8" | |
- name: Install dependencies | |
run: | | |
python -m pip install --upgrade pip | |
pip install .[quality] | |
- name: Check quality | |
run: make quality | |
- name: Check if failure | |
if: ${{ failure() }} | |
run: | | |
echo "Quality check failed. Please ensure the right dependency versions are installed with 'pip install -e .[quality]' and run 'make style && make quality'" >> $GITHUB_STEP_SUMMARY | |
check_repository_consistency: | |
needs: check_code_quality | |
runs-on: ubuntu-22.04 | |
steps: | |
- uses: actions/checkout@v3 | |
- name: Set up Python | |
uses: actions/setup-python@v4 | |
with: | |
python-version: "3.8" | |
- name: Install dependencies | |
run: | | |
python -m pip install --upgrade pip | |
pip install .[quality] | |
- name: Check repo consistency | |
run: | | |
python utils/check_copies.py | |
python utils/check_dummies.py | |
make deps_table_check_updated | |
- name: Check if failure | |
if: ${{ failure() }} | |
run: | | |
echo "Repo consistency check failed. Please ensure the right dependency versions are installed with 'pip install -e .[quality]' and run 'make fix-copies'" >> $GITHUB_STEP_SUMMARY | |
run_fast_tests: | |
needs: [check_code_quality, check_repository_consistency] | |
strategy: | |
fail-fast: false | |
matrix: | |
config: | |
- name: Fast PyTorch Pipeline CPU tests | |
framework: pytorch_pipelines | |
runner: aws-highmemory-32-plus | |
image: diffusers/diffusers-pytorch-cpu | |
report: torch_cpu_pipelines | |
- name: Fast PyTorch Models & Schedulers CPU tests | |
framework: pytorch_models | |
runner: aws-general-8-plus | |
image: diffusers/diffusers-pytorch-cpu | |
report: torch_cpu_models_schedulers | |
- name: Fast Flax CPU tests | |
framework: flax | |
runner: aws-general-8-plus | |
image: diffusers/diffusers-flax-cpu | |
report: flax_cpu | |
- name: PyTorch Example CPU tests | |
framework: pytorch_examples | |
runner: aws-general-8-plus | |
image: diffusers/diffusers-pytorch-cpu | |
report: torch_example_cpu | |
name: ${{ matrix.config.name }} | |
runs-on: | |
group: ${{ matrix.config.runner }} | |
container: | |
image: ${{ matrix.config.image }} | |
options: --shm-size "16gb" --ipc host -v /mnt/hf_cache:/mnt/cache/ | |
defaults: | |
run: | |
shell: bash | |
steps: | |
- name: Checkout diffusers | |
uses: actions/checkout@v3 | |
with: | |
fetch-depth: 2 | |
- name: Install dependencies | |
run: | | |
python -m venv /opt/venv && export PATH="/opt/venv/bin:$PATH" | |
python -m uv pip install -e [quality,test] | |
python -m uv pip install accelerate | |
- name: Environment | |
run: | | |
python -m venv /opt/venv && export PATH="/opt/venv/bin:$PATH" | |
python utils/print_env.py | |
- name: Run fast PyTorch Pipeline CPU tests | |
if: ${{ matrix.config.framework == 'pytorch_pipelines' }} | |
run: | | |
python -m venv /opt/venv && export PATH="/opt/venv/bin:$PATH" | |
python -m pytest -n 8 --max-worker-restart=0 --dist=loadfile \ | |
-s -v -k "not Flax and not Onnx" \ | |
--make-reports=tests_${{ matrix.config.report }} \ | |
tests/pipelines | |
- name: Run fast PyTorch Model Scheduler CPU tests | |
if: ${{ matrix.config.framework == 'pytorch_models' }} | |
run: | | |
python -m venv /opt/venv && export PATH="/opt/venv/bin:$PATH" | |
python -m pytest -n 4 --max-worker-restart=0 --dist=loadfile \ | |
-s -v -k "not Flax and not Onnx and not Dependency" \ | |
--make-reports=tests_${{ matrix.config.report }} \ | |
tests/models tests/schedulers tests/others | |
- name: Run fast Flax TPU tests | |
if: ${{ matrix.config.framework == 'flax' }} | |
run: | | |
python -m venv /opt/venv && export PATH="/opt/venv/bin:$PATH" | |
python -m pytest -n 4 --max-worker-restart=0 --dist=loadfile \ | |
-s -v -k "Flax" \ | |
--make-reports=tests_${{ matrix.config.report }} \ | |
tests | |
- name: Run example PyTorch CPU tests | |
if: ${{ matrix.config.framework == 'pytorch_examples' }} | |
run: | | |
python -m venv /opt/venv && export PATH="/opt/venv/bin:$PATH" | |
python -m uv pip install peft timm | |
python -m pytest -n 4 --max-worker-restart=0 --dist=loadfile \ | |
--make-reports=tests_${{ matrix.config.report }} \ | |
examples | |
- name: Failure short reports | |
if: ${{ failure() }} | |
run: cat reports/tests_${{ matrix.config.report }}_failures_short.txt | |
- name: Test suite reports artifacts | |
if: ${{ always() }} | |
uses: actions/upload-artifact@v4 | |
with: | |
name: pr_${{ matrix.config.framework }}_${{ matrix.config.report }}_test_reports | |
path: reports | |
run_staging_tests: | |
needs: [check_code_quality, check_repository_consistency] | |
strategy: | |
fail-fast: false | |
matrix: | |
config: | |
- name: Hub tests for models, schedulers, and pipelines | |
framework: hub_tests_pytorch | |
runner: | |
group: aws-general-8-plus | |
image: diffusers/diffusers-pytorch-cpu | |
report: torch_hub | |
name: ${{ matrix.config.name }} | |
runs-on: ${{ matrix.config.runner }} | |
container: | |
image: ${{ matrix.config.image }} | |
options: --shm-size "16gb" --ipc host -v /mnt/hf_cache:/mnt/cache/ | |
defaults: | |
run: | |
shell: bash | |
steps: | |
- name: Checkout diffusers | |
uses: actions/checkout@v3 | |
with: | |
fetch-depth: 2 | |
- name: Install dependencies | |
run: | | |
python -m venv /opt/venv && export PATH="/opt/venv/bin:$PATH" | |
python -m uv pip install -e [quality,test] | |
- name: Environment | |
run: | | |
python -m venv /opt/venv && export PATH="/opt/venv/bin:$PATH" | |
python utils/print_env.py | |
- name: Run Hub tests for models, schedulers, and pipelines on a staging env | |
if: ${{ matrix.config.framework == 'hub_tests_pytorch' }} | |
run: | | |
python -m venv /opt/venv && export PATH="/opt/venv/bin:$PATH" | |
HUGGINGFACE_CO_STAGING=true python -m pytest \ | |
-m "is_staging_test" \ | |
--make-reports=tests_${{ matrix.config.report }} \ | |
tests | |
- name: Failure short reports | |
if: ${{ failure() }} | |
run: cat reports/tests_${{ matrix.config.report }}_failures_short.txt | |
- name: Test suite reports artifacts | |
if: ${{ always() }} | |
uses: actions/upload-artifact@v4 | |
with: | |
name: pr_${{ matrix.config.report }}_test_reports | |
path: reports | |
run_lora_tests: | |
needs: [check_code_quality, check_repository_consistency] | |
strategy: | |
fail-fast: false | |
name: LoRA tests with PEFT main | |
runs-on: | |
group: aws-general-8-plus | |
container: | |
image: diffusers/diffusers-pytorch-cpu | |
options: --shm-size "16gb" --ipc host -v /mnt/hf_cache:/mnt/cache/ | |
defaults: | |
run: | |
shell: bash | |
steps: | |
- name: Checkout diffusers | |
uses: actions/checkout@v3 | |
with: | |
fetch-depth: 2 | |
- name: Install dependencies | |
run: | | |
python -m venv /opt/venv && export PATH="/opt/venv/bin:$PATH" | |
python -m uv pip install -e [quality,test] | |
# TODO (sayakpaul, DN6): revisit `--no-deps` | |
python -m pip install -U peft@git+https://github.com/huggingface/peft.git --no-deps | |
python -m uv pip install -U transformers@git+https://github.com/huggingface/transformers.git --no-deps | |
python -m uv pip install -U tokenizers | |
pip uninstall accelerate -y && python -m uv pip install -U accelerate@git+https://github.com/huggingface/accelerate.git --no-deps | |
- name: Environment | |
run: | | |
python -m venv /opt/venv && export PATH="/opt/venv/bin:$PATH" | |
python utils/print_env.py | |
- name: Run fast PyTorch LoRA tests with PEFT | |
run: | | |
python -m venv /opt/venv && export PATH="/opt/venv/bin:$PATH" | |
python -m pytest -n 4 --max-worker-restart=0 --dist=loadfile \ | |
-s -v \ | |
--make-reports=tests_peft_main \ | |
tests/lora/ | |
python -m pytest -n 4 --max-worker-restart=0 --dist=loadfile \ | |
-s -v \ | |
--make-reports=tests_models_lora_peft_main \ | |
tests/models/ -k "lora" | |
- name: Failure short reports | |
if: ${{ failure() }} | |
run: | | |
cat reports/tests_lora_failures_short.txt | |
cat reports/tests_models_lora_failures_short.txt | |
- name: Test suite reports artifacts | |
if: ${{ always() }} | |
uses: actions/upload-artifact@v4 | |
with: | |
name: pr_main_test_reports | |
path: reports | |