Fix .to() method for all attention biases (fairinternal/xformers#1278) #628

Workflow file for this run

	name: wheels

	on:
	pull_request:
	paths:
	- ".github/compute_wheel_version.py"
	- ".github/workflows/wheel*"
	- ".github/actions/setup-build-cuda/action.yml"
	- "setup.py"
	- "requirements*.txt"
	push:
	branches:
	- main
	tags:
	- "v[0-9]+*"

	jobs:
	target_determinator:
	runs-on: ubuntu-latest
	outputs:
	matrix: ${{ steps.set-matrix.outputs.matrix }}
	steps:
	- id: set-matrix
	shell: python
	run: \|
	import os
	import json
	import itertools
	environ = os.environ

	PY_VERSIONS = ['3.9', '3.10', '3.11', '3.12']
	# NOTE: Don't forget to update `upload_pt`'s matrix
	# when changing the CUDA/ROCM versions below!
	CU_VERSIONS = ['118', '121', '124']
	ROCM_VERSIONS = ["6.1"] # <- 6.0 broken in `manylinux_2_28`
	PY_CU = list(itertools.product(PY_VERSIONS, CU_VERSIONS))
	PY_ROCM = list(itertools.product(PY_VERSIONS, ROCM_VERSIONS))
	print("Full matrix PY_CU", PY_CU)
	if os.environ["GITHUB_EVENT_NAME"] == "pull_request":
	print("pull-request: limiting matrix to save resources")
	PY_CU = [(PY_VERSIONS[0], CU_VERSIONS[0])]
	for cu in CU_VERSIONS[1:]:
	PY_CU.append((PY_VERSIONS[-1], cu))
	print("Limited matrix PY_CU", PY_CU)
	PY_ROCM = [(PY_VERSIONS[-1], ROCM_VERSIONS[-1])]

	include = []
	for os in ['8-core-ubuntu', 'windows-8-core']:
	for torch_version in ['2.5.1']:
	# CUDA builds
	for python, cuda_short_version in PY_CU:
	if cuda_short_version != "124" and "windows" in os:
	print("Windows builder no longer compatible with cu<124")
	continue
	include.append(dict(
	os=os,
	python=python,
	torch_version=torch_version,
	toolkit_type="cuda",
	toolkit_short_version=cuda_short_version,
	))
	print(include[-1])
	# ROCM builds
	for python, rocm_short_version in PY_ROCM:
	if os == 'windows-8-core':
	continue
	include.append(dict(
	os="16-core-ubuntu", # use for ROCm wheels only to avoid CI timeouts
	python=python,
	torch_version=torch_version,
	toolkit_type="rocm",
	toolkit_short_version=rocm_short_version,
	))
	print(include[-1])
	matrix = {'include': include}
	print(json.dumps(matrix))
	with open(environ["GITHUB_OUTPUT"], "a") as fd:
	fd.write("matrix="+json.dumps(matrix))
	build:
	needs: target_determinator
	strategy:
	fail-fast: false
	matrix: ${{ fromJson(needs.target_determinator.outputs.matrix) }}

	uses: ./.github/workflows/wheels_build.yml
	if: github.repository == 'facebookresearch/xformers' \|\| github.event_name == 'pull_request'
	with:
	os: ${{ matrix.os }}
	python: ${{ matrix.python }}
	torch_version: ${{ matrix.torch_version }}
	toolkit_type: ${{ matrix.toolkit_type }}
	toolkit_short_version: ${{ matrix.toolkit_short_version }}

	upload_pip:
	needs: build
	uses: ./.github/workflows/wheels_upload_pip.yml
	with:
	twine_username: __token__
	filter: "torch2.5.1+cu121"
	execute: ${{ github.repository == 'facebookresearch/xformers' && github.event_name != 'pull_request' }}
	secrets:
	twine_password: ${{ secrets.PYPI_TOKEN }}

	upload_pt:
	needs: build
	strategy:
	fail-fast: false
	matrix:
	suffix:
	- cu118
	- cu121
	- cu124
	- rocm6.1
	uses: ./.github/workflows/wheels_upload_s3.yml
	with:
	aws_role: "arn:aws:iam::749337293305:role/pytorch_bot_uploader_role"
	s3_path: s3://pytorch/whl/${{ matrix.suffix }}/
	aws_s3_cp_extra_args: --acl public-read
	filter: "torch2.5.1+${{ matrix.suffix }}"
	execute: ${{ github.repository == 'facebookresearch/xformers' && github.ref_type == 'tag' }}

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Fix .to() method for all attention biases (fairinternal/xformers#1278) #628

Workflow file

Fix .to() method for all attention biases (fairinternal/xformers#1278) #628

Jobs

Run details

Workflow file for this run