OSS: Capture triton kernel in ET (#124775) #75148

Workflow file for this run

	name: trunk

	on:
	push:
	branches:
	- main
	- release/*
	- landchecks/*
	tags:
	- ciflow/trunk/*
	workflow_dispatch:
	schedule:
	- cron: 29 8 * * * # about 1:29am PDT

	concurrency:
	group: ${{ github.workflow }}-${{ github.event.pull_request.number \|\| github.ref_name }}-${{ github.ref_type == 'branch' && github.sha }}-${{ github.event_name == 'workflow_dispatch' }}-${{ github.event_name == 'schedule' }}
	cancel-in-progress: true

	permissions: read-all

	jobs:
	llm-td:
	name: before-test
	uses: ./.github/workflows/llm_td_retrieval.yml
	permissions:
	id-token: write
	contents: read

	target-determination:
	name: before-test
	uses: ./.github/workflows/target_determination.yml
	needs: llm-td
	permissions:
	id-token: write
	contents: read

	# Build PyTorch with BUILD_CAFFE2=ON
	caffe2-linux-jammy-py3_8-gcc11-build:
	name: caffe2-linux-jammy-py3.8-gcc11
	uses: ./.github/workflows/_linux-build.yml
	with:
	build-environment: caffe2-linux-jammy-py3.8-gcc11
	docker-image-name: pytorch-linux-jammy-py3.8-gcc11
	test-matrix: \|
	{ include: [
	{ config: "default", shard: 1, num_shards: 1 },
	]}

	linux-focal-cuda12_1-py3_10-gcc9-build:
	name: linux-focal-cuda12.1-py3.10-gcc9
	uses: ./.github/workflows/_linux-build.yml
	with:
	build-environment: linux-focal-cuda12.1-py3.10-gcc9
	docker-image-name: pytorch-linux-focal-cuda12.1-cudnn8-py3-gcc9
	test-matrix: \|
	{ include: [
	{ config: "nogpu_AVX512", shard: 1, num_shards: 1, runner: "linux.2xlarge" },
	{ config: "nogpu_NO_AVX2", shard: 1, num_shards: 1, runner: "linux.2xlarge" },
	{ config: "jit_legacy", shard: 1, num_shards: 1, runner: "linux.4xlarge.nvidia.gpu" },
	]}

	linux-focal-cuda12_1-py3_10-gcc9-test:
	name: linux-focal-cuda12.1-py3.10-gcc9
	uses: ./.github/workflows/_linux-test.yml
	needs:
	- linux-focal-cuda12_1-py3_10-gcc9-build
	- target-determination
	with:
	build-environment: linux-focal-cuda12.1-py3.10-gcc9
	docker-image: ${{ needs.linux-focal-cuda12_1-py3_10-gcc9-build.outputs.docker-image }}
	test-matrix: ${{ needs.linux-focal-cuda12_1-py3_10-gcc9-build.outputs.test-matrix }}

	libtorch-linux-focal-cuda12_1-py3_7-gcc9-debug-build:
	name: libtorch-linux-focal-cuda12.1-py3.7-gcc9-debug
	uses: ./.github/workflows/_linux-build.yml
	with:
	build-environment: libtorch-linux-focal-cuda12.1-py3.7-gcc9
	docker-image-name: pytorch-linux-focal-cuda12.1-cudnn8-py3-gcc9
	build-generates-artifacts: false
	runner: linux.4xlarge
	test-matrix: \|
	{ include: [
	{ config: "default", shard: 1, num_shards: 1 },
	]}

	# no-ops builds test USE_PER_OPERATOR_HEADERS=0 where ATen/ops is not generated
	linux-focal-cuda12_1-py3_10-gcc9-no-ops-build:
	name: linux-focal-cuda12.1-py3.10-gcc9-no-ops
	uses: ./.github/workflows/_linux-build.yml
	with:
	build-environment: linux-focal-cuda12.1-py3.10-gcc9-no-ops
	docker-image-name: pytorch-linux-focal-cuda12.1-cudnn8-py3-gcc9
	test-matrix: \|
	{ include: [
	{ config: "default", shard: 1, num_shards: 1 },
	]}

	pytorch-linux-focal-py3-clang9-android-ndk-r21e-build:
	name: pytorch-linux-focal-py3-clang9-android-ndk-r21e-build
	uses: ./.github/workflows/_android-full-build-test.yml
	with:
	build-environment: pytorch-linux-focal-py3-clang9-android-ndk-r21e-build
	docker-image-name: pytorch-linux-focal-py3-clang9-android-ndk-r21e
	test-matrix: \|
	{ include: [
	{ config: "default", shard: 1, num_shards: 1, runner: "linux.2xlarge" },
	]}

	macos-12-py3-arm64-build:
	name: macos-12-py3-arm64
	uses: ./.github/workflows/_mac-build.yml
	with:
	sync-tag: macos-12-py3-arm64-build
	build-environment: macos-12-py3-arm64
	runner-type: macos-m1-stable
	build-generates-artifacts: true
	# To match the one pre-installed in the m1 runners
	python-version: 3.9.12
	# We need to set the environment file here instead of trying to detect it automatically because
	# MacOS arm64 is cross-compiled from x86-64. Specifically, it means that arm64 conda environment
	# is needed when building PyTorch MacOS arm64 from x86-64
	environment-file: .github/requirements/conda-env-macOS-ARM64
	test-matrix: \|
	{ include: [
	{ config: "default", shard: 1, num_shards: 3, runner: "macos-m1-stable" },
	{ config: "default", shard: 2, num_shards: 3, runner: "macos-m1-stable" },
	{ config: "default", shard: 3, num_shards: 3, runner: "macos-m1-stable" },
	]}

	macos-12-py3-arm64-mps-test:
	name: macos-12-py3-arm64-mps
	uses: ./.github/workflows/_mac-test-mps.yml
	needs: macos-12-py3-arm64-build
	if: needs.macos-12-py3-arm64-build.outputs.build-outcome == 'success'
	with:
	sync-tag: macos-12-py3-arm64-mps-test
	build-environment: macos-12-py3-arm64
	# Same as the build job
	python-version: 3.9.12
	test-matrix: \|
	{ include: [
	{ config: "mps", shard: 1, num_shards: 1, runner: "macos-m1-stable" },
	]}

	macos-12-py3-arm64-test:
	name: macos-12-py3-arm64
	uses: ./.github/workflows/_mac-test.yml
	needs:
	- macos-12-py3-arm64-build
	- target-determination
	with:
	build-environment: macos-12-py3-arm64
	# Same as the build job
	python-version: 3.9.12
	test-matrix: ${{ needs.macos-12-py3-arm64-build.outputs.test-matrix }}
	arch: arm64

	win-vs2019-cpu-py3-build:
	name: win-vs2019-cpu-py3
	uses: ./.github/workflows/_win-build.yml
	with:
	build-environment: win-vs2019-cpu-py3
	cuda-version: cpu
	sync-tag: win-cpu-build
	test-matrix: \|
	{ include: [
	{ config: "default", shard: 1, num_shards: 3, runner: "windows.4xlarge.nonephemeral" },
	{ config: "default", shard: 2, num_shards: 3, runner: "windows.4xlarge.nonephemeral" },
	{ config: "default", shard: 3, num_shards: 3, runner: "windows.4xlarge.nonephemeral" },
	]}

	win-vs2019-cpu-py3-test:
	name: win-vs2019-cpu-py3
	uses: ./.github/workflows/_win-test.yml
	needs:
	- win-vs2019-cpu-py3-build
	- target-determination
	with:
	build-environment: win-vs2019-cpu-py3
	cuda-version: cpu
	test-matrix: ${{ needs.win-vs2019-cpu-py3-build.outputs.test-matrix }}

	win-vs2019-cuda11_8-py3-build:
	name: win-vs2019-cuda11.8-py3
	uses: ./.github/workflows/_win-build.yml
	with:
	build-environment: win-vs2019-cuda11.8-py3
	cuda-version: "11.8"
	sync-tag: win-cuda-build
	test-matrix: \|
	{ include: [
	{ config: "default", shard: 1, num_shards: 6, runner: "windows.g5.4xlarge.nvidia.gpu" },
	{ config: "default", shard: 2, num_shards: 6, runner: "windows.g5.4xlarge.nvidia.gpu" },
	{ config: "default", shard: 3, num_shards: 6, runner: "windows.g5.4xlarge.nvidia.gpu" },
	{ config: "default", shard: 4, num_shards: 6, runner: "windows.g5.4xlarge.nvidia.gpu" },
	{ config: "default", shard: 5, num_shards: 6, runner: "windows.g5.4xlarge.nvidia.gpu" },
	{ config: "default", shard: 6, num_shards: 6, runner: "windows.g5.4xlarge.nvidia.gpu" },
	{ config: "force_on_cpu", shard: 1, num_shards: 1, runner: "windows.4xlarge.nonephemeral" },
	]}

	linux-focal-rocm6_0-py3_8-build:
	name: linux-focal-rocm6.0-py3.8
	uses: ./.github/workflows/_linux-build-label.yml
	with:
	build-environment: linux-focal-rocm6.0-py3.8
	docker-image-name: pytorch-linux-focal-rocm-n-py3
	sync-tag: rocm-build
	test-matrix: \|
	{ include: [
	{ config: "default", shard: 1, num_shards: 1, runner: "linux.rocm.gpu" },
	]}

	linux-focal-rocm6_0-py3_8-test:
	permissions:
	id-token: write
	contents: read
	name: linux-focal-rocm6.0-py3.8
	uses: ./.github/workflows/_rocm-test.yml
	needs:
	- linux-focal-rocm6_0-py3_8-build
	- target-determination
	with:
	build-environment: linux-focal-rocm6.0-py3.8
	docker-image: ${{ needs.linux-focal-rocm6_0-py3_8-build.outputs.docker-image }}
	test-matrix: ${{ needs.linux-focal-rocm6_0-py3_8-build.outputs.test-matrix }}
	tests-to-include: "test_nn test_torch test_cuda test_ops test_unary_ufuncs test_binary_ufuncs test_autograd inductor/test_torchinductor"

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

OSS: Capture triton kernel in ET (#124775) #75148

Workflow file

OSS: Capture triton kernel in ET (#124775) #75148

Jobs

Run details

Workflow file for this run