diff --git a/.github/workflows/pull.yml b/.github/workflows/pull.yml index 8b32e46cf21..d1b64e75981 100644 --- a/.github/workflows/pull.yml +++ b/.github/workflows/pull.yml @@ -395,25 +395,6 @@ jobs: # Test llama2 PYTHON_EXECUTABLE=python bash .ci/scripts/test_llama.sh -model stories110M -build_tool "${BUILD_TOOL}" -mode "${MODE}" -dtype "${DTYPE}" -pt2e_quantize "${PT2E_QUANTIZE}" - test-qnn-models-linux: - name: test-qnn-models-linux - uses: pytorch/test-infra/.github/workflows/linux_job.yml@main - strategy: - fail-fast: false - with: - runner: linux.2xlarge - docker-image: executorch-ubuntu-22.04-qnn-sdk - submodules: 'true' - ref: ${{ github.event_name == 'pull_request' && github.event.pull_request.head.sha || github.sha }} - timeout: 180 - script: | - # The generic Linux job chooses to use base env, not the one setup by the image - CONDA_ENV=$(conda env list --json | jq -r ".envs | .[-1]") - conda activate "${CONDA_ENV}" - - # placeholder for running test_qnn_delegate.py, can use matrix such that we can trigger different jobs, refers to test-llama-runner-qnn-linux - # reminder: make sure each job runs fast - test-phi-3-mini-runner-linux: name: test-phi-3-mini-runner-linux uses: pytorch/test-infra/.github/workflows/linux_job.yml@main