-
Notifications
You must be signed in to change notification settings - Fork 1.1k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Attempt to remove AWS S3 flaky cache for sccache (#2953)
* backend(trtllm): attempt to remove AWS S3 flaky cache for sccache * backend(trtllm): what if we expose ENV instead of inline? * backend(trtllm): and with the right env var for gha sccache * backend(trtllm): relax the way to detect sccache * backend(trtllm): make sccache definition manually * backend(trtllm): ok let's try to define the launchers in build.rs when rustc_wrapper is present * backend(trtllm): export env variable in run mb? * backend(trtllm): Cache mode max to cache intermediate layers * backend(trtllm): inject ompi_version build arg in dependent step
- Loading branch information
1 parent
6cb41a8
commit 40b0027
Showing
4 changed files
with
51 additions
and
80 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -6,11 +6,11 @@ on: | |
hardware: | ||
type: string | ||
description: Hardware | ||
# options: | ||
# - cuda | ||
# - cuda-trtllm | ||
# - rocm | ||
# - intel | ||
# options: | ||
# - cuda | ||
# - cuda-trtllm | ||
# - rocm | ||
# - intel | ||
required: true | ||
release-tests: | ||
description: "Run release integration tests" | ||
|
@@ -41,19 +41,18 @@ jobs: | |
uses: actions/checkout@v4 | ||
- name: Inject slug/short variables | ||
uses: rlespinasse/[email protected] | ||
- name: Inject required variables for sccache to interact with Github Actions Cache | ||
uses: actions/github-script@v7 | ||
with: | ||
script: | | ||
core.exportVariable('ACTIONS_CACHE_URL', process.env.ACTIONS_CACHE_URL || ''); | ||
core.exportVariable('ACTIONS_RUNTIME_TOKEN', process.env.ACTIONS_RUNTIME_TOKEN || ''); | ||
- name: Extract TensorRT-LLM version | ||
run: | | ||
echo "TENSORRT_LLM_VERSION=$(grep -oP '([a-z,0-9]{40})' $GITHUB_WORKSPACE/backends/trtllm/cmake/trtllm.cmake)" >> $GITHUB_ENV | ||
echo "TensorRT-LLM version: ${{ env.TENSORRT_LLM_VERSION }}" | ||
- name: "Configure AWS Credentials" | ||
id: aws-creds | ||
uses: aws-actions/configure-aws-credentials@v4 | ||
with: | ||
aws-region: us-east-1 | ||
role-to-assume: ${{ secrets.AWS_ROLE_GITHUB_TGI_TEST }} | ||
role-duration-seconds: 7200 | ||
output-credentials: true | ||
- name: Construct harware variables | ||
- name: Construct hardware variables | ||
shell: bash | ||
run: | | ||
case ${{ inputs.hardware }} in | ||
|
@@ -75,9 +74,6 @@ jobs: | |
export runs_on="ubuntu-latest" | ||
export platform="" | ||
export extra_pytest="" | ||
export target="ci-runtime" | ||
export sccache_s3_key_prefix="trtllm" | ||
export sccache_region="us-east-1" | ||
export build_type="dev" | ||
;; | ||
rocm) | ||
|
@@ -128,8 +124,6 @@ jobs: | |
echo "EXTRA_PYTEST=${extra_pytest}" >> $GITHUB_ENV | ||
echo REGISTRY_MIRROR=$REGISTRY_MIRROR >> $GITHUB_ENV | ||
echo "TARGET=${target}" >> $GITHUB_ENV | ||
echo "SCCACHE_S3_KEY_PREFIX=${sccache_s3_key_prefix}" >> $GITHUB_ENV | ||
echo "SCCACHE_REGION=${sccache_region}" >> $GITHUB_ENV | ||
echo "BUILD_TYPE=${build_type}" >> $GITHUB_ENV | ||
- name: Initialize Docker Buildx | ||
uses: docker/setup-buildx-action@v3 | ||
|
@@ -196,17 +190,14 @@ jobs: | |
DOCKER_LABEL=sha-${{ env.GITHUB_SHA_SHORT }}${{ env.LABEL }} | ||
PLATFORM=${{ env.PLATFORM }} | ||
build_type=${{ env.BUILD_TYPE }} | ||
is_gha_build=true | ||
aws_access_key_id=${{ steps.aws-creds.outputs.aws-access-key-id }} | ||
aws_secret_access_key=${{ steps.aws-creds.outputs.aws-secret-access-key }} | ||
aws_session_token=${{ steps.aws-creds.outputs.aws-session-token }} | ||
sccache_bucket=${{ secrets.AWS_S3_BUCKET_GITHUB_TGI_TEST }} | ||
sccache_s3_key_prefix=${{ env.SCCACHE_S3_KEY_PREFIX }} | ||
sccache_region=${{ env.SCCACHE_REGION }} | ||
sccache_gha_enabled=on | ||
actions_cache_url=${{ env.ACTIONS_CACHE_URL }} | ||
actions_runtime_token=${{ env.ACTIONS_RUNTIME_TOKEN }} | ||
tags: ${{ steps.meta.outputs.tags || steps.meta-pr.outputs.tags }} | ||
labels: ${{ steps.meta.outputs.labels || steps.meta-pr.outputs.labels }} | ||
cache-from: type=s3,region=us-east-1,bucket=ci-docker-buildx-cache,name=text-generation-inference-cache${{ env.LABEL }},mode=min,access_key_id=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_ACCESS_KEY_ID }},secret_access_key=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_SECRET_ACCESS_KEY }},mode=min | ||
cache-to: type=s3,region=us-east-1,bucket=ci-docker-buildx-cache,name=text-generation-inference-cache${{ env.LABEL }},mode=min,access_key_id=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_ACCESS_KEY_ID }},secret_access_key=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_SECRET_ACCESS_KEY }},mode=min | ||
cache-from: type=s3,region=us-east-1,bucket=ci-docker-buildx-cache,name=text-generation-inference-cache${{ env.LABEL }},mode=min,access_key_id=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_ACCESS_KEY_ID }},secret_access_key=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_SECRET_ACCESS_KEY }},mode=max | ||
cache-to: type=s3,region=us-east-1,bucket=ci-docker-buildx-cache,name=text-generation-inference-cache${{ env.LABEL }},mode=min,access_key_id=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_ACCESS_KEY_ID }},secret_access_key=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_SECRET_ACCESS_KEY }},mode=max | ||
- name: Final | ||
id: final | ||
run: | | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters