Skip to content

Build: Trigger CI for new vllm_backend Triton releases #49

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Draft
wants to merge 111 commits into
base: main
Choose a base branch
from
Draft
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
111 commits
Select commit Hold shift + click to select a range
4f59ff5
Create build.sh
nvda-mesharma Jul 23, 2024
5f40521
Rename build.sh to build_source.sh
nvda-mesharma Jul 23, 2024
b19dbb7
Create build_docker.sh
nvda-mesharma Jul 23, 2024
65f979c
Create vllm_version.txt
nvda-mesharma Jul 23, 2024
a12519f
Create triton_version.txt
nvda-mesharma Jul 23, 2024
59b549f
Update build_docker.sh
nvda-mesharma Jul 23, 2024
8ca761d
Update build_source.sh
nvda-mesharma Jul 23, 2024
718c244
Delete ci/build/triton_version.txt
nvda-mesharma Jul 23, 2024
6c1ad63
Delete ci/build/vllm_version.txt
nvda-mesharma Jul 23, 2024
5a251ae
Update build_source.sh
nvda-mesharma Jul 23, 2024
73655f8
Update build_source.sh
nvda-mesharma Jul 23, 2024
450f73b
Update build_docker.sh
nvda-mesharma Jul 23, 2024
915346e
Create trigger_ci.yml
nvda-mesharma Jul 23, 2024
00d10f9
Update trigger_ci.yml
nvda-mesharma Jul 23, 2024
0ff3e8b
Update trigger_ci.yml
nvda-mesharma Jul 23, 2024
1ea7b00
Update build_source.sh
nvda-mesharma Jul 23, 2024
580bbf0
Create verify_latest_vllm.ci
nvda-mesharma Jul 24, 2024
2085c70
Update trigger_ci.yml
nvda-mesharma Jul 24, 2024
6d79abc
Update verify_latest_vllm.ci
nvda-mesharma Jul 24, 2024
3418d12
Update build_source.sh
nvda-mesharma Jul 24, 2024
380fb94
Update build_source.sh
nvda-mesharma Jul 24, 2024
9a1725b
Update build_source.sh
nvda-mesharma Jul 24, 2024
8e182af
Update build_source.sh
nvda-mesharma Jul 24, 2024
93a10a5
Update build_source.sh
nvda-mesharma Jul 24, 2024
50cc924
Update build_source.sh
nvda-mesharma Jul 24, 2024
c800ef4
Update build_source.sh
nvda-mesharma Jul 24, 2024
9dca430
Update build_source.sh
nvda-mesharma Jul 24, 2024
fa1846a
Update build_source.sh
nvda-mesharma Jul 24, 2024
1fd0e56
Update build_source.sh
nvda-mesharma Jul 24, 2024
8209da1
Update build_source.sh
nvda-mesharma Jul 24, 2024
7f6157c
Update build_source.sh
nvda-mesharma Jul 24, 2024
a5e9fc4
Update build_source.sh
nvda-mesharma Jul 24, 2024
0301c04
Update build_source.sh
nvda-mesharma Jul 24, 2024
b6f351e
Update build_source.sh
nvda-mesharma Jul 24, 2024
ba5dba3
Update build_source.sh
nvda-mesharma Jul 24, 2024
bfe7131
Update build_source.sh
nvda-mesharma Jul 24, 2024
d6606d3
Update build_source.sh
nvda-mesharma Jul 24, 2024
223a10b
Update build_source.sh
nvda-mesharma Jul 25, 2024
23865a6
Update build_source.sh
nvda-mesharma Jul 25, 2024
b1c58b3
Update build_source.sh
nvda-mesharma Jul 25, 2024
72ee876
Update build_source.sh
nvda-mesharma Jul 25, 2024
18c6ab6
Update trigger_ci.yml
nvda-mesharma Jul 27, 2024
d4b30c0
Delete .github/workflows/verify_latest_vllm.ci
nvda-mesharma Jul 27, 2024
a2b3058
Update build_source.sh
nvda-mesharma Jul 27, 2024
dd7ccf9
Update build_source.sh
nvda-mesharma Jul 27, 2024
cfa8c48
Delete .github/workflows/pre-commit.yaml
nvda-mesharma Jul 27, 2024
8bdc8e0
Update trigger_ci.yml
nvda-mesharma Jul 27, 2024
07912f2
Create contributor.yml
nvda-mesharma Jul 29, 2024
9268c2f
Update trigger_ci.yml
nvda-mesharma Jul 29, 2024
98f4a3f
Create verified.yml
nvda-mesharma Jul 30, 2024
e0c4ad4
Update verified.yml
nvda-mesharma Jul 30, 2024
013e389
Update verified.yml
nvda-mesharma Jul 30, 2024
20f3d39
Update contributor.yml
nvda-mesharma Jul 31, 2024
2d5098a
Delete .github/workflows/verified.yml
nvda-mesharma Jul 31, 2024
84e14dd
Update trigger_ci.yml
nvda-mesharma Jul 31, 2024
fb20236
Create pre-commit.yaml
nvda-mesharma Aug 5, 2024
29e73ba
fix pre-commit issues
nvda-mesharma Aug 5, 2024
a2e7db3
Update build_source.sh
nvda-mesharma Aug 5, 2024
bfb9466
Update build_source.sh
nvda-mesharma Aug 5, 2024
f348d49
Update README.md
nvda-mesharma Aug 5, 2024
85c53aa
Update build_source.sh
nvda-mesharma Aug 5, 2024
25a71f7
Update README.md
nvda-mesharma Aug 5, 2024
deb13ce
Update trigger_ci.yml
nvda-mesharma Aug 5, 2024
d888f12
Update trigger_ci.yml
nvda-mesharma Aug 5, 2024
7a08c86
Update build_source.sh
nvda-mesharma Aug 5, 2024
e76e209
Update build_source.sh
nvda-mesharma Aug 5, 2024
1b3dbc0
Update build_source.sh
nvda-mesharma Aug 5, 2024
1a93230
Update build_source.sh
nvda-mesharma Aug 6, 2024
1efadc7
Update trigger_ci.yml
nvda-mesharma Aug 6, 2024
3d0110a
Update build_source.sh
nvda-mesharma Aug 6, 2024
f29d9d0
Update build_source.sh
nvda-mesharma Aug 6, 2024
dec1329
Update build_source.sh
nvda-mesharma Aug 6, 2024
52aaded
Update build_source.sh
nvda-mesharma Aug 6, 2024
62fc87c
Update build_source.sh
nvda-mesharma Aug 6, 2024
6605983
Update trigger_ci.yml
nvda-mesharma Aug 6, 2024
98fbc29
Update trigger_ci.yml
nvda-mesharma Aug 6, 2024
f484188
Update trigger_ci.yml
nvda-mesharma Aug 6, 2024
91dc27a
Update trigger_ci.yml
nvda-mesharma Aug 30, 2024
9bf9c12
Update trigger_ci.yml
nvda-mesharma Aug 30, 2024
805ae1e
Update README.md
nvda-mesharma Aug 30, 2024
7ccea9c
Update README.md
nvda-mesharma Aug 30, 2024
d347b1d
Update README.md
nvda-mesharma Aug 30, 2024
fff8f14
Update build_docker.sh
nvda-mesharma Sep 4, 2024
156724a
Update build_docker.sh
nvda-mesharma Sep 4, 2024
4604761
Update build_docker.sh
nvda-mesharma Sep 4, 2024
232787f
Create vllm_release_ci.yml
nvda-mesharma Sep 5, 2024
656c8f5
Rename trigger_ci.yml to triton_update_ci.yml
nvda-mesharma Sep 5, 2024
47b9a91
Update triton_update_ci.yml
nvda-mesharma Sep 5, 2024
047b885
Rename vllm_release_ci.yml to vllm_update_ci.yml
nvda-mesharma Sep 5, 2024
fb7977f
Update vllm_update_ci.yml
nvda-mesharma Sep 5, 2024
2050086
Update vllm_update_ci.yml
nvda-mesharma Sep 5, 2024
9492364
Update triton_update_ci.yml
nvda-mesharma Sep 5, 2024
ce76a76
Update vllm_update_ci.yml
nvda-mesharma Sep 5, 2024
2fafdda
Update vllm_update_ci.yml
nvda-mesharma Sep 5, 2024
5792663
Update README.md
nvda-mesharma Sep 6, 2024
f3258ef
Update README.md
nvda-mesharma Sep 6, 2024
f2c7a89
Update README.md
nvda-mesharma Sep 20, 2024
e45854c
Update README.md
nvda-mesharma Sep 20, 2024
5929f7a
Update README.md
nvda-mesharma Sep 20, 2024
2512b8a
Update triton_update_ci.yml
nvda-mesharma Sep 20, 2024
7c97d9f
Update vllm_update_ci.yml
nvda-mesharma Sep 23, 2024
552db92
Merge branch 'main' into mesharma-ci
nvda-mesharma Sep 30, 2024
65fe72c
Update build_source.sh
nvda-mesharma Nov 21, 2024
3ada940
Update triton_update_ci.yml
nvda-mesharma Nov 21, 2024
760f884
Update build_source.sh
nvda-mesharma Nov 21, 2024
61ba078
Update triton_update_ci.yml
nvda-mesharma Nov 21, 2024
0100f94
Update triton_update_ci.yml
nvda-mesharma Nov 21, 2024
5768b34
Update README.md
nvda-mesharma Nov 21, 2024
ea2120c
Update triton_update_ci.yml
nvda-mesharma Nov 21, 2024
adec735
Update README.md
nvda-mesharma Nov 21, 2024
834e76e
Update README.md
nvda-mesharma Nov 21, 2024
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
21 changes: 21 additions & 0 deletions .github/workflows/contributor.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,21 @@
name: Welcome message
on:
pull_request_target:
types: [opened]

jobs:
pr_reminder:
runs-on: ubuntu-latest
steps:
- name: Add first comment
uses: actions/github-script@v6
with:
script: |
github.rest.issues.createComment({
owner: context.repo.owner,
repo: context.repo.repo,
issue_number: context.issue.number,
body: '👋 Hi! \nThank you for contributing to the project.\n Just a reminder: PRs will trigger full CI run by default. We will add verified labels on the PR once build and tests steps are successful.\n🚀'
})
env:
GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
1 change: 0 additions & 1 deletion .github/workflows/pre-commit.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -36,4 +36,3 @@ jobs:
- uses: actions/checkout@v3
- uses: actions/setup-python@v3
- uses: pre-commit/[email protected]

45 changes: 45 additions & 0 deletions .github/workflows/triton_update_ci.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,45 @@
name: Validate Triton Pull request by running our change on the latest version of vLLM
on:
pull_request:
jobs:
mirror_repo:
environment: GITLAB
runs-on: self-hosted
steps:
- name: Sync Mirror Repository
run: |
#!/bin/bash
curl --request POST --header "PRIVATE-TOKEN:${{ secrets.TOKEN }}" "${{ secrets.MIRROR_URL }}"
trigger-ci:
environment: GITLAB
needs: mirror_repo
runs-on: self-hosted
steps:
- name: Trigger Pipeline
run: |
#!/bin/bash
# Get latest VLLM RELEASED VERSION from https://github.com/triton-inference-server/vllm_backend/releases
TAG=$(curl https://api.github.com/repos/triton-inference-server/vllm_backend/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}')
export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.10
if [ -z "$TRITON_CONTAINER_VERSION" ]
then
echo "\$TRITON_CONTAINER_VERSION is NULL, setting it to 24.10"
TRITON_CONTAINER_VERSION=24.10
else
echo "\$TRITON_CONTAINER_VERSION is NOT NULL"
fi
echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}"

# Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases
TAG=$(curl https://api.github.com/repos/vllm-project/vllm/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}')
export VLLM_VERSION=${TAG#v} # example: 0.5.5
if [ -z "$VLLM_VERSION" ]
then
echo "\$VLLM_VERSION is NULL, setting it to 0.5.5"
VLLM_VERSION=0.5.5
else
echo "\$VLLM_VERSION is NOT NULL"
fi
echo "VLLM_VERSION = ${VLLM_VERSION}"

curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD_SOURCE" -F variables[TRITON_CONTAINER_VERSION]="${TRITON_CONTAINER_VERSION}" -F variables[VLLM_VERSION]="${VLLM_VERSION}" -F variables[TEST_OPTION]="ALL_TESTS" "${{ secrets.PIPELINE_URL }}"
36 changes: 36 additions & 0 deletions .github/workflows/vllm_update_ci.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,36 @@
name: Validate latest vLLM release from https://github.com/vllm-project/vllm/releases against latest Triton release https://github.com/triton-inference-server/vllm_backend/releases
on:
schedule:
- cron: "30 09 */3 * *"
jobs:
mirror_repo:
environment: GITLAB
runs-on: self-hosted
steps:
- name: Sync Mirror Repository
run: |
#!/bin/bash
curl --request POST --header "PRIVATE-TOKEN:${{ secrets.TOKEN }}" "${{ secrets.MIRROR_URL }}"
trigger-ci:
environment: GITLAB
needs: mirror_repo
runs-on: self-hosted
steps:
- name: Trigger Pipeline
run: |
#!/bin/bash
# Get latest VLLM RELEASED VERSION from https://github.com/triton-inference-server/vllm_backend/releases
TAG=$(curl https://api.github.com/repos/triton-inference-server/vllm_backend/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}')
export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.08
# Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases
TAG=$(curl https://api.github.com/repos/vllm-project/vllm/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}')
export VLLM_VERSION=${TAG#v} # example: 0.5.5
echo "VLLM_VERSION = ${VLLM_VERSION}"
if [ -z "$TRITON_CONTAINER_VERSION" || -z "$VLLM_VERSION"]
then
echo "Can't find latest Triton or vllm version.. Skipping CI run"
else
echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}"
echo "VLLM_VERSION = ${VLLM_VERSION}"
curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="PULL_DOCKER" -F variables[TRITON_CONTAINER_VERSION]="${TRITON_CONTAINER_VERSION}" -F variables[TEST_OPTION]="ALL_HARDWARE" -F variables[VLLM_VERSION]="${VLLM_VERSION}" -F variables[TEST_OPTION]="ALL_TESTS" "${{ secrets.PIPELINE_URL }}"
fi
21 changes: 20 additions & 1 deletion README.md
Original file line number Diff line number Diff line change
Expand Up @@ -27,6 +27,9 @@
-->

[![License](https://img.shields.io/badge/License-BSD3-lightgrey.svg)](https://opensource.org/licenses/BSD-3-Clause)
![Static Badge](https://img.shields.io/badge/Triton-24.10-8A2BE2)
![Static Badge](https://img.shields.io/badge/vLLM-0.5.5-blue)
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

could you please clarify why the version 0.5.5 was picked?

Copy link
Collaborator Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

We have a passing pipeline with this version. Hence, I picked this as the default until a new version is tested and verified.

Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I think we should have the latest version we support, or wait until we have tests, that indicate that we can migrate to the latest. Since we don't support 0.5.5 and vLLM's latest version now is 0.6.1.post2, I can see a confusion, that will arise in users with this badge

Copy link
Collaborator Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

done

![Static Badge](https://img.shields.io/badge/CI_Passing-V100%2CA100%2CH100-Green)
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

could you please clarify how these static badges work?

Copy link
Collaborator Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Ideally this should be automated. But, it is a manual process at the moment. Once the cron task is finished and the pipeline is green, I'd have to issue a PR to update the badges here.

Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Do we want to hold on adding badges, until we have an automated workflow in place?


# vLLM Backend

Expand Down Expand Up @@ -82,7 +85,18 @@ latest YY.MM (year.month) of [Triton release](https://github.com/triton-inferenc

```
# YY.MM is the version of Triton.
export TRITON_CONTAINER_VERSION=<YY.MM>
# Get latest VLLM RELEASED VERSION from https://github.com/triton-inference-server/vllm_backend/releases
TAG=$(curl https://api.github.com/repos/triton-inference-server/vllm_backend/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}')
export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.06
echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}"

# Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases
TAG=$(curl https://api.github.com/repos/vllm-project/vllm/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}')
export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1
echo "VLLM_VERSION = ${VLLM_VERSION}"

git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git
cd server
./build.py -v --enable-logging
--enable-stats
--enable-tracing
Expand All @@ -101,6 +115,11 @@ export TRITON_CONTAINER_VERSION=<YY.MM>
--backend=python:r${TRITON_CONTAINER_VERSION}
--backend=vllm:r${TRITON_CONTAINER_VERSION}
--backend=ensemble
--vllm-version=${VLLM_VERSION}
# Build Triton Server
cd build
bash -x ./docker_build

```

### Option 3. Add the vLLM Backend to the Default Triton Container
Expand Down
36 changes: 36 additions & 0 deletions ci/build/build_docker.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,36 @@
#!/bin/bash
# Copyright 2024, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions
# are met:
# * Redistributions of source code must retain the above copyright
# notice, this list of conditions and the following disclaimer.
# * Redistributions in binary form must reproduce the above copyright
# notice, this list of conditions and the following disclaimer in the
# documentation and/or other materials provided with the distribution.
# * Neither the name of NVIDIA CORPORATION nor the names of its
# contributors may be used to endorse or promote products derived
# from this software without specific prior written permission.
#
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ``AS IS'' AND ANY
# EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
# PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
# CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
# EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
# PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
# PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
# OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

while getopts t: flag
do
case "${flag}" in
u) PROD_CONTAINER=${OPTARG};;
esac
done

echo "Pulling container image ${PROD_CONTAINER}"
docker pull ${PROD_CONTAINER}
63 changes: 63 additions & 0 deletions ci/build/build_source.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,63 @@
#!/bin/bash
# Copyright 2024, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions
# are met:
# * Redistributions of source code must retain the above copyright
# notice, this list of conditions and the following disclaimer.
# * Redistributions in binary form must reproduce the above copyright
# notice, this list of conditions and the following disclaimer in the
# documentation and/or other materials provided with the distribution.
# * Neither the name of NVIDIA CORPORATION nor the names of its
# contributors may be used to endorse or promote products derived
# from this software without specific prior written permission.
#
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ``AS IS'' AND ANY
# EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
# PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
# CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
# EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
# PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
# PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
# OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

while getopts t:v: flag
do
case "${flag}" in
u) TRITON_CONTAINER_VERSION=${OPTARG};;
a) VLLM_VERSION=${OPTARG};;
esac
done

echo "Triton version is ${TRITON_CONTAINER_VERSION} and vllm version is ${VLLM_VERSION}"
# This change will start working for r24.12 release
#git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git
git clone https://github.com/triton-inference-server/server.git
set -x && python3 server/build.py -v \
--enable-logging \
--enable-stats \
--enable-tracing \
--enable-metrics \
--enable-gpu-metrics \
--enable-cpu-metrics \
--enable-gpu \
--no-container-interactive \
--container-prebuild-command="docker login -u gitlab-ci-token -p ${CI_JOB_TOKEN} ${CI_REGISTRY}" \
--filesystem=gcs \
--filesystem=s3 \
--filesystem=azure_storage \
--endpoint=http \
--endpoint=grpc \
--endpoint=sagemaker \
--endpoint=vertex-ai \
--upstream-container-version=${TRITON_CONTAINER_VERSION} \
--backend=python:r${TRITON_CONTAINER_VERSION} \
--backend=vllm:r${TRITON_CONTAINER_VERSION} \
--vllm-version=${VLLM_VERSION} 2>&1
# Build Triton Server
cd server/build
bash -x ./docker_build
Loading