From 4f59ff5d31a2347b8d2cf039fcaeefe4d7cad781 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 11:07:13 -0700 Subject: [PATCH 001/110] Create build.sh --- ci/build/build.sh | 1 + 1 file changed, 1 insertion(+) create mode 100644 ci/build/build.sh diff --git a/ci/build/build.sh b/ci/build/build.sh new file mode 100644 index 00000000..a0990367 --- /dev/null +++ b/ci/build/build.sh @@ -0,0 +1 @@ +TBD From 5f40521d86c3eda6ccbbaa57b0dee1cf7eb0a4ce Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 11:31:16 -0700 Subject: [PATCH 002/110] Rename build.sh to build_source.sh --- ci/build/{build.sh => build_source.sh} | 0 1 file changed, 0 insertions(+), 0 deletions(-) rename ci/build/{build.sh => build_source.sh} (100%) diff --git a/ci/build/build.sh b/ci/build/build_source.sh similarity index 100% rename from ci/build/build.sh rename to ci/build/build_source.sh From b19dbb7dfbe8dc88ad8c94c2d3584277ea22c380 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 11:31:49 -0700 Subject: [PATCH 003/110] Create build_docker.sh --- ci/build/build_docker.sh | 1 + 1 file changed, 1 insertion(+) create mode 100644 ci/build/build_docker.sh diff --git a/ci/build/build_docker.sh b/ci/build/build_docker.sh new file mode 100644 index 00000000..8b137891 --- /dev/null +++ b/ci/build/build_docker.sh @@ -0,0 +1 @@ + From 65f979ca89beb9fa8e989972e82347f0f3bffbeb Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 11:32:23 -0700 Subject: [PATCH 004/110] Create vllm_version.txt --- ci/build/vllm_version.txt | 1 + 1 file changed, 1 insertion(+) create mode 100644 ci/build/vllm_version.txt diff --git a/ci/build/vllm_version.txt b/ci/build/vllm_version.txt new file mode 100644 index 00000000..8b137891 --- /dev/null +++ b/ci/build/vllm_version.txt @@ -0,0 +1 @@ + From a12519f752b0644fec8a47468c0ff81ec0ed70ed Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 11:32:47 -0700 Subject: [PATCH 005/110] Create triton_version.txt --- ci/build/triton_version.txt | 1 + 1 file changed, 1 insertion(+) create mode 100644 ci/build/triton_version.txt diff --git a/ci/build/triton_version.txt b/ci/build/triton_version.txt new file mode 100644 index 00000000..8b137891 --- /dev/null +++ b/ci/build/triton_version.txt @@ -0,0 +1 @@ + From 59b549ffcace0d1170edd29a08645a1c2afb5fdc Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 11:34:24 -0700 Subject: [PATCH 006/110] Update build_docker.sh --- ci/build/build_docker.sh | 28 ++++++++++++++++++++++++++++ 1 file changed, 28 insertions(+) diff --git a/ci/build/build_docker.sh b/ci/build/build_docker.sh index 8b137891..696b8f76 100644 --- a/ci/build/build_docker.sh +++ b/ci/build/build_docker.sh @@ -1 +1,29 @@ +#!/bin/bash +# Copyright 2024, NVIDIA CORPORATION & AFFILIATES. All rights reserved. +# +# Redistribution and use in source and binary forms, with or without +# modification, are permitted provided that the following conditions +# are met: +# * Redistributions of source code must retain the above copyright +# notice, this list of conditions and the following disclaimer. +# * Redistributions in binary form must reproduce the above copyright +# notice, this list of conditions and the following disclaimer in the +# documentation and/or other materials provided with the distribution. +# * Neither the name of NVIDIA CORPORATION nor the names of its +# contributors may be used to endorse or promote products derived +# from this software without specific prior written permission. +# +# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ``AS IS'' AND ANY +# EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE +# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR +# PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR +# CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, +# EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, +# PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR +# PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY +# OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT +# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE +# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. +export TRITON_CONTAINER_VERSION= +docker pull nvcr.io/nvidia/tritonserver:${TRITON_CONTAINER_VERSION}-vllm-python-py3 From 8ca761db79e5ca51e352b19c22b7b74c693110b9 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 12:04:12 -0700 Subject: [PATCH 007/110] Update build_source.sh --- ci/build/build_source.sh | 50 +++++++++++++++++++++++++++++++++++++++- 1 file changed, 49 insertions(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index a0990367..96f2a501 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -1 +1,49 @@ -TBD +#!/bin/bash +# Copyright 2024, NVIDIA CORPORATION & AFFILIATES. All rights reserved. +# +# Redistribution and use in source and binary forms, with or without +# modification, are permitted provided that the following conditions +# are met: +# * Redistributions of source code must retain the above copyright +# notice, this list of conditions and the following disclaimer. +# * Redistributions in binary form must reproduce the above copyright +# notice, this list of conditions and the following disclaimer in the +# documentation and/or other materials provided with the distribution. +# * Neither the name of NVIDIA CORPORATION nor the names of its +# contributors may be used to endorse or promote products derived +# from this software without specific prior written permission. +# +# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ``AS IS'' AND ANY +# EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE +# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR +# PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR +# CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, +# EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, +# PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR +# PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY +# OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT +# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE +# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + +export TRITON_CONTAINER_VERSION= +export VLLM_VERSION=0.5.3 # grab this version via curl + +git clone -b mesharma-ci https://github.com/triton-inference-server/server.git +source build.py -v --enable-logging + --enable-stats + --enable-tracing + --enable-metrics + --enable-gpu-metrics + --enable-cpu-metrics + --enable-gpu + --filesystem=gcs + --filesystem=s3 + --filesystem=azure_storage + --endpoint=http + --endpoint=grpc + --endpoint=sagemaker + --endpoint=vertex-ai + --upstream-container-version=${TRITON_CONTAINER_VERSION} + --backend=python:r${TRITON_CONTAINER_VERSION} + --backend=vllm:r${TRITON_CONTAINER_VERSION} + --vllm-version=${VLLM_VERSION} From 718c244816a77ab6897c7d96c017b8ac3e8748c7 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 12:04:45 -0700 Subject: [PATCH 008/110] Delete ci/build/triton_version.txt --- ci/build/triton_version.txt | 1 - 1 file changed, 1 deletion(-) delete mode 100644 ci/build/triton_version.txt diff --git a/ci/build/triton_version.txt b/ci/build/triton_version.txt deleted file mode 100644 index 8b137891..00000000 --- a/ci/build/triton_version.txt +++ /dev/null @@ -1 +0,0 @@ - From 6c1ad63ba2da68c3a44b7847ac12de513d7f5209 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 12:04:57 -0700 Subject: [PATCH 009/110] Delete ci/build/vllm_version.txt --- ci/build/vllm_version.txt | 1 - 1 file changed, 1 deletion(-) delete mode 100644 ci/build/vllm_version.txt diff --git a/ci/build/vllm_version.txt b/ci/build/vllm_version.txt deleted file mode 100644 index 8b137891..00000000 --- a/ci/build/vllm_version.txt +++ /dev/null @@ -1 +0,0 @@ - From 5a251ae170884732ef2912fffd82a064620574e8 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 12:20:40 -0700 Subject: [PATCH 010/110] Update build_source.sh --- ci/build/build_source.sh | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 96f2a501..92482a98 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -26,7 +26,10 @@ # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. export TRITON_CONTAINER_VERSION= -export VLLM_VERSION=0.5.3 # grab this version via curl + +# Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases +TAG=$(curl https://api.github.com/repos/triton-inference-server/server/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') +export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 git clone -b mesharma-ci https://github.com/triton-inference-server/server.git source build.py -v --enable-logging From 73655f8e4bb8839f6d41286086155905d040203f Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 12:30:12 -0700 Subject: [PATCH 011/110] Update build_source.sh --- ci/build/build_source.sh | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 92482a98..48eab963 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -25,7 +25,9 @@ # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. -export TRITON_CONTAINER_VERSION= +# Get latest VLLM RELEASED VERSION from https://github.com/triton-inference-server/vllm_backend/releases +TAG=$(curl https://api.github.com/repos/triton-inference-server/vllm_backend/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') +export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.06 # Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases TAG=$(curl https://api.github.com/repos/triton-inference-server/server/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') From 450f73bcf8e4babeee63e143ca55a95230de6939 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 12:30:25 -0700 Subject: [PATCH 012/110] Update build_docker.sh --- ci/build/build_docker.sh | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/ci/build/build_docker.sh b/ci/build/build_docker.sh index 696b8f76..571d22d5 100644 --- a/ci/build/build_docker.sh +++ b/ci/build/build_docker.sh @@ -25,5 +25,8 @@ # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. -export TRITON_CONTAINER_VERSION= +# Get latest VLLM RELEASED VERSION from https://github.com/triton-inference-server/vllm_backend/releases +TAG=$(curl https://api.github.com/repos/triton-inference-server/vllm_backend/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') +export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.06 + docker pull nvcr.io/nvidia/tritonserver:${TRITON_CONTAINER_VERSION}-vllm-python-py3 From 915346ebc3773c8aff75401375d38a111a96388d Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 12:37:40 -0700 Subject: [PATCH 013/110] Create trigger_ci.yml --- .github/workflows/trigger_ci.yml | 20 ++++++++++++++++++++ 1 file changed, 20 insertions(+) create mode 100644 .github/workflows/trigger_ci.yml diff --git a/.github/workflows/trigger_ci.yml b/.github/workflows/trigger_ci.yml new file mode 100644 index 00000000..cf1bfbbd --- /dev/null +++ b/.github/workflows/trigger_ci.yml @@ -0,0 +1,20 @@ +on: + pull_request: +jobs: + mirror_repo: + environment: GITLAB + runs-on: self-hosted + steps: + - name: Sync Mirror Repository + run: | + #!/bin/bash + curl --request POST --header "PRIVATE-TOKEN:${{ secrets.TOKEN }}" "${{ secrets.MIRROR_URL }}" + trigger-ci: + environment: GITLAB + needs: mirror_repo + runs-on: self-hosted + steps: + - name: Trigger Pipeline + run: | + #!/bin/bash + curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} "${{ secrets.PIPELINE_URL }}" From 00d10f923a6ed3d55672c569199714e7eca1843d Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 13:49:27 -0700 Subject: [PATCH 014/110] Update trigger_ci.yml --- .github/workflows/trigger_ci.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/trigger_ci.yml b/.github/workflows/trigger_ci.yml index cf1bfbbd..19ecc8c2 100644 --- a/.github/workflows/trigger_ci.yml +++ b/.github/workflows/trigger_ci.yml @@ -17,4 +17,4 @@ jobs: - name: Trigger Pipeline run: | #!/bin/bash - curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} "${{ secrets.PIPELINE_URL }}" + curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} variables[BUILD_OPTION]="BUILD-DOCKER" "${{ secrets.PIPELINE_URL }}" From 0ff3e8b5c6d4cfa0107629bce5deb056f75301f6 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 14:06:52 -0700 Subject: [PATCH 015/110] Update trigger_ci.yml --- .github/workflows/trigger_ci.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/trigger_ci.yml b/.github/workflows/trigger_ci.yml index 19ecc8c2..486b6a83 100644 --- a/.github/workflows/trigger_ci.yml +++ b/.github/workflows/trigger_ci.yml @@ -17,4 +17,4 @@ jobs: - name: Trigger Pipeline run: | #!/bin/bash - curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} variables[BUILD_OPTION]="BUILD-DOCKER" "${{ secrets.PIPELINE_URL }}" + curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD-DOCKER" "${{ secrets.PIPELINE_URL }}" From 1ea7b00f486db257cc2ce5ae049cde06058e6750 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 15:24:45 -0700 Subject: [PATCH 016/110] Update build_source.sh From 580bbf06b57d34801fabcd18f6b28c98cecc81a1 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 18:24:21 -0700 Subject: [PATCH 017/110] Create verify_latest_vllm.ci --- .github/workflows/verify_latest_vllm.ci | 21 +++++++++++++++++++++ 1 file changed, 21 insertions(+) create mode 100644 .github/workflows/verify_latest_vllm.ci diff --git a/.github/workflows/verify_latest_vllm.ci b/.github/workflows/verify_latest_vllm.ci new file mode 100644 index 00000000..5538958a --- /dev/null +++ b/.github/workflows/verify_latest_vllm.ci @@ -0,0 +1,21 @@ +on: + schedule: + - cron: '0 0 * * *' +jobs: + mirror_repo: + environment: GITLAB + runs-on: self-hosted + steps: + - name: Sync Mirror Repository + run: | + #!/bin/bash + curl --request POST --header "PRIVATE-TOKEN:${{ secrets.TOKEN }}" "${{ secrets.MIRROR_URL }}" + trigger-ci: + environment: GITLAB + needs: mirror_repo + runs-on: self-hosted + steps: + - name: Trigger Pipeline + run: | + #!/bin/bash + curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD-SOURCE" "${{ secrets.PIPELINE_URL }}" From 2085c70c002da4398126b99dd3264bcc64c19788 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 18:24:57 -0700 Subject: [PATCH 018/110] Update trigger_ci.yml --- .github/workflows/trigger_ci.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/trigger_ci.yml b/.github/workflows/trigger_ci.yml index 486b6a83..07deb27b 100644 --- a/.github/workflows/trigger_ci.yml +++ b/.github/workflows/trigger_ci.yml @@ -17,4 +17,4 @@ jobs: - name: Trigger Pipeline run: | #!/bin/bash - curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD-DOCKER" "${{ secrets.PIPELINE_URL }}" + curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD-SOURCE" "${{ secrets.PIPELINE_URL }}" From 6d79abc95938d3fc4cd5c4683df23a5eda86536b Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 18:26:39 -0700 Subject: [PATCH 019/110] Update verify_latest_vllm.ci --- .github/workflows/verify_latest_vllm.ci | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/verify_latest_vllm.ci b/.github/workflows/verify_latest_vllm.ci index 5538958a..4816f86c 100644 --- a/.github/workflows/verify_latest_vllm.ci +++ b/.github/workflows/verify_latest_vllm.ci @@ -1,6 +1,6 @@ on: schedule: - - cron: '0 0 * * *' + - cron: '0 20 * * 4' jobs: mirror_repo: environment: GITLAB From 3418d121d98f9a88fea5f274ca6ca9bcc8bc2202 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 20:32:40 -0700 Subject: [PATCH 020/110] Update build_source.sh --- ci/build/build_source.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 48eab963..671ee7cc 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -34,7 +34,7 @@ TAG=$(curl https://api.github.com/repos/triton-inference-server/server/releases/ export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 git clone -b mesharma-ci https://github.com/triton-inference-server/server.git -source build.py -v --enable-logging +source server/build.py -v --enable-logging --enable-stats --enable-tracing --enable-metrics From 380fb942dcbe14c8580e2084c8b5e96a30058bff Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 20:34:33 -0700 Subject: [PATCH 021/110] Update build_source.sh --- ci/build/build_source.sh | 1 + 1 file changed, 1 insertion(+) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 671ee7cc..e02a2861 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -34,6 +34,7 @@ TAG=$(curl https://api.github.com/repos/triton-inference-server/server/releases/ export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 git clone -b mesharma-ci https://github.com/triton-inference-server/server.git +ls -l source server/build.py -v --enable-logging --enable-stats --enable-tracing From 9a1725b319c12483231814bffdf94f8d041b13c6 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 20:38:42 -0700 Subject: [PATCH 022/110] Update build_source.sh --- ci/build/build_source.sh | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index e02a2861..821cc9af 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -34,8 +34,7 @@ TAG=$(curl https://api.github.com/repos/triton-inference-server/server/releases/ export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 git clone -b mesharma-ci https://github.com/triton-inference-server/server.git -ls -l -source server/build.py -v --enable-logging +./server/build.py -v --enable-logging --enable-stats --enable-tracing --enable-metrics From 8e182af8db9a9603b0d78c833f957b00614129a9 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 20:43:26 -0700 Subject: [PATCH 023/110] Update build_source.sh --- ci/build/build_source.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 821cc9af..8b889508 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -34,7 +34,7 @@ TAG=$(curl https://api.github.com/repos/triton-inference-server/server/releases/ export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 git clone -b mesharma-ci https://github.com/triton-inference-server/server.git -./server/build.py -v --enable-logging +python3 server/build.py -v --enable-logging --enable-stats --enable-tracing --enable-metrics From 93a10a5c58155450ba4bb8fc9c0388c63eb8ac80 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 20:47:54 -0700 Subject: [PATCH 024/110] Update build_source.sh --- ci/build/build_source.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 8b889508..1c05e3d5 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -51,4 +51,4 @@ python3 server/build.py -v --enable-logging --upstream-container-version=${TRITON_CONTAINER_VERSION} --backend=python:r${TRITON_CONTAINER_VERSION} --backend=vllm:r${TRITON_CONTAINER_VERSION} - --vllm-version=${VLLM_VERSION} + --vllm-version=${VLLM_VERSION} 2>&1 From 50cc924d71701998ff15f86170270c48d13a5e79 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 21:07:36 -0700 Subject: [PATCH 025/110] Update build_source.sh --- ci/build/build_source.sh | 1 + 1 file changed, 1 insertion(+) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 1c05e3d5..19ecf457 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -28,6 +28,7 @@ # Get latest VLLM RELEASED VERSION from https://github.com/triton-inference-server/vllm_backend/releases TAG=$(curl https://api.github.com/repos/triton-inference-server/vllm_backend/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.06 +echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}" # Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases TAG=$(curl https://api.github.com/repos/triton-inference-server/server/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') From c800ef46c581cda3bc63980fa9af672b6199b079 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 22:12:36 -0700 Subject: [PATCH 026/110] Update build_source.sh --- ci/build/build_source.sh | 1 + 1 file changed, 1 insertion(+) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 19ecf457..d1ac677d 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -42,6 +42,7 @@ python3 server/build.py -v --enable-logging --enable-gpu-metrics --enable-cpu-metrics --enable-gpu + --no-container-interactive --filesystem=gcs --filesystem=s3 --filesystem=azure_storage From 9dca430b243513947ec0e743128036363f52b4af Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 22:20:11 -0700 Subject: [PATCH 027/110] Update build_source.sh --- ci/build/build_source.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index d1ac677d..a670a542 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -35,7 +35,7 @@ TAG=$(curl https://api.github.com/repos/triton-inference-server/server/releases/ export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 git clone -b mesharma-ci https://github.com/triton-inference-server/server.git -python3 server/build.py -v --enable-logging +set -x && python3 server/build.py -v --enable-logging --enable-stats --enable-tracing --enable-metrics From fa1846abe97bcfff1e896201ae35dee6398f0627 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 23 Jul 2024 22:20:55 -0700 Subject: [PATCH 028/110] Update build_source.sh --- ci/build/build_source.sh | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index a670a542..ddffb608 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -53,4 +53,5 @@ set -x && python3 server/build.py -v --enable-logging --upstream-container-version=${TRITON_CONTAINER_VERSION} --backend=python:r${TRITON_CONTAINER_VERSION} --backend=vllm:r${TRITON_CONTAINER_VERSION} - --vllm-version=${VLLM_VERSION} 2>&1 + --vllm-version=${VLLM_VERSION} || RV=$?; 2>&1 +echo "RV=$RV" From 1fd0e5689605a09f9fa46bf69754aac2a90b8299 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Wed, 24 Jul 2024 00:27:32 -0700 Subject: [PATCH 029/110] Update build_source.sh --- ci/build/build_source.sh | 1 + 1 file changed, 1 insertion(+) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index ddffb608..f026328a 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -42,6 +42,7 @@ set -x && python3 server/build.py -v --enable-logging --enable-gpu-metrics --enable-cpu-metrics --enable-gpu + --container-prebuild-command="docker login -u gitlab-ci-token -p ${CI_JOB_TOKEN} ${CI_REGISTRY}" --no-container-interactive --filesystem=gcs --filesystem=s3 From 8209da1a25e53cd2e104cd3c0de1f4ba5e856d58 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Wed, 24 Jul 2024 00:31:00 -0700 Subject: [PATCH 030/110] Update build_source.sh --- ci/build/build_source.sh | 1 - 1 file changed, 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index f026328a..dc53f5b8 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -43,7 +43,6 @@ set -x && python3 server/build.py -v --enable-logging --enable-cpu-metrics --enable-gpu --container-prebuild-command="docker login -u gitlab-ci-token -p ${CI_JOB_TOKEN} ${CI_REGISTRY}" - --no-container-interactive --filesystem=gcs --filesystem=s3 --filesystem=azure_storage From 7f6157caa1b59c5a3cc2b5cca51628fbaaefd86c Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Wed, 24 Jul 2024 00:35:19 -0700 Subject: [PATCH 031/110] Update build_source.sh --- ci/build/build_source.sh | 7 +++---- 1 file changed, 3 insertions(+), 4 deletions(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index dc53f5b8..546622e2 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -34,7 +34,8 @@ echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}" TAG=$(curl https://api.github.com/repos/triton-inference-server/server/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 -git clone -b mesharma-ci https://github.com/triton-inference-server/server.git +# git clone -b mesharma-ci https://github.com/triton-inference-server/server.git +git clone https://github.com/triton-inference-server/server.git set -x && python3 server/build.py -v --enable-logging --enable-stats --enable-tracing @@ -52,6 +53,4 @@ set -x && python3 server/build.py -v --enable-logging --endpoint=vertex-ai --upstream-container-version=${TRITON_CONTAINER_VERSION} --backend=python:r${TRITON_CONTAINER_VERSION} - --backend=vllm:r${TRITON_CONTAINER_VERSION} - --vllm-version=${VLLM_VERSION} || RV=$?; 2>&1 -echo "RV=$RV" + --backend=vllm:r${TRITON_CONTAINER_VERSION} 2>&1 From a5e9fc4f7051aab447a836646135888c270e5ff3 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Wed, 24 Jul 2024 00:39:25 -0700 Subject: [PATCH 032/110] Update build_source.sh --- ci/build/build_source.sh | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 546622e2..75fe9aa8 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -34,8 +34,7 @@ echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}" TAG=$(curl https://api.github.com/repos/triton-inference-server/server/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 -# git clone -b mesharma-ci https://github.com/triton-inference-server/server.git -git clone https://github.com/triton-inference-server/server.git +git clone -b mesharma-ci https://github.com/triton-inference-server/server.git set -x && python3 server/build.py -v --enable-logging --enable-stats --enable-tracing @@ -53,4 +52,5 @@ set -x && python3 server/build.py -v --enable-logging --endpoint=vertex-ai --upstream-container-version=${TRITON_CONTAINER_VERSION} --backend=python:r${TRITON_CONTAINER_VERSION} - --backend=vllm:r${TRITON_CONTAINER_VERSION} 2>&1 + --backend=vllm:r${TRITON_CONTAINER_VERSION} + --vllm-version=${VLLM_VERSION} 2>&1 From 0301c0431b50ff8e6ff8d546f1e511a3897306e2 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Wed, 24 Jul 2024 09:53:22 -0700 Subject: [PATCH 033/110] Update build_source.sh --- ci/build/build_source.sh | 1 + 1 file changed, 1 insertion(+) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 75fe9aa8..90c6df5c 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -42,6 +42,7 @@ set -x && python3 server/build.py -v --enable-logging --enable-gpu-metrics --enable-cpu-metrics --enable-gpu + --no-container-interactive --container-prebuild-command="docker login -u gitlab-ci-token -p ${CI_JOB_TOKEN} ${CI_REGISTRY}" --filesystem=gcs --filesystem=s3 From b6f351e1244e0a556aa3e8ffadd4feb2a2d5f716 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Wed, 24 Jul 2024 12:07:51 -0700 Subject: [PATCH 034/110] Update build_source.sh --- ci/build/build_source.sh | 43 +++++++++++++++++++++------------------- 1 file changed, 23 insertions(+), 20 deletions(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 90c6df5c..c09da14b 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -33,25 +33,28 @@ echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}" # Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases TAG=$(curl https://api.github.com/repos/triton-inference-server/server/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 +echo "VLLM_VERSION = ${VLLM_VERSION}" git clone -b mesharma-ci https://github.com/triton-inference-server/server.git -set -x && python3 server/build.py -v --enable-logging - --enable-stats - --enable-tracing - --enable-metrics - --enable-gpu-metrics - --enable-cpu-metrics - --enable-gpu - --no-container-interactive - --container-prebuild-command="docker login -u gitlab-ci-token -p ${CI_JOB_TOKEN} ${CI_REGISTRY}" - --filesystem=gcs - --filesystem=s3 - --filesystem=azure_storage - --endpoint=http - --endpoint=grpc - --endpoint=sagemaker - --endpoint=vertex-ai - --upstream-container-version=${TRITON_CONTAINER_VERSION} - --backend=python:r${TRITON_CONTAINER_VERSION} - --backend=vllm:r${TRITON_CONTAINER_VERSION} - --vllm-version=${VLLM_VERSION} 2>&1 +set -x && python3 server/build.py -v \ + --enable-logging \ + --enable-stats \ + --enable-tracing \ + --enable-metrics \ + --enable-gpu-metrics \ + --enable-cpu-metrics \ + --enable-gpu \ + --no-container-interactive \ + --container-prebuild-command="docker login -u gitlab-ci-token -p ${CI_JOB_TOKEN} ${CI_REGISTRY}" \ + --filesystem=gcs \ + --filesystem=s3 \ + --filesystem=azure_storage \ + --endpoint=http \ + --endpoint=grpc \ + --endpoint=sagemaker \ + --endpoint=vertex-ai \ + --upstream-container-version=${TRITON_CONTAINER_VERSION} \ + --backend=python:r${TRITON_CONTAINER_VERSION} \ + --backend=vllm:r${TRITON_CONTAINER_VERSION} \ + --vllm-version=${VLLM_VERSION} 2>&1 \ + / From ba5dba3ca2f9574a2d8fd36d11630a800fba6c6e Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Wed, 24 Jul 2024 12:11:14 -0700 Subject: [PATCH 035/110] Update build_source.sh --- ci/build/build_source.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index c09da14b..d3cc7239 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -31,7 +31,7 @@ export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.06 echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}" # Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases -TAG=$(curl https://api.github.com/repos/triton-inference-server/server/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') +TAG=$(curl https://api.github.com/repos/vllm-project/vllm/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 echo "VLLM_VERSION = ${VLLM_VERSION}" From bfe71315aae49bcd5ad1064a9400412427db18d9 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Wed, 24 Jul 2024 12:25:42 -0700 Subject: [PATCH 036/110] Update build_source.sh --- ci/build/build_source.sh | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index d3cc7239..b9b04755 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -56,5 +56,4 @@ set -x && python3 server/build.py -v \ --upstream-container-version=${TRITON_CONTAINER_VERSION} \ --backend=python:r${TRITON_CONTAINER_VERSION} \ --backend=vllm:r${TRITON_CONTAINER_VERSION} \ - --vllm-version=${VLLM_VERSION} 2>&1 \ - / + --vllm-version=${VLLM_VERSION} 2>&1 From d6606d32510145ec9dc0654f0d0ac957265268cd Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Wed, 24 Jul 2024 14:37:11 -0700 Subject: [PATCH 037/110] Update build_source.sh --- ci/build/build_source.sh | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index b9b04755..fe061d48 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -56,4 +56,5 @@ set -x && python3 server/build.py -v \ --upstream-container-version=${TRITON_CONTAINER_VERSION} \ --backend=python:r${TRITON_CONTAINER_VERSION} \ --backend=vllm:r${TRITON_CONTAINER_VERSION} \ - --vllm-version=${VLLM_VERSION} 2>&1 + --vllm-version=${VLLM_VERSION} \ + --dryrun 2>&1 From 223a10b0153668711b0f045266310fa90d0c9dda Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Wed, 24 Jul 2024 17:11:00 -0700 Subject: [PATCH 038/110] Update build_source.sh --- ci/build/build_source.sh | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index fe061d48..b9b04755 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -56,5 +56,4 @@ set -x && python3 server/build.py -v \ --upstream-container-version=${TRITON_CONTAINER_VERSION} \ --backend=python:r${TRITON_CONTAINER_VERSION} \ --backend=vllm:r${TRITON_CONTAINER_VERSION} \ - --vllm-version=${VLLM_VERSION} \ - --dryrun 2>&1 + --vllm-version=${VLLM_VERSION} 2>&1 From 23865a622655c4f2d2601f6945c1c4290744241f Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Wed, 24 Jul 2024 19:18:01 -0700 Subject: [PATCH 039/110] Update build_source.sh --- ci/build/build_source.sh | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index b9b04755..74c64d50 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -32,7 +32,8 @@ echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}" # Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases TAG=$(curl https://api.github.com/repos/vllm-project/vllm/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') -export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 +# export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 +export VLLM_VERSION=0.5.0.post1 # seeing errors with latest vllm_version echo "VLLM_VERSION = ${VLLM_VERSION}" git clone -b mesharma-ci https://github.com/triton-inference-server/server.git From b1c58b353e4893854d595907cd9ffcd03925db38 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Wed, 24 Jul 2024 20:26:03 -0700 Subject: [PATCH 040/110] Update build_source.sh --- ci/build/build_source.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 74c64d50..98c3a148 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -33,7 +33,7 @@ echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}" # Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases TAG=$(curl https://api.github.com/repos/vllm-project/vllm/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') # export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 -export VLLM_VERSION=0.5.0.post1 # seeing errors with latest vllm_version +export VLLM_VERSION=0.4.3 # seeing errors with latest vllm_version echo "VLLM_VERSION = ${VLLM_VERSION}" git clone -b mesharma-ci https://github.com/triton-inference-server/server.git From 72ee87613e030e022213110e1e91f0d4d15330fa Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Thu, 25 Jul 2024 10:13:07 -0700 Subject: [PATCH 041/110] Update build_source.sh --- ci/build/build_source.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 98c3a148..0ce8aae3 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -36,7 +36,7 @@ TAG=$(curl https://api.github.com/repos/vllm-project/vllm/releases/latest | grep export VLLM_VERSION=0.4.3 # seeing errors with latest vllm_version echo "VLLM_VERSION = ${VLLM_VERSION}" -git clone -b mesharma-ci https://github.com/triton-inference-server/server.git +git clone -b mesharma-r24.06 https://github.com/triton-inference-server/server.git set -x && python3 server/build.py -v \ --enable-logging \ --enable-stats \ From 18c6ab65291346c146cf9e7bc3a81c5c361d6c34 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Sat, 27 Jul 2024 00:46:37 -0700 Subject: [PATCH 042/110] Update trigger_ci.yml --- .github/workflows/trigger_ci.yml | 18 ++++++++++++++++++ 1 file changed, 18 insertions(+) diff --git a/.github/workflows/trigger_ci.yml b/.github/workflows/trigger_ci.yml index 07deb27b..2d850bfd 100644 --- a/.github/workflows/trigger_ci.yml +++ b/.github/workflows/trigger_ci.yml @@ -18,3 +18,21 @@ jobs: run: | #!/bin/bash curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD-SOURCE" "${{ secrets.PIPELINE_URL }}" + add-ready-label: + environment: GITLAB + needs: trigger-ci + runs-on: self-hosted + if: ${{ github.event.workflow_run.conclusion == 'success' }} + steps: + - name: Add labels + uses: actions/github-script@v5 + with: + script: | + github.rest.issues.addLabels({ + owner: context.repo.owner, + repo: context.repo.repo, + issue_number: context.issue.number, + labels: ['ready', 'verified_on_V100', 'verified_on_A100', 'verified_on_H100'] + }) + env: + GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} From d4b30c053549127ade7562423c1e188432ca30d1 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Sat, 27 Jul 2024 00:50:52 -0700 Subject: [PATCH 043/110] Delete .github/workflows/verify_latest_vllm.ci --- .github/workflows/verify_latest_vllm.ci | 21 --------------------- 1 file changed, 21 deletions(-) delete mode 100644 .github/workflows/verify_latest_vllm.ci diff --git a/.github/workflows/verify_latest_vllm.ci b/.github/workflows/verify_latest_vllm.ci deleted file mode 100644 index 4816f86c..00000000 --- a/.github/workflows/verify_latest_vllm.ci +++ /dev/null @@ -1,21 +0,0 @@ -on: - schedule: - - cron: '0 20 * * 4' -jobs: - mirror_repo: - environment: GITLAB - runs-on: self-hosted - steps: - - name: Sync Mirror Repository - run: | - #!/bin/bash - curl --request POST --header "PRIVATE-TOKEN:${{ secrets.TOKEN }}" "${{ secrets.MIRROR_URL }}" - trigger-ci: - environment: GITLAB - needs: mirror_repo - runs-on: self-hosted - steps: - - name: Trigger Pipeline - run: | - #!/bin/bash - curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD-SOURCE" "${{ secrets.PIPELINE_URL }}" From a2b3058555dc81f2e7f4bb9d29d9b5eac51e8bfb Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Sat, 27 Jul 2024 00:53:00 -0700 Subject: [PATCH 044/110] Update build_source.sh --- ci/build/build_source.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 0ce8aae3..c9287974 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -57,4 +57,4 @@ set -x && python3 server/build.py -v \ --upstream-container-version=${TRITON_CONTAINER_VERSION} \ --backend=python:r${TRITON_CONTAINER_VERSION} \ --backend=vllm:r${TRITON_CONTAINER_VERSION} \ - --vllm-version=${VLLM_VERSION} 2>&1 + --vllm-version=${VLLM_VERSION} 2>&1 From dd7ccf91925e1f4554562f458dadcb751d1bb871 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Sat, 27 Jul 2024 00:56:19 -0700 Subject: [PATCH 045/110] Update build_source.sh --- ci/build/build_source.sh | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index c9287974..7866c14d 100644 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -28,15 +28,15 @@ # Get latest VLLM RELEASED VERSION from https://github.com/triton-inference-server/vllm_backend/releases TAG=$(curl https://api.github.com/repos/triton-inference-server/vllm_backend/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.06 -echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}" +echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}" # Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases TAG=$(curl https://api.github.com/repos/vllm-project/vllm/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') # export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 export VLLM_VERSION=0.4.3 # seeing errors with latest vllm_version -echo "VLLM_VERSION = ${VLLM_VERSION}" +echo "VLLM_VERSION = ${VLLM_VERSION}" -git clone -b mesharma-r24.06 https://github.com/triton-inference-server/server.git +git clone -b mesharma-r24.06 https://github.com/triton-inference-server/server.git set -x && python3 server/build.py -v \ --enable-logging \ --enable-stats \ From cfa8c4880c685ae735cc642b18b316a95aa93dfe Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Sat, 27 Jul 2024 01:12:42 -0700 Subject: [PATCH 046/110] Delete .github/workflows/pre-commit.yaml --- .github/workflows/pre-commit.yaml | 39 ------------------------------- 1 file changed, 39 deletions(-) delete mode 100644 .github/workflows/pre-commit.yaml diff --git a/.github/workflows/pre-commit.yaml b/.github/workflows/pre-commit.yaml deleted file mode 100644 index 531cc291..00000000 --- a/.github/workflows/pre-commit.yaml +++ /dev/null @@ -1,39 +0,0 @@ -# Copyright 2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved. -# -# Redistribution and use in source and binary forms, with or without -# modification, are permitted provided that the following conditions -# are met: -# * Redistributions of source code must retain the above copyright -# notice, this list of conditions and the following disclaimer. -# * Redistributions in binary form must reproduce the above copyright -# notice, this list of conditions and the following disclaimer in the -# documentation and/or other materials provided with the distribution. -# * Neither the name of NVIDIA CORPORATION nor the names of its -# contributors may be used to endorse or promote products derived -# from this software without specific prior written permission. -# -# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ``AS IS'' AND ANY -# EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE -# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR -# PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR -# CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, -# EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, -# PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR -# PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY -# OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT -# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE -# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. - -name: pre-commit - -on: - pull_request: - -jobs: - pre-commit: - runs-on: ubuntu-22.04 - steps: - - uses: actions/checkout@v3 - - uses: actions/setup-python@v3 - - uses: pre-commit/action@v3.0.0 - From 8bdc8e0cb47307fb90ab98fa6be103907ca6549f Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Sat, 27 Jul 2024 01:47:36 -0700 Subject: [PATCH 047/110] Update trigger_ci.yml --- .github/workflows/trigger_ci.yml | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/.github/workflows/trigger_ci.yml b/.github/workflows/trigger_ci.yml index 2d850bfd..d0b3655f 100644 --- a/.github/workflows/trigger_ci.yml +++ b/.github/workflows/trigger_ci.yml @@ -20,9 +20,8 @@ jobs: curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD-SOURCE" "${{ secrets.PIPELINE_URL }}" add-ready-label: environment: GITLAB - needs: trigger-ci runs-on: self-hosted - if: ${{ github.event.workflow_run.conclusion == 'success' }} + if: ${{ always() && !cancelled() && needs.*.result == 'success' }} steps: - name: Add labels uses: actions/github-script@v5 From 07912f281b7c677734aa1becc57e30571de14dda Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Mon, 29 Jul 2024 12:27:04 -0700 Subject: [PATCH 048/110] Create contributor.yml --- .github/workflows/contributor.yml | 21 +++++++++++++++++++++ 1 file changed, 21 insertions(+) create mode 100644 .github/workflows/contributor.yml diff --git a/.github/workflows/contributor.yml b/.github/workflows/contributor.yml new file mode 100644 index 00000000..fdf48536 --- /dev/null +++ b/.github/workflows/contributor.yml @@ -0,0 +1,21 @@ +name: Welcome message +on: + pull_request_target: + types: [opened] + +jobs: + pr_reminder: + runs-on: ubuntu-latest + steps: + - name: Add first comment + uses: actions/github-script@v6 + with: + script: | + github.rest.issues.createComment({ + owner: context.repo.owner, + repo: context.repo.repo, + issue_number: context.issue.number, + body: 'šŸ‘‹ Hi! \nThank you for contributing to the project.\n Just a reminder: PRs would not trigger full CI run by default. You can run CI tests by commenting `/ready` on the PR.\nšŸš€' + }) + env: + GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} From 9268c2fb8225cf78118b7969dd9b81ec82813b92 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Mon, 29 Jul 2024 12:28:46 -0700 Subject: [PATCH 049/110] Update trigger_ci.yml --- .github/workflows/trigger_ci.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/trigger_ci.yml b/.github/workflows/trigger_ci.yml index d0b3655f..9d743b50 100644 --- a/.github/workflows/trigger_ci.yml +++ b/.github/workflows/trigger_ci.yml @@ -18,7 +18,7 @@ jobs: run: | #!/bin/bash curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD-SOURCE" "${{ secrets.PIPELINE_URL }}" - add-ready-label: + add-verified-labels: environment: GITLAB runs-on: self-hosted if: ${{ always() && !cancelled() && needs.*.result == 'success' }} From 98f4a3fcd25137354cf335c212f7ef1cf9f3aaac Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 30 Jul 2024 13:16:02 -0700 Subject: [PATCH 050/110] Create verified.yml --- .github/workflows/verified.yml | 23 +++++++++++++++++++++++ 1 file changed, 23 insertions(+) create mode 100644 .github/workflows/verified.yml diff --git a/.github/workflows/verified.yml b/.github/workflows/verified.yml new file mode 100644 index 00000000..1c2c005d --- /dev/null +++ b/.github/workflows/verified.yml @@ -0,0 +1,23 @@ +on: + issue_comment: + types: [created] +jobs: + run-test: + runs-on: ubuntu-latest + if: github.event.issue.pull_request && contains(github.event.comment.body, '/ready')add-verified-labels: + environment: GITLAB + runs-on: self-hosted + if: ${{ always() && !cancelled() && needs.*.result == 'success' }} + steps: + - name: Add labels + uses: actions/github-script@v5 + with: + script: | + github.rest.issues.addLabels({ + owner: context.repo.owner, + repo: context.repo.repo, + issue_number: context.issue.number, + labels: ['ready', 'verified_on_V100', 'verified_on_A100', 'verified_on_H100'] + }) + env: + GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} From e0c4ad4a041acd23b92d2c37f0eb416fe90fdcd9 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 30 Jul 2024 13:16:53 -0700 Subject: [PATCH 051/110] Update verified.yml --- .github/workflows/verified.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/verified.yml b/.github/workflows/verified.yml index 1c2c005d..5862bce9 100644 --- a/.github/workflows/verified.yml +++ b/.github/workflows/verified.yml @@ -2,9 +2,9 @@ on: issue_comment: types: [created] jobs: - run-test: + add-verified-labels: runs-on: ubuntu-latest - if: github.event.issue.pull_request && contains(github.event.comment.body, '/ready')add-verified-labels: + if: github.event.issue.pull_request && contains(github.event.comment.body, '/ready') environment: GITLAB runs-on: self-hosted if: ${{ always() && !cancelled() && needs.*.result == 'success' }} From 013e3895e41319e8b28df50e195ef682444ea24a Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 30 Jul 2024 13:26:48 -0700 Subject: [PATCH 052/110] Update verified.yml --- .github/workflows/verified.yml | 5 +---- 1 file changed, 1 insertion(+), 4 deletions(-) diff --git a/.github/workflows/verified.yml b/.github/workflows/verified.yml index 5862bce9..5f4d731a 100644 --- a/.github/workflows/verified.yml +++ b/.github/workflows/verified.yml @@ -5,10 +5,7 @@ jobs: add-verified-labels: runs-on: ubuntu-latest if: github.event.issue.pull_request && contains(github.event.comment.body, '/ready') - environment: GITLAB - runs-on: self-hosted - if: ${{ always() && !cancelled() && needs.*.result == 'success' }} - steps: + steps: - name: Add labels uses: actions/github-script@v5 with: From 20f3d396b1c56eab4c50628245087de7a0ac34c3 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Wed, 31 Jul 2024 10:57:27 -0700 Subject: [PATCH 053/110] Update contributor.yml --- .github/workflows/contributor.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/contributor.yml b/.github/workflows/contributor.yml index fdf48536..606e1b20 100644 --- a/.github/workflows/contributor.yml +++ b/.github/workflows/contributor.yml @@ -15,7 +15,7 @@ jobs: owner: context.repo.owner, repo: context.repo.repo, issue_number: context.issue.number, - body: 'šŸ‘‹ Hi! \nThank you for contributing to the project.\n Just a reminder: PRs would not trigger full CI run by default. You can run CI tests by commenting `/ready` on the PR.\nšŸš€' + body: 'šŸ‘‹ Hi! \nThank you for contributing to the project.\n Just a reminder: PRs will trigger full CI run by default. We will add verified labels on the PR once build and tests steps are successful.\nšŸš€' }) env: GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} From 2d5098a15bb8479b98f26f0b9a89c9fee8ad68ac Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Wed, 31 Jul 2024 11:04:04 -0700 Subject: [PATCH 054/110] Delete .github/workflows/verified.yml --- .github/workflows/verified.yml | 20 -------------------- 1 file changed, 20 deletions(-) delete mode 100644 .github/workflows/verified.yml diff --git a/.github/workflows/verified.yml b/.github/workflows/verified.yml deleted file mode 100644 index 5f4d731a..00000000 --- a/.github/workflows/verified.yml +++ /dev/null @@ -1,20 +0,0 @@ -on: - issue_comment: - types: [created] -jobs: - add-verified-labels: - runs-on: ubuntu-latest - if: github.event.issue.pull_request && contains(github.event.comment.body, '/ready') - steps: - - name: Add labels - uses: actions/github-script@v5 - with: - script: | - github.rest.issues.addLabels({ - owner: context.repo.owner, - repo: context.repo.repo, - issue_number: context.issue.number, - labels: ['ready', 'verified_on_V100', 'verified_on_A100', 'verified_on_H100'] - }) - env: - GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} From 84e14dded0c7b473d847066dbe5861e50c355b3d Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Wed, 31 Jul 2024 14:17:29 -0700 Subject: [PATCH 055/110] Update trigger_ci.yml --- .github/workflows/trigger_ci.yml | 17 ----------------- 1 file changed, 17 deletions(-) diff --git a/.github/workflows/trigger_ci.yml b/.github/workflows/trigger_ci.yml index 9d743b50..07deb27b 100644 --- a/.github/workflows/trigger_ci.yml +++ b/.github/workflows/trigger_ci.yml @@ -18,20 +18,3 @@ jobs: run: | #!/bin/bash curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD-SOURCE" "${{ secrets.PIPELINE_URL }}" - add-verified-labels: - environment: GITLAB - runs-on: self-hosted - if: ${{ always() && !cancelled() && needs.*.result == 'success' }} - steps: - - name: Add labels - uses: actions/github-script@v5 - with: - script: | - github.rest.issues.addLabels({ - owner: context.repo.owner, - repo: context.repo.repo, - issue_number: context.issue.number, - labels: ['ready', 'verified_on_V100', 'verified_on_A100', 'verified_on_H100'] - }) - env: - GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} From fb2023686d943466977efa9a5c673aff50862ec4 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Mon, 5 Aug 2024 12:33:55 -0700 Subject: [PATCH 056/110] Create pre-commit.yaml --- .github/workflows/pre-commit.yaml | 38 +++++++++++++++++++++++++++++++ 1 file changed, 38 insertions(+) create mode 100644 .github/workflows/pre-commit.yaml diff --git a/.github/workflows/pre-commit.yaml b/.github/workflows/pre-commit.yaml new file mode 100644 index 00000000..ab4bd951 --- /dev/null +++ b/.github/workflows/pre-commit.yaml @@ -0,0 +1,38 @@ +# Copyright 2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved. +# +# Redistribution and use in source and binary forms, with or without +# modification, are permitted provided that the following conditions +# are met: +# * Redistributions of source code must retain the above copyright +# notice, this list of conditions and the following disclaimer. +# * Redistributions in binary form must reproduce the above copyright +# notice, this list of conditions and the following disclaimer in the +# documentation and/or other materials provided with the distribution. +# * Neither the name of NVIDIA CORPORATION nor the names of its +# contributors may be used to endorse or promote products derived +# from this software without specific prior written permission. +# +# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ``AS IS'' AND ANY +# EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE +# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR +# PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR +# CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, +# EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, +# PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR +# PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY +# OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT +# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE +# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + +name: pre-commit + +on: + pull_request: + +jobs: + pre-commit: + runs-on: ubuntu-22.04 + steps: + - uses: actions/checkout@v3 + - uses: actions/setup-python@v3 + - uses: pre-commit/action@v3.0.0 From 29e73baa400ef96f7d35d0cc86acd034f2df8b38 Mon Sep 17 00:00:00 2001 From: Meenakshi Date: Mon, 5 Aug 2024 12:42:25 -0700 Subject: [PATCH 057/110] fix pre-commit issues --- ci/build/build_docker.sh | 0 ci/build/build_source.sh | 0 2 files changed, 0 insertions(+), 0 deletions(-) mode change 100644 => 100755 ci/build/build_docker.sh mode change 100644 => 100755 ci/build/build_source.sh diff --git a/ci/build/build_docker.sh b/ci/build/build_docker.sh old mode 100644 new mode 100755 diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh old mode 100644 new mode 100755 From a2e7db3647176a932647993eddd72210e35efc52 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Mon, 5 Aug 2024 13:32:18 -0700 Subject: [PATCH 058/110] Update build_source.sh --- ci/build/build_source.sh | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 7866c14d..a58c69a6 100755 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -33,7 +33,6 @@ echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}" # Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases TAG=$(curl https://api.github.com/repos/vllm-project/vllm/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') # export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 -export VLLM_VERSION=0.4.3 # seeing errors with latest vllm_version echo "VLLM_VERSION = ${VLLM_VERSION}" git clone -b mesharma-r24.06 https://github.com/triton-inference-server/server.git @@ -58,3 +57,6 @@ set -x && python3 server/build.py -v \ --backend=python:r${TRITON_CONTAINER_VERSION} \ --backend=vllm:r${TRITON_CONTAINER_VERSION} \ --vllm-version=${VLLM_VERSION} 2>&1 +# Build Triton Server +cd server/build +bash -x ./docker_build From bfb94668802e4f66e83fce32c6a87e6d9dd8ead7 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Mon, 5 Aug 2024 13:34:04 -0700 Subject: [PATCH 059/110] Update build_source.sh --- ci/build/build_source.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index a58c69a6..f77f69dc 100755 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -32,7 +32,7 @@ echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}" # Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases TAG=$(curl https://api.github.com/repos/vllm-project/vllm/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') -# export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 +export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 echo "VLLM_VERSION = ${VLLM_VERSION}" git clone -b mesharma-r24.06 https://github.com/triton-inference-server/server.git From f348d4928a33dbaccd2faf3bcf7a7e23f99cfbed Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Mon, 5 Aug 2024 13:34:37 -0700 Subject: [PATCH 060/110] Update README.md --- README.md | 14 +++++++++++++- 1 file changed, 13 insertions(+), 1 deletion(-) diff --git a/README.md b/README.md index 13953f58..e51fcc46 100644 --- a/README.md +++ b/README.md @@ -82,7 +82,15 @@ latest YY.MM (year.month) of [Triton release](https://github.com/triton-inferenc ``` # YY.MM is the version of Triton. -export TRITON_CONTAINER_VERSION= +# Get latest VLLM RELEASED VERSION from https://github.com/triton-inference-server/vllm_backend/releases +TAG=$(curl https://api.github.com/repos/triton-inference-server/vllm_backend/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') +export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.06 +echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}" + +# Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases +TAG=$(curl https://api.github.com/repos/vllm-project/vllm/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') +export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 +echo "VLLM_VERSION = ${VLLM_VERSION}" ./build.py -v --enable-logging --enable-stats --enable-tracing @@ -100,6 +108,10 @@ export TRITON_CONTAINER_VERSION= --upstream-container-version=${TRITON_CONTAINER_VERSION} --backend=python:r${TRITON_CONTAINER_VERSION} --backend=vllm:r${TRITON_CONTAINER_VERSION} + --vllm-version=${VLLM_VERSION} +# Build Triton Server +cd server/build +bash -x ./docker_build ``` ### Option 3. Add the vLLM Backend to the Default Triton Container From 85c53aa8c2f46da9ea9dd3f072805b7cf4eb1e9a Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Mon, 5 Aug 2024 13:36:23 -0700 Subject: [PATCH 061/110] Update build_source.sh --- ci/build/build_source.sh | 1 + 1 file changed, 1 insertion(+) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index f77f69dc..2f4ef2e2 100755 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -35,6 +35,7 @@ TAG=$(curl https://api.github.com/repos/vllm-project/vllm/releases/latest | grep export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 echo "VLLM_VERSION = ${VLLM_VERSION}" +#git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git git clone -b mesharma-r24.06 https://github.com/triton-inference-server/server.git set -x && python3 server/build.py -v \ --enable-logging \ From 25a71f7ee74c0b803511580786cc6feca036eaf3 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Mon, 5 Aug 2024 13:37:00 -0700 Subject: [PATCH 062/110] Update README.md --- README.md | 2 ++ 1 file changed, 2 insertions(+) diff --git a/README.md b/README.md index e51fcc46..82601f62 100644 --- a/README.md +++ b/README.md @@ -91,6 +91,8 @@ echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}" TAG=$(curl https://api.github.com/repos/vllm-project/vllm/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 echo "VLLM_VERSION = ${VLLM_VERSION}" + +git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git ./build.py -v --enable-logging --enable-stats --enable-tracing From deb13cecdb21254cba11cfe9457f6a079d77c53c Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Mon, 5 Aug 2024 13:51:19 -0700 Subject: [PATCH 063/110] Update trigger_ci.yml --- .github/workflows/trigger_ci.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/trigger_ci.yml b/.github/workflows/trigger_ci.yml index 07deb27b..985605e9 100644 --- a/.github/workflows/trigger_ci.yml +++ b/.github/workflows/trigger_ci.yml @@ -17,4 +17,4 @@ jobs: - name: Trigger Pipeline run: | #!/bin/bash - curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD-SOURCE" "${{ secrets.PIPELINE_URL }}" + curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD_SOURCE" "${{ secrets.PIPELINE_URL }}" From d888f12390f0c6a26497d094d7b24b1a49ae39d6 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Mon, 5 Aug 2024 13:55:40 -0700 Subject: [PATCH 064/110] Update trigger_ci.yml --- .github/workflows/trigger_ci.yml | 12 +++++++++++- 1 file changed, 11 insertions(+), 1 deletion(-) diff --git a/.github/workflows/trigger_ci.yml b/.github/workflows/trigger_ci.yml index 985605e9..19ffa2bd 100644 --- a/.github/workflows/trigger_ci.yml +++ b/.github/workflows/trigger_ci.yml @@ -17,4 +17,14 @@ jobs: - name: Trigger Pipeline run: | #!/bin/bash - curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD_SOURCE" "${{ secrets.PIPELINE_URL }}" + # Get latest VLLM RELEASED VERSION from https://github.com/triton-inference-server/vllm_backend/releases + TAG=$(curl https://api.github.com/repos/triton-inference-server/vllm_backend/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') + export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.06 + echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}" + + # Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases + TAG=$(curl https://api.github.com/repos/vllm-project/vllm/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') + export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 + echo "VLLM_VERSION = ${VLLM_VERSION}" + + curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD_SOURCE" -F variables[TRITON_CONTAINER_VERSION]="TRITON_CONTAINER_VERSION" -F variables[VLLM_VERSION]="VLLM_VERSION" "${{ secrets.PIPELINE_URL }}" From 7a08c86b7db7315de976c59480586f1fc0f3d4a3 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Mon, 5 Aug 2024 13:58:20 -0700 Subject: [PATCH 065/110] Update build_source.sh --- ci/build/build_source.sh | 16 +++++++--------- 1 file changed, 7 insertions(+), 9 deletions(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 2f4ef2e2..61f3c600 100755 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -25,15 +25,13 @@ # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. -# Get latest VLLM RELEASED VERSION from https://github.com/triton-inference-server/vllm_backend/releases -TAG=$(curl https://api.github.com/repos/triton-inference-server/vllm_backend/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') -export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.06 -echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}" - -# Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases -TAG=$(curl https://api.github.com/repos/vllm-project/vllm/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') -export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 -echo "VLLM_VERSION = ${VLLM_VERSION}" +while getopts t:v: flag +do + case "${flag}" in + u) TRITON_CONTAINER_VERSION=${OPTARG};; + a) VLLM_VERSION=${OPTARG};; + esac +done #git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git git clone -b mesharma-r24.06 https://github.com/triton-inference-server/server.git From e76e209d32355baea1d58cc856083bac1377389b Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Mon, 5 Aug 2024 14:27:51 -0700 Subject: [PATCH 066/110] Update build_source.sh --- ci/build/build_source.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 61f3c600..3d6157e4 100755 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -34,7 +34,7 @@ do done #git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git -git clone -b mesharma-r24.06 https://github.com/triton-inference-server/server.git +git clone -b mesharma-ci https://github.com/triton-inference-server/server.git set -x && python3 server/build.py -v \ --enable-logging \ --enable-stats \ From 1b3dbc0d7e6345425c2185248cd3a4f00a36ef87 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Mon, 5 Aug 2024 15:29:00 -0700 Subject: [PATCH 067/110] Update build_source.sh --- ci/build/build_source.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 3d6157e4..d1ecd09d 100755 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -34,7 +34,7 @@ do done #git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git -git clone -b mesharma-ci https://github.com/triton-inference-server/server.git +git clone -b mesharma-r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git set -x && python3 server/build.py -v \ --enable-logging \ --enable-stats \ From 1a93230ba33e8a16743a264177bdcda545f225f2 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 6 Aug 2024 12:34:48 -0700 Subject: [PATCH 068/110] Update build_source.sh --- ci/build/build_source.sh | 1 + 1 file changed, 1 insertion(+) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index d1ecd09d..4fdc6731 100755 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -33,6 +33,7 @@ do esac done +echo "Triton version is $TRITON_CONTAINER_VERSION and vllm version is $VLLM_VERSION" #git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git git clone -b mesharma-r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git set -x && python3 server/build.py -v \ From 1efadc7b422c9625feec4e5ffc42bc8078116cdf Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 6 Aug 2024 12:54:55 -0700 Subject: [PATCH 069/110] Update trigger_ci.yml --- .github/workflows/trigger_ci.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/trigger_ci.yml b/.github/workflows/trigger_ci.yml index 19ffa2bd..adada373 100644 --- a/.github/workflows/trigger_ci.yml +++ b/.github/workflows/trigger_ci.yml @@ -27,4 +27,4 @@ jobs: export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 echo "VLLM_VERSION = ${VLLM_VERSION}" - curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD_SOURCE" -F variables[TRITON_CONTAINER_VERSION]="TRITON_CONTAINER_VERSION" -F variables[VLLM_VERSION]="VLLM_VERSION" "${{ secrets.PIPELINE_URL }}" + curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD_SOURCE" -F variables[TRITON_CONTAINER_VERSION]="${TRITON_CONTAINER_VERSION}" -F variables[VLLM_VERSION]="${VLLM_VERSION}" "${{ secrets.PIPELINE_URL }}" From 3d0110a74f7e2bf4dc36da60b8be6a2d3d056a75 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 6 Aug 2024 12:57:20 -0700 Subject: [PATCH 070/110] Update build_source.sh --- ci/build/build_source.sh | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 4fdc6731..c9496354 100755 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -34,8 +34,7 @@ do done echo "Triton version is $TRITON_CONTAINER_VERSION and vllm version is $VLLM_VERSION" -#git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git -git clone -b mesharma-r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git +git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git set -x && python3 server/build.py -v \ --enable-logging \ --enable-stats \ From f29d9d04f38b763c170af038b1b34dbe5fe560fb Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 6 Aug 2024 13:07:02 -0700 Subject: [PATCH 071/110] Update build_source.sh --- ci/build/build_source.sh | 1 + 1 file changed, 1 insertion(+) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index c9496354..409e3b96 100755 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -35,6 +35,7 @@ done echo "Triton version is $TRITON_CONTAINER_VERSION and vllm version is $VLLM_VERSION" git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git +git clone -b rmesharma-r24.06 https://github.com/triton-inference-server/server.git set -x && python3 server/build.py -v \ --enable-logging \ --enable-stats \ From dec1329e77d4ad1e4058da689880f82458e226f7 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 6 Aug 2024 13:07:15 -0700 Subject: [PATCH 072/110] Update build_source.sh --- ci/build/build_source.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 409e3b96..7aa21f84 100755 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -34,7 +34,7 @@ do done echo "Triton version is $TRITON_CONTAINER_VERSION and vllm version is $VLLM_VERSION" -git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git +#git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git git clone -b rmesharma-r24.06 https://github.com/triton-inference-server/server.git set -x && python3 server/build.py -v \ --enable-logging \ From 52aadedd8ec7817b566d8dc2b1306627a603566c Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 6 Aug 2024 13:10:19 -0700 Subject: [PATCH 073/110] Update build_source.sh --- ci/build/build_source.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 7aa21f84..ad5a4e50 100755 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -35,7 +35,7 @@ done echo "Triton version is $TRITON_CONTAINER_VERSION and vllm version is $VLLM_VERSION" #git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git -git clone -b rmesharma-r24.06 https://github.com/triton-inference-server/server.git +git clone -b mesharma-ci https://github.com/triton-inference-server/server.git set -x && python3 server/build.py -v \ --enable-logging \ --enable-stats \ From 62fc87c5e097c4f1c1ab297f71d78289cbf5426e Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 6 Aug 2024 13:22:11 -0700 Subject: [PATCH 074/110] Update build_source.sh --- ci/build/build_source.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index ad5a4e50..082672d5 100755 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -33,7 +33,7 @@ do esac done -echo "Triton version is $TRITON_CONTAINER_VERSION and vllm version is $VLLM_VERSION" +echo "Triton version is ${TRITON_CONTAINER_VERSION} and vllm version is ${VLLM_VERSION}" #git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git git clone -b mesharma-ci https://github.com/triton-inference-server/server.git set -x && python3 server/build.py -v \ From 660598348189b7016fefdcf882f934c649047123 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 6 Aug 2024 13:29:01 -0700 Subject: [PATCH 075/110] Update trigger_ci.yml --- .github/workflows/trigger_ci.yml | 13 +++++++++++++ 1 file changed, 13 insertions(+) diff --git a/.github/workflows/trigger_ci.yml b/.github/workflows/trigger_ci.yml index adada373..623cda83 100644 --- a/.github/workflows/trigger_ci.yml +++ b/.github/workflows/trigger_ci.yml @@ -20,11 +20,24 @@ jobs: # Get latest VLLM RELEASED VERSION from https://github.com/triton-inference-server/vllm_backend/releases TAG=$(curl https://api.github.com/repos/triton-inference-server/vllm_backend/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.06 + if [ -z "$TRITON_CONTAINER_VERSION" ] + then + echo "\$TRITON_CONTAINER_VERSION is NULL, setting it to 24.07" + else + echo "\$TRITON_CONTAINER_VERSION is NOT NULL" + fi echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}" # Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases TAG=$(curl https://api.github.com/repos/vllm-project/vllm/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 + if [ -z "$VLLM_VERSION" ] + then + echo "\$VLLM_VERSION is NULL, setting it to 0.5.3.post1" + else + echo "\$VLLM_VERSION is NOT NULL" + fi echo "VLLM_VERSION = ${VLLM_VERSION}" + curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD_SOURCE" -F variables[TRITON_CONTAINER_VERSION]="${TRITON_CONTAINER_VERSION}" -F variables[VLLM_VERSION]="${VLLM_VERSION}" "${{ secrets.PIPELINE_URL }}" From 98fbc29ffd91598570f4166806c5ef877d40e194 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 6 Aug 2024 13:36:49 -0700 Subject: [PATCH 076/110] Update trigger_ci.yml --- .github/workflows/trigger_ci.yml | 2 ++ 1 file changed, 2 insertions(+) diff --git a/.github/workflows/trigger_ci.yml b/.github/workflows/trigger_ci.yml index 623cda83..fa8a520d 100644 --- a/.github/workflows/trigger_ci.yml +++ b/.github/workflows/trigger_ci.yml @@ -23,6 +23,7 @@ jobs: if [ -z "$TRITON_CONTAINER_VERSION" ] then echo "\$TRITON_CONTAINER_VERSION is NULL, setting it to 24.07" + TRITON_CONTAINER_VERSION=24.07 else echo "\$TRITON_CONTAINER_VERSION is NOT NULL" fi @@ -34,6 +35,7 @@ jobs: if [ -z "$VLLM_VERSION" ] then echo "\$VLLM_VERSION is NULL, setting it to 0.5.3.post1" + VLLM_VERSION=0.5.3.post1 else echo "\$VLLM_VERSION is NOT NULL" fi From f484188fd1aa314f9f492ac7e97fdf3427a190d7 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Tue, 6 Aug 2024 14:55:51 -0700 Subject: [PATCH 077/110] Update trigger_ci.yml --- .github/workflows/trigger_ci.yml | 1 - 1 file changed, 1 deletion(-) diff --git a/.github/workflows/trigger_ci.yml b/.github/workflows/trigger_ci.yml index fa8a520d..cefbfa76 100644 --- a/.github/workflows/trigger_ci.yml +++ b/.github/workflows/trigger_ci.yml @@ -41,5 +41,4 @@ jobs: fi echo "VLLM_VERSION = ${VLLM_VERSION}" - curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD_SOURCE" -F variables[TRITON_CONTAINER_VERSION]="${TRITON_CONTAINER_VERSION}" -F variables[VLLM_VERSION]="${VLLM_VERSION}" "${{ secrets.PIPELINE_URL }}" From 91dc27ae423d1dccb15019d6e8bc68da9ad1c0c7 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Fri, 30 Aug 2024 11:38:26 -0700 Subject: [PATCH 078/110] Update trigger_ci.yml --- .github/workflows/trigger_ci.yml | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/.github/workflows/trigger_ci.yml b/.github/workflows/trigger_ci.yml index cefbfa76..d4343040 100644 --- a/.github/workflows/trigger_ci.yml +++ b/.github/workflows/trigger_ci.yml @@ -19,11 +19,11 @@ jobs: #!/bin/bash # Get latest VLLM RELEASED VERSION from https://github.com/triton-inference-server/vllm_backend/releases TAG=$(curl https://api.github.com/repos/triton-inference-server/vllm_backend/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') - export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.06 + export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.08 if [ -z "$TRITON_CONTAINER_VERSION" ] then echo "\$TRITON_CONTAINER_VERSION is NULL, setting it to 24.07" - TRITON_CONTAINER_VERSION=24.07 + TRITON_CONTAINER_VERSION=24.08 else echo "\$TRITON_CONTAINER_VERSION is NOT NULL" fi @@ -31,11 +31,11 @@ jobs: # Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases TAG=$(curl https://api.github.com/repos/vllm-project/vllm/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') - export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 + export VLLM_VERSION=${TAG#v} # example: 0.5.5 if [ -z "$VLLM_VERSION" ] then - echo "\$VLLM_VERSION is NULL, setting it to 0.5.3.post1" - VLLM_VERSION=0.5.3.post1 + echo "\$VLLM_VERSION is NULL, setting it to 0.5.5" + VLLM_VERSION=0.5.5 else echo "\$VLLM_VERSION is NOT NULL" fi From 9bf9c12aef04356788f7850bb63ecedf17fbdf9e Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Fri, 30 Aug 2024 11:47:13 -0700 Subject: [PATCH 079/110] Update trigger_ci.yml --- .github/workflows/trigger_ci.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/trigger_ci.yml b/.github/workflows/trigger_ci.yml index d4343040..b6546258 100644 --- a/.github/workflows/trigger_ci.yml +++ b/.github/workflows/trigger_ci.yml @@ -22,7 +22,7 @@ jobs: export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.08 if [ -z "$TRITON_CONTAINER_VERSION" ] then - echo "\$TRITON_CONTAINER_VERSION is NULL, setting it to 24.07" + echo "\$TRITON_CONTAINER_VERSION is NULL, setting it to 24.08" TRITON_CONTAINER_VERSION=24.08 else echo "\$TRITON_CONTAINER_VERSION is NOT NULL" From 805ae1e0fd82b87cb7228fc8668b4e5cd48fcab0 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Fri, 30 Aug 2024 12:14:08 -0700 Subject: [PATCH 080/110] Update README.md --- README.md | 3 +++ 1 file changed, 3 insertions(+) diff --git a/README.md b/README.md index 82601f62..517cca02 100644 --- a/README.md +++ b/README.md @@ -27,6 +27,9 @@ --> [![License](https://img.shields.io/badge/License-BSD3-lightgrey.svg)](https://opensource.org/licenses/BSD-3-Clause) +![Static Badge](https://img.shields.io/badge/Triton-24.08-Purple) +![Static Badge](https://img.shields.io/badge/vLLM-0.5.5-blue) +![Static Badge](https://img.shields.io/badge/Passing-A100%2CH100%2CGH100-Green) # vLLM Backend From 7ccea9c21deab631fcec4522a96d45c4b5a13bf0 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Fri, 30 Aug 2024 12:15:11 -0700 Subject: [PATCH 081/110] Update README.md --- README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/README.md b/README.md index 517cca02..ee822da0 100644 --- a/README.md +++ b/README.md @@ -27,7 +27,7 @@ --> [![License](https://img.shields.io/badge/License-BSD3-lightgrey.svg)](https://opensource.org/licenses/BSD-3-Clause) -![Static Badge](https://img.shields.io/badge/Triton-24.08-Purple) +![Static Badge](https://img.shields.io/badge/Triton-24.08-8A2BE2) ![Static Badge](https://img.shields.io/badge/vLLM-0.5.5-blue) ![Static Badge](https://img.shields.io/badge/Passing-A100%2CH100%2CGH100-Green) From d347b1dccac45c94e90cda8f17d08a4198238a77 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Fri, 30 Aug 2024 12:21:15 -0700 Subject: [PATCH 082/110] Update README.md --- README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/README.md b/README.md index ee822da0..9e3b2848 100644 --- a/README.md +++ b/README.md @@ -29,7 +29,7 @@ [![License](https://img.shields.io/badge/License-BSD3-lightgrey.svg)](https://opensource.org/licenses/BSD-3-Clause) ![Static Badge](https://img.shields.io/badge/Triton-24.08-8A2BE2) ![Static Badge](https://img.shields.io/badge/vLLM-0.5.5-blue) -![Static Badge](https://img.shields.io/badge/Passing-A100%2CH100%2CGH100-Green) +![Static Badge](https://img.shields.io/badge/CI_Passing-A100%2CH100%2CGH100-Green) # vLLM Backend From fff8f14946e9345edbacff7a5de395ffa50f0955 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Wed, 4 Sep 2024 13:30:37 -0700 Subject: [PATCH 083/110] Update build_docker.sh --- ci/build/build_docker.sh | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/ci/build/build_docker.sh b/ci/build/build_docker.sh index 571d22d5..34752a96 100755 --- a/ci/build/build_docker.sh +++ b/ci/build/build_docker.sh @@ -28,5 +28,12 @@ # Get latest VLLM RELEASED VERSION from https://github.com/triton-inference-server/vllm_backend/releases TAG=$(curl https://api.github.com/repos/triton-inference-server/vllm_backend/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.06 +if [ -z "$TRITON_CONTAINER_VERSION" ] + then + echo "\$TRITON_CONTAINER_VERSION is NULL, setting it to 24.08" + TRITON_CONTAINER_VERSION=24.08 + else + echo "\$TRITON_CONTAINER_VERSION is NOT NULL" + fi docker pull nvcr.io/nvidia/tritonserver:${TRITON_CONTAINER_VERSION}-vllm-python-py3 From 156724a0549ad140dc7ed58b4b6f554afb303aaf Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Wed, 4 Sep 2024 16:08:05 -0700 Subject: [PATCH 084/110] Update build_docker.sh --- ci/build/build_docker.sh | 18 ++++++++---------- 1 file changed, 8 insertions(+), 10 deletions(-) diff --git a/ci/build/build_docker.sh b/ci/build/build_docker.sh index 34752a96..76ea2ed5 100755 --- a/ci/build/build_docker.sh +++ b/ci/build/build_docker.sh @@ -25,15 +25,13 @@ # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. -# Get latest VLLM RELEASED VERSION from https://github.com/triton-inference-server/vllm_backend/releases -TAG=$(curl https://api.github.com/repos/triton-inference-server/vllm_backend/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') -export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.06 -if [ -z "$TRITON_CONTAINER_VERSION" ] - then - echo "\$TRITON_CONTAINER_VERSION is NULL, setting it to 24.08" - TRITON_CONTAINER_VERSION=24.08 - else - echo "\$TRITON_CONTAINER_VERSION is NOT NULL" - fi +while getopts t:v: flag +do + case "${flag}" in + u) TRITON_CONTAINER_VERSION=${OPTARG};; + a) VLLM_VERSION=${OPTARG};; + esac +done +echo "Triton version is ${TRITON_CONTAINER_VERSION} and vllm version is ${VLLM_VERSION}" docker pull nvcr.io/nvidia/tritonserver:${TRITON_CONTAINER_VERSION}-vllm-python-py3 From 4604761bc5d13f0154c96a59f9a5619cb92d6cc0 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Wed, 4 Sep 2024 16:24:28 -0700 Subject: [PATCH 085/110] Update build_docker.sh --- ci/build/build_docker.sh | 9 ++++----- 1 file changed, 4 insertions(+), 5 deletions(-) diff --git a/ci/build/build_docker.sh b/ci/build/build_docker.sh index 76ea2ed5..46d1a426 100755 --- a/ci/build/build_docker.sh +++ b/ci/build/build_docker.sh @@ -25,13 +25,12 @@ # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. -while getopts t:v: flag +while getopts t: flag do case "${flag}" in - u) TRITON_CONTAINER_VERSION=${OPTARG};; - a) VLLM_VERSION=${OPTARG};; + u) PROD_CONTAINER=${OPTARG};; esac done -echo "Triton version is ${TRITON_CONTAINER_VERSION} and vllm version is ${VLLM_VERSION}" -docker pull nvcr.io/nvidia/tritonserver:${TRITON_CONTAINER_VERSION}-vllm-python-py3 +echo "Pulling container image ${PROD_CONTAINER}" +docker pull ${PROD_CONTAINER} From 232787fee6f9b17f1e06f280f088ade56502fa94 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Thu, 5 Sep 2024 12:11:27 -0700 Subject: [PATCH 086/110] Create vllm_release_ci.yml --- .github/workflows/vllm_release_ci.yml | 39 +++++++++++++++++++++++++++ 1 file changed, 39 insertions(+) create mode 100644 .github/workflows/vllm_release_ci.yml diff --git a/.github/workflows/vllm_release_ci.yml b/.github/workflows/vllm_release_ci.yml new file mode 100644 index 00000000..c2c82511 --- /dev/null +++ b/.github/workflows/vllm_release_ci.yml @@ -0,0 +1,39 @@ +name: Validate latest vLLM release from https://github.com/vllm-project/vllm/releases against latest Triton release +on: + schedule: + - cron: "30 09 */3 * *" +jobs: + mirror_repo: + environment: GITLAB + runs-on: self-hosted + steps: + - name: Sync Mirror Repository + run: | + #!/bin/bash + curl --request POST --header "PRIVATE-TOKEN:${{ secrets.TOKEN }}" "${{ secrets.MIRROR_URL }}" + trigger-ci: + environment: GITLAB + needs: mirror_repo + runs-on: self-hosted + steps: + - name: Trigger Pipeline + run: | + #!/bin/bash + # Get latest VLLM RELEASED VERSION from https://github.com/triton-inference-server/vllm_backend/releases + TAG=$(curl https://api.github.com/repos/triton-inference-server/vllm_backend/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') + export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.08 + + # Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases + TAG=$(curl https://api.github.com/repos/vllm-project/vllm/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') + export VLLM_VERSION=${TAG#v} # example: 0.5.5 + echo "VLLM_VERSION = ${VLLM_VERSION}" + + if [ -z "$TRITON_CONTAINER_VERSION" || -z "$VLLM_VERSION"] + then + echo "Can't find latest Triton or vllm version.. Skipping CI run" + else + echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}" + echo "VLLM_VERSION = ${VLLM_VERSION}" + curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="PULL_DOCKER" -F variables[TRITON_CONTAINER_VERSION]="${TRITON_CONTAINER_VERSION}" -F variables[VLLM_VERSION]="${VLLM_VERSION}" "${{ secrets.PIPELINE_URL }}" + fi + From 656c8f5d057e970eac6a5205c0df421294b7ea1e Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Thu, 5 Sep 2024 12:11:54 -0700 Subject: [PATCH 087/110] Rename trigger_ci.yml to triton_update_ci.yml --- .github/workflows/{trigger_ci.yml => triton_update_ci.yml} | 0 1 file changed, 0 insertions(+), 0 deletions(-) rename .github/workflows/{trigger_ci.yml => triton_update_ci.yml} (100%) diff --git a/.github/workflows/trigger_ci.yml b/.github/workflows/triton_update_ci.yml similarity index 100% rename from .github/workflows/trigger_ci.yml rename to .github/workflows/triton_update_ci.yml From 47b9a91312169600b62573ac056155e7363ef764 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Thu, 5 Sep 2024 12:13:04 -0700 Subject: [PATCH 088/110] Update triton_update_ci.yml --- .github/workflows/triton_update_ci.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/triton_update_ci.yml b/.github/workflows/triton_update_ci.yml index b6546258..e25b6b69 100644 --- a/.github/workflows/triton_update_ci.yml +++ b/.github/workflows/triton_update_ci.yml @@ -1,3 +1,4 @@ +name: Validate Triton Pull request by running our change on latest vLLM release on: pull_request: jobs: From 047b885209bb1fc531a0dd8bc06bb1b6daefb534 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Thu, 5 Sep 2024 12:14:23 -0700 Subject: [PATCH 089/110] Rename vllm_release_ci.yml to vllm_update_ci.yml --- .github/workflows/{vllm_release_ci.yml => vllm_update_ci.yml} | 0 1 file changed, 0 insertions(+), 0 deletions(-) rename .github/workflows/{vllm_release_ci.yml => vllm_update_ci.yml} (100%) diff --git a/.github/workflows/vllm_release_ci.yml b/.github/workflows/vllm_update_ci.yml similarity index 100% rename from .github/workflows/vllm_release_ci.yml rename to .github/workflows/vllm_update_ci.yml From fb7977f286f7496568bbdf515a1b69b0ea2835db Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Thu, 5 Sep 2024 12:15:35 -0700 Subject: [PATCH 090/110] Update vllm_update_ci.yml --- .github/workflows/vllm_update_ci.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/vllm_update_ci.yml b/.github/workflows/vllm_update_ci.yml index c2c82511..bdf2cb6f 100644 --- a/.github/workflows/vllm_update_ci.yml +++ b/.github/workflows/vllm_update_ci.yml @@ -1,4 +1,4 @@ -name: Validate latest vLLM release from https://github.com/vllm-project/vllm/releases against latest Triton release +name: Validate latest vLLM release from https://github.com/vllm-project/vllm/releases against latest Triton release https://github.com/triton-inference-server/vllm_backend/releases on: schedule: - cron: "30 09 */3 * *" From 2050086a374ff8ef81eac553bd19bb9b3df231f5 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Thu, 5 Sep 2024 12:18:03 -0700 Subject: [PATCH 091/110] Update vllm_update_ci.yml --- .github/workflows/vllm_update_ci.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/vllm_update_ci.yml b/.github/workflows/vllm_update_ci.yml index bdf2cb6f..3e7e9675 100644 --- a/.github/workflows/vllm_update_ci.yml +++ b/.github/workflows/vllm_update_ci.yml @@ -34,6 +34,6 @@ jobs: else echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}" echo "VLLM_VERSION = ${VLLM_VERSION}" - curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="PULL_DOCKER" -F variables[TRITON_CONTAINER_VERSION]="${TRITON_CONTAINER_VERSION}" -F variables[VLLM_VERSION]="${VLLM_VERSION}" "${{ secrets.PIPELINE_URL }}" + curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="PULL_DOCKER" -F variables[TRITON_CONTAINER_VERSION]="${TRITON_CONTAINER_VERSION}" -F variables[VLLM_VERSION]="${VLLM_VERSION}" -F variables[TEST_OPTION]="ALL_TESTS" "${{ secrets.PIPELINE_URL }}" fi From 94923644c526a4ea29f87ddb89c6712fdb2ae124 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Thu, 5 Sep 2024 12:18:27 -0700 Subject: [PATCH 092/110] Update triton_update_ci.yml --- .github/workflows/triton_update_ci.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/triton_update_ci.yml b/.github/workflows/triton_update_ci.yml index e25b6b69..3faffff2 100644 --- a/.github/workflows/triton_update_ci.yml +++ b/.github/workflows/triton_update_ci.yml @@ -42,4 +42,4 @@ jobs: fi echo "VLLM_VERSION = ${VLLM_VERSION}" - curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD_SOURCE" -F variables[TRITON_CONTAINER_VERSION]="${TRITON_CONTAINER_VERSION}" -F variables[VLLM_VERSION]="${VLLM_VERSION}" "${{ secrets.PIPELINE_URL }}" + curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD_SOURCE" -F variables[TRITON_CONTAINER_VERSION]="${TRITON_CONTAINER_VERSION}" -F variables[VLLM_VERSION]="${VLLM_VERSION}" -F variables[TEST_OPTION]="ALL_TESTS" "${{ secrets.PIPELINE_URL }}" From ce76a769b68952f45724be5e114cc7ef900f86af Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Thu, 5 Sep 2024 12:30:09 -0700 Subject: [PATCH 093/110] Update vllm_update_ci.yml --- .github/workflows/vllm_update_ci.yml | 1 - 1 file changed, 1 deletion(-) diff --git a/.github/workflows/vllm_update_ci.yml b/.github/workflows/vllm_update_ci.yml index 3e7e9675..417baa28 100644 --- a/.github/workflows/vllm_update_ci.yml +++ b/.github/workflows/vllm_update_ci.yml @@ -36,4 +36,3 @@ jobs: echo "VLLM_VERSION = ${VLLM_VERSION}" curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="PULL_DOCKER" -F variables[TRITON_CONTAINER_VERSION]="${TRITON_CONTAINER_VERSION}" -F variables[VLLM_VERSION]="${VLLM_VERSION}" -F variables[TEST_OPTION]="ALL_TESTS" "${{ secrets.PIPELINE_URL }}" fi - From 2fafdda6070fa7ab50e2a2c7d0765c1371ca0ea4 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Thu, 5 Sep 2024 12:32:28 -0700 Subject: [PATCH 094/110] Update vllm_update_ci.yml --- .github/workflows/vllm_update_ci.yml | 2 -- 1 file changed, 2 deletions(-) diff --git a/.github/workflows/vllm_update_ci.yml b/.github/workflows/vllm_update_ci.yml index 417baa28..3a3f91fc 100644 --- a/.github/workflows/vllm_update_ci.yml +++ b/.github/workflows/vllm_update_ci.yml @@ -22,12 +22,10 @@ jobs: # Get latest VLLM RELEASED VERSION from https://github.com/triton-inference-server/vllm_backend/releases TAG=$(curl https://api.github.com/repos/triton-inference-server/vllm_backend/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.08 - # Get latest VLLM RELEASED VERSION from https://github.com/vllm-project/vllm/releases TAG=$(curl https://api.github.com/repos/vllm-project/vllm/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') export VLLM_VERSION=${TAG#v} # example: 0.5.5 echo "VLLM_VERSION = ${VLLM_VERSION}" - if [ -z "$TRITON_CONTAINER_VERSION" || -z "$VLLM_VERSION"] then echo "Can't find latest Triton or vllm version.. Skipping CI run" From 57926632ecbdc473266c0bc3bf86f1d37db8451d Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Fri, 6 Sep 2024 11:35:42 -0700 Subject: [PATCH 095/110] Update README.md --- README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/README.md b/README.md index 9e3b2848..3c26fb22 100644 --- a/README.md +++ b/README.md @@ -29,7 +29,7 @@ [![License](https://img.shields.io/badge/License-BSD3-lightgrey.svg)](https://opensource.org/licenses/BSD-3-Clause) ![Static Badge](https://img.shields.io/badge/Triton-24.08-8A2BE2) ![Static Badge](https://img.shields.io/badge/vLLM-0.5.5-blue) -![Static Badge](https://img.shields.io/badge/CI_Passing-A100%2CH100%2CGH100-Green) +![Static Badge](https://img.shields.io/badge/CI_Passing-AV00%2CA100%2CH100-Green) # vLLM Backend From f3258ef2b656082e6ba3f16230819de3602bbea6 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Fri, 6 Sep 2024 11:35:59 -0700 Subject: [PATCH 096/110] Update README.md --- README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/README.md b/README.md index 3c26fb22..3953e652 100644 --- a/README.md +++ b/README.md @@ -29,7 +29,7 @@ [![License](https://img.shields.io/badge/License-BSD3-lightgrey.svg)](https://opensource.org/licenses/BSD-3-Clause) ![Static Badge](https://img.shields.io/badge/Triton-24.08-8A2BE2) ![Static Badge](https://img.shields.io/badge/vLLM-0.5.5-blue) -![Static Badge](https://img.shields.io/badge/CI_Passing-AV00%2CA100%2CH100-Green) +![Static Badge](https://img.shields.io/badge/CI_Passing-V100%2CA100%2CH100-Green) # vLLM Backend From f2c7a89fecebaf7ab51c37b57caa629225c6a1a1 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Fri, 20 Sep 2024 16:11:40 -0700 Subject: [PATCH 097/110] Update README.md Co-authored-by: Olga Andreeva <124622579+oandreeva-nv@users.noreply.github.com> --- README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/README.md b/README.md index 3953e652..015ec3ad 100644 --- a/README.md +++ b/README.md @@ -115,7 +115,7 @@ git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-se --backend=vllm:r${TRITON_CONTAINER_VERSION} --vllm-version=${VLLM_VERSION} # Build Triton Server -cd server/build +cd build bash -x ./docker_build ``` From e45854c609a17429292f9190179b675bb9d455ec Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Fri, 20 Sep 2024 16:11:57 -0700 Subject: [PATCH 098/110] Update README.md Co-authored-by: Olga Andreeva <124622579+oandreeva-nv@users.noreply.github.com> --- README.md | 1 + 1 file changed, 1 insertion(+) diff --git a/README.md b/README.md index 015ec3ad..2043ca5d 100644 --- a/README.md +++ b/README.md @@ -96,6 +96,7 @@ export VLLM_VERSION=${TAG#v} # example: 0.5.3.post1 echo "VLLM_VERSION = ${VLLM_VERSION}" git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git +cd server ./build.py -v --enable-logging --enable-stats --enable-tracing From 5929f7a241250418c7957f997eec9ebfb16a35a6 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Fri, 20 Sep 2024 16:16:25 -0700 Subject: [PATCH 099/110] Update README.md --- README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/README.md b/README.md index 2043ca5d..887fe44e 100644 --- a/README.md +++ b/README.md @@ -28,7 +28,7 @@ [![License](https://img.shields.io/badge/License-BSD3-lightgrey.svg)](https://opensource.org/licenses/BSD-3-Clause) ![Static Badge](https://img.shields.io/badge/Triton-24.08-8A2BE2) -![Static Badge](https://img.shields.io/badge/vLLM-0.5.5-blue) +![Static Badge](https://img.shields.io/badge/vLLM-0.5.3.post1-blue) ![Static Badge](https://img.shields.io/badge/CI_Passing-V100%2CA100%2CH100-Green) # vLLM Backend From 2512b8ae50da5b295443080b9b4b919e1c1abf6b Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Fri, 20 Sep 2024 16:17:50 -0700 Subject: [PATCH 100/110] Update triton_update_ci.yml --- .github/workflows/triton_update_ci.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/triton_update_ci.yml b/.github/workflows/triton_update_ci.yml index 3faffff2..bf379c06 100644 --- a/.github/workflows/triton_update_ci.yml +++ b/.github/workflows/triton_update_ci.yml @@ -35,8 +35,8 @@ jobs: export VLLM_VERSION=${TAG#v} # example: 0.5.5 if [ -z "$VLLM_VERSION" ] then - echo "\$VLLM_VERSION is NULL, setting it to 0.5.5" - VLLM_VERSION=0.5.5 + echo "\$VLLM_VERSION is NULL, setting it to 0.5.3.post1" + VLLM_VERSION=0.5.3.post1 else echo "\$VLLM_VERSION is NOT NULL" fi From 7c97d9f44bd5d7e9013f95f0c87bf7cee563806e Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Mon, 23 Sep 2024 10:50:09 -0700 Subject: [PATCH 101/110] Update vllm_update_ci.yml --- .github/workflows/vllm_update_ci.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/vllm_update_ci.yml b/.github/workflows/vllm_update_ci.yml index 3a3f91fc..903b9df8 100644 --- a/.github/workflows/vllm_update_ci.yml +++ b/.github/workflows/vllm_update_ci.yml @@ -32,5 +32,5 @@ jobs: else echo "TRITON_CONTAINER_VERSION = ${TRITON_CONTAINER_VERSION}" echo "VLLM_VERSION = ${VLLM_VERSION}" - curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="PULL_DOCKER" -F variables[TRITON_CONTAINER_VERSION]="${TRITON_CONTAINER_VERSION}" -F variables[VLLM_VERSION]="${VLLM_VERSION}" -F variables[TEST_OPTION]="ALL_TESTS" "${{ secrets.PIPELINE_URL }}" + curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="PULL_DOCKER" -F variables[TRITON_CONTAINER_VERSION]="${TRITON_CONTAINER_VERSION}" -F variables[TEST_OPTION]="ALL_HARDWARE" -F variables[VLLM_VERSION]="${VLLM_VERSION}" -F variables[TEST_OPTION]="ALL_TESTS" "${{ secrets.PIPELINE_URL }}" fi From 65fe72c2d12c4f5fbf6118c90447c631ea1eea9e Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Thu, 21 Nov 2024 10:50:07 -0800 Subject: [PATCH 102/110] Update build_source.sh --- ci/build/build_source.sh | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 082672d5..7c78b0be 100755 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -34,8 +34,7 @@ do done echo "Triton version is ${TRITON_CONTAINER_VERSION} and vllm version is ${VLLM_VERSION}" -#git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git -git clone -b mesharma-ci https://github.com/triton-inference-server/server.git +git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git set -x && python3 server/build.py -v \ --enable-logging \ --enable-stats \ From 3ada940476613c090f8d7e9ae90c1bad928d9372 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Thu, 21 Nov 2024 10:54:03 -0800 Subject: [PATCH 103/110] Update triton_update_ci.yml --- .github/workflows/triton_update_ci.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/triton_update_ci.yml b/.github/workflows/triton_update_ci.yml index bf379c06..cb6360a6 100644 --- a/.github/workflows/triton_update_ci.yml +++ b/.github/workflows/triton_update_ci.yml @@ -24,7 +24,7 @@ jobs: if [ -z "$TRITON_CONTAINER_VERSION" ] then echo "\$TRITON_CONTAINER_VERSION is NULL, setting it to 24.08" - TRITON_CONTAINER_VERSION=24.08 + TRITON_CONTAINER_VERSION=24.10 else echo "\$TRITON_CONTAINER_VERSION is NOT NULL" fi @@ -35,7 +35,7 @@ jobs: export VLLM_VERSION=${TAG#v} # example: 0.5.5 if [ -z "$VLLM_VERSION" ] then - echo "\$VLLM_VERSION is NULL, setting it to 0.5.3.post1" + echo "\$VLLM_VERSION is NULL, setting it to 0.5.5" VLLM_VERSION=0.5.3.post1 else echo "\$VLLM_VERSION is NOT NULL" From 760f884e056a8636ff742edaf99d90833d2d3f3f Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Thu, 21 Nov 2024 11:04:24 -0800 Subject: [PATCH 104/110] Update build_source.sh --- ci/build/build_source.sh | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/ci/build/build_source.sh b/ci/build/build_source.sh index 7c78b0be..e40cf471 100755 --- a/ci/build/build_source.sh +++ b/ci/build/build_source.sh @@ -34,7 +34,9 @@ do done echo "Triton version is ${TRITON_CONTAINER_VERSION} and vllm version is ${VLLM_VERSION}" -git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git +# This change will start working for r24.12 release +#git clone -b r${TRITON_CONTAINER_VERSION} https://github.com/triton-inference-server/server.git +git clone https://github.com/triton-inference-server/server.git set -x && python3 server/build.py -v \ --enable-logging \ --enable-stats \ From 61ba07872b6600853ce625c654c6c6559a04b6d0 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Thu, 21 Nov 2024 11:08:53 -0800 Subject: [PATCH 105/110] Update triton_update_ci.yml --- .github/workflows/triton_update_ci.yml | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/.github/workflows/triton_update_ci.yml b/.github/workflows/triton_update_ci.yml index cb6360a6..8c7886d5 100644 --- a/.github/workflows/triton_update_ci.yml +++ b/.github/workflows/triton_update_ci.yml @@ -1,4 +1,4 @@ -name: Validate Triton Pull request by running our change on latest vLLM release +name: Validate Triton Pull request by running our change on the latest version of vLLM on: pull_request: jobs: @@ -20,10 +20,10 @@ jobs: #!/bin/bash # Get latest VLLM RELEASED VERSION from https://github.com/triton-inference-server/vllm_backend/releases TAG=$(curl https://api.github.com/repos/triton-inference-server/vllm_backend/releases/latest | grep -i "tag_name" | awk -F '"' '{print $4}') - export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.08 + export TRITON_CONTAINER_VERSION=${TAG#v} # example: 24.10 if [ -z "$TRITON_CONTAINER_VERSION" ] then - echo "\$TRITON_CONTAINER_VERSION is NULL, setting it to 24.08" + echo "\$TRITON_CONTAINER_VERSION is NULL, setting it to 24.10" TRITON_CONTAINER_VERSION=24.10 else echo "\$TRITON_CONTAINER_VERSION is NOT NULL" @@ -36,7 +36,7 @@ jobs: if [ -z "$VLLM_VERSION" ] then echo "\$VLLM_VERSION is NULL, setting it to 0.5.5" - VLLM_VERSION=0.5.3.post1 + VLLM_VERSION=0.5.5 else echo "\$VLLM_VERSION is NOT NULL" fi From 0100f947331bbd6185b7c647fd8cd857a205b342 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Thu, 21 Nov 2024 11:40:41 -0800 Subject: [PATCH 106/110] Update triton_update_ci.yml --- .github/workflows/triton_update_ci.yml | 38 ++++++++++++++++++++++++++ 1 file changed, 38 insertions(+) diff --git a/.github/workflows/triton_update_ci.yml b/.github/workflows/triton_update_ci.yml index 8c7886d5..7d100d46 100644 --- a/.github/workflows/triton_update_ci.yml +++ b/.github/workflows/triton_update_ci.yml @@ -43,3 +43,41 @@ jobs: echo "VLLM_VERSION = ${VLLM_VERSION}" curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD_SOURCE" -F variables[TRITON_CONTAINER_VERSION]="${TRITON_CONTAINER_VERSION}" -F variables[VLLM_VERSION]="${VLLM_VERSION}" -F variables[TEST_OPTION]="ALL_TESTS" "${{ secrets.PIPELINE_URL }}" + add-badges: + environment: GITLAB + needs: trigger-ci + runs-on: self-hosted + steps: + - uses: wow-actions/add-badges@v1 + env: + repo_url: ${{ github.event.repository.html_url }} + repo_name: ${{ github.event.repository.name }} + repo_owner: ${{ github.event.repository.owner.login }} + with: + GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} + center: true + badges: | + [ + [ + { + "badge": "https://img.shields.io/github/license/${{ env.repo_owner }}/${{ env.repo_name }}?style=flat-square", + "alt": "MIT License", + "link": "${{ env.repo_url }}/blob/master/LICENSE" + }, + { + "badge": "https://img.shields.io/badge/Triton-24.10-8A2BE2", + "alt": "Triton", + "link": "https://github.com/triton-inference-server/vllm_backend" + }, + { + "badge": "https://img.shields.io/badge/vLLM-0.5.5-blue", + "alt": "vLLM", + "link": "https://github.com/vllm-project/vllm" + }, + { + "badge": "https://img.shields.io/badge/CI_Passing-V100%2CA100%2CH100-Green", + "alt": "CI", + "link": "https://github.com/triton-inference-server/vllm_backend/actions" + } + ] + ] From 5768b345b3cd032732e948ff6d8b343136152670 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Thu, 21 Nov 2024 11:41:48 -0800 Subject: [PATCH 107/110] Update README.md --- README.md | 5 ++--- 1 file changed, 2 insertions(+), 3 deletions(-) diff --git a/README.md b/README.md index 69945106..d8b6900a 100644 --- a/README.md +++ b/README.md @@ -27,9 +27,8 @@ --> [![License](https://img.shields.io/badge/License-BSD3-lightgrey.svg)](https://opensource.org/licenses/BSD-3-Clause) -![Static Badge](https://img.shields.io/badge/Triton-24.08-8A2BE2) -![Static Badge](https://img.shields.io/badge/vLLM-0.5.3.post1-blue) -![Static Badge](https://img.shields.io/badge/CI_Passing-V100%2CA100%2CH100-Green) + + # vLLM Backend From ea2120cab66ce5415f22f363f5a6b634479d4ad9 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Thu, 21 Nov 2024 11:53:08 -0800 Subject: [PATCH 108/110] Update triton_update_ci.yml --- .github/workflows/triton_update_ci.yml | 38 -------------------------- 1 file changed, 38 deletions(-) diff --git a/.github/workflows/triton_update_ci.yml b/.github/workflows/triton_update_ci.yml index 7d100d46..8c7886d5 100644 --- a/.github/workflows/triton_update_ci.yml +++ b/.github/workflows/triton_update_ci.yml @@ -43,41 +43,3 @@ jobs: echo "VLLM_VERSION = ${VLLM_VERSION}" curl --fail --request POST --form token=${{ secrets.PIPELINE_TOKEN }} -F ref=${GITHUB_HEAD_REF} -F variables[BUILD_OPTION]="BUILD_SOURCE" -F variables[TRITON_CONTAINER_VERSION]="${TRITON_CONTAINER_VERSION}" -F variables[VLLM_VERSION]="${VLLM_VERSION}" -F variables[TEST_OPTION]="ALL_TESTS" "${{ secrets.PIPELINE_URL }}" - add-badges: - environment: GITLAB - needs: trigger-ci - runs-on: self-hosted - steps: - - uses: wow-actions/add-badges@v1 - env: - repo_url: ${{ github.event.repository.html_url }} - repo_name: ${{ github.event.repository.name }} - repo_owner: ${{ github.event.repository.owner.login }} - with: - GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} - center: true - badges: | - [ - [ - { - "badge": "https://img.shields.io/github/license/${{ env.repo_owner }}/${{ env.repo_name }}?style=flat-square", - "alt": "MIT License", - "link": "${{ env.repo_url }}/blob/master/LICENSE" - }, - { - "badge": "https://img.shields.io/badge/Triton-24.10-8A2BE2", - "alt": "Triton", - "link": "https://github.com/triton-inference-server/vllm_backend" - }, - { - "badge": "https://img.shields.io/badge/vLLM-0.5.5-blue", - "alt": "vLLM", - "link": "https://github.com/vllm-project/vllm" - }, - { - "badge": "https://img.shields.io/badge/CI_Passing-V100%2CA100%2CH100-Green", - "alt": "CI", - "link": "https://github.com/triton-inference-server/vllm_backend/actions" - } - ] - ] From adec7355243144605eac2b52b760409c9ab75f54 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Thu, 21 Nov 2024 11:54:55 -0800 Subject: [PATCH 109/110] Update README.md --- README.md | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/README.md b/README.md index d8b6900a..69945106 100644 --- a/README.md +++ b/README.md @@ -27,8 +27,9 @@ --> [![License](https://img.shields.io/badge/License-BSD3-lightgrey.svg)](https://opensource.org/licenses/BSD-3-Clause) - - +![Static Badge](https://img.shields.io/badge/Triton-24.08-8A2BE2) +![Static Badge](https://img.shields.io/badge/vLLM-0.5.3.post1-blue) +![Static Badge](https://img.shields.io/badge/CI_Passing-V100%2CA100%2CH100-Green) # vLLM Backend From 834e76e8135d5a77538f42ed89400b1fb682a6e5 Mon Sep 17 00:00:00 2001 From: Meenakshi Sharma <163925564+nvda-mesharma@users.noreply.github.com> Date: Thu, 21 Nov 2024 11:55:12 -0800 Subject: [PATCH 110/110] Update README.md --- README.md | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/README.md b/README.md index 69945106..a4a9d3fb 100644 --- a/README.md +++ b/README.md @@ -27,8 +27,8 @@ --> [![License](https://img.shields.io/badge/License-BSD3-lightgrey.svg)](https://opensource.org/licenses/BSD-3-Clause) -![Static Badge](https://img.shields.io/badge/Triton-24.08-8A2BE2) -![Static Badge](https://img.shields.io/badge/vLLM-0.5.3.post1-blue) +![Static Badge](https://img.shields.io/badge/Triton-24.10-8A2BE2) +![Static Badge](https://img.shields.io/badge/vLLM-0.5.5-blue) ![Static Badge](https://img.shields.io/badge/CI_Passing-V100%2CA100%2CH100-Green) # vLLM Backend