Skip to content

Commit 75588dc

Browse files
mc-nvnv-anantskthuikrishung5
authored
Update main branch post 24.11 (#7829)
Co-authored-by: Anant Sharma <anants@nvidia.com> Co-authored-by: Jacky <18255193+kthui@users.noreply.github.com> Co-authored-by: Kris Hung <krish@nvidia.com>
1 parent 2890779 commit 75588dc

File tree

53 files changed

+196
-184
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

53 files changed

+196
-184
lines changed

CMakeLists.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -221,7 +221,7 @@ ExternalProject_Add(triton-server
221221
-Dre2_DIR:PATH=${TRITON_THIRD_PARTY_INSTALL_PREFIX}/re2/${LIB_DIR}/cmake/re2
222222
-Dabsl_DIR:PATH=${TRITON_THIRD_PARTY_INSTALL_PREFIX}/absl/${LIB_DIR}/cmake/absl
223223
-DCURL_DIR:STRING=${TRITON_THIRD_PARTY_INSTALL_PREFIX}/curl/${LIB_DIR}/cmake/CURL
224-
-Dnlohmann_json_DIR:PATH=${TRITON_THIRD_PARTY_INSTALL_PREFIX}/nlohmann_json/${LIB_DIR}/cmake/nlohmann_json
224+
-Dnlohmann_json_DIR:PATH=${TRITON_THIRD_PARTY_INSTALL_PREFIX}/nlohmann_json/share/cmake/nlohmann_json
225225
-DLibevent_DIR:PATH=${TRITON_THIRD_PARTY_INSTALL_PREFIX}/libevent/lib/cmake/libevent
226226
-Dlibevhtp_DIR:PATH=${TRITON_THIRD_PARTY_INSTALL_PREFIX}/libevhtp/lib/cmake/libevhtp
227227
-Dstorage_client_DIR:PATH=${TRITON_THIRD_PARTY_INSTALL_PREFIX}/google-cloud-cpp/${LIB_DIR}/cmake/storage_client

Dockerfile.QA

Lines changed: 8 additions & 18 deletions
Original file line numberDiff line numberDiff line change
@@ -59,20 +59,19 @@ RUN apt-get update && \
5959
libboost-dev \
6060
python3-dev \
6161
python3-pip \
62+
python3-wheel \
63+
python3-setuptools \
6264
rapidjson-dev \
6365
software-properties-common && \
6466
rm -rf /var/lib/apt/lists/*
6567

66-
RUN pip3 install --upgrade pip && \
67-
pip3 install --upgrade wheel setuptools
68-
6968
RUN apt update -q=2 \
7069
&& apt install -y gpg wget \
7170
&& wget -O - https://apt.kitware.com/keys/kitware-archive-latest.asc 2>/dev/null | gpg --dearmor - | tee /usr/share/keyrings/kitware-archive-keyring.gpg >/dev/null \
7271
&& . /etc/os-release \
7372
&& echo "deb [signed-by=/usr/share/keyrings/kitware-archive-keyring.gpg] https://apt.kitware.com/ubuntu/ $UBUNTU_CODENAME main" | tee /etc/apt/sources.list.d/kitware.list >/dev/null \
7473
&& apt-get update -q=2 \
75-
&& apt-get install -y --no-install-recommends cmake=3.27.7* cmake-data=3.27.7*
74+
&& apt-get install -y --no-install-recommends cmake=3.28.3* cmake-data=3.28.3*
7675

7776
# Add inception_graphdef model to example repo
7877
WORKDIR /workspace/docs/examples/model_repository
@@ -311,20 +310,12 @@ ARG TARGETPLATFORM
311310
ENV DEBIAN_FRONTEND=noninteractive
312311

313312
# install platform specific packages
314-
RUN if [ $(cat /etc/os-release | grep 'VERSION_ID="20.04"' | wc -l) -ne 0 ]; then \
315-
apt-get update && \
316-
apt-get install -y --no-install-recommends \
317-
libpng-dev; \
318-
elif [ $(cat /etc/os-release | grep 'VERSION_ID="22.04"' | wc -l) -ne 0 ]; then \
319-
apt-get update && \
320-
apt-get install -y --no-install-recommends \
321-
libpng-dev; \
322-
elif [ $(cat /etc/os-release | grep 'VERSION_ID="18.04"' | wc -l) -ne 0 ]; then \
313+
RUN if grep -qE '^VERSION_ID="(18\.04|20\.04|22\.04|24\.04)' /etc/os-release; then \
323314
apt-get update && \
324315
apt-get install -y --no-install-recommends \
325316
libpng-dev; \
326317
else \
327-
echo "Ubuntu version must be either 18.04, 20.04 or 22.04" && \
318+
echo "Ubuntu version must be either 18.04, 20.04, 22.04 or 24.04" && \
328319
exit 1; \
329320
fi
330321

@@ -337,14 +328,14 @@ RUN apt-get update && apt-get install -y --no-install-recommends \
337328
libarchive-dev \
338329
libopencv-core-dev \
339330
libzmq3-dev \
340-
maven \
341331
openjdk-11-jdk \
342332
nginx \
343333
npm \
344334
protobuf-compiler \
345335
python3-dev \
346336
python3-pip \
347337
python3-protobuf \
338+
python3-wheel \
348339
python3-setuptools \
349340
swig \
350341
valgrind && \
@@ -354,9 +345,8 @@ RUN apt-get update && apt-get install -y --no-install-recommends \
354345
RUN rm -f /usr/bin/python && \
355346
ln -s /usr/bin/python3 /usr/bin/python
356347

357-
RUN pip3 install --upgrade wheel setuptools && \
358-
pip3 install --upgrade "numpy<2" pillow attrdict future grpcio requests gsutil \
359-
awscli six grpcio-channelz prettytable virtualenv \
348+
RUN pip3 install --upgrade "numpy<2" pillow attrdict future "grpcio<1.68" requests gsutil \
349+
awscli six "grpcio-channelz<1.68" prettytable virtualenv \
360350
check-jsonschema
361351

362352
# go needed for example go client test.

Dockerfile.sdk

Lines changed: 12 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -29,7 +29,7 @@
2929
#
3030

3131
# Base image on the minimum Triton container
32-
ARG BASE_IMAGE=nvcr.io/nvidia/tritonserver:24.10-py3-min
32+
ARG BASE_IMAGE=nvcr.io/nvidia/tritonserver:24.11-py3-min
3333

3434
ARG TRITON_CLIENT_REPO_SUBDIR=clientrepo
3535
ARG TRITON_PA_REPO_SUBDIR=perfanalyzerrepo
@@ -44,7 +44,7 @@ ARG JAVA_BINDINGS_MAVEN_VERSION=3.8.4
4444
ARG JAVA_BINDINGS_JAVACPP_PRESETS_TAG=1.5.8
4545

4646
# DCGM version to install for Model Analyzer
47-
ARG DCGM_VERSION=3.2.6
47+
ARG DCGM_VERSION=3.3.6
4848

4949
ARG NVIDIA_TRITON_SERVER_SDK_VERSION=unknown
5050
ARG NVIDIA_BUILD_ID=unknown
@@ -57,6 +57,7 @@ FROM ${BASE_IMAGE} AS sdk_build
5757

5858
# Ensure apt-get won't prompt for selecting options
5959
ENV DEBIAN_FRONTEND=noninteractive
60+
ENV PIP_BREAK_SYSTEM_PACKAGES=1
6061

6162
RUN apt-get update && \
6263
apt-get install -y --no-install-recommends \
@@ -78,15 +79,15 @@ RUN apt-get update && \
7879
python3 \
7980
python3-pip \
8081
python3-dev \
82+
python3-wheel \
83+
python3-setuptools \
8184
rapidjson-dev \
8285
vim \
8386
wget \
8487
python3-pdfkit \
8588
openjdk-11-jdk \
8689
maven && \
87-
pip3 install --upgrade wheel setuptools && \
88-
pip3 install --upgrade grpcio-tools && \
89-
pip3 install --upgrade pip
90+
pip3 install --upgrade "grpcio-tools<1.68"
9091

9192
# Client build requires recent version of CMake (FetchContent required)
9293
# Using CMAKE installation instruction from:: https://apt.kitware.com/
@@ -96,7 +97,7 @@ RUN apt update -q=2 \
9697
&& . /etc/os-release \
9798
&& echo "deb [signed-by=/usr/share/keyrings/kitware-archive-keyring.gpg] https://apt.kitware.com/ubuntu/ $UBUNTU_CODENAME main" | tee /etc/apt/sources.list.d/kitware.list >/dev/null \
9899
&& apt-get update -q=2 \
99-
&& apt-get install -y --no-install-recommends cmake=3.27.7* cmake-data=3.27.7* \
100+
&& apt-get install -y --no-install-recommends cmake=3.28.3* cmake-data=3.28.3* \
100101
&& cmake --version
101102

102103
# Build expects "python" executable (not python3).
@@ -183,6 +184,7 @@ FROM ${BASE_IMAGE}
183184

184185
# Ensure apt-get won't prompt for selecting options
185186
ENV DEBIAN_FRONTEND=noninteractive
187+
ENV PIP_BREAK_SYSTEM_PACKAGES=1
186188

187189
ARG DCGM_VERSION
188190
ARG TRITON_REPO_ORGANIZATION
@@ -205,14 +207,14 @@ RUN apt-get update && \
205207
python3 \
206208
python3-pip \
207209
python3-dev \
210+
python3-wheel \
211+
python3-setuptools \
208212
vim \
209213
wget \
210214
python3-pdfkit \
211215
maven \
212216
default-jdk && \
213-
pip3 install --upgrade wheel setuptools && \
214-
pip3 install --upgrade grpcio-tools && \
215-
pip3 install --upgrade pip
217+
pip3 install "grpcio<1.68" "grpcio-tools<1.68"
216218

217219
WORKDIR /workspace
218220
COPY TRITON_VERSION .
@@ -250,7 +252,7 @@ RUN pip3 install install/python/genai_perf-*.whl
250252
RUN if [ "$TRITON_ENABLE_GPU" = "ON" ]; then \
251253
[ "$(uname -m)" != "x86_64" ] && arch="sbsa" || arch="x86_64" && \
252254
curl -o /tmp/cuda-keyring.deb \
253-
https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/$arch/cuda-keyring_1.0-1_all.deb \
255+
https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2404/$arch/cuda-keyring_1.1-1_all.deb \
254256
&& apt install /tmp/cuda-keyring.deb && rm /tmp/cuda-keyring.deb && \
255257
apt-get update && apt-get install -y datacenter-gpu-manager=1:${DCGM_VERSION}; \
256258
fi

README.md

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -32,8 +32,8 @@
3232

3333
>[!WARNING]
3434
>You are currently on the `main` branch which tracks under-development progress
35-
>towards the next release. The current release is version [2.51.0](https://github.com/triton-inference-server/server/releases/latest)
36-
>and corresponds to the 24.10 container release on NVIDIA GPU Cloud (NGC).
35+
>towards the next release. The current release is version [2.52.0](https://github.com/triton-inference-server/server/releases/latest)
36+
>and corresponds to the 24.11 container release on NVIDIA GPU Cloud (NGC).
3737
3838
Triton Inference Server is an open source inference serving software that
3939
streamlines AI inferencing. Triton enables teams to deploy any AI model from
@@ -91,16 +91,16 @@ Inference Server with the
9191

9292
```bash
9393
# Step 1: Create the example model repository
94-
git clone -b r24.10 https://github.com/triton-inference-server/server.git
94+
git clone -b r24.11 https://github.com/triton-inference-server/server.git
9595
cd server/docs/examples
9696
./fetch_models.sh
9797

9898
# Step 2: Launch triton from the NGC Triton container
99-
docker run --gpus=1 --rm --net=host -v ${PWD}/model_repository:/models nvcr.io/nvidia/tritonserver:24.10-py3 tritonserver --model-repository=/models
99+
docker run --gpus=1 --rm --net=host -v ${PWD}/model_repository:/models nvcr.io/nvidia/tritonserver:24.11-py3 tritonserver --model-repository=/models
100100

101101
# Step 3: Sending an Inference Request
102102
# In a separate console, launch the image_client example from the NGC Triton SDK container
103-
docker run -it --rm --net=host nvcr.io/nvidia/tritonserver:24.10-py3-sdk
103+
docker run -it --rm --net=host nvcr.io/nvidia/tritonserver:24.11-py3-sdk
104104
/workspace/install/bin/image_client -m densenet_onnx -c 3 -s INCEPTION /workspace/images/mug.jpg
105105

106106
# Inference should return the following

TRITON_VERSION

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
2.53.0dev
1+
2.53.0dev

build.py

Lines changed: 17 additions & 18 deletions
Original file line numberDiff line numberDiff line change
@@ -73,11 +73,11 @@
7373
DEFAULT_TRITON_VERSION_MAP = {
7474
"release_version": "2.53.0dev",
7575
"triton_container_version": "24.12dev",
76-
"upstream_container_version": "24.10",
76+
"upstream_container_version": "24.11",
7777
"ort_version": "1.19.2",
7878
"ort_openvino_version": "2024.4.0",
7979
"standalone_openvino_version": "2024.4.0",
80-
"dcgm_version": "3.2.6",
80+
"dcgm_version": "3.3.6",
8181
"vllm_version": "0.5.5",
8282
"rhel_py_version": "3.12.3",
8383
}
@@ -885,7 +885,7 @@ def install_dcgm_libraries(dcgm_version, target_machine):
885885
ENV DCGM_VERSION {}
886886
# Install DCGM. Steps from https://developer.nvidia.com/dcgm#Downloads
887887
RUN curl -o /tmp/cuda-keyring.deb \\
888-
https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/sbsa/cuda-keyring_1.0-1_all.deb \\
888+
https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2404/sbsa/cuda-keyring_1.1-1_all.deb \\
889889
&& apt install /tmp/cuda-keyring.deb \\
890890
&& rm /tmp/cuda-keyring.deb \\
891891
&& apt-get update \\
@@ -898,7 +898,7 @@ def install_dcgm_libraries(dcgm_version, target_machine):
898898
ENV DCGM_VERSION {}
899899
# Install DCGM. Steps from https://developer.nvidia.com/dcgm#Downloads
900900
RUN curl -o /tmp/cuda-keyring.deb \\
901-
https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/x86_64/cuda-keyring_1.0-1_all.deb \\
901+
https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2404/x86_64/cuda-keyring_1.1-1_all.deb \\
902902
&& apt install /tmp/cuda-keyring.deb \\
903903
&& rm /tmp/cuda-keyring.deb \\
904904
&& apt-get update \\
@@ -1035,6 +1035,7 @@ def create_dockerfile_buildbase(ddir, dockerfile_name, argmap):
10351035
df += """
10361036
# Ensure apt-get won't prompt for selecting options
10371037
ENV DEBIAN_FRONTEND=noninteractive
1038+
ENV PIP_BREAK_SYSTEM_PACKAGES=1
10381039
10391040
# Install docker docker buildx
10401041
RUN apt-get update \\
@@ -1071,6 +1072,7 @@ def create_dockerfile_buildbase(ddir, dockerfile_name, argmap):
10711072
patchelf \\
10721073
python3-dev \\
10731074
python3-pip \\
1075+
python3-wheel \\
10741076
python3-setuptools \\
10751077
rapidjson-dev \\
10761078
scons \\
@@ -1085,10 +1087,7 @@ def create_dockerfile_buildbase(ddir, dockerfile_name, argmap):
10851087
wget \\
10861088
&& rm -rf /var/lib/apt/lists/*
10871089
1088-
RUN pip3 install --upgrade pip \\
1089-
&& pip3 install --upgrade \\
1090-
wheel \\
1091-
setuptools \\
1090+
RUN pip3 install --upgrade \\
10921091
docker \\
10931092
virtualenv
10941093
@@ -1106,7 +1105,7 @@ def create_dockerfile_buildbase(ddir, dockerfile_name, argmap):
11061105
&& . /etc/os-release \\
11071106
&& echo "deb [signed-by=/usr/share/keyrings/kitware-archive-keyring.gpg] https://apt.kitware.com/ubuntu/ $UBUNTU_CODENAME main" | tee /etc/apt/sources.list.d/kitware.list >/dev/null \\
11081107
&& apt-get update -q=2 \\
1109-
&& apt-get install -y --no-install-recommends cmake=3.27.7* cmake-data=3.27.7*
1108+
&& apt-get install -y --no-install-recommends cmake=3.28.3* cmake-data=3.28.3*
11101109
"""
11111110

11121111
if FLAGS.enable_gpu:
@@ -1243,7 +1242,6 @@ def create_dockerfile_linux(
12431242
rm -fr ${TRT_ROOT}/bin ${TRT_ROOT}/targets/${ARCH}-linux-gnu/bin ${TRT_ROOT}/data && \\
12441243
rm -fr ${TRT_ROOT}/doc ${TRT_ROOT}/onnx_graphsurgeon ${TRT_ROOT}/python && \\
12451244
rm -fr ${TRT_ROOT}/samples ${TRT_ROOT}/targets/${ARCH}-linux-gnu/samples && \\
1246-
python3 -m pip install --upgrade pip && \\
12471245
pip3 install --no-cache-dir transformers && \\
12481246
find /usr -name libtensorrt_llm.so -exec dirname {} \; > /etc/ld.so.conf.d/tensorrt-llm.conf && \\
12491247
find /opt/tritonserver -name libtritonserver.so -exec dirname {} \; > /etc/ld.so.conf.d/triton-tensorrtllm-worker.conf && \\
@@ -1308,6 +1306,7 @@ def dockerfile_prepare_container_linux(argmap, backends, enable_gpu, target_mach
13081306
# artifacts copied below are assign to this user.
13091307
ENV TRITON_SERVER_USER=triton-server
13101308
RUN userdel tensorrt-server > /dev/null 2>&1 || true \\
1309+
&& userdel ubuntu > /dev/null 2>&1 || true \\
13111310
&& if ! id -u $TRITON_SERVER_USER > /dev/null 2>&1 ; then \\
13121311
useradd $TRITON_SERVER_USER; \\
13131312
fi \\
@@ -1354,12 +1353,10 @@ def dockerfile_prepare_container_linux(argmap, backends, enable_gpu, target_mach
13541353
libgoogle-perftools-dev \\
13551354
libjemalloc-dev \\
13561355
libnuma-dev \\
1357-
libre2-9 \\
13581356
software-properties-common \\
13591357
wget \\
13601358
{backend_dependencies} \\
13611359
python3-pip \\
1362-
&& python3 -m pip install --upgrade pip \\
13631360
&& rm -rf /var/lib/apt/lists/*
13641361
""".format(
13651362
backend_dependencies=backend_dependencies
@@ -1402,7 +1399,8 @@ def dockerfile_prepare_container_linux(argmap, backends, enable_gpu, target_mach
14021399
if "python" in backends:
14031400
if target_platform() == "rhel":
14041401
df += """
1405-
# python3 and some pip installs required for the python backend
1402+
ENV PIP_BREAK_SYSTEM_PACKAGES=1
1403+
# python3, python3-pip and some pip installs required for the python backend
14061404
RUN yum install -y \\
14071405
libarchive-devel \\
14081406
openssl-devel \\
@@ -1420,16 +1418,17 @@ def dockerfile_prepare_container_linux(argmap, backends, enable_gpu, target_mach
14201418
"""
14211419
else:
14221420
df += """
1423-
# python3 and some pip installs required for the python backend
1421+
ENV PIP_BREAK_SYSTEM_PACKAGES=1
1422+
# python3, python3-pip and some pip installs required for the python backend
14241423
RUN apt-get update \\
14251424
&& apt-get install -y --no-install-recommends \\
14261425
python3 \\
14271426
libarchive-dev \\
1427+
python3-pip \\
1428+
python3-wheel \\
1429+
python3-setuptools \\
14281430
libpython3-dev \\
1429-
&& pip3 install --upgrade pip \\
14301431
&& pip3 install --upgrade \\
1431-
wheel \\
1432-
setuptools \\
14331432
\"numpy<2\" \\
14341433
virtualenv \\
14351434
&& rm -rf /var/lib/apt/lists/*
@@ -1631,7 +1630,7 @@ def create_build_dockerfiles(
16311630
FLAGS.upstream_container_version
16321631
)
16331632
else:
1634-
base_image = "ubuntu:22.04"
1633+
base_image = "ubuntu:24.04"
16351634

16361635
dockerfileargmap = {
16371636
"NVIDIA_BUILD_REF": "" if FLAGS.build_sha is None else FLAGS.build_sha,

deploy/aws/values.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,7 @@
2727
replicaCount: 1
2828

2929
image:
30-
imageName: nvcr.io/nvidia/tritonserver:24.10-py3
30+
imageName: nvcr.io/nvidia/tritonserver:24.11-py3
3131
pullPolicy: IfNotPresent
3232
modelRepositoryPath: s3://triton-inference-server-repository/model_repository
3333
numGpus: 1

deploy/fleetcommand/values.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,7 @@
2727
replicaCount: 1
2828

2929
image:
30-
imageName: nvcr.io/nvidia/tritonserver:24.10-py3
30+
imageName: nvcr.io/nvidia/tritonserver:24.11-py3
3131
pullPolicy: IfNotPresent
3232
numGpus: 1
3333
serverCommand: tritonserver
@@ -47,13 +47,13 @@ image:
4747
#
4848
# To set model control mode, uncomment and configure below
4949
# TODO: Fix the following url, it is invalid
50-
# See https://github.com/triton-inference-server/server/blob/r24.10/docs/model_management.md
50+
# See https://github.com/triton-inference-server/server/blob/r24.11/docs/model_management.md
5151
# for more details
5252
#- --model-control-mode=explicit|poll|none
5353
#
5454
# Additional server args
5555
#
56-
# see https://github.com/triton-inference-server/server/blob/r24.10/README.md
56+
# see https://github.com/triton-inference-server/server/blob/r24.11/README.md
5757
# for more details
5858

5959
service:

deploy/gcp/values.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,7 @@
2727
replicaCount: 1
2828

2929
image:
30-
imageName: nvcr.io/nvidia/tritonserver:24.10-py3
30+
imageName: nvcr.io/nvidia/tritonserver:24.11-py3
3131
pullPolicy: IfNotPresent
3232
modelRepositoryPath: gs://triton-inference-server-repository/model_repository
3333
numGpus: 1

deploy/gke-marketplace-app/benchmark/perf-analyzer-script/triton_client.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -33,7 +33,7 @@ metadata:
3333
namespace: default
3434
spec:
3535
containers:
36-
- image: nvcr.io/nvidia/tritonserver:24.10-py3-sdk
36+
- image: nvcr.io/nvidia/tritonserver:24.11-py3-sdk
3737
imagePullPolicy: Always
3838
name: nv-triton-client
3939
securityContext:

0 commit comments

Comments
 (0)