diff --git a/script/app-mlperf-inference-nvidia/customize.py b/script/app-mlperf-inference-nvidia/customize.py index 70e5d3710..2cb95e75f 100644 --- a/script/app-mlperf-inference-nvidia/customize.py +++ b/script/app-mlperf-inference-nvidia/customize.py @@ -300,7 +300,7 @@ def preprocess(i): if not os.path.exists(fp32_model_path): # download via prehook_deps env['MLC_REQUIRE_GPTJ_MODEL_DOWNLOAD'] = 'yes' - if make_command == "build_engine": + if make_command in ["build_engine", "preprocess_data"]: cmds.append( f"cp -r $MLC_ML_MODEL_FILE_WITH_PATH {fp32_model_path}") diff --git a/script/app-mlperf-inference/meta.yaml b/script/app-mlperf-inference/meta.yaml index 846936234..6a4b6cf3b 100644 --- a/script/app-mlperf-inference/meta.yaml +++ b/script/app-mlperf-inference/meta.yaml @@ -404,6 +404,15 @@ variations: _tp-size.: - MLC_NVIDIA_TP_SIZE + nvidia-original,r5.0-dev_default,gptj_: + docker: + image_name: mlperf-inference-nvidia-v4.1-dev-llm + deps: + - tags: get,ml-model,gptj,_nvidia,_fp8 + update_tags_from_env_with_prefix: + _tp-size.: + - MLC_NVIDIA_TP_SIZE + nvidia-original,r4.1_default: docker: base_image: nvcr.io/nvidia/mlperf/mlperf-inference:mlpinf-v4.1-cuda12.4-pytorch24.04-ubuntu22.04-x86_64-release diff --git a/script/build-mlperf-inference-server-nvidia/meta.yaml b/script/build-mlperf-inference-server-nvidia/meta.yaml index 3530c9482..e8e49748b 100644 --- a/script/build-mlperf-inference-server-nvidia/meta.yaml +++ b/script/build-mlperf-inference-server-nvidia/meta.yaml @@ -276,6 +276,14 @@ versions: - x86_64 MLC_PYTHON_MINOR_VERSION: - 8 + - tags: get,generic-python-lib,_package.cuda-python + names: + - cuda-python + version_max: '12.6' + version_max_usable: '12.3.0' + - tags: get,generic-python-lib,_package.networkx + version_max: '2.9.99' + version_max_usable: '2.8.8' r4.1-dev: default_env: @@ -283,6 +291,14 @@ versions: deps: - tags: get,generic,sys-util,_nlohmann-json3-dev - tags: get,generic,sys-util,_git-lfs + - tags: get,generic-python-lib,_package.cuda-python + names: + - cuda-python + version_max: '12.6' + version_max_usable: '12.3.0' + - tags: get,generic-python-lib,_package.networkx + version_max: '2.9.99' + version_max_usable: '2.8.8' - tags: install,pytorch,from.src,_for-nvidia-mlperf-inference-v4.0 names: - pytorch