mlcommons · arjunsuresh · Dec 24, 2024 · Dec 24, 2024 · Dec 24, 2024 · Dec 24, 2024
@@ -161,6 +161,10 @@ variations:
       - python3
       tags: get,python3
     - tags: get,generic-python-lib,_package.safetensors
+    - tags: get,generic-python-lib,_torch
+      names:
+      - torch
+      - pytorch
   rclone:
     add_deps_recursive:
       dae:

@@ -17,5 +17,5 @@ export DOCKER_RUN_ARGS=" -v ${CM_NVIDIA_MLPERF_SCRATCH_PATH}:/mnt"
 make -C docker run LOCAL_USER=1
 test $? -eq 0 || exit $?
 
-${CM_PYTHON_BIN_WITH_PATH} ${CM_MLPERF_INFERENCE_NVIDIA_CODE_PATH}/code/gptj/tensorrt/onnx_tune.py --fp8-scalers-path=${CM_NVIDIA_MLPERF_SCRATCH_PATH}/models/GPTJ-6B/fp8-quantized-ammo/GPTJ-FP8-quantized/rank0.safetensors --scaler 1.005 --index 15
+PYTHONPATH='' ${CM_PYTHON_BIN_WITH_PATH} ${CM_MLPERF_INFERENCE_NVIDIA_CODE_PATH}/code/gptj/tensorrt/onnx_tune.py --fp8-scalers-path=${CM_NVIDIA_MLPERF_SCRATCH_PATH}/models/GPTJ-6B/fp8-quantized-ammo/GPTJ-FP8-quantized/rank0.safetensors --scaler 1.005 --index 15
 test $? -eq 0 || exit $?
@@ -28,9 +28,8 @@ retinanet:
     target_qps: 850.0
   Server:
     target_qps: 630.0
-sdxl:
+stable-diffusion-xl:
   Offline:
     target_qps: 0.7
   Server:
-    target_qps: 0.3
-
+    target_qps: 0.3  
@@ -35,7 +35,7 @@
       target_qps: 8
     Server:
       target_qps: 7
-  sdxl:
+  stable-diffusion-xl:
     Offline:
       target_qps: 1.3
     Server:

@@ -13,7 +13,7 @@ def preprocess(i):
 
     # Not enforcing dev requirement for now
     if env.get('CM_TENSORRT_TAR_FILE_PATH', '') == '' and env.get(
-            'CM_TENSORRT_REQUIRE_DEV1', '') != 'yes' and env.get('CM_HOST_PLATFORM_FLAVOR', '') != 'aarch64':
+            'CM_TENSORRT_REQUIRE_DEV1', '') != 'yes' and env.get('CM_HOST_PLATFORM_FLAVOR_', '') != 'aarch64':
 
         if os_info['platform'] == 'windows':
             extra_pre = ''