test: Validate request correlation ID data type (#7919)

yinggeh · web-flow · commit 48e615dd13c6 · 2025-01-08T11:10:04.000-08:00
diff --git a/qa/L0_sequence_corrid_batcher/sequence_corrid_batcher_test.py b/qa/L0_sequence_corrid_batcher/sequence_corrid_batcher_test.py
@@ -1,6 +1,6 @@
 #!/usr/bin/env python3
 
-# Copyright 2020-2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# Copyright 2020-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 #
 # Redistribution and use in source and binary forms, with or without
 # modification, are permitted provided that the following conditions
@@ -38,6 +38,8 @@
 import numpy as np
 import sequence_util as su
 import test_util as tu
+import tritonclient.http as httpclient
+from tritonclient.utils import InferenceServerException, np_to_triton_dtype
 
 _test_system_shared_memory = bool(int(os.environ.get("TEST_SYSTEM_SHARED_MEMORY", 0)))
 _test_cuda_shared_memory = bool(int(os.environ.get("TEST_CUDA_SHARED_MEMORY", 0)))
@@ -77,6 +79,12 @@ def get_expected_result(self, expected_result, corrid, value, trial, flag_str=No
                     expected_result += corrid
         return expected_result
 
+    def data_type_to_string(self, dtype):
+        if dtype == "TYPE_STRING":
+            return "BYTES"
+        else:
+            return dtype.replace("TYPE_", "")
+
     def test_skip_batch(self):
         # Test model instances together are configured with
         # total-batch-size 4. Send four sequences in parallel where
@@ -221,6 +229,78 @@ def test_skip_batch(self):
                     self.cleanup_shm_regions(precreated_shm2_handles)
                     self.cleanup_shm_regions(precreated_shm3_handles)
 
+    def test_corrid_data_type(self):
+        model_name = "add_sub"
+        expected_corrid_dtype = os.environ["TRITONSERVER_CORRID_DATA_TYPE"]
+
+        for corrid, corrid_dtype in [("corrid", "TYPE_STRING"), (123, "TYPE_UINT64")]:
+            # Check if the corrid data type matches the expected corrid data type specified in the model config
+            dtypes_match = True
+            if (corrid_dtype == "TYPE_STRING") and (
+                expected_corrid_dtype != "TYPE_STRING"
+            ):
+                dtypes_match = False
+            elif (corrid_dtype == "TYPE_UINT64") and (
+                expected_corrid_dtype
+                not in ["TYPE_UINT32", "TYPE_INT32", "TYPE_UINT64", "TYPE_INT64"]
+            ):
+                dtypes_match = False
+
+            with httpclient.InferenceServerClient("localhost:8000") as client:
+                input0_data = np.random.rand(16).astype(np.float32)
+                input1_data = np.random.rand(16).astype(np.float32)
+                inputs = [
+                    httpclient.InferInput(
+                        "INPUT0",
+                        input0_data.shape,
+                        np_to_triton_dtype(input0_data.dtype),
+                    ),
+                    httpclient.InferInput(
+                        "INPUT1",
+                        input1_data.shape,
+                        np_to_triton_dtype(input1_data.dtype),
+                    ),
+                ]
+
+                inputs[0].set_data_from_numpy(input0_data)
+                inputs[1].set_data_from_numpy(input1_data)
+
+                if not dtypes_match:
+                    with self.assertRaises(InferenceServerException) as e:
+                        client.infer(
+                            model_name,
+                            inputs,
+                            sequence_id=corrid,
+                            sequence_start=True,
+                            sequence_end=False,
+                        )
+                    err_str = str(e.exception)
+                    self.assertIn(
+                        f"sequence batching control 'CORRID' data-type is '{self.data_type_to_string(corrid_dtype)}', but model '{model_name}' expects '{self.data_type_to_string(expected_corrid_dtype)}'",
+                        err_str,
+                    )
+                else:
+                    response = client.infer(
+                        model_name,
+                        inputs,
+                        sequence_id=corrid,
+                        sequence_start=True,
+                        sequence_end=False,
+                    )
+                    response.get_response()
+                    output0_data = response.as_numpy("OUTPUT0")
+                    output1_data = response.as_numpy("OUTPUT1")
+
+                    self.assertTrue(
+                        np.allclose(input0_data + input1_data, output0_data),
+                        "add_sub example error: incorrect sum",
+                    )
+
+                    self.assertTrue(
+                        np.allclose(input0_data - input1_data, output1_data),
+                        "add_sub example error: incorrect difference",
+                    )
+
 
 if __name__ == "__main__":
     unittest.main()
diff --git a/qa/L0_sequence_corrid_batcher/test.sh b/qa/L0_sequence_corrid_batcher/test.sh
@@ -1,5 +1,5 @@
 #!/bin/bash
-# Copyright (c) 2020, NVIDIA CORPORATION. All rights reserved.
+# Copyright (c) 2020-2025, NVIDIA CORPORATION. All rights reserved.
 #
 # Redistribution and use in source and binary forms, with or without
 # modification, are permitted provided that the following conditions
@@ -121,6 +121,59 @@ for model_trial in 4; do
     done
 done
 
+# Test correlation ID data type
+mkdir -p corrid_data_type/add_sub/1
+cp ../python_models/add_sub/model.py corrid_data_type/add_sub/1
+
+for corrid_data_type in TYPE_STRING TYPE_UINT32 TYPE_INT32 TYPE_UINT64 TYPE_INT64; do
+    (cd corrid_data_type/add_sub && \
+    cp ../../../python_models/add_sub/config.pbtxt . && \
+    echo "sequence_batching { \
+        control_input [{ \
+            name: \"CORRID\" \
+            control [{ \
+            kind: CONTROL_SEQUENCE_CORRID \
+            data_type: $corrid_data_type \
+            }]
+        }] \
+        }" >> config.pbtxt)
+    MODEL_DIR=corrid_data_type
+
+    for i in test_corrid_data_type ; do
+        export TRITONSERVER_CORRID_DATA_TYPE=$corrid_data_type
+        SERVER_ARGS="--model-repository=`pwd`/$MODEL_DIR"
+        SERVER_LOG="./$i.$MODEL_DIR.server.log"
+        run_server
+        if [ "$SERVER_PID" == "0" ]; then
+            echo -e "\n***\n*** Failed to start $SERVER\n***"
+            cat $SERVER_LOG
+            exit 1
+        fi
+
+        echo "Test: $i, repository $MODEL_DIR" >>$CLIENT_LOG
+
+        set +e
+        python $BATCHER_TEST SequenceCorrIDBatcherTest.$i >>$CLIENT_LOG 2>&1
+        if [ $? -ne 0 ]; then
+            echo -e "\n***\n*** Test $i Failed\n***" >>$CLIENT_LOG
+            echo -e "\n***\n*** Test $i Failed\n***"
+            RET=1
+        else
+            check_test_results $TEST_RESULT_FILE 1
+            if [ $? -ne 0 ]; then
+                cat $CLIENT_LOG
+                echo -e "\n***\n*** Test Result Verification Failed\n***"
+                RET=1
+            fi
+        fi
+        set -e
+
+        unset TRITONSERVER_CORRID_DATA_TYPE
+        kill $SERVER_PID
+        wait $SERVER_PID
+    done
+done
+
 if [ $RET -eq 0 ]; then
     echo -e "\n***\n*** Test Passed\n***"
 else