Add mismatch key name gpu io test

triton-inference-server · kthui · Dec 8, 2022 · Dec 7, 2022 · Dec 7, 2022 · Dec 7, 2022
commit 9eed25860cb161938dfe48296d1d746f4edda523
diff --git a/qa/L0_tf_gpu_io/mismatch_key_name/1/model.savedmodel/saved_model.pb b/qa/L0_tf_gpu_io/mismatch_key_name/1/model.savedmodel/saved_model.pb
diff --git a/qa/L0_tf_gpu_io/mismatch_key_name/config.pbtxt b/qa/L0_tf_gpu_io/mismatch_key_name/config.pbtxt
@@ -0,0 +1,44 @@
+# Copyright 2022, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+#
+# Redistribution and use in source and binary forms, with or without
+# modification, are permitted provided that the following conditions
+# are met:
+#  * Redistributions of source code must retain the above copyright
+#    notice, this list of conditions and the following disclaimer.
+#  * Redistributions in binary form must reproduce the above copyright
+#    notice, this list of conditions and the following disclaimer in the
+#    documentation and/or other materials provided with the distribution.
+#  * Neither the name of NVIDIA CORPORATION nor the names of its
+#    contributors may be used to endorse or promote products derived
+#    from this software without specific prior written permission.
+#
+# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ``AS IS'' AND ANY
+# EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
+# PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE COPYRIGHT OWNER OR
+# CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
+# EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
+# PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR 
+# PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
+# OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+name: "mismatch_key_name"
+platform: "tensorflow_savedmodel"
+max_batch_size: 0
+
+input [
+  {
+    name: "INPUT0_key"
+    data_type: TYPE_FP32
+    dims: [ -1 ]
+  }
+]
+output [
+  {
+    name: "OUTPUT0_key"
+    data_type: TYPE_FP32
+    dims: [ -1 ]
+  }
+]
diff --git a/qa/L0_tf_gpu_io/test.sh b/qa/L0_tf_gpu_io/test.sh
@@ -1,5 +1,5 @@
 #!/bin/bash
-# Copyright (c) 2019-2020, NVIDIA CORPORATION. All rights reserved.
+# Copyright 2019-2022, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 #
 # Redistribution and use in source and binary forms, with or without
 # modification, are permitted provided that the following conditions
@@ -42,6 +42,7 @@ export CUDA_VISIBLE_DEVICES=0
 
 CLIENT=../clients/perf_client
 BACKENDS=${BACKENDS:="graphdef savedmodel"}
+MODEL_TYPES="$BACKENDS mismatch_key_name"
 TENSOR_SIZE=16384
 
 DATADIR=/data/inferenceserver/${REPO_VERSION}
@@ -50,24 +51,43 @@ SERVER=/opt/tritonserver/bin/tritonserver
 source ../common/util.sh
 
 RET=0
+rm -f ./*.log
 
 #
 # Use "identity" model for all model types.
 #
-rm -f ./*.log
-for BACKEND in $BACKENDS; do
-    MODEL_NAME=${BACKEND}_zero_1_float32
-    rm -fr models && mkdir -p models
-    cp -r $DATADIR/qa_identity_model_repository/${MODEL_NAME} \
-       models/${MODEL_NAME}_def && \
-    (cd models/${MODEL_NAME}_def && \
-            sed -i 's/_zero_1_float32/&_def/' config.pbtxt) && \
-    # Enable GPU I/O for TensorFlow model
-    cp -r models/${MODEL_NAME}_def models/${MODEL_NAME}_gpu && \
-    (cd models/${MODEL_NAME}_gpu && \
-            sed -i 's/_zero_1_float32_def/_zero_1_float32_gpu/' \
-                config.pbtxt && \
-            echo "optimization { execution_accelerators { gpu_execution_accelerator : [ { name : \"gpu_io\"} ] } }" >> config.pbtxt)
+for MODEL_TYPE in $MODEL_TYPES; do
+
+    # Setup models
+    rm -rf models && mkdir -p models
+    if [[ " ${BACKENDS[*]} " =~ " ${MODEL_TYPE} " ]]; then
+        MODEL_NAME=${MODEL_TYPE}_zero_1_float32
+        INPUT_NAME="INPUT0"
+        # Copy from qa_identity_model_repository
+        cp -r $DATADIR/qa_identity_model_repository/${MODEL_NAME} \
+                models/${MODEL_NAME}_def && \
+        (cd models/${MODEL_NAME}_def && \
+                sed -i 's/_zero_1_float32/&_def/' config.pbtxt) && \
+        # Enable GPU I/O for TensorFlow model
+        cp -r models/${MODEL_NAME}_def models/${MODEL_NAME}_gpu && \
+        (cd models/${MODEL_NAME}_gpu && \
+                sed -i 's/_zero_1_float32_def/_zero_1_float32_gpu/' \
+                    config.pbtxt && \
+                echo "optimization { execution_accelerators { gpu_execution_accelerator : [ { name : \"gpu_io\"} ] } }" >> config.pbtxt)
+    else
+        MODEL_NAME=${MODEL_TYPE}
+        INPUT_NAME="INPUT0_key"
+        # Copy a special model
+        cp -r ${MODEL_NAME} models/${MODEL_NAME}_def && \
+        (cd models/${MODEL_NAME}_def && \
+                sed -i "s/${MODEL_NAME}/&_def/" config.pbtxt) && \
+        # Enable GPU I/O for TensorFlow model
+        cp -r models/${MODEL_NAME}_def models/${MODEL_NAME}_gpu && \
+        (cd models/${MODEL_NAME}_gpu && \
+                sed -i "s/${MODEL_NAME}_def/${MODEL_NAME}_gpu/" \
+                    config.pbtxt && \
+                echo "optimization { execution_accelerators { gpu_execution_accelerator : [ { name : \"gpu_io\"} ] } }" >> config.pbtxt)
+    fi
 
     SERVER_ARGS="--model-repository=`pwd`/models --log-verbose=1"
     SERVER_LOG="${MODEL_NAME}.serverlog"
@@ -80,8 +100,8 @@ for BACKEND in $BACKENDS; do
 
     set +e
 
-    $CLIENT -m${MODEL_NAME}_def --shape INPUT0:${TENSOR_SIZE} \
-                >> ${BACKEND}.sanity.log 2>&1
+    $CLIENT -m${MODEL_NAME}_def --shape ${INPUT_NAME}:${TENSOR_SIZE} \
+                >> ${MODEL_TYPE}.sanity.log 2>&1
     if (( $? != 0 )); then
         RET=1
     fi
@@ -92,8 +112,8 @@ for BACKEND in $BACKENDS; do
         RET=1
     fi
 
-    $CLIENT -m${MODEL_NAME}_gpu  --shape INPUT0:${TENSOR_SIZE} \
-             >> ${BACKEND}.gpu.sanity.log 2>&1
+    $CLIENT -m${MODEL_NAME}_gpu  --shape ${INPUT_NAME}:${TENSOR_SIZE} \
+             >> ${MODEL_TYPE}.gpu.sanity.log 2>&1
     if (( $? != 0 )); then
         RET=1
     fi
@@ -105,14 +125,14 @@ for BACKEND in $BACKENDS; do
     fi
 
     # Sample latency results
-    $CLIENT -m${MODEL_NAME}_def --shape INPUT0:${TENSOR_SIZE} \
-             >> ${BACKEND}.log 2>&1
+    $CLIENT -m${MODEL_NAME}_def --shape ${INPUT_NAME}:${TENSOR_SIZE} \
+             >> ${MODEL_TYPE}.log 2>&1
     if (( $? != 0 )); then
         RET=1
     fi
 
-    $CLIENT -m${MODEL_NAME}_gpu --shape INPUT0:${TENSOR_SIZE} \
-            >> ${BACKEND}.gpu.log 2>&1
+    $CLIENT -m${MODEL_NAME}_gpu --shape ${INPUT_NAME}:${TENSOR_SIZE} \
+            >> ${MODEL_TYPE}.gpu.log 2>&1
     if (( $? != 0 )); then
         RET=1
     fi
@@ -123,11 +143,11 @@ for BACKEND in $BACKENDS; do
     wait $SERVER_PID
 done
 
-for BACKEND in $BACKENDS; do
-    echo -e "\n${BACKEND}\n************"
-    cat ${BACKEND}.log
-    echo -e "\n${BACKEND} with GPU I/O\n************"
-    cat ${BACKEND}.gpu.log
+for MODEL_TYPE in $MODEL_TYPES; do
+    echo -e "\n${MODEL_TYPE}\n************"
+    cat ${MODEL_TYPE}.log
+    echo -e "\n${MODEL_TYPE} with GPU I/O\n************"
+    cat ${MODEL_TYPE}.gpu.log
 done
 
 if [ $RET -eq 0 ]; then