| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172 |
- #!/bin/bash
- # Copyright (c) 2019 NVIDIA CORPORATION. All rights reserved.
- # Licensed under the Apache License, Version 2.0 (the "License");
- # you may not use this file except in compliance with the License.
- # You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- MODEL_NAME=${1:-"bert"}
- MODEL_VERSION=${2:-1}
- BATCH_SIZE=${3:-1}
- MAX_LATENCY=${4:-100}
- MAX_CLIENT_THREADS=${5:-10}
- MAX_CONCURRENCY=${6:-50}
- SERVER_HOSTNAME=${7:-"localhost"}
- if [[ $SERVER_HOSTNAME == *":"* ]]; then
- echo "ERROR! Do not include the port when passing the Server Hostname. These scripts require that the TRITON HTTP endpoint is on Port 8000 and the gRPC endpoint is on Port 8001. Exiting..."
- exit 1
- fi
- if [ "$SERVER_HOSTNAME" = "localhost" ]
- then
- if [ ! "$(docker inspect -f "{{.State.Running}}" triton_server_cont)" = "true" ] ; then
- echo "Launching TRITON server"
- bash triton/scripts/launch_server.sh
- SERVER_LAUNCHED=true
- function cleanup_server {
- echo "Killing TRITON server"
- docker kill triton_server_cont
- }
- # Ensure we cleanup the server on exit
- # trap "exit" INT TERM
- trap cleanup_server EXIT
- fi
- fi
- # Wait until server is up. curl on the health of the server and sleep until its ready
- bash triton/scripts/wait_for_triton_server.sh $SERVER_HOSTNAME
- TIMESTAMP=$(date "+%y%m%d_%H%M")
- bash scripts/docker/launch.sh mkdir -p /results/perf_client/${MODEL_NAME}
- OUTPUT_FILE_CSV="/results/perf_client/${MODEL_NAME}/results_${TIMESTAMP}.csv"
- ARGS="\
- --max-threads ${MAX_CLIENT_THREADS} \
- -m ${MODEL_NAME} \
- -x ${MODEL_VERSION} \
- -p 200000 \
- -d \
- -v -z \
- -i gRPC \
- -u ${SERVER_HOSTNAME}:8001 \
- -b ${BATCH_SIZE} \
- -l ${MAX_LATENCY} \
- -c ${MAX_CONCURRENCY} \
- -f ${OUTPUT_FILE_CSV}"
- echo "Using args: $(echo "$ARGS" | sed -e 's/ -/\n-/g')"
- bash scripts/docker/launch.sh /workspace/install/bin/perf_client $ARGS
|