Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
3 changes: 0 additions & 3 deletions ci/L0_backend_vllm/test.sh
Original file line number Diff line number Diff line change
Expand Up @@ -28,9 +28,6 @@
RET=0
SUBTESTS="accuracy_test request_cancellation enabled_stream vllm_backend metrics_test"

export C_INCLUDE_PATH=/usr/local/cuda/include:$C_INCLUDE_PATH
export TRITON_PTXAS_PATH=/usr/local/cuda/bin/ptxas

python3 -m pip install tritonclient[grpc]

for TEST in ${SUBTESTS}; do
Expand Down
3 changes: 0 additions & 3 deletions ci/L0_multi_gpu_vllm/multi_lora/test.sh
Original file line number Diff line number Diff line change
Expand Up @@ -41,9 +41,6 @@ EXPECTED_NUM_TESTS=2
GENERATE_ENDPOINT="localhost:8000/v2/models/vllm_llama_multi_lora/generate"
CHECK_FOR_ERROR=true

export C_INCLUDE_PATH=/usr/local/cuda/include:$C_INCLUDE_PATH
export TRITON_PTXAS_PATH=/usr/local/cuda/bin/ptxas

make_api_call() {
local endpoint="$1"
local data="$2"
Expand Down
3 changes: 0 additions & 3 deletions ci/L0_multi_gpu_vllm/vllm_backend/test.sh
Original file line number Diff line number Diff line change
Expand Up @@ -36,9 +36,6 @@ CLIENT_PY="./vllm_multi_gpu_test.py"
SAMPLE_MODELS_REPO="../../../samples/model_repository"
EXPECTED_NUM_TESTS=1

export C_INCLUDE_PATH=/usr/local/cuda/include:$C_INCLUDE_PATH
export TRITON_PTXAS_PATH=/usr/local/cuda/bin/ptxas

### Helpers
function validate_file_contains() {
local KEY="${1}"
Expand Down
Loading