Skip to content

Commit f5164d6

Browse files
committed
fix tp2
1 parent b1dda49 commit f5164d6

File tree

2 files changed

+3
-3
lines changed

2 files changed

+3
-3
lines changed

test/ci_use/QwQ-32B/run_server.sh

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -19,13 +19,13 @@ rm -rf log/*
1919
mkdir -p log
2020

2121
# 环境变量
22-
export CUDA_VISIBLE_DEVICES=4,5,6,7
22+
export CUDA_VISIBLE_DEVICES=0,1
2323
export INFERENCE_MSG_QUEUE_ID=7679
2424
export ENABLE_V1_KVCACHE_SCHEDULER=1
2525

2626

2727
python -m fastdeploy.entrypoints.openai.api_server \
28-
--tensor-parallel-size 4 \
28+
--tensor-parallel-size 2 \
2929
--port 8787 \
3030
--engine-worker-queue-port 7679 \
3131
--metrics-port 7877 \

test/ci_use/QwQ-32B/run_test.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,7 @@ BASE_URL="http://$HOST:$PORT"
88

99
TOTAL_ROUNDS=100
1010
CHAT_REQUESTS_PER_ROUND=5
11-
export CUDA_VISIBLE_DEVICES=4,5,6,7
11+
export CUDA_VISIBLE_DEVICES=0,1
1212
MAX_MEMORY_MB=10240 # 10GB
1313

1414
# ====================================================

0 commit comments

Comments
 (0)