Skip to content

Commit d780ebe

Browse files
committed
Add splitwise deployment with using rdma
1 parent 98f1ab4 commit d780ebe

File tree

3 files changed

+656
-5
lines changed

3 files changed

+656
-5
lines changed

tests/e2e/test_ernie_03b_pd_router_v1.py renamed to tests/e2e/test_ernie_03b_pd_router_v1_ipc.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -12,8 +12,8 @@
1212
# See the License for the specific language governing permissions and
1313
# limitations under the License.
1414

15-
# Test splitwise deployment which uses local_scheduler + router,
16-
# and ENABLE_V1_KVCACHE_SCHEDULER is 1
15+
# Test splitwise deployment: use local_scheduler + router,
16+
# set ENABLE_V1_KVCACHE_SCHEDULER is 1, use ipc to transfer cache.
1717

1818
import json
1919
import os
@@ -111,7 +111,7 @@ def setup_and_run_server():
111111
env_prefill["CUDA_VISIBLE_DEVICES"] = "0"
112112
env_prefill["ENABLE_V1_KVCACHE_SCHEDULER"] = "1"
113113
env_prefill["FD_LOG_DIR"] = "log_prefill"
114-
prefill_log_path = "server.log"
114+
prefill_log_path = "prefill.log"
115115
prefill_cmd = [
116116
sys.executable,
117117
"-m",
@@ -161,7 +161,7 @@ def setup_and_run_server():
161161
env_decode["CUDA_VISIBLE_DEVICES"] = "1"
162162
env_decode["ENABLE_V1_KVCACHE_SCHEDULER"] = "1"
163163
env_decode["FD_LOG_DIR"] = "log_decode"
164-
decode_log_path = "decode_server.log"
164+
decode_log_path = "decode.log"
165165
decode_cmd = [
166166
sys.executable,
167167
"-m",
@@ -216,7 +216,7 @@ def setup_and_run_server():
216216
try:
217217
os.killpg(process_prefill.pid, signal.SIGTERM)
218218
os.killpg(process_decode.pid, signal.SIGTERM)
219-
clean_ports()
219+
clean_ports(PORTS_TO_CLEAN)
220220
except Exception as e:
221221
print(f"Failed to kill process group: {e}")
222222
raise RuntimeError(f"API server did not start on port {FD_API_PORT}")

0 commit comments

Comments
 (0)