From 1cb4341fbcca4e58fa1ac5c1d55691eff16bf52b Mon Sep 17 00:00:00 2001 From: Mark McLoughlin Date: Fri, 23 Jan 2026 15:59:04 +0000 Subject: [PATCH] [ROCm][PD] Remove unused moriio connector proxy code (#32939) Signed-off-by: Mark McLoughlin --- .../moriio_toy_proxy_server.py | 22 ------------------- 1 file changed, 22 deletions(-) diff --git a/examples/online_serving/disaggregated_serving/moriio_toy_proxy_server.py b/examples/online_serving/disaggregated_serving/moriio_toy_proxy_server.py index 90ffbef31..ca3318173 100644 --- a/examples/online_serving/disaggregated_serving/moriio_toy_proxy_server.py +++ b/examples/online_serving/disaggregated_serving/moriio_toy_proxy_server.py @@ -166,27 +166,6 @@ async def stream_decode_response(session, response, request_id): await session.close() -async def send_request_to_decode(endpoint, req_data, request_id): - async with aiohttp.ClientSession( - timeout=aiohttp.ClientTimeout(total=6 * 6000 * 6000) - ) as session: - headers = { - "Authorization": f"Bearer {os.environ.get('OPENAI_API_KEY')}", - "X-Request-Id": request_id, - } - async with session.post( - url=endpoint, json=req_data, headers=headers - ) as response: - if response.status == 200: - async for chunk_bytes in response.content.iter_chunked(1024): - yield chunk_bytes - else: - raise RuntimeError( - "send_request_to_decode response.status != 200,response.statuus = ", - response.status, - ) - - def example_round_robin_dp_loader(request_number, dp_size): return request_nums % dp_size @@ -233,7 +212,6 @@ async def handle_request(): ) dip, dport = extract_ip_port_fast(decode_instance_endpoint["request_address"]) - ip, port = extract_ip_port_fast(prefill_instance_endpoint["request_address"]) req_data_to_prefill = copy.deepcopy(req_data) req_data_to_prefill["kv_transfer_params"] = {}