Unverified Commit 1cb4341f authored by Mark McLoughlin's avatar Mark McLoughlin Committed by GitHub
Browse files

[ROCm][PD] Remove unused moriio connector proxy code (#32939)


Signed-off-by: default avatarMark McLoughlin <markmc@redhat.com>
parent 1fb648bf
...@@ -166,27 +166,6 @@ async def stream_decode_response(session, response, request_id): ...@@ -166,27 +166,6 @@ async def stream_decode_response(session, response, request_id):
await session.close() await session.close()
async def send_request_to_decode(endpoint, req_data, request_id):
async with aiohttp.ClientSession(
timeout=aiohttp.ClientTimeout(total=6 * 6000 * 6000)
) as session:
headers = {
"Authorization": f"Bearer {os.environ.get('OPENAI_API_KEY')}",
"X-Request-Id": request_id,
}
async with session.post(
url=endpoint, json=req_data, headers=headers
) as response:
if response.status == 200:
async for chunk_bytes in response.content.iter_chunked(1024):
yield chunk_bytes
else:
raise RuntimeError(
"send_request_to_decode response.status != 200,response.statuus = ",
response.status,
)
def example_round_robin_dp_loader(request_number, dp_size): def example_round_robin_dp_loader(request_number, dp_size):
return request_nums % dp_size return request_nums % dp_size
...@@ -233,7 +212,6 @@ async def handle_request(): ...@@ -233,7 +212,6 @@ async def handle_request():
) )
dip, dport = extract_ip_port_fast(decode_instance_endpoint["request_address"]) dip, dport = extract_ip_port_fast(decode_instance_endpoint["request_address"])
ip, port = extract_ip_port_fast(prefill_instance_endpoint["request_address"])
req_data_to_prefill = copy.deepcopy(req_data) req_data_to_prefill = copy.deepcopy(req_data)
req_data_to_prefill["kv_transfer_params"] = {} req_data_to_prefill["kv_transfer_params"] = {}
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment