Commit 993954a6 authored by Ryan McCormick's avatar Ryan McCormick Committed by GitHub
Browse files

refactor: Replace trtllm example prints with debug logs

parent deb6c7e8
...@@ -77,7 +77,7 @@ class DisaggregatedServingOperator(TritonCoreOperator): ...@@ -77,7 +77,7 @@ class DisaggregatedServingOperator(TritonCoreOperator):
response_sender = request.response_sender() response_sender = request.response_sender()
"""Preprocessing""" """Preprocessing"""
print(request) self._logger.debug(request)
if "text_input" in request.inputs: if "text_input" in request.inputs:
query = request.inputs["text_input"].to_bytes_array() query = request.inputs["text_input"].to_bytes_array()
elif "prompt" in request.inputs: elif "prompt" in request.inputs:
...@@ -102,7 +102,7 @@ class DisaggregatedServingOperator(TritonCoreOperator): ...@@ -102,7 +102,7 @@ class DisaggregatedServingOperator(TritonCoreOperator):
streaming = request.parameters.get("streaming", False) streaming = request.parameters.get("streaming", False)
input_ids, input_lengths = await self._preprocess(query) input_ids, input_lengths = await self._preprocess(query)
print(input_ids, input_lengths) self._logger.debug(input_ids, input_lengths)
prefill_inputs["input_ids"] = input_ids prefill_inputs["input_ids"] = input_ids
prefill_inputs["input_lengths"] = input_lengths prefill_inputs["input_lengths"] = input_lengths
prefill_inputs["request_output_len"] = request_output_len prefill_inputs["request_output_len"] = request_output_len
...@@ -177,7 +177,6 @@ class DisaggregatedServingOperator(TritonCoreOperator): ...@@ -177,7 +177,6 @@ class DisaggregatedServingOperator(TritonCoreOperator):
async def _preprocess(self, query): async def _preprocess(self, query):
start_ids = None start_ids = None
start_lengths = None start_lengths = None
print("here!")
if isinstance(query, str): if isinstance(query, str):
query = [[query]] query = [[query]]
async for preprocess_response in self._preprocess_model.async_infer( async for preprocess_response in self._preprocess_model.async_infer(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment