diff --git a/examples/disaggregated_prefill_v1/load_balance_proxy_layerwise_server_example.py b/examples/disaggregated_prefill_v1/load_balance_proxy_layerwise_server_example.py index c60015539e9..7e80b55c930 100644 --- a/examples/disaggregated_prefill_v1/load_balance_proxy_layerwise_server_example.py +++ b/examples/disaggregated_prefill_v1/load_balance_proxy_layerwise_server_example.py @@ -556,7 +556,13 @@ async def generate_stream(): instance_info.prefiller_idx, instance_info.prefiller_score) released_kv = True - chunk_str = chunk.decode("utf-8").strip() + try: + chunk_str = chunk.decode("utf-8").strip() + except UnicodeDecodeError: + logger.debug( + f"Skipping chunk: {chunk}") + yield chunk + continue if not chunk_str: continue if chunk_str.startswith("data: "): diff --git a/examples/disaggregated_prefill_v1/load_balance_proxy_server_example.py b/examples/disaggregated_prefill_v1/load_balance_proxy_server_example.py index 880ed69e5f8..0694aced4af 100644 --- a/examples/disaggregated_prefill_v1/load_balance_proxy_server_example.py +++ b/examples/disaggregated_prefill_v1/load_balance_proxy_server_example.py @@ -539,7 +539,13 @@ async def generate_stream(): instance_info.prefiller_idx, instance_info.prefiller_score) released_kv = True - chunk_str = chunk.decode("utf-8").strip() + try: + chunk_str = chunk.decode("utf-8").strip() + except UnicodeDecodeError: + logger.debug( + f"Skipping chunk: {chunk}") + yield chunk + continue if not chunk_str: continue if chunk_str.startswith("data: "):