diff --git a/vllm/entrypoints/grpc/grpc_server.py b/vllm/entrypoints/grpc/grpc_server.py index 795451ae8..a7f6a5031 100644 --- a/vllm/entrypoints/grpc/grpc_server.py +++ b/vllm/entrypoints/grpc/grpc_server.py @@ -236,8 +236,8 @@ async def GenerateStream( last_output_length = len(output.text) last_token_count = len(output.token_ids) - # Accumulate full output for logging - full_output += output.text + # Save full output for logging + full_output = output.text # Edit up the first_response for logging purposes only if first_response is None: