diff --git a/vllm/model_executor/model_loader/spyre.py b/vllm/model_executor/model_loader/spyre.py index 0f87a6c35..b1479c3c6 100644 --- a/vllm/model_executor/model_loader/spyre.py +++ b/vllm/model_executor/model_loader/spyre.py @@ -46,7 +46,9 @@ def __init__( self.past_key_value_states = None self.dtype = torch.float16 if envs.VLLM_SPYRE_DYNAMO_BACKEND == \ 'sendnn_decoder' else torch.float32 - # indices: True unfinished, False for finished or padded sequence + # boolean tensor of length batch size with indices: + # True for unfinished sequences and + # False for finished or padded sequences self.indices = None # Lazy initialized