Skip to content

Commit

Permalink
further stripped down scheduler code
Browse files Browse the repository at this point in the history
Signed-off-by: Andrew Feldman <afeldman@neuralmagic.com>
  • Loading branch information
afeldman-nm committed Jan 8, 2025
1 parent 8482b5c commit d2fcc64
Show file tree
Hide file tree
Showing 2 changed files with 5 additions and 9 deletions.
6 changes: 1 addition & 5 deletions vllm/v1/core/scheduler.py
Original file line number Diff line number Diff line change
Expand Up @@ -460,11 +460,7 @@ def update_from_output(
new_token_ids=request.output_token_ids[-num_new_tokens:],
finished=request.is_finished(),
finish_reason=request.get_finished_reason(),
stop_reason=request.stop_reason,
logprobs_token_ids=[],
logprobs=[],
prompt_logprobs_token_ids=None,
prompt_logprobs=None)
stop_reason=request.stop_reason)
engine_core_outputs.append(output)

# Breakout of the loop.
Expand Down
8 changes: 4 additions & 4 deletions vllm/v1/engine/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -41,11 +41,11 @@ class EngineCoreOutput(

request_id: str
new_token_ids: List[int]
logprobs: List[torch.Tensor]
logprobs_token_ids: List[torch.Tensor]
prompt_logprobs: Optional[torch.Tensor]
prompt_logprobs_token_ids: Optional[torch.Tensor]
finished: bool
logprobs: List[torch.Tensor] = []
logprobs_token_ids: List[torch.Tensor] = []
prompt_logprobs: Optional[torch.Tensor] = None
prompt_logprobs_token_ids: Optional[torch.Tensor] = None
finish_reason: Optional[str] = None
stop_reason: Union[int, str, None] = None

Expand Down

0 comments on commit d2fcc64

Please sign in to comment.