File tree Expand file tree Collapse file tree 1 file changed +2
-0
lines changed
Expand file tree Collapse file tree 1 file changed +2
-0
lines changed Original file line number Diff line number Diff line change @@ -101,6 +101,7 @@ def __init__(
101101 self .eos_token : List [int ] = [eos_token ] if isinstance (eos_token , int ) else eos_token
102102 self .receive_abort_request = asyncio .Event ()
103103 self .abort_timeout = 5.0
104+ self .lmdeploy_actor_store = None
104105
105106 def init_dist_port (self ):
106107 """Initialize distributed communication ports.
@@ -613,6 +614,7 @@ async def _handle_non_stream_response(
613614 assert finish_reason == "abort" , (
614615 f"routed_experts is None, but finish_reason is { finish_reason } , expected abort. response: { response } "
615616 )
617+ del routed_experts
616618 # NOTE: When set return_token_ids = True, the response must contain valid token_ids/logprobs.
617619 # If not, we consider it as an invalid response and retry it.
618620 # NOTE: !!! When finish_reason is abort, some queries may not return token_ids or logprobs. !!!
You can’t perform that action at this time.
0 commit comments