Skip to content

Commit baa6401

Browse files
committed
get lmdeploy_actor once
1 parent 13ae947 commit baa6401

File tree

1 file changed

+2
-0
lines changed

1 file changed

+2
-0
lines changed

xtuner/v1/ray/rollout/worker.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -101,6 +101,7 @@ def __init__(
101101
self.eos_token: List[int] = [eos_token] if isinstance(eos_token, int) else eos_token
102102
self.receive_abort_request = asyncio.Event()
103103
self.abort_timeout = 5.0
104+
self.lmdeploy_actor_store = None
104105

105106
def init_dist_port(self):
106107
"""Initialize distributed communication ports.
@@ -613,6 +614,7 @@ async def _handle_non_stream_response(
613614
assert finish_reason == "abort", (
614615
f"routed_experts is None, but finish_reason is {finish_reason}, expected abort. response: {response}"
615616
)
617+
del routed_experts
616618
# NOTE: When set return_token_ids = True, the response must contain valid token_ids/logprobs.
617619
# If not, we consider it as an invalid response and retry it.
618620
# NOTE: !!! When finish_reason is abort, some queries may not return token_ids or logprobs. !!!

0 commit comments

Comments
 (0)