Skip to content

Commit 225fc8d

Browse files
use self.hidden_size not use self.fd_config.model_config.hidden_size (#7340)
1 parent 4982aa0 commit 225fc8d

File tree

2 files changed

+3
-1
lines changed

2 files changed

+3
-1
lines changed

fastdeploy/model_executor/layers/moe/moe.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -788,7 +788,7 @@ def forward_chunked_moe(
788788
chunk_size = self.fd_config.parallel_config.chunked_moe_size
789789
token_num = x.shape[0]
790790
fake_x = paddle.empty(
791-
shape=[0, self.fd_config.model_config.hidden_size],
791+
shape=[0, self.hidden_size],
792792
dtype=paddle.get_default_dtype(),
793793
)
794794
# input size that are less than a chunk, less than the max size data or empty input

tests/distributed/chunked_moe.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -169,6 +169,8 @@ def setup_fused_moe(self):
169169
fused_moe.fd_config = mock_fd_config
170170
fused_moe.quant_method = MockQuantMethod()
171171
fused_moe.enable_routing_replay = None
172+
173+
fused_moe.hidden_size = mock_fd_config.model_config.hidden_size
172174
return fused_moe
173175

174176
def run_model_runner(self):

0 commit comments

Comments
 (0)