File tree Expand file tree Collapse file tree 2 files changed +3
-1
lines changed
fastdeploy/model_executor/layers/moe Expand file tree Collapse file tree 2 files changed +3
-1
lines changed Original file line number Diff line number Diff line change @@ -788,7 +788,7 @@ def forward_chunked_moe(
788788 chunk_size = self .fd_config .parallel_config .chunked_moe_size
789789 token_num = x .shape [0 ]
790790 fake_x = paddle .empty (
791- shape = [0 , self .fd_config . model_config . hidden_size ],
791+ shape = [0 , self .hidden_size ],
792792 dtype = paddle .get_default_dtype (),
793793 )
794794 # input size that are less than a chunk, less than the max size data or empty input
Original file line number Diff line number Diff line change @@ -169,6 +169,8 @@ def setup_fused_moe(self):
169169 fused_moe .fd_config = mock_fd_config
170170 fused_moe .quant_method = MockQuantMethod ()
171171 fused_moe .enable_routing_replay = None
172+
173+ fused_moe .hidden_size = mock_fd_config .model_config .hidden_size
172174 return fused_moe
173175
174176 def run_model_runner (self ):
You can’t perform that action at this time.
0 commit comments