File tree Expand file tree Collapse file tree 1 file changed +2
-2
lines changed 
fastdeploy/model_executor/layers/moe Expand file tree Collapse file tree 1 file changed +2
-2
lines changed Original file line number Diff line number Diff line change @@ -168,12 +168,12 @@ def apply(
168168        Paddle Cutlass compute Fused MoE. 
169169        """ 
170170        if  layer .ep_size  >  1 :
171-             if  layer .fd_config .model_config .moe_phase .phase  ==  "prefill" :
171+             if  layer .fd_config .model_config .moe_phase .phase  ==  "prefill"   and   layer . layer_idx   ==   0 :
172172                if  layer .fd_config .scheduler_config .splitwise_role  ==  "mixed" :
173173                    self .ep_prefill_runner .clean_low_latency_buffer ()
174174                return  self .apply_ep_prefill (layer , x , gate )
175175            else :
176-                 if  layer .fd_config .scheduler_config .splitwise_role  ==  "mixed" :
176+                 if  layer .fd_config .scheduler_config .splitwise_role  ==  "mixed"   and   layer . layer_idx   ==   0 :
177177                    self .ep_decoder_runner .clean_low_latency_buffer ()
178178                return  self .apply_ep_decode (layer , x , gate )
179179        else :
    
 
   
 
     
   
   
          
     
  
    
     
 
    
      
     
 
     
    You can’t perform that action at this time.
  
 
    
  
     
    
      
        
     
 
       
      
     
   
 
    
    
  
 
  
 
     
    
0 commit comments