Skip to content

Commit 3d7d22e

Browse files
committed
[BUGFIX] fix ep mixed bug
1 parent 51f68ae commit 3d7d22e

File tree

1 file changed

+11
-6
lines changed

1 file changed

+11
-6
lines changed

fastdeploy/engine/expert_service.py

Lines changed: 11 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -59,7 +59,7 @@ def __init__(self, cfg, local_data_parallel_id):
5959
self.cfg.disaggregate_info = None
6060

6161
self.scheduler = cfg.scheduler_config.scheduler()
62-
if cfg.splitwise_role != "mixed":
62+
if cfg.scheduler_config.name != "splitwise":
6363
self.scheduler.reset_nodeid(f"{self.scheduler.infer.nodeid}_{local_data_parallel_id!s}")
6464

6565
self.cfg.parallel_config.local_data_parallel_id = local_data_parallel_id
@@ -142,10 +142,11 @@ def start(self, ipc_signal_suffix, local_data_parallel_id):
142142

143143
self.token_processor.run()
144144
self.cfg.init_cache_info()
145-
role = self.cfg.splitwise_role
146-
host_ip = self.cfg.host_ip
147-
disaggregate = self.cfg.disaggregate_info
148-
self.scheduler.start(role, host_ip, disaggregate)
145+
if self.cfg.scheduler_config.name != "splitwise":
146+
role = self.cfg.splitwise_role
147+
host_ip = self.cfg.host_ip
148+
disaggregate = self.cfg.disaggregate_info
149+
self.scheduler.start(role, host_ip, disaggregate)
149150
self.cfg.print()
150151

151152
launched_expert_service_signal_data = np.zeros(
@@ -376,6 +377,10 @@ def start_expert_service(cfg, local_data_parallel_id, ipc_signal_suffix):
376377
expert_service = ExpertService(cfg, local_data_parallel_id)
377378
try:
378379
expert_service.start(ipc_signal_suffix, local_data_parallel_id)
379-
expert_service.split_connector.start_receiver()
380+
if cfg.splitwise_role != "mixed":
381+
expert_service.split_connector.start_receiver()
382+
else:
383+
while True:
384+
time.sleep(100)
380385
except Exception as e:
381386
llm_logger.exception(f"Expert service failed to start: {e}, {str(traceback.format_exc())}")

0 commit comments

Comments
 (0)