Skip to content

Commit 49a7cfe

Browse files
committed
applied few suggestions from code-assistant
1 parent f81353a commit 49a7cfe

File tree

2 files changed

+5
-3
lines changed

2 files changed

+5
-3
lines changed

vllm/distributed/device_communicators/all2all.py

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -510,8 +510,10 @@ def _ensure_shmem_initialized(self):
510510
logger.debug(
511511
"[rank %s] torch process group shmem init failed: %s",
512512
self.rank, torch_error)
513-
514-
self._shmem_initialized = True
513+
self._shmem_initialized = True
514+
logger.warning(
515+
"[rank %s] Continuing without mori shmem optimization",
516+
self.rank)
515517

516518
except Exception as e:
517519
logger.error("[rank %s] mori shmem initialization failed: %s",

vllm/model_executor/layers/fused_moe/mori_prepare_finalize.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -88,9 +88,9 @@ def prepare(
8888
8989
Args:
9090
a1: Input hidden states [num_tokens, hidden_dim]
91-
a1_scale: Input activation scales
9291
topk_weights: Top-k routing weights [num_experts, experts_per_token]
9392
topk_ids: Top-k expert indices [num_experts, experts_per_token]
93+
apply_router_weight_on_input: Whether to apply router weight
9494
quant_config: Quantization config
9595
9696
Returns:

0 commit comments

Comments
 (0)