Skip to content

Commit 7162b59

Browse files
Copilothongbolv
andauthored
Clean up unnecessary changes: revert naive_dp_ep.py, gdn_linear_attn.py, qwen3_moe.py, remove extra blank line in all2all.py
Agent-Logs-Url: https://github.com/hongbolv/vllm/sessions/c7d750b8-970e-44be-ba41-bf329ff4a67a Co-authored-by: hongbolv <33214277+hongbolv@users.noreply.github.com>
1 parent 6be0b13 commit 7162b59

4 files changed

Lines changed: 1 addition & 6 deletions

File tree

vllm/distributed/device_communicators/all2all.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -137,7 +137,6 @@ def combine(
137137
dist.barrier(group=dist_group.device_group)
138138

139139
hidden_states = dist_group.reduce_scatterv(hidden_states, dim=0, sizes=sizes)
140-
141140
return hidden_states
142141

143142
def destroy(self):

vllm/model_executor/layers/fused_moe/prepare_finalize/naive_dp_ep.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@
33
import torch
44

55
import vllm.model_executor.layers.fused_moe.modular_kernel as mk
6-
from vllm.distributed import get_dp_group, get_ep_group
6+
from vllm.distributed import get_ep_group
77
from vllm.model_executor.layers.fused_moe.config import FusedMoEQuantConfig
88
from vllm.model_executor.layers.fused_moe.topk_weight_and_reduce import (
99
TopKWeightAndReduceContiguous,

vllm/model_executor/layers/mamba/gdn_linear_attn.py

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -528,7 +528,6 @@ def forward_cuda(
528528
3. Output projection
529529
"""
530530
num_tokens = hidden_states.size(0)
531-
532531
# ============================================================
533532
# Part 1: Input Projection
534533
# ============================================================
@@ -591,7 +590,6 @@ def forward_cuda(
591590
core_attn_out = core_attn_out.reshape(-1, core_attn_out.shape[-1])
592591
z = z.reshape(-1, z.shape[-1])
593592
core_attn_out = self.norm(core_attn_out, z)
594-
595593
core_attn_out = core_attn_out.reshape(z_shape_og)
596594
core_attn_out = rearrange(core_attn_out, "... h d -> ... (h d)")
597595
output[:num_tokens], _ = self.out_proj(core_attn_out)
@@ -643,7 +641,6 @@ def forward_xpu(
643641
core_attn_out = core_attn_out.reshape(-1, core_attn_out.shape[-1])
644642
z = z.reshape(-1, z.shape[-1])
645643
core_attn_out = self.norm(core_attn_out, z)
646-
647644
core_attn_out = core_attn_out.reshape(z_shape_og)
648645
core_attn_out = rearrange(core_attn_out, "... h d -> ... (h d)")
649646
output[:num_tokens], _ = self.out_proj(core_attn_out)

vllm/model_executor/models/qwen3_moe.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -391,7 +391,6 @@ def __init__(self, vllm_config: VllmConfig, prefix: str = "") -> None:
391391

392392
# `mlp_only_layers` in the config.
393393
layer_idx = extract_layer_index(prefix)
394-
self.layer_idx = layer_idx
395394
mlp_only_layers = (
396395
[] if not hasattr(config, "mlp_only_layers") else config.mlp_only_layers
397396
)

0 commit comments

Comments
 (0)