update

zhiding512 · zhiding512 · commit 817a6eb48a1b · 2025-11-26T17:50:54.000Z
diff --git a/3rdparty/composable_kernel b/3rdparty/composable_kernel
@@ -1 +1 @@
-Subproject commit c2e0f0a0b753f6d8fce07fbd7fc809b63abea5b2
+Subproject commit 31ec8bd33a1bb5104b44a6e2fd746e8b816cd975
diff --git a/csrc/pybind/moe_op_pybind.cu b/csrc/pybind/moe_op_pybind.cu
@@ -1,10 +1,11 @@
 /* SPDX-License-Identifier: MIT
    Copyright (c) 2024, Advanced Micro Devices, Inc. All rights reserved.
 */
-#include "rocm_ops.hpp"
 #include "moe_op.h"
+#include "rocm_ops.hpp"
 
 PYBIND11_MODULE(TORCH_EXTENSION_NAME, m)
 {
+      AITER_ENUM_PYBIND;
       MOE_OP_PYBIND;
 }
diff --git a/op_tests/test_moe_2stage.py b/op_tests/test_moe_2stage.py
@@ -668,8 +668,8 @@ def weight_per_128x128_quant(weight, quant_dtype):
 torch.cuda.manual_seed_all(seed)
 l_dtype = ["bf16", "fp16"][:1]
 # l_dim = [(6144, 4096)]
-l_dim = [(7168, 256)]
-# l_dim = [(3072, 3072)]
+# l_dim = [(7168, 256)]
+l_dim = [(3072, 3072)]
 l_tokenNum = [
     # 1,
     # 2,
@@ -693,8 +693,8 @@ def weight_per_128x128_quant(weight, quant_dtype):
     # (aiter.QuantType.per_Token, dtypes.fp8, dtypes.fp8),  # a8w8
     # (aiter.QuantType.per_Token, dtypes.fp8, torch.int4),  # a8w4
     # (aiter.QuantType.per_1x32, dtypes.fp4x2, dtypes.fp4x2),  # a4w4
-    (aiter.QuantType.per_128x128, dtypes.fp8, dtypes.fp8),  # a8w8
-    # (aiter.QuantType.per_1x32, dtypes.bf16, dtypes.fp4x2),  # a16w4
+    # (aiter.QuantType.per_128x128, dtypes.fp8, dtypes.fp8),  # a8w8
+    (aiter.QuantType.per_1x32, dtypes.bf16, dtypes.fp4x2),  # a16w4
 ]
 l_act = [aiter.ActivationType.Silu, aiter.ActivationType.Gelu][:1]
 l_doweight_stage1 = [False, True][:1]

Original file line number	Diff line number	Diff line change
`@@ -1,10 +1,11 @@`
`1`	`1`	`/* SPDX-License-Identifier: MIT`
`2`	`2`	`Copyright (c) 2024, Advanced Micro Devices, Inc. All rights reserved.`
`3`	`3`	`*/`
`4`		`-#include "rocm_ops.hpp"`
`5`	`4`	`#include "moe_op.h"`
	`5`	`+#include "rocm_ops.hpp"`
`6`	`6`
`7`	`7`	`PYBIND11_MODULE(TORCH_EXTENSION_NAME, m)`
`8`	`8`	`{`
	`9`	`+ AITER_ENUM_PYBIND;`
`9`	`10`	`MOE_OP_PYBIND;`
`10`	`11`	`}`