We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 61b7ed6 commit 8175710Copy full SHA for 8175710
python/sgl_jax/srt/layers/moe.py
@@ -223,12 +223,12 @@ def _expert_parallel_forward_with_shard_map(
223
224
# 转换为静态整数参数(在动态 m 值上使用最大值作为安全的静态值)
225
static_tiling_gate = (
226
- min(optimal_tiling_gate[0], 16384), # 设置合理的最大值
+ optimal_tiling_gate[0], # 设置合理的最大值
227
optimal_tiling_gate[1],
228
optimal_tiling_gate[2],
229
)
230
static_tiling_down = (
231
- min(optimal_tiling_down[0], 16384),
+ optimal_tiling_down[0],
232
optimal_tiling_down[1],
233
optimal_tiling_down[2],
234
0 commit comments