Signed-off-by: Bill Nell <bnell@redhat.com>
This commit is contained in:
Bill Nell
2025-05-28 23:38:19 +00:00
parent 3ca8322b74
commit d86e3f0172

View File

@ -614,13 +614,10 @@ class BatchedExperts(mk.FusedMoEPermuteExpertsUnpermute):
else:
num = int(expert_num_tokens[expert].item())
tmp = _resize_cache(workspace2, (num, N))
if self.use_fp8_w8a8:
assert False # TBD
else:
input = hidden_states[expert, :num, :] @ w1[expert].transpose(
0, 1)
self.activation(activation, tmp, input)
out[expert, :num, :] = tmp @ w2[expert].transpose(0, 1)
assert not self.use_fp8_w8a8
input = hidden_states[expert, :num, :] @ w1[expert].transpose(0, 1)
self.activation(activation, tmp, input)
out[expert, :num, :] = tmp @ w2[expert].transpose(0, 1)
return out