[Bugfix] Fix deepseek-v2 error: "missing 1 required positional argument: 'residual'" (#13802)
This commit is contained in:
@ -614,7 +614,7 @@ class DeepseekV2Model(nn.Module):
|
||||
residual = intermediate_tensors["residual"]
|
||||
|
||||
for layer in self.layers[self.start_layer:self.end_layer]:
|
||||
hidden_states, residual = layer(positions, hidden_states)
|
||||
hidden_states, residual = layer(positions, hidden_states, residual)
|
||||
|
||||
if not get_pp_group().is_last_rank:
|
||||
return IntermediateTensors({
|
||||
|
||||
Reference in New Issue
Block a user