Skip to content

Commit

Permalink
reset time_faaaa
Browse files Browse the repository at this point in the history
  • Loading branch information
jahatef committed Oct 13, 2024
1 parent dd441b6 commit a418670
Showing 1 changed file with 1 addition and 1 deletion.
2 changes: 1 addition & 1 deletion megatron/model/rwkv/v6/rwkv.py
Original file line number Diff line number Diff line change
Expand Up @@ -279,7 +279,7 @@ def forward(self, x):
H = self.neox_args.num_attention_heads//mpu.get_model_parallel_world_size()
H_tp = H//mpu.get_model_parallel_world_size()

self.time_faaaa = self.time_faaaa[:self.neox_args.num_attention_heads//2,:]
#self.time_faaaa = self.time_faaaa[:self.neox_args.num_attention_heads//2,:]
#self.time_faaaa = scatter_to_model_parallel_region(self.time_faaaa)
r, k, v, g, w = self.jit_func(x)
print(f"shape of r: {r.size()}, k: {k.size()}, v: {v.size()}, g: {g.size()}, w: {w.size()}, H: {H}, B: {B}, T: {T}, C: {C}, time_faaaa: {self.time_faaaa.size()}, \n")
Expand Down

0 comments on commit a418670

Please sign in to comment.