i know it doesn't look like much, but this kwarg was not used lol :D

2024-05-18 05:26:03 +02:00 · 2022-03-27 17:48:05 +01:00 · 2022-03-27 17:48:05 +01:00 · 3ed14b2cec
parent 107b6d7e31
commit 3ed14b2cec
1 changed files with 1 additions and 1 deletions
--- a/mingpt/model.py
+++ b/mingpt/model.py
@ -58,7 +58,7 @@ class CausalSelfAttention(nn.Module):
                                     .view(1, 1, config.block_size, config.block_size))
        self.n_head = config.n_head

-    def forward(self, x, layer_past=None):
+    def forward(self, x):
        B, T, C = x.size() # batch size, sequence length, embedding dimensionality (n_embd)

        # calculate query, key, values for all heads in batch and move head forward to be the batch dim