hotfix: add contiguous_backward to llama

2026-01-10 23:48:01 -05:00 · 2025-07-31 15:06:19 -07:00
parent fa66d9772d
commit 474ee9daa5
1 changed files with 1 additions and 1 deletions
--- a/extra/models/llama.py
+++ b/extra/models/llama.py
@@ -111,7 +111,7 @@ class TransformerBlock:

  def __call__(self, x:Tensor, start_pos:Union[Variable,int], freqs_cis:Tensor, mask:Optional[Tensor]):
    h = x + self.attention(self.attention_norm(x), start_pos, freqs_cis, mask)
-    return (h + self.feed_forward(self.ffn_norm(h))).contiguous()
+    return (h + self.feed_forward(self.ffn_norm(h))).contiguous().contiguous_backward()

 # standard openai sampling
 def sample(logits: Tensor, temp: float, k: int, p: float, af: float, ap: float):