add contiguous in BertIntermediate (#13713)

faster step with a lot less recomputation
2026-01-08 22:48:25 -05:00 · 2025-12-15 22:37:36 -05:00
parent 7589c897b2
commit 041e9a41c9
1 changed files with 2 additions and 1 deletions
--- a/extra/models/bert.py
+++ b/extra/models/bert.py
@@ -242,7 +242,8 @@ class BertIntermediate:
  def __call__(self, hidden_states):
    x = self.dense(hidden_states)
    # tinygrad gelu is openai gelu but we need the original bert gelu
-    return gelu(x)
+    # NOTE: contiguous for speed
+    return gelu(x).contiguous()

 class BertAttention:
  def __init__(self, hidden_size, num_attention_heads, attention_probs_dropout_prob, hidden_dropout_prob):