fix draft rotary embedding when given 2d position ids

dcw02 · dcw02 · commit 81966baf2496 · 2025-10-13T04:11:03.000-04:00
diff --git a/specforge/modeling/draft/llama3_eagle.py b/specforge/modeling/draft/llama3_eagle.py
@@ -317,7 +317,9 @@ def _apply_interleaved_mrope(self, freqs: torch.Tensor) -> torch.Tensor:
 
     def forward(self, x, position_ids):
         # In contrast to other models, Qwen-VL variants have different position ids for the grids
-        # So we expand the inv_freq to shape (3, ...)
+        # So we expand the position ids/inv_freq to shape (3, ...)
+        if position_ids.ndim == 2:
+            position_ids = position_ids[None, ...].expand(3, -1, -1)
         inv_freq_expanded = (
             self.inv_freq[None, None, :, None]
             .float()