From 0a23ae08f78a7531f11a8385710248bba8639427 Mon Sep 17 00:00:00 2001 From: NanoCode012 Date: Fri, 6 Mar 2026 23:44:00 +0700 Subject: [PATCH] fix: position_ids casted to int64 for qwen35 patch (#3468) [skip ci] * fix: position_ids casted to int64 for qwen35 patch * fix: to use view instead of reshape to ensure noncontiguous error explicitly * chore: lint --- src/axolotl/monkeypatch/models/qwen3_5/modeling.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/src/axolotl/monkeypatch/models/qwen3_5/modeling.py b/src/axolotl/monkeypatch/models/qwen3_5/modeling.py index f88f60555..0b3302d82 100644 --- a/src/axolotl/monkeypatch/models/qwen3_5/modeling.py +++ b/src/axolotl/monkeypatch/models/qwen3_5/modeling.py @@ -35,9 +35,9 @@ def get_cu_seqlens(position_ids): if position_ids.ndim == 3: position_ids = position_ids[0] - tensor_kwargs = {"dtype": torch.long, "device": position_ids.device} - position_ids = position_ids.reshape(-1) - indices_q = (position_ids == 0).nonzero().reshape(-1) + tensor_kwargs = {"dtype": torch.int32, "device": position_ids.device} + position_ids = position_ids.view(-1) + indices_q = (position_ids == 0).nonzero().view(-1) return torch.cat( ( indices_q.to(**tensor_kwargs),