Skip to content

Commit afad283

Browse files
committed
Remove transpose as not required in candle
1 parent 6d88ba7 commit afad283

File tree

1 file changed

+0
-5
lines changed

1 file changed

+0
-5
lines changed

backends/candle/src/models/flash_qwen3.rs

Lines changed: 0 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -146,11 +146,6 @@ impl Qwen3Attention {
146146
let (q, _res) = self.q_norm.forward(&q, None)?;
147147
let (k, _res) = self.k_norm.forward(&k, None)?;
148148

149-
// Transpose to [batch, heads, seq_len, head_dim]
150-
let q = q.transpose(1, 2)?;
151-
let k = k.transpose(1, 2)?;
152-
let v = v.transpose(1, 2)?;
153-
154149
apply_rotary_inplace(&q, &k, &cos, &sin, true)?;
155150

156151
let attention = flash_attn_varlen(

0 commit comments

Comments
 (0)