Fix q_proj and o_proj shape

alvarobartt · alvarobartt · commit 2669a5c355bb · 2025-06-06T14:15:03.000Z
diff --git a/backends/candle/src/models/flash_qwen3.rs b/backends/candle/src/models/flash_qwen3.rs
@@ -38,7 +38,7 @@ impl Qwen3Attention {
         let hidden_size = config.hidden_size;
 
         let query_weight = vb.pp("q_proj").get(
-            (num_attention_heads * attention_head_size, hidden_size),
+            (hidden_size, num_attention_heads * attention_head_size),
             "weight",
         )?;
         let query_bias = if config.attention_bias {
@@ -77,7 +77,7 @@ impl Qwen3Attention {
         let v_proj = Linear::new(value_weight, value_bias, None);
 
         let o_proj_weight = vb.pp("o_proj").get(
-            (num_attention_heads * attention_head_size, hidden_size),
+            (hidden_size, num_attention_heads * attention_head_size),
             "weight",
         )?;
         let o_proj = Linear::new(o_proj_weight, None, None);