We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
o_proj
1 parent 106fd19 commit 6d88ba7Copy full SHA for 6d88ba7
backends/candle/src/models/flash_qwen3.rs
@@ -77,7 +77,7 @@ impl Qwen3Attention {
77
let v_proj = Linear::new(value_weight, value_bias, None);
78
79
let o_proj_weight = vb.pp("o_proj").get(
80
- (num_attention_heads * attention_head_size, hidden_size),
+ (hidden_size, num_attention_heads * attention_head_size),
81
"weight",
82
)?;
83
let o_proj = Linear::new(o_proj_weight, None, None);
0 commit comments