Upload folder using huggingface_hub
Browse files- modeling_qwen3.py +1 -1
modeling_qwen3.py
CHANGED
|
@@ -694,7 +694,7 @@ class Qwen3SummaryAttention(Qwen3Attention):
|
|
| 694 |
else:
|
| 695 |
self._sliding_chunk_num = int(val)
|
| 696 |
|
| 697 |
-
if config.summary_independent_parameters:
|
| 698 |
self.q_proj_summary = nn.Linear(
|
| 699 |
config.hidden_size, config.num_attention_heads * self.head_dim, bias=config.attention_bias
|
| 700 |
)
|
|
|
|
| 694 |
else:
|
| 695 |
self._sliding_chunk_num = int(val)
|
| 696 |
|
| 697 |
+
if config.summary_independent_parameters and config.mix_coeff > 0:
|
| 698 |
self.q_proj_summary = nn.Linear(
|
| 699 |
config.hidden_size, config.num_attention_heads * self.head_dim, bias=config.attention_bias
|
| 700 |
)
|