Update configuration_neollm.py
Browse files- configuration_neollm.py +1 -1
configuration_neollm.py
CHANGED
|
@@ -598,7 +598,7 @@ class NeoLLMConfig(PretrainedConfig):
|
|
| 598 |
use_laurel_lr=False,
|
| 599 |
laurel_lr_rank=32,
|
| 600 |
# ββ Interleaved Head Attention (Duvvuri et al., 2026) βββββββββββββ
|
| 601 |
-
use_iha=
|
| 602 |
iha_num_pseudo_heads=2, # P=2 β 2Γ2=4 patrones por head
|
| 603 |
iha_local_global_pattern="LLLLG", # 4 locales + 1 global (paper Β§5.1)
|
| 604 |
iha_sliding_window=None, # auto = N // (2*P^2) usando la longitud real del batch
|
|
|
|
| 598 |
use_laurel_lr=False,
|
| 599 |
laurel_lr_rank=32,
|
| 600 |
# ββ Interleaved Head Attention (Duvvuri et al., 2026) βββββββββββββ
|
| 601 |
+
use_iha=True,
|
| 602 |
iha_num_pseudo_heads=2, # P=2 β 2Γ2=4 patrones por head
|
| 603 |
iha_local_global_pattern="LLLLG", # 4 locales + 1 global (paper Β§5.1)
|
| 604 |
iha_sliding_window=None, # auto = N // (2*P^2) usando la longitud real del batch
|