Update configuration_llama_nsa.py
Browse files
configuration_llama_nsa.py
CHANGED
|
@@ -185,6 +185,7 @@ class LlamaNSAConfig(PretrainedConfig):
|
|
| 185 |
block_size=64,
|
| 186 |
block_counts=16,
|
| 187 |
window_size=512,
|
|
|
|
| 188 |
**kwargs,
|
| 189 |
):
|
| 190 |
self.vocab_size = vocab_size
|
|
@@ -214,6 +215,7 @@ class LlamaNSAConfig(PretrainedConfig):
|
|
| 214 |
self.block_size = block_size # debug
|
| 215 |
self.block_counts = block_counts
|
| 216 |
self.window_size = window_size
|
|
|
|
| 217 |
|
| 218 |
# Validate the correctness of rotary position embeddings parameters
|
| 219 |
# BC: if there is a 'type' field, copy it it to 'rope_type'.
|
|
@@ -230,4 +232,4 @@ class LlamaNSAConfig(PretrainedConfig):
|
|
| 230 |
)
|
| 231 |
|
| 232 |
|
| 233 |
-
__all__ = ["LlamaNSAConfig"]
|
|
|
|
| 185 |
block_size=64,
|
| 186 |
block_counts=16,
|
| 187 |
window_size=512,
|
| 188 |
+
inference_mode="sparse",
|
| 189 |
**kwargs,
|
| 190 |
):
|
| 191 |
self.vocab_size = vocab_size
|
|
|
|
| 215 |
self.block_size = block_size # debug
|
| 216 |
self.block_counts = block_counts
|
| 217 |
self.window_size = window_size
|
| 218 |
+
self.inference_mode = inference_mode
|
| 219 |
|
| 220 |
# Validate the correctness of rotary position embeddings parameters
|
| 221 |
# BC: if there is a 'type' field, copy it it to 'rope_type'.
|
|
|
|
| 232 |
)
|
| 233 |
|
| 234 |
|
| 235 |
+
__all__ = ["LlamaNSAConfig"]
|