Update modeling_i3.py
Browse files- modeling_i3.py +3 -3
modeling_i3.py
CHANGED
|
@@ -1,13 +1,13 @@
|
|
| 1 |
import torch
|
| 2 |
from torch import nn
|
| 3 |
from transformers import PreTrainedModel, PretrainedConfig
|
| 4 |
-
from i3_modules import i3Model # import your original i3Model
|
| 5 |
|
| 6 |
class i3Config(PretrainedConfig):
|
| 7 |
model_type = "i3"
|
| 8 |
|
| 9 |
-
def __init__(self, vocab_size=
|
| 10 |
-
max_seq_len=
|
| 11 |
super().__init__(**kwargs)
|
| 12 |
self.vocab_size = vocab_size
|
| 13 |
self.d_model = d_model
|
|
|
|
| 1 |
import torch
|
| 2 |
from torch import nn
|
| 3 |
from transformers import PreTrainedModel, PretrainedConfig
|
| 4 |
+
from i3_modules import i3Model # import your original i3Model class
|
| 5 |
|
| 6 |
class i3Config(PretrainedConfig):
|
| 7 |
model_type = "i3"
|
| 8 |
|
| 9 |
+
def __init__(self, vocab_size=34, d_model=256, n_layers=6, n_heads=8,
|
| 10 |
+
max_seq_len=128, rank=8, d_state=16, **kwargs):
|
| 11 |
super().__init__(**kwargs)
|
| 12 |
self.vocab_size = vocab_size
|
| 13 |
self.d_model = d_model
|