Update configuration_i3.py
Browse files- configuration_i3.py +3 -12
configuration_i3.py
CHANGED
|
@@ -1,19 +1,10 @@
|
|
| 1 |
-
from transformers
|
| 2 |
|
| 3 |
class I3Config(PretrainedConfig):
|
| 4 |
model_type = "i3"
|
| 5 |
|
| 6 |
-
def __init__(
|
| 7 |
-
|
| 8 |
-
vocab_size=50000,
|
| 9 |
-
d_model=512,
|
| 10 |
-
n_layers=12,
|
| 11 |
-
n_heads=8,
|
| 12 |
-
max_seq_len=256,
|
| 13 |
-
rank=64,
|
| 14 |
-
d_state=32,
|
| 15 |
-
**kwargs,
|
| 16 |
-
):
|
| 17 |
super().__init__(**kwargs)
|
| 18 |
self.vocab_size = vocab_size
|
| 19 |
self.d_model = d_model
|
|
|
|
| 1 |
+
from transformers import PretrainedConfig
|
| 2 |
|
| 3 |
class I3Config(PretrainedConfig):
|
| 4 |
model_type = "i3"
|
| 5 |
|
| 6 |
+
def __init__(self, vocab_size=4466, d_model=512, n_layers=12, n_heads=16,
|
| 7 |
+
max_seq_len=256, rank=128, d_state=64, **kwargs):
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 8 |
super().__init__(**kwargs)
|
| 9 |
self.vocab_size = vocab_size
|
| 10 |
self.d_model = d_model
|