Merge branch 'main' of https://huggingface.co/normalcomputing/extended-mind-mpt-7b into main
Browse files- blocks.py +1 -1
- config.json +2 -2
- modeling_mpt.py +4 -4
blocks.py
CHANGED
|
@@ -7,7 +7,7 @@
|
|
| 7 |
from typing import Dict, Optional, Tuple
|
| 8 |
import torch
|
| 9 |
import torch.nn as nn
|
| 10 |
-
from
|
| 11 |
from llmfoundry.models.layers.norm import NORM_CLASS_REGISTRY
|
| 12 |
|
| 13 |
class MPTMLP(nn.Module):
|
|
|
|
| 7 |
from typing import Dict, Optional, Tuple
|
| 8 |
import torch
|
| 9 |
import torch.nn as nn
|
| 10 |
+
from attention import ATTN_CLASS_REGISTRY
|
| 11 |
from llmfoundry.models.layers.norm import NORM_CLASS_REGISTRY
|
| 12 |
|
| 13 |
class MPTMLP(nn.Module):
|
config.json
CHANGED
|
@@ -21,8 +21,8 @@
|
|
| 21 |
"use_active_externalism": true
|
| 22 |
},
|
| 23 |
"auto_map": {
|
| 24 |
-
"AutoConfig": "
|
| 25 |
-
"AutoModelForCausalLM": "
|
| 26 |
},
|
| 27 |
"d_model": 4096,
|
| 28 |
"emb_pdrop": 0,
|
|
|
|
| 21 |
"use_active_externalism": true
|
| 22 |
},
|
| 23 |
"auto_map": {
|
| 24 |
+
"AutoConfig": "configuration.ExtendedMPTConfig",
|
| 25 |
+
"AutoModelForCausalLM": "modeling_mpt.ExtendedMPTForCausalLM"
|
| 26 |
},
|
| 27 |
"d_model": 4096,
|
| 28 |
"emb_pdrop": 0,
|
modeling_mpt.py
CHANGED
|
@@ -27,10 +27,10 @@ from llmfoundry.models.layers.custom_embedding import SharedEmbedding
|
|
| 27 |
from llmfoundry.models.layers.norm import NORM_CLASS_REGISTRY
|
| 28 |
from llmfoundry.models.utils.param_init_fns import MODEL_INIT_REGISTRY
|
| 29 |
|
| 30 |
-
from
|
| 31 |
-
from
|
| 32 |
-
from
|
| 33 |
-
from
|
| 34 |
|
| 35 |
Tokenizer = Union[PreTrainedTokenizer, PreTrainedTokenizerFast]
|
| 36 |
|
|
|
|
| 27 |
from llmfoundry.models.layers.norm import NORM_CLASS_REGISTRY
|
| 28 |
from llmfoundry.models.utils.param_init_fns import MODEL_INIT_REGISTRY
|
| 29 |
|
| 30 |
+
from configuration import ExtendedMPTConfig
|
| 31 |
+
from attention import attn_bias_shape, build_attn_bias
|
| 32 |
+
from blocks import MPTBlock
|
| 33 |
+
from utils import instantiate_from_config
|
| 34 |
|
| 35 |
Tokenizer = Union[PreTrainedTokenizer, PreTrainedTokenizerFast]
|
| 36 |
|