Commit
·
d16379a
1
Parent(s):
81beb99
Configure custom GPT for AutoModel loading
Browse files- __init__.py +10 -0
- config.json +7 -2
__init__.py
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# __init__.py
|
2 |
+
|
3 |
+
from .model import GPTConfig, GPT
|
4 |
+
|
5 |
+
try:
|
6 |
+
from transformers import AutoConfig, AutoModel
|
7 |
+
AutoConfig.register("gpt", GPTConfig)
|
8 |
+
AutoModel.register(GPTConfig, GPT)
|
9 |
+
except ImportError:
|
10 |
+
pass
|
config.json
CHANGED
@@ -6,7 +6,12 @@
|
|
6 |
"n_layer": 6,
|
7 |
"n_head": 6,
|
8 |
"n_embd": 384,
|
|
|
|
|
9 |
"auto_map": {
|
|
|
10 |
"AutoModel": "model.GPT"
|
11 |
-
}
|
12 |
-
|
|
|
|
|
|
6 |
"n_layer": 6,
|
7 |
"n_head": 6,
|
8 |
"n_embd": 384,
|
9 |
+
"dropout": 0.0,
|
10 |
+
"bias": true,
|
11 |
"auto_map": {
|
12 |
+
"AutoConfig": "model.GPTConfig",
|
13 |
"AutoModel": "model.GPT"
|
14 |
+
},
|
15 |
+
"torch_dtype": "float32",
|
16 |
+
"transformers_version": "4.42.0"
|
17 |
+
}
|