Exquisique commited on
Commit
d16379a
·
1 Parent(s): 81beb99

Configure custom GPT for AutoModel loading

Browse files
Files changed (2) hide show
  1. __init__.py +10 -0
  2. config.json +7 -2
__init__.py ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ # __init__.py
2
+
3
+ from .model import GPTConfig, GPT
4
+
5
+ try:
6
+ from transformers import AutoConfig, AutoModel
7
+ AutoConfig.register("gpt", GPTConfig)
8
+ AutoModel.register(GPTConfig, GPT)
9
+ except ImportError:
10
+ pass
config.json CHANGED
@@ -6,7 +6,12 @@
6
  "n_layer": 6,
7
  "n_head": 6,
8
  "n_embd": 384,
 
 
9
  "auto_map": {
 
10
  "AutoModel": "model.GPT"
11
- }
12
- }
 
 
 
6
  "n_layer": 6,
7
  "n_head": 6,
8
  "n_embd": 384,
9
+ "dropout": 0.0,
10
+ "bias": true,
11
  "auto_map": {
12
+ "AutoConfig": "model.GPTConfig",
13
  "AutoModel": "model.GPT"
14
+ },
15
+ "torch_dtype": "float32",
16
+ "transformers_version": "4.42.0"
17
+ }