Joshua Oehms commited on
Commit
658a0b3
·
1 Parent(s): f958d61

Cross-attention tied to dbmdz/bert-base-german-cased

Browse files
Files changed (2) hide show
  1. config.json +3 -1
  2. pytorch_model.bin +2 -2
config.json CHANGED
@@ -1,6 +1,7 @@
1
  {
2
- "_name_or_path": "dbmdz/german-gpt2",
3
  "activation_function": "gelu_new",
 
4
  "architectures": [
5
  "GPT2LMHeadModel"
6
  ],
@@ -10,6 +11,7 @@
10
  "eos_token_id": 1,
11
  "gradient_checkpointing": false,
12
  "initializer_range": 0.02,
 
13
  "layer_norm_epsilon": 1e-05,
14
  "model_type": "gpt2",
15
  "n_ctx": 1024,
 
1
  {
2
+ "_name_or_path": "josh-oo/german-gpt2-easy",
3
  "activation_function": "gelu_new",
4
+ "add_cross_attention": true,
5
  "architectures": [
6
  "GPT2LMHeadModel"
7
  ],
 
11
  "eos_token_id": 1,
12
  "gradient_checkpointing": false,
13
  "initializer_range": 0.02,
14
+ "is_decoder": true,
15
  "layer_norm_epsilon": 1e-05,
16
  "model_type": "gpt2",
17
  "n_ctx": 1024,
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd0841fa8bdd2afb18a1b73972a84da2caaf09e56e007a8253d407f78d12b2cb
3
- size 510421097
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebc33e88b9e55cc9f0686af4790da8c8cfa5f041aef3a45e868dbbb4cf81fe46
3
+ size 636511097