cammy commited on
Commit
c9402a6
1 Parent(s): c41b2b6

Training in progress, epoch 1

Browse files
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
config.json ADDED
@@ -0,0 +1,66 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "allenai/led-large-16384-arxiv",
3
+ "_num_labels": 3,
4
+ "activation_dropout": 0.0,
5
+ "activation_function": "gelu",
6
+ "architectures": [
7
+ "LEDForConditionalGeneration"
8
+ ],
9
+ "attention_dropout": 0.0,
10
+ "attention_window": [
11
+ 1024,
12
+ 1024,
13
+ 1024,
14
+ 1024,
15
+ 1024,
16
+ 1024,
17
+ 1024,
18
+ 1024,
19
+ 1024,
20
+ 1024,
21
+ 1024,
22
+ 1024
23
+ ],
24
+ "bos_token_id": 0,
25
+ "classif_dropout": 0.0,
26
+ "classifier_dropout": 0.0,
27
+ "d_model": 1024,
28
+ "decoder_attention_heads": 16,
29
+ "decoder_ffn_dim": 4096,
30
+ "decoder_layerdrop": 0.0,
31
+ "decoder_layers": 12,
32
+ "decoder_start_token_id": 2,
33
+ "dropout": 0.1,
34
+ "encoder_attention_heads": 16,
35
+ "encoder_ffn_dim": 4096,
36
+ "encoder_layerdrop": 0.0,
37
+ "encoder_layers": 12,
38
+ "eos_token_id": 2,
39
+ "gradient_checkpointing": false,
40
+ "id2label": {
41
+ "0": "LABEL_0",
42
+ "1": "LABEL_1",
43
+ "2": "LABEL_2"
44
+ },
45
+ "init_std": 0.02,
46
+ "is_encoder_decoder": true,
47
+ "label2id": {
48
+ "LABEL_0": 0,
49
+ "LABEL_1": 1,
50
+ "LABEL_2": 2
51
+ },
52
+ "max_decoder_position_embeddings": 1024,
53
+ "max_encoder_position_embeddings": 16384,
54
+ "max_length": 512,
55
+ "max_position_embeddings": 1024,
56
+ "model_type": "led",
57
+ "num_beams": 4,
58
+ "num_hidden_layers": 12,
59
+ "output_past": false,
60
+ "pad_token_id": 1,
61
+ "prefix": " ",
62
+ "torch_dtype": "float32",
63
+ "transformers_version": "4.16.2",
64
+ "use_cache": true,
65
+ "vocab_size": 50265
66
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:934705092c3f5bbf6b02e141e45ad78ca06eb9d2cbebb31657927587d4e64a1c
3
+ size 1839628337
runs/Mar17_17-58-32_DESKTOP-AUUC0F6/1647511128.4571788/events.out.tfevents.1647511128.DESKTOP-AUUC0F6.13576.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb2bfaf3110c20830769b85f82b4cd2bb4d87df85a040fa4503e547f380657e3
3
+ size 5069
runs/Mar17_17-58-32_DESKTOP-AUUC0F6/events.out.tfevents.1647511128.DESKTOP-AUUC0F6.13576.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f9acc9ede124a338c6f6670d30b35d6c28d5f82b6b89bbf92827255ef0b6e99
3
+ size 4749
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, "eos_token": {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, "unk_token": {"content": "<unk>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, "sep_token": {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, "pad_token": {"content": "<pad>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, "cls_token": {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, "mask_token": {"content": "<mask>", "single_word": false, "lstrip": true, "rstrip": false, "normalized": true}}
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"unk_token": {"content": "<unk>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "bos_token": {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "eos_token": {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "add_prefix_space": false, "errors": "replace", "sep_token": {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "cls_token": {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "pad_token": {"content": "<pad>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "mask_token": {"content": "<mask>", "single_word": false, "lstrip": true, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "trim_offsets": true, "model_max_length": 16384, "special_tokens_map_file": "C:\\Users\\User/.cache\\huggingface\\transformers\\644496eac19670e4eae039a730bc2e3b219ecc44fcb1eb6827fe78d6590ee9bc.cb2244924ab24d706b02fd7fcedaea4531566537687a539ebb94db511fd122a0", "name_or_path": "allenai/led-large-16384-arxiv", "tokenizer_class": "LEDTokenizer"}
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b931a4eaaba30ec5a2ce2629e90951f1927e2d18690fefa7ebc0f984baf871c
3
+ size 3183
vocab.json ADDED
The diff for this file is too large to render. See raw diff