adityaprakhar commited on
Commit
6cdfbc4
·
verified ·
1 Parent(s): 90fc7d5

Training in progress, step 500

Browse files
config.json CHANGED
@@ -1,65 +1,62 @@
1
  {
2
- "_name_or_path": "adityaprakhar/LayoutLMv1_March_14_2024_100_epochs",
3
  "architectures": [
4
  "LayoutLMForTokenClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
- "bos_token_id": 0,
8
- "eos_token_id": 2,
9
- "gradient_checkpointing": false,
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
12
  "hidden_size": 768,
13
  "id2label": {
14
- "0": "attorneys for plaintiff",
15
- "1": "attorney for defendant/cross-complainant/cross-defendant",
16
- "2": "address",
17
- "3": "lawfirm",
18
- "4": "other",
19
- "5": "attorneys for co-counsel",
20
- "6": "email",
21
- "7": "co-counsel for plaintiff",
22
- "8": "attorney_name",
23
- "9": "attorneys for defendant",
24
- "10": "parties",
25
- "11": "SBN",
26
- "12": "attorneys for co-defendant",
27
- "13": "fax",
28
- "14": "telephone",
29
- "15": "counsel for plaintiff"
30
  },
31
  "initializer_range": 0.02,
32
  "intermediate_size": 3072,
33
  "label2id": {
34
- "SBN": 11,
35
- "address": 2,
36
- "attorney for defendant/cross-complainant/cross-defendant": 1,
37
- "attorney_name": 8,
38
- "attorneys for co-counsel": 5,
39
- "attorneys for co-defendant": 12,
40
- "attorneys for defendant": 9,
41
- "attorneys for plaintiff": 0,
42
- "co-counsel for plaintiff": 7,
43
- "counsel for plaintiff": 15,
44
- "email": 6,
45
- "fax": 13,
46
- "lawfirm": 3,
47
- "other": 4,
48
- "parties": 10,
49
- "telephone": 14
50
  },
51
- "layer_norm_eps": 1e-05,
52
  "max_2d_position_embeddings": 1024,
53
- "max_position_embeddings": 514,
54
  "model_type": "layoutlm",
55
  "num_attention_heads": 12,
56
  "num_hidden_layers": 12,
57
- "pad_token_id": 1,
 
58
  "position_embedding_type": "absolute",
59
- "tokenizer_class": "RobertaTokenizer",
60
  "torch_dtype": "float32",
61
  "transformers_version": "4.39.0.dev0",
62
- "type_vocab_size": 1,
63
  "use_cache": true,
64
- "vocab_size": 50265
65
  }
 
1
  {
2
+ "_name_or_path": "microsoft/layoutlm-base-uncased",
3
  "architectures": [
4
  "LayoutLMForTokenClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
 
 
 
7
  "hidden_act": "gelu",
8
  "hidden_dropout_prob": 0.1,
9
  "hidden_size": 768,
10
  "id2label": {
11
+ "0": "SBN",
12
+ "1": "address",
13
+ "2": "attorney for defendant/cross-complainant/cross-defendant",
14
+ "3": "attorney_name",
15
+ "4": "attorneys for co-counsel",
16
+ "5": "attorneys for co-defendant",
17
+ "6": "attorneys for defendant",
18
+ "7": "attorneys for plaintiff",
19
+ "8": "co-counsel for plaintiff",
20
+ "9": "counsel for plaintiff",
21
+ "10": "email",
22
+ "11": "fax",
23
+ "12": "lawfirm",
24
+ "13": "other",
25
+ "14": "parties",
26
+ "15": "telephone"
27
  },
28
  "initializer_range": 0.02,
29
  "intermediate_size": 3072,
30
  "label2id": {
31
+ "SBN": 0,
32
+ "address": 1,
33
+ "attorney for defendant/cross-complainant/cross-defendant": 2,
34
+ "attorney_name": 3,
35
+ "attorneys for co-counsel": 4,
36
+ "attorneys for co-defendant": 5,
37
+ "attorneys for defendant": 6,
38
+ "attorneys for plaintiff": 7,
39
+ "co-counsel for plaintiff": 8,
40
+ "counsel for plaintiff": 9,
41
+ "email": 10,
42
+ "fax": 11,
43
+ "lawfirm": 12,
44
+ "other": 13,
45
+ "parties": 14,
46
+ "telephone": 15
47
  },
48
+ "layer_norm_eps": 1e-12,
49
  "max_2d_position_embeddings": 1024,
50
+ "max_position_embeddings": 512,
51
  "model_type": "layoutlm",
52
  "num_attention_heads": 12,
53
  "num_hidden_layers": 12,
54
+ "output_past": true,
55
+ "pad_token_id": 0,
56
  "position_embedding_type": "absolute",
 
57
  "torch_dtype": "float32",
58
  "transformers_version": "4.39.0.dev0",
59
+ "type_vocab_size": 2,
60
  "use_cache": true,
61
+ "vocab_size": 30522
62
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91019c590ba6cb1518b07c03f72aec4f36ee40239af96131ce5d56c863d4707a
3
- size 511239464
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:426fc30233f066b24d33b2e9adf413c8770fc760809ea35966db48342c635937
3
+ size 450585896
runs/Mar15_04-26-50_a738b175db70/events.out.tfevents.1710476811.a738b175db70.640.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e5ed67762e431abb611dda872a625fb056850eb4b1e025138fc17b44f9c2b94
3
+ size 5438
runs/Mar15_05-09-02_a738b175db70/events.out.tfevents.1710479343.a738b175db70.640.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff7f450e63603ac879a110de4ec8367d4ada2dbc378d97ee6e1812879ae81380
3
+ size 7753
runs/Mar15_05-10-27_a738b175db70/events.out.tfevents.1710479428.a738b175db70.640.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b4481c538f8961ecd94a95a3508ef7062e2d5d4eddddfe3a0b5f35d2dc5e956
3
+ size 5527
runs/Mar15_05-10-40_a738b175db70/events.out.tfevents.1710479441.a738b175db70.640.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d81617d57f543437ffa8a2dfd284f30c08527d65800460b517ebd2b071e39fd
3
+ size 8090
tokenizer.json CHANGED
@@ -6,16 +6,7 @@
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
- "padding": {
10
- "strategy": {
11
- "Fixed": 512
12
- },
13
- "direction": "Right",
14
- "pad_to_multiple_of": null,
15
- "pad_id": 0,
16
- "pad_type_id": 0,
17
- "pad_token": "[PAD]"
18
- },
19
  "added_tokens": [
20
  {
21
  "id": 0,
 
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
+ "padding": null,
 
 
 
 
 
 
 
 
 
10
  "added_tokens": [
11
  {
12
  "id": 0,
tokenizer_config.json CHANGED
@@ -41,40 +41,16 @@
41
  "special": true
42
  }
43
  },
44
- "additional_special_tokens": [],
45
- "apply_ocr": false,
46
  "clean_up_tokenization_spaces": true,
47
  "cls_token": "[CLS]",
48
- "cls_token_box": [
49
- 0,
50
- 0,
51
- 0,
52
- 0
53
- ],
54
- "do_basic_tokenize": true,
55
  "do_lower_case": true,
56
  "mask_token": "[MASK]",
 
57
  "model_max_length": 512,
58
- "never_split": null,
59
- "only_label_first_subword": true,
60
  "pad_token": "[PAD]",
61
- "pad_token_box": [
62
- 0,
63
- 0,
64
- 0,
65
- 0
66
- ],
67
- "pad_token_label": -100,
68
- "processor_class": "LayoutLMv2Processor",
69
  "sep_token": "[SEP]",
70
- "sep_token_box": [
71
- 1000,
72
- 1000,
73
- 1000,
74
- 1000
75
- ],
76
  "strip_accents": null,
77
  "tokenize_chinese_chars": true,
78
- "tokenizer_class": "LayoutLMv2Tokenizer",
79
  "unk_token": "[UNK]"
80
  }
 
41
  "special": true
42
  }
43
  },
 
 
44
  "clean_up_tokenization_spaces": true,
45
  "cls_token": "[CLS]",
 
 
 
 
 
 
 
46
  "do_lower_case": true,
47
  "mask_token": "[MASK]",
48
+ "max_len": 512,
49
  "model_max_length": 512,
 
 
50
  "pad_token": "[PAD]",
 
 
 
 
 
 
 
 
51
  "sep_token": "[SEP]",
 
 
 
 
 
 
52
  "strip_accents": null,
53
  "tokenize_chinese_chars": true,
54
+ "tokenizer_class": "LayoutLMTokenizer",
55
  "unk_token": "[UNK]"
56
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb267664c88410ec285ff352a2025bf27e5098514fbd76dbac42ab7887fb7630
3
  size 4856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43c4e79aadf045e89982d6e95ea6046773154367159de0bae998da2375bfed0a
3
  size 4856