pierreguillou
/

lilt-xlm-roberta-base-finetuned-with-DocLayNet-base-at-paragraphlevel-ml512

Model card Files Files and versions Metrics Training metrics Community

pierreguillou commited on Feb 15, 2023

Commit

541b089

1 Parent(s): c3d2988

Training in progress, step 400

Browse files

Files changed (36) hide show

.gitattributes +0 -1
{checkpoint-100 → checkpoint-200}/config.json +0 -0
{checkpoint-100 → checkpoint-200}/optimizer.pt +1 -1
{checkpoint-100 → checkpoint-200}/pytorch_model.bin +1 -1
{checkpoint-100 → checkpoint-200}/rng_state.pth +1 -1
{checkpoint-100 → checkpoint-200}/scaler.pt +1 -1
{checkpoint-100 → checkpoint-200}/scheduler.pt +1 -1
{checkpoint-100 → checkpoint-200}/special_tokens_map.json +0 -0
{checkpoint-100 → checkpoint-200}/tokenizer.json +0 -0
{checkpoint-100 → checkpoint-200}/tokenizer_config.json +0 -0
{checkpoint-100 → checkpoint-200}/trainer_state.json +17 -5
{checkpoint-100 → checkpoint-200}/training_args.bin +0 -0
checkpoint-300/config.json +56 -0
checkpoint-300/optimizer.pt +3 -0
checkpoint-300/pytorch_model.bin +3 -0
checkpoint-300/rng_state.pth +3 -0
checkpoint-300/scaler.pt +3 -0
checkpoint-300/scheduler.pt +3 -0
checkpoint-300/special_tokens_map.json +15 -0
checkpoint-300/tokenizer.json +3 -0
checkpoint-300/tokenizer_config.json +20 -0
checkpoint-300/trainer_state.json +52 -0
checkpoint-300/training_args.bin +3 -0
checkpoint-400/config.json +56 -0
checkpoint-400/optimizer.pt +3 -0
checkpoint-400/pytorch_model.bin +3 -0
checkpoint-400/rng_state.pth +3 -0
checkpoint-400/scaler.pt +3 -0
checkpoint-400/scheduler.pt +3 -0
checkpoint-400/special_tokens_map.json +15 -0
checkpoint-400/tokenizer.json +3 -0
checkpoint-400/tokenizer_config.json +20 -0
checkpoint-400/trainer_state.json +64 -0
checkpoint-400/training_args.bin +3 -0
pytorch_model.bin +1 -1
runs/Feb15_07-53-26_e220f522c880/events.out.tfevents.1676447621.e220f522c880.495.0 +2 -2

.gitattributes CHANGED Viewed

@@ -32,5 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
-checkpoint-100/tokenizer.json filter=lfs diff=lfs merge=lfs -text
 tokenizer.json filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
 tokenizer.json filter=lfs diff=lfs merge=lfs -text

{checkpoint-100 → checkpoint-200}/config.json RENAMED Viewed

File without changes

{checkpoint-100 → checkpoint-200}/optimizer.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3c3bb7f798b7faa9ffe19d5e1bb8395f1909a3e12768cc1876e800e16f389c7a
 size 2265827717

 version https://git-lfs.github.com/spec/v1
+oid sha256:c7cdf79d3146238ae659f3724cb61a9f3eef1d94bdc25b29615f00c8f24590c2
 size 2265827717

{checkpoint-100 → checkpoint-200}/pytorch_model.bin RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8ddccc8aa50bfb082d45e1d9486a1480ff83d9b46e9e73c0609138717d6e917e
 size 1134425553

 version https://git-lfs.github.com/spec/v1
+oid sha256:d22e589804912ea5de135343295f3d1d679cdb01de0862367236991e3a9e8f5b
 size 1134425553

{checkpoint-100 → checkpoint-200}/rng_state.pth RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b3f5812fac2dd8ce54f144d17e5819925f261f779dbbc7a7fe69a7fcaf2e80f8
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:19a5fbfb1d8b3fb183af663f8903b6b2d98760688828d8a5abb54552e6de1d6f
 size 14575

{checkpoint-100 → checkpoint-200}/scaler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:49275945ecfd0346ebdc51411033b3b40ac9d7fd86faa2315017693f738a1151
 size 557

 version https://git-lfs.github.com/spec/v1
+oid sha256:fc28ad4ba690d88b4a64a84b0eb679f0ae2052dd18f66a37a2ec7425463d2024
 size 557

{checkpoint-100 → checkpoint-200}/scheduler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:26589aff2b7c88281509e1e9d0ce9b63736104f150596456f9ee599b4187ae0d
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:f06cf77a584fcbc5eec1e5ddee45214561dae318ae26edcbcc04f742aac3e73b
 size 627

{checkpoint-100 → checkpoint-200}/special_tokens_map.json RENAMED Viewed

File without changes

{checkpoint-100 → checkpoint-200}/tokenizer.json RENAMED Viewed

File without changes

{checkpoint-100 → checkpoint-200}/tokenizer_config.json RENAMED Viewed

File without changes

{checkpoint-100 → checkpoint-200}/trainer_state.json RENAMED Viewed

@@ -1,8 +1,8 @@
 {
-  "best_metric": 0.6585185702735884,
-  "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_paragraphs_ml512-v5/checkpoint-100",
-  "epoch": 0.053304904051172705,
-  "global_step": 100,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -18,11 +18,23 @@
       "eval_samples_per_second": 33.717,
       "eval_steps_per_second": 2.119,
       "step": 100
     }
   ],
   "max_steps": 1876,
   "num_train_epochs": 1,
-  "total_flos": 222537791078400.0,
   "trial_name": null,
   "trial_params": null
 }

 {
+  "best_metric": 0.7551279108067913,
+  "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_paragraphs_ml512-v5/checkpoint-200",
+  "epoch": 0.10660980810234541,
+  "global_step": 200,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 33.717,
       "eval_steps_per_second": 2.119,
       "step": 100
+    },
+    {
+      "epoch": 0.11,
+      "eval_accuracy": 0.7551279108067913,
+      "eval_f1": 0.7551279108067913,
+      "eval_loss": 0.7886354327201843,
+      "eval_precision": 0.7551279108067913,
+      "eval_recall": 0.7551279108067913,
+      "eval_runtime": 48.4163,
+      "eval_samples_per_second": 33.191,
+      "eval_steps_per_second": 2.086,
+      "step": 200
     }
   ],
   "max_steps": 1876,
   "num_train_epochs": 1,
+  "total_flos": 445075582156800.0,
   "trial_name": null,
   "trial_params": null
 }

{checkpoint-100 → checkpoint-200}/training_args.bin RENAMED Viewed

File without changes

checkpoint-300/config.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "_name_or_path": "nielsr/lilt-xlm-roberta-base",
+  "architectures": [
+    "LiltForTokenClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "channel_shrink_ratio": 4,
+  "classifier_dropout": null,
+  "eos_token_id": 2,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "Caption",
+    "1": "Footnote",
+    "2": "Formula",
+    "3": "List-item",
+    "4": "Page-footer",
+    "5": "Page-header",
+    "6": "Picture",
+    "7": "Section-header",
+    "8": "Table",
+    "9": "Text",
+    "10": "Title"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "Caption": 0,
+    "Footnote": 1,
+    "Formula": 2,
+    "List-item": 3,
+    "Page-footer": 4,
+    "Page-header": 5,
+    "Picture": 6,
+    "Section-header": 7,
+    "Table": 8,
+    "Text": 9,
+    "Title": 10
+  },
+  "layer_norm_eps": 1e-05,
+  "max_2d_position_embeddings": 1024,
+  "max_position_embeddings": 514,
+  "model_type": "lilt",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "output_past": true,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "torch_dtype": "float32",
+  "transformers_version": "4.26.1",
+  "type_vocab_size": 1,
+  "use_cache": true,
+  "vocab_size": 250002
+}

checkpoint-300/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5b57c47892e2c979ead028ed133a8e6310573791bcb0ce4b62a32dc49850683e
+size 2265828101

checkpoint-300/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:880a92376813495eb9c614b219a5f3739441875a9dd423f5a5a4c0f194747462
+size 1134425553

checkpoint-300/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2edaa8158eaf8be7cc7f6c6471898dae049ef076acac0f3f1cc542415dc6dfca
+size 14575

checkpoint-300/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:35d89833ad47769c3fd687316799e7acd03e729c4180e72e9a36d6ac51bf9656
+size 557

checkpoint-300/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:40904ad5451576d85b4d1b180d481a37f60db63c24eb116a2d70a90d013a25fd
+size 627

checkpoint-300/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": {
+    "content": "<mask>",
+    "lstrip": true,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "unk_token": "<unk>"
+}

checkpoint-300/tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:62c24cdc13d4c9952d63718d6c9fa4c287974249e16b7ade6d5a85e7bbb75626
+size 17082660

checkpoint-300/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,20 @@

+{
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": {
+    "__type": "AddedToken",
+    "content": "<mask>",
+    "lstrip": true,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "model_max_length": 512,
+  "name_or_path": "nielsr/lilt-xlm-roberta-base",
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "special_tokens_map_file": null,
+  "tokenizer_class": "XLMRobertaTokenizer",
+  "unk_token": "<unk>"
+}

checkpoint-300/trainer_state.json ADDED Viewed

	@@ -0,0 +1,52 @@

+{
+  "best_metric": 0.8248275724395382,
+  "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_paragraphs_ml512-v5/checkpoint-300",
+  "epoch": 0.15991471215351813,
+  "global_step": 300,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.05,
+      "eval_accuracy": 0.6585185702735884,
+      "eval_f1": 0.6585185702735884,
+      "eval_loss": 0.9875321388244629,
+      "eval_precision": 0.6585185702735884,
+      "eval_recall": 0.6585185702735884,
+      "eval_runtime": 47.6616,
+      "eval_samples_per_second": 33.717,
+      "eval_steps_per_second": 2.119,
+      "step": 100
+    },
+    {
+      "epoch": 0.11,
+      "eval_accuracy": 0.7551279108067913,
+      "eval_f1": 0.7551279108067913,
+      "eval_loss": 0.7886354327201843,
+      "eval_precision": 0.7551279108067913,
+      "eval_recall": 0.7551279108067913,
+      "eval_runtime": 48.4163,
+      "eval_samples_per_second": 33.191,
+      "eval_steps_per_second": 2.086,
+      "step": 200
+    },
+    {
+      "epoch": 0.16,
+      "eval_accuracy": 0.8248275724395381,
+      "eval_f1": 0.8248275724395382,
+      "eval_loss": 0.5894176363945007,
+      "eval_precision": 0.8248275724395381,
+      "eval_recall": 0.8248275724395381,
+      "eval_runtime": 47.5388,
+      "eval_samples_per_second": 33.804,
+      "eval_steps_per_second": 2.125,
+      "step": 300
+    }
+  ],
+  "max_steps": 1876,
+  "num_train_epochs": 1,
+  "total_flos": 667613373235200.0,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-300/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:575d482dfbe4b5795db81627b295d36a31851f66bb801524d15bc53043f733c4
+size 3707

checkpoint-400/config.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "_name_or_path": "nielsr/lilt-xlm-roberta-base",
+  "architectures": [
+    "LiltForTokenClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "channel_shrink_ratio": 4,
+  "classifier_dropout": null,
+  "eos_token_id": 2,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "Caption",
+    "1": "Footnote",
+    "2": "Formula",
+    "3": "List-item",
+    "4": "Page-footer",
+    "5": "Page-header",
+    "6": "Picture",
+    "7": "Section-header",
+    "8": "Table",
+    "9": "Text",
+    "10": "Title"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "Caption": 0,
+    "Footnote": 1,
+    "Formula": 2,
+    "List-item": 3,
+    "Page-footer": 4,
+    "Page-header": 5,
+    "Picture": 6,
+    "Section-header": 7,
+    "Table": 8,
+    "Text": 9,
+    "Title": 10
+  },
+  "layer_norm_eps": 1e-05,
+  "max_2d_position_embeddings": 1024,
+  "max_position_embeddings": 514,
+  "model_type": "lilt",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "output_past": true,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "torch_dtype": "float32",
+  "transformers_version": "4.26.1",
+  "type_vocab_size": 1,
+  "use_cache": true,
+  "vocab_size": 250002
+}

checkpoint-400/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7bea0ae9c91632ba73324243f693237eedfde07c60552f721ae85502620f6663
+size 2265828101

checkpoint-400/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4727566eb4ffd9fac82a769c6b877c66e5ed779dfa933929c682a8e7337e5fa1
+size 1134425553

checkpoint-400/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6084e517c898c5f3679c65138c00f6e8c42eb251e79e5c86866ef9d34d8a6959
+size 14575

checkpoint-400/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8894add6cf5ff4d4049868d7614fbae0eb98e7ffb617edb8d94b4cd7e15ebd0d
+size 557

checkpoint-400/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:510282233ecb669cc6a91c195a0954011c19ca6b777845a850e4192cef7447aa
+size 627

checkpoint-400/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": {
+    "content": "<mask>",
+    "lstrip": true,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "unk_token": "<unk>"
+}

checkpoint-400/tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:62c24cdc13d4c9952d63718d6c9fa4c287974249e16b7ade6d5a85e7bbb75626
+size 17082660

checkpoint-400/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,20 @@

+{
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": {
+    "__type": "AddedToken",
+    "content": "<mask>",
+    "lstrip": true,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "model_max_length": 512,
+  "name_or_path": "nielsr/lilt-xlm-roberta-base",
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "special_tokens_map_file": null,
+  "tokenizer_class": "XLMRobertaTokenizer",
+  "unk_token": "<unk>"
+}

checkpoint-400/trainer_state.json ADDED Viewed

	@@ -0,0 +1,64 @@

+{
+  "best_metric": 0.8395799854272509,
+  "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_paragraphs_ml512-v5/checkpoint-400",
+  "epoch": 0.21321961620469082,
+  "global_step": 400,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.05,
+      "eval_accuracy": 0.6585185702735884,
+      "eval_f1": 0.6585185702735884,
+      "eval_loss": 0.9875321388244629,
+      "eval_precision": 0.6585185702735884,
+      "eval_recall": 0.6585185702735884,
+      "eval_runtime": 47.6616,
+      "eval_samples_per_second": 33.717,
+      "eval_steps_per_second": 2.119,
+      "step": 100
+    },
+    {
+      "epoch": 0.11,
+      "eval_accuracy": 0.7551279108067913,
+      "eval_f1": 0.7551279108067913,
+      "eval_loss": 0.7886354327201843,
+      "eval_precision": 0.7551279108067913,
+      "eval_recall": 0.7551279108067913,
+      "eval_runtime": 48.4163,
+      "eval_samples_per_second": 33.191,
+      "eval_steps_per_second": 2.086,
+      "step": 200
+    },
+    {
+      "epoch": 0.16,
+      "eval_accuracy": 0.8248275724395381,
+      "eval_f1": 0.8248275724395382,
+      "eval_loss": 0.5894176363945007,
+      "eval_precision": 0.8248275724395381,
+      "eval_recall": 0.8248275724395381,
+      "eval_runtime": 47.5388,
+      "eval_samples_per_second": 33.804,
+      "eval_steps_per_second": 2.125,
+      "step": 300
+    },
+    {
+      "epoch": 0.21,
+      "eval_accuracy": 0.839579985427251,
+      "eval_f1": 0.8395799854272509,
+      "eval_loss": 0.479428768157959,
+      "eval_precision": 0.839579985427251,
+      "eval_recall": 0.839579985427251,
+      "eval_runtime": 45.3857,
+      "eval_samples_per_second": 35.408,
+      "eval_steps_per_second": 2.225,
+      "step": 400
+    }
+  ],
+  "max_steps": 1876,
+  "num_train_epochs": 1,
+  "total_flos": 890151164313600.0,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-400/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:575d482dfbe4b5795db81627b295d36a31851f66bb801524d15bc53043f733c4
+size 3707

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8ddccc8aa50bfb082d45e1d9486a1480ff83d9b46e9e73c0609138717d6e917e
 size 1134425553

 version https://git-lfs.github.com/spec/v1
+oid sha256:4727566eb4ffd9fac82a769c6b877c66e5ed779dfa933929c682a8e7337e5fa1
 size 1134425553

runs/Feb15_07-53-26_e220f522c880/events.out.tfevents.1676447621.e220f522c880.495.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5505a2df10be119c29733e09f107dae909925262ce13ec35de03e8b1cf862391
-size 5136

 version https://git-lfs.github.com/spec/v1
+oid sha256:2c9463d47ba3115fd44ba28de90fc0000cfcf2825b962b5b23499351a1fc9e21
+size 6552