SjardiWillems commited on Mar 3, 2024

Commit

81a3037

verified ·

1 Parent(s): e3f7f77

Training in progress, epoch 1

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

model.safetensors +1 -1
run-2/checkpoint-108/config.json +25 -0
run-2/checkpoint-108/model.safetensors +3 -0
run-2/checkpoint-108/optimizer.pt +3 -0
run-2/checkpoint-108/rng_state.pth +3 -0
run-2/checkpoint-108/scheduler.pt +3 -0
run-2/checkpoint-108/special_tokens_map.json +7 -0
run-2/checkpoint-108/tokenizer.json +0 -0
run-2/checkpoint-108/tokenizer_config.json +55 -0
run-2/checkpoint-108/trainer_state.json +62 -0
run-2/checkpoint-108/training_args.bin +3 -0
run-2/checkpoint-108/vocab.txt +0 -0
run-2/checkpoint-135/config.json +25 -0
run-2/checkpoint-135/model.safetensors +3 -0
run-2/checkpoint-135/optimizer.pt +3 -0
run-2/checkpoint-135/rng_state.pth +3 -0
run-2/checkpoint-135/scheduler.pt +3 -0
run-2/checkpoint-135/special_tokens_map.json +7 -0
run-2/checkpoint-135/tokenizer.json +0 -0
run-2/checkpoint-135/tokenizer_config.json +55 -0
run-2/checkpoint-135/trainer_state.json +71 -0
run-2/checkpoint-135/training_args.bin +3 -0
run-2/checkpoint-135/vocab.txt +0 -0
run-2/checkpoint-54/config.json +25 -0
run-2/checkpoint-54/model.safetensors +3 -0
run-2/checkpoint-54/optimizer.pt +3 -0
run-2/checkpoint-54/rng_state.pth +3 -0
run-2/checkpoint-54/scheduler.pt +3 -0
run-2/checkpoint-54/special_tokens_map.json +7 -0
run-2/checkpoint-54/tokenizer.json +0 -0
run-2/checkpoint-54/tokenizer_config.json +55 -0
run-2/checkpoint-54/trainer_state.json +44 -0
run-2/checkpoint-54/training_args.bin +3 -0
run-2/checkpoint-54/vocab.txt +0 -0
run-2/checkpoint-81/config.json +25 -0
run-2/checkpoint-81/model.safetensors +3 -0
run-2/checkpoint-81/optimizer.pt +3 -0
run-2/checkpoint-81/rng_state.pth +3 -0
run-2/checkpoint-81/scheduler.pt +3 -0
run-2/checkpoint-81/special_tokens_map.json +7 -0
run-2/checkpoint-81/tokenizer.json +0 -0
run-2/checkpoint-81/tokenizer_config.json +55 -0
run-2/checkpoint-81/trainer_state.json +53 -0
run-2/checkpoint-81/training_args.bin +3 -0
run-2/checkpoint-81/vocab.txt +0 -0
run-3/checkpoint-14/config.json +25 -0
run-3/checkpoint-14/model.safetensors +3 -0
run-3/checkpoint-14/optimizer.pt +3 -0
run-3/checkpoint-14/rng_state.pth +3 -0
run-3/checkpoint-14/scheduler.pt +3 -0

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:deb089e9ac2ba3e9bfee178463e0a5351fb79b4046211f6167830b3a160bf33d
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:34758dea04f1bea7ab3e4dd1e3a3218a2e99ce16f149b8e02c525be17cfea861
 size 267832560

run-2/checkpoint-108/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "vocab_size": 30522
+}

run-2/checkpoint-108/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:799684ca1e24f982075d992e9e335324f5573e7ef56c67cd5bcb133e8f2f0b6b
+size 267832560

run-2/checkpoint-108/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:610577fdf4659c6f7b9094f14056906c56708303f1aff15389b8b4a6b502c56f
+size 535727290

run-2/checkpoint-108/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:59b6d72b7c13134366148b85305a10efa5c12ac394465f536cb8ec929f115e0b
+size 14244

run-2/checkpoint-108/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:20d21f2ab7fb975821737104762c4b794348af2df3e1c90e1318bd02d3a913ac
+size 1064

run-2/checkpoint-108/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-108/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-2/checkpoint-108/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-108/trainer_state.json ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+  "best_metric": 0.3357348095160262,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-2/checkpoint-81",
+  "epoch": 4.0,
+  "eval_steps": 500,
+  "global_step": 108,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.5863072276115417,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.5165,
+      "eval_samples_per_second": 2019.464,
+      "eval_steps_per_second": 127.79,
+      "step": 27
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6026574969291687,
+      "eval_matthews_correlation": 0.2013844279302642,
+      "eval_runtime": 0.5047,
+      "eval_samples_per_second": 2066.4,
+      "eval_steps_per_second": 130.76,
+      "step": 54
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.607330322265625,
+      "eval_matthews_correlation": 0.3357348095160262,
+      "eval_runtime": 0.5243,
+      "eval_samples_per_second": 1989.403,
+      "eval_steps_per_second": 125.887,
+      "step": 81
+    },
+    {
+      "epoch": 4.0,
+      "eval_loss": 0.7189709544181824,
+      "eval_matthews_correlation": 0.3154257263042179,
+      "eval_runtime": 0.5087,
+      "eval_samples_per_second": 2050.342,
+      "eval_steps_per_second": 129.744,
+      "step": 108
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 135,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.425091322202513e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 32,
+    "seed": 27
+  }
+}

run-2/checkpoint-108/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e90b8efb5f56f17604458520e4d53f07ee283e90d1f7b6a020b4be6c6503812e
+size 4984

run-2/checkpoint-108/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-2/checkpoint-135/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "vocab_size": 30522
+}

run-2/checkpoint-135/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:494c8ee337329ce4be4fc474cb1a9c1467c4f48106b62ca8731a04d537c93511
+size 267832560

run-2/checkpoint-135/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3d0c8be98c18c032f8dfa75043d7136ff12a6dca264142ed0ba7a5b8391081d9
+size 535727290

run-2/checkpoint-135/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4c672204aac7a101b6410ac612308b42ce010335d1ac3001c6f663573700fb09
+size 14244

run-2/checkpoint-135/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2c85e8f1bc5d1181d5fa0ae120687b388adfcc66b640e756e8177997e5bc3778
+size 1064

run-2/checkpoint-135/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-135/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-2/checkpoint-135/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-135/trainer_state.json ADDED Viewed

	@@ -0,0 +1,71 @@

+{
+  "best_metric": 0.3357348095160262,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-2/checkpoint-81",
+  "epoch": 5.0,
+  "eval_steps": 500,
+  "global_step": 135,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.5863072276115417,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.5165,
+      "eval_samples_per_second": 2019.464,
+      "eval_steps_per_second": 127.79,
+      "step": 27
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6026574969291687,
+      "eval_matthews_correlation": 0.2013844279302642,
+      "eval_runtime": 0.5047,
+      "eval_samples_per_second": 2066.4,
+      "eval_steps_per_second": 130.76,
+      "step": 54
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.607330322265625,
+      "eval_matthews_correlation": 0.3357348095160262,
+      "eval_runtime": 0.5243,
+      "eval_samples_per_second": 1989.403,
+      "eval_steps_per_second": 125.887,
+      "step": 81
+    },
+    {
+      "epoch": 4.0,
+      "eval_loss": 0.7189709544181824,
+      "eval_matthews_correlation": 0.3154257263042179,
+      "eval_runtime": 0.5087,
+      "eval_samples_per_second": 2050.342,
+      "eval_steps_per_second": 129.744,
+      "step": 108
+    },
+    {
+      "epoch": 5.0,
+      "eval_loss": 0.7904144525527954,
+      "eval_matthews_correlation": 0.330547033474257,
+      "eval_runtime": 0.517,
+      "eval_samples_per_second": 2017.523,
+      "eval_steps_per_second": 127.667,
+      "step": 135
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 135,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.425091322202513e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 32,
+    "seed": 27
+  }
+}

run-2/checkpoint-135/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e90b8efb5f56f17604458520e4d53f07ee283e90d1f7b6a020b4be6c6503812e
+size 4984

run-2/checkpoint-135/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-2/checkpoint-54/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "vocab_size": 30522
+}

run-2/checkpoint-54/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e67d42c7b5ce5be69053a13c00a3e983682f24fd86122eca03a4b54bdaf15095
+size 267832560

run-2/checkpoint-54/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8003bab0865001b17f3b0cab5f3a93e3c888c510bc54f8234f473fc73f29882d
+size 535727290

run-2/checkpoint-54/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7cd3af59b7bc57117e33eb85129fb27fe9b99a4d97b80616ed19ab24a60dd7a4
+size 14244

run-2/checkpoint-54/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1c4c727881ab7818c061d58ab3d72eb93859bf6554a1d381415340dc93338332
+size 1064

run-2/checkpoint-54/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-54/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-2/checkpoint-54/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-54/trainer_state.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "best_metric": 0.2013844279302642,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-2/checkpoint-54",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 54,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.5863072276115417,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.5165,
+      "eval_samples_per_second": 2019.464,
+      "eval_steps_per_second": 127.79,
+      "step": 27
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6026574969291687,
+      "eval_matthews_correlation": 0.2013844279302642,
+      "eval_runtime": 0.5047,
+      "eval_samples_per_second": 2066.4,
+      "eval_steps_per_second": 130.76,
+      "step": 54
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 135,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.425091322202513e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 32,
+    "seed": 27
+  }
+}

run-2/checkpoint-54/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e90b8efb5f56f17604458520e4d53f07ee283e90d1f7b6a020b4be6c6503812e
+size 4984

run-2/checkpoint-54/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-2/checkpoint-81/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "vocab_size": 30522
+}

run-2/checkpoint-81/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7bc2ca71e34d79bf5f4e95b539e7003cc222a659304e2d9f25c9840fbdb2ac5f
+size 267832560

run-2/checkpoint-81/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:adbc2e3aeb472b78064a18c901ab0fadc2ad2c24ad10b5385f8014042aec3298
+size 535727290

run-2/checkpoint-81/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ba75ccedb65df6de671761dac259371c3a129942c31ec316e9b2776bdda36507
+size 14244

run-2/checkpoint-81/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a6e867063540d48528730ccc5e97a5778c11fca371a55d7f450fe37f9f8f584b
+size 1064

run-2/checkpoint-81/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-81/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-2/checkpoint-81/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-81/trainer_state.json ADDED Viewed

	@@ -0,0 +1,53 @@

+{
+  "best_metric": 0.3357348095160262,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-2/checkpoint-81",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 81,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.5863072276115417,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.5165,
+      "eval_samples_per_second": 2019.464,
+      "eval_steps_per_second": 127.79,
+      "step": 27
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6026574969291687,
+      "eval_matthews_correlation": 0.2013844279302642,
+      "eval_runtime": 0.5047,
+      "eval_samples_per_second": 2066.4,
+      "eval_steps_per_second": 130.76,
+      "step": 54
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.607330322265625,
+      "eval_matthews_correlation": 0.3357348095160262,
+      "eval_runtime": 0.5243,
+      "eval_samples_per_second": 1989.403,
+      "eval_steps_per_second": 125.887,
+      "step": 81
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 135,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.425091322202513e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 32,
+    "seed": 27
+  }
+}

run-2/checkpoint-81/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e90b8efb5f56f17604458520e4d53f07ee283e90d1f7b6a020b4be6c6503812e
+size 4984

run-2/checkpoint-81/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-14/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "vocab_size": 30522
+}

run-3/checkpoint-14/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:34758dea04f1bea7ab3e4dd1e3a3218a2e99ce16f149b8e02c525be17cfea861
+size 267832560

run-3/checkpoint-14/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:de8b8bbf28dd4bfd70fd116511ecea1485ec20bad536edf9b8ff3d6389ab81b9
+size 535727290

run-3/checkpoint-14/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:44f1ba7aab2dfa1d0478d1725b890b6fd7e36f8371ca31185f540f856a92f08a
+size 14244

run-3/checkpoint-14/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cc52100d304523553ddf963ecc74beb1a4e173ed77e02db7504af683ece58cc9
+size 1064