Delete checkpoint-6

Files changed (13) hide show

checkpoint-6/config.json DELETED Viewed

@@ -1,39 +0,0 @@
-{
-  "_name_or_path": "MakNeiro",
-  "activation_function": "gelu_new",
-  "architectures": [
-    "MakNeiroLMHeadModel"
-  ],
-  "attn_pdrop": 0.1,
-  "bos_token_id": 50256,
-  "embd_pdrop": 0.1,
-  "eos_token_id": 50256,
-  "initializer_range": 0.02,
-  "layer_norm_epsilon": 1e-05,
-  "model_type": "gpt2",
-  "n_ctx": 1024,
-  "n_embd": 768,
-  "n_head": 12,
-  "n_inner": null,
-  "n_layer": 12,
-  "n_positions": 1024,
-  "reorder_and_upcast_attn": false,
-  "resid_pdrop": 0.1,
-  "scale_attn_by_inverse_layer_idx": false,
-  "scale_attn_weights": true,
-  "summary_activation": null,
-  "summary_first_dropout": 0.1,
-  "summary_proj_to_labels": true,
-  "summary_type": "cls_index",
-  "summary_use_proj": true,
-  "task_specific_params": {
-    "text-generation": {
-      "do_sample": true,
-      "max_length": 50
-    }
-  },
-  "torch_dtype": "float32",
-  "transformers_version": "4.48.1",
-  "use_cache": true,
-  "vocab_size": 50257
-}

checkpoint-6/generation_config.json DELETED Viewed

@@ -1,6 +0,0 @@
-{
-  "_from_model_config": true,
-  "bos_token_id": 50256,
-  "eos_token_id": 50256,
-  "transformers_version": "4.48.1"
-}

checkpoint-6/merges.txt DELETED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-6/model.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:8c3213bf2cd176a6c38baf8b5ce9d2d1e60f9f00ca4be63a49bf2cf7c23153c8
-size 497774208

checkpoint-6/optimizer.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:6c4684019c08c1299d4cd1aaad14d10704267febd848ea5e3cadc6ddbf70c0ea
-size 995638202

checkpoint-6/rng_state.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:b2f03b5fb0d0cfe806763da6c4f1eaab2959746319e12efa4ab79eaaaa752065
-size 13990

checkpoint-6/scheduler.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:fe365bc08501112708f16b93d6f0262855f7de387b03f809ea8a015bd489f1d9
-size 1064

checkpoint-6/special_tokens_map.json DELETED Viewed

@@ -1,6 +0,0 @@
-{
-  "bos_token": "<|endoftext|>",
-  "eos_token": "<|endoftext|>",
-  "pad_token": "<|endoftext|>",
-  "unk_token": "<|endoftext|>"
-}

checkpoint-6/tokenizer.json DELETED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-6/tokenizer_config.json DELETED Viewed

@@ -1,21 +0,0 @@
-{
-  "add_prefix_space": false,
-  "added_tokens_decoder": {
-    "50256": {
-      "content": "<|endoftext|>",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    }
-  },
-  "bos_token": "<|endoftext|>",
-  "clean_up_tokenization_spaces": false,
-  "eos_token": "<|endoftext|>",
-  "extra_special_tokens": {},
-  "model_max_length": 1024,
-  "pad_token": "<|endoftext|>",
-  "tokenizer_class": "GPT2Tokenizer",
-  "unk_token": "<|endoftext|>"
-}

checkpoint-6/trainer_state.json DELETED Viewed

@@ -1,49 +0,0 @@
-{
-  "best_metric": null,
-  "best_model_checkpoint": null,
-  "epoch": 3.0,
-  "eval_steps": 500,
-  "global_step": 6,
-  "is_hyper_param_search": false,
-  "is_local_process_zero": true,
-  "is_world_process_zero": true,
-  "log_history": [
-    {
-      "epoch": 1.0,
-      "eval_loss": 4.320729732513428,
-      "eval_runtime": 0.118,
-      "eval_samples_per_second": 8.475,
-      "eval_steps_per_second": 8.475,
-      "step": 2
-    },
-    {
-      "epoch": 2.0,
-      "eval_loss": 2.3262906074523926,
-      "eval_runtime": 0.11,
-      "eval_samples_per_second": 9.091,
-      "eval_steps_per_second": 9.091,
-      "step": 4
-    }
-  ],
-  "logging_steps": 200,
-  "max_steps": 6,
-  "num_input_tokens_seen": 0,
-  "num_train_epochs": 3,
-  "save_steps": 10000,
-  "stateful_callbacks": {
-    "TrainerControl": {
-      "args": {
-        "should_epoch_stop": false,
-        "should_evaluate": false,
-        "should_log": false,
-        "should_save": true,
-        "should_training_stop": true
-      },
-      "attributes": {}
-    }
-  },
-  "total_flos": 979845120000.0,
-  "train_batch_size": 4,
-  "trial_name": null,
-  "trial_params": null
-}

checkpoint-6/training_args.bin DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:c97fe1a3a61f8156f07f9b504a8243379d1bff62a1c3fd9aad81e14b1ba7d043
-size 5304

checkpoint-6/vocab.json DELETED Viewed

The diff for this file is too large to render. See raw diff