Mak05 commited on
Commit
be8728d
·
verified ·
1 Parent(s): 4839c16

Delete checkpoint-6

Browse files
checkpoint-6/config.json DELETED
@@ -1,39 +0,0 @@
1
- {
2
- "_name_or_path": "MakNeiro",
3
- "activation_function": "gelu_new",
4
- "architectures": [
5
- "MakNeiroLMHeadModel"
6
- ],
7
- "attn_pdrop": 0.1,
8
- "bos_token_id": 50256,
9
- "embd_pdrop": 0.1,
10
- "eos_token_id": 50256,
11
- "initializer_range": 0.02,
12
- "layer_norm_epsilon": 1e-05,
13
- "model_type": "gpt2",
14
- "n_ctx": 1024,
15
- "n_embd": 768,
16
- "n_head": 12,
17
- "n_inner": null,
18
- "n_layer": 12,
19
- "n_positions": 1024,
20
- "reorder_and_upcast_attn": false,
21
- "resid_pdrop": 0.1,
22
- "scale_attn_by_inverse_layer_idx": false,
23
- "scale_attn_weights": true,
24
- "summary_activation": null,
25
- "summary_first_dropout": 0.1,
26
- "summary_proj_to_labels": true,
27
- "summary_type": "cls_index",
28
- "summary_use_proj": true,
29
- "task_specific_params": {
30
- "text-generation": {
31
- "do_sample": true,
32
- "max_length": 50
33
- }
34
- },
35
- "torch_dtype": "float32",
36
- "transformers_version": "4.48.1",
37
- "use_cache": true,
38
- "vocab_size": 50257
39
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-6/generation_config.json DELETED
@@ -1,6 +0,0 @@
1
- {
2
- "_from_model_config": true,
3
- "bos_token_id": 50256,
4
- "eos_token_id": 50256,
5
- "transformers_version": "4.48.1"
6
- }
 
 
 
 
 
 
 
checkpoint-6/merges.txt DELETED
The diff for this file is too large to render. See raw diff
 
checkpoint-6/model.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:8c3213bf2cd176a6c38baf8b5ce9d2d1e60f9f00ca4be63a49bf2cf7c23153c8
3
- size 497774208
 
 
 
 
checkpoint-6/optimizer.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c4684019c08c1299d4cd1aaad14d10704267febd848ea5e3cadc6ddbf70c0ea
3
- size 995638202
 
 
 
 
checkpoint-6/rng_state.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2f03b5fb0d0cfe806763da6c4f1eaab2959746319e12efa4ab79eaaaa752065
3
- size 13990
 
 
 
 
checkpoint-6/scheduler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe365bc08501112708f16b93d6f0262855f7de387b03f809ea8a015bd489f1d9
3
- size 1064
 
 
 
 
checkpoint-6/special_tokens_map.json DELETED
@@ -1,6 +0,0 @@
1
- {
2
- "bos_token": "<|endoftext|>",
3
- "eos_token": "<|endoftext|>",
4
- "pad_token": "<|endoftext|>",
5
- "unk_token": "<|endoftext|>"
6
- }
 
 
 
 
 
 
 
checkpoint-6/tokenizer.json DELETED
The diff for this file is too large to render. See raw diff
 
checkpoint-6/tokenizer_config.json DELETED
@@ -1,21 +0,0 @@
1
- {
2
- "add_prefix_space": false,
3
- "added_tokens_decoder": {
4
- "50256": {
5
- "content": "<|endoftext|>",
6
- "lstrip": false,
7
- "normalized": true,
8
- "rstrip": false,
9
- "single_word": false,
10
- "special": true
11
- }
12
- },
13
- "bos_token": "<|endoftext|>",
14
- "clean_up_tokenization_spaces": false,
15
- "eos_token": "<|endoftext|>",
16
- "extra_special_tokens": {},
17
- "model_max_length": 1024,
18
- "pad_token": "<|endoftext|>",
19
- "tokenizer_class": "GPT2Tokenizer",
20
- "unk_token": "<|endoftext|>"
21
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-6/trainer_state.json DELETED
@@ -1,49 +0,0 @@
1
- {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 3.0,
5
- "eval_steps": 500,
6
- "global_step": 6,
7
- "is_hyper_param_search": false,
8
- "is_local_process_zero": true,
9
- "is_world_process_zero": true,
10
- "log_history": [
11
- {
12
- "epoch": 1.0,
13
- "eval_loss": 4.320729732513428,
14
- "eval_runtime": 0.118,
15
- "eval_samples_per_second": 8.475,
16
- "eval_steps_per_second": 8.475,
17
- "step": 2
18
- },
19
- {
20
- "epoch": 2.0,
21
- "eval_loss": 2.3262906074523926,
22
- "eval_runtime": 0.11,
23
- "eval_samples_per_second": 9.091,
24
- "eval_steps_per_second": 9.091,
25
- "step": 4
26
- }
27
- ],
28
- "logging_steps": 200,
29
- "max_steps": 6,
30
- "num_input_tokens_seen": 0,
31
- "num_train_epochs": 3,
32
- "save_steps": 10000,
33
- "stateful_callbacks": {
34
- "TrainerControl": {
35
- "args": {
36
- "should_epoch_stop": false,
37
- "should_evaluate": false,
38
- "should_log": false,
39
- "should_save": true,
40
- "should_training_stop": true
41
- },
42
- "attributes": {}
43
- }
44
- },
45
- "total_flos": 979845120000.0,
46
- "train_batch_size": 4,
47
- "trial_name": null,
48
- "trial_params": null
49
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-6/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:c97fe1a3a61f8156f07f9b504a8243379d1bff62a1c3fd9aad81e14b1ba7d043
3
- size 5304
 
 
 
 
checkpoint-6/vocab.json DELETED
The diff for this file is too large to render. See raw diff