jermyn commited on
Commit
7b84f1c
1 Parent(s): 78c10df

Training in progress, step 10

Browse files
adapter_config.json CHANGED
@@ -16,17 +16,17 @@
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": null,
18
  "peft_type": "LORA",
19
- "r": 32,
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "up_proj",
24
  "o_proj",
25
- "q_proj",
26
  "k_proj",
27
- "down_proj",
28
  "gate_proj",
29
- "v_proj"
 
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": null,
18
  "peft_type": "LORA",
19
+ "r": 16,
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
23
  "o_proj",
24
+ "up_proj",
25
  "k_proj",
26
+ "v_proj",
27
  "gate_proj",
28
+ "q_proj",
29
+ "down_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:84af51dc250669c92d92b05b429eef31fd02f1396e5504973994a79b49c9acf0
3
- size 60010384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a8c26b2c5d8f6ca20b8846fc26b4c55ea31d8ad614db0a006e672950f40910e
3
+ size 30027544
config.json CHANGED
@@ -12,6 +12,7 @@
12
  "initializer_range": 0.02,
13
  "intermediate_size": 5504,
14
  "max_position_embeddings": 16384,
 
15
  "model_type": "llama",
16
  "num_attention_heads": 16,
17
  "num_hidden_layers": 24,
@@ -40,7 +41,7 @@
40
  "rope_theta": 100000,
41
  "tie_word_embeddings": false,
42
  "torch_dtype": "bfloat16",
43
- "transformers_version": "4.40.2",
44
  "use_cache": false,
45
  "vocab_size": 32256
46
  }
 
12
  "initializer_range": 0.02,
13
  "intermediate_size": 5504,
14
  "max_position_embeddings": 16384,
15
+ "mlp_bias": false,
16
  "model_type": "llama",
17
  "num_attention_heads": 16,
18
  "num_hidden_layers": 24,
 
41
  "rope_theta": 100000,
42
  "tie_word_embeddings": false,
43
  "torch_dtype": "bfloat16",
44
+ "transformers_version": "4.41.1",
45
  "use_cache": false,
46
  "vocab_size": 32256
47
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a6debfef838e651f8575f13b65bb3941024e0ca0d85b1b357df704569e0c5aac
3
- size 5880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e16da9b1b8a80a3cdfcd43e7c24a4835abe7dd60daa9ecc48b34fbaba9d72abb
3
+ size 6072