miladalsh commited on
Commit
9dd866e
·
verified ·
1 Parent(s): 629a4d8

Training in progress, step 200

Browse files
adapter_config.json CHANGED
@@ -19,12 +19,12 @@
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
- "o_proj",
23
  "k_proj",
24
- "down_proj",
25
  "up_proj",
26
- "gate_proj",
27
  "q_proj",
 
 
 
28
  "v_proj"
29
  ],
30
  "task_type": "CAUSAL_LM",
 
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
 
22
  "k_proj",
 
23
  "up_proj",
 
24
  "q_proj",
25
+ "gate_proj",
26
+ "down_proj",
27
+ "o_proj",
28
  "v_proj"
29
  ],
30
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b7f052020c7cd116955fbb297185fedd42fc1054c92ddb5c82fd152e138d0084
3
  size 4785795512
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e714f81142ebd87b8bc5bda8999495e860b3fb764a41d9dde496fed29fc7879
3
  size 4785795512
config.json CHANGED
@@ -7,7 +7,6 @@
7
  "attention_dropout": 0.0,
8
  "bos_token_id": 128000,
9
  "eos_token_id": 128001,
10
- "head_dim": 128,
11
  "hidden_act": "silu",
12
  "hidden_size": 4096,
13
  "initializer_range": 0.02,
@@ -24,7 +23,7 @@
24
  "rope_theta": 500000.0,
25
  "tie_word_embeddings": false,
26
  "torch_dtype": "float16",
27
- "transformers_version": "4.46.2",
28
  "use_cache": true,
29
  "vocab_size": 128258
30
  }
 
7
  "attention_dropout": 0.0,
8
  "bos_token_id": 128000,
9
  "eos_token_id": 128001,
 
10
  "hidden_act": "silu",
11
  "hidden_size": 4096,
12
  "initializer_range": 0.02,
 
23
  "rope_theta": 500000.0,
24
  "tie_word_embeddings": false,
25
  "torch_dtype": "float16",
26
+ "transformers_version": "4.43.4",
27
  "use_cache": true,
28
  "vocab_size": 128258
29
  }
generation_config.json CHANGED
@@ -5,5 +5,5 @@
5
  "max_length": 4096,
6
  "temperature": 0.6,
7
  "top_p": 0.9,
8
- "transformers_version": "4.46.2"
9
  }
 
5
  "max_length": 4096,
6
  "temperature": 0.6,
7
  "top_p": 0.9,
8
+ "transformers_version": "4.43.4"
9
  }
model-00001-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b10647b1adcff6129f0502db8761269184b30e55d51d287b3faa5c9bd8a33fb
3
  size 1973471736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b43a13c859d8b493e9b3073be9996a694785728af4276a99891c2a00fbff9f5c
3
  size 1973471736
model-00002-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3817910d5adba1370fb2b036f952504fb0480510faafd68ebaf714a82b2c319
3
  size 1895895296
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a600444224f16883ed368e53e92063cecdbcb35d0213dca85333eb50d119c292
3
  size 1895895296
model-00003-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:567309864cc6649a32ff19dddd5de662abb27043c3f2ba8ebcd468e9a383d026
3
  size 1979798000
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5769bfd9d23b1e4a0fa1cb476596f7413e49a34647a553c9f9dedb95fd2211cc
3
  size 1979798000
model-00004-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a462811926c00b538a2c2e27a383e40e87441f89c3c1df49f81d4c5209f9c8d6
3
  size 1946227328
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4ff06f2ce976dd0effdc5de3a85249b3830e3f226af205f82a24f4bb335a422
3
  size 1946227328
model-00005-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a89768288a42693e691aa62949a168baa9b3658f5fbc522db9d2ef78ff7a3f50
3
  size 1979798024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d630aca1b73f12d743448d32eb66cd720d659d8669b1c9275b9fe548a4ae70a6
3
  size 1979798024
model-00006-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:244c46cd7190c9134a1bdf5878183e2c2ba2283ed650ef4685d22a6a354ddf66
3
  size 1946227328
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c55ad3eb4df97651266b9b377a00fde02c5acaa4009975b19635a4d838e3dafa
3
  size 1946227328
model-00007-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0810bd485771b864dbae67113d246e57fb2faf615fb9c5a231a3d8a842e76eaf
3
  size 1979798024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8abe8639f467c3661445a01aef194d7c3f5942afaaa026646ce1111298b4884e
3
  size 1979798024
model-00008-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4725a11d9fa7d15c279594127be33e8b0e455b3bc60947d318555d5a863c1697
3
  size 1308683392
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c517af1b07aa80399f5370fcd2981aec0bd3806e1b17086447660d86a16a9725
3
  size 1308683392
model-00009-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:39895c13234ef72001a960a8b1d937946f8bae80635324f3348c8b4b757aa5ce
3
  size 1050689664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7be10146a07f787ddffd34ff35a68e5b68b8d22060db03a635190e3499f99be5
3
  size 1050689664
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:962eae968288b2eae28691f4aa07e607a46c3be430550fed5eb9282004658d80
3
  size 5624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3ae87892af338cee68334d5bcd2e0663f39a73961b0675dd514fb4f4c093256
3
  size 5624