Trained with Unsloth

Files changed (7) hide show

README.md CHANGED Viewed

@@ -1,15 +1,15 @@
 ---
 library_name: transformers
 tags:
 - unsloth
 - trl
 - sft
-license: apache-2.0
-datasets:
-- mlabonne/llmtwin
-language:
-- en
-base_model: meta-llama/Meta-Llama-3.1-8B
 ---
 ![image/png](https://cdn-uploads.huggingface.co/production/uploads/61b8e2ba285851687028d395/Ddo6O27iJ0uFiGp7Y5py1.png)

 ---
+base_model: meta-llama/Meta-Llama-3.1-8B
+datasets:
+- mlabonne/llmtwin
+language:
+- en
 library_name: transformers
+license: apache-2.0
 tags:
 - unsloth
 - trl
 - sft
 ---
 ![image/png](https://cdn-uploads.huggingface.co/production/uploads/61b8e2ba285851687028d395/Ddo6O27iJ0uFiGp7Y5py1.png)

config.json CHANGED Viewed

@@ -1,12 +1,16 @@
 {
-  "_name_or_path": "unsloth/Meta-Llama-3.1-8B",
   "architectures": [
     "LlamaForCausalLM"
   ],
   "attention_bias": false,
   "attention_dropout": 0.0,
   "bos_token_id": 128000,
-  "eos_token_id": 128001,
   "hidden_act": "silu",
   "hidden_size": 4096,
   "initializer_range": 0.02,
@@ -31,7 +35,7 @@
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
   "transformers_version": "4.44.2",
-  "unsloth_version": "2024.8",
   "use_cache": true,
   "vocab_size": 128256
 }

 {
+  "_name_or_path": "mlabonne/Llama-3.1-8B",
   "architectures": [
     "LlamaForCausalLM"
   ],
   "attention_bias": false,
   "attention_dropout": 0.0,
   "bos_token_id": 128000,
+  "eos_token_id": [
+    128001,
+    128008,
+    128009
+  ],
   "hidden_act": "silu",
   "hidden_size": 4096,
   "initializer_range": 0.02,
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
   "transformers_version": "4.44.2",
+  "unsloth_version": "2024.9.post4",
   "use_cache": true,
   "vocab_size": 128256
 }

generation_config.json CHANGED Viewed

@@ -1,8 +1,11 @@
 {
-  "_from_model_config": true,
   "bos_token_id": 128000,
   "do_sample": true,
-  "eos_token_id": 128001,
   "max_length": 131072,
   "pad_token_id": 128004,
   "temperature": 0.6,

 {
   "bos_token_id": 128000,
   "do_sample": true,
+  "eos_token_id": [
+    128001,
+    128008,
+    128009
+  ],
   "max_length": 131072,
   "pad_token_id": 128004,
   "temperature": 0.6,

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:75392c61e91fdbd94f2d8fb2403f22282957d81160939a10c28870732f6fa3ab
 size 4976698672

 version https://git-lfs.github.com/spec/v1
+oid sha256:67271b802b4279f0bef010ea71b6934f636cec71cf1519e40ce7a304b04719a5
 size 4976698672

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d8b17337fb10c5b153636b4c5e0e56fce927df3b31feea11f75af18ee96e993f
 size 4999802720

 version https://git-lfs.github.com/spec/v1
+oid sha256:98bf4aa11a4c6d8cfa58384a7301494789e1334cd9be0f000be07e94f32b9928
 size 4999802720

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6ec7d5edebb2c5e3d4589ed9caf54696e544150597f4f50f70a39d3a0c4bb89e
 size 4915916176

 version https://git-lfs.github.com/spec/v1
+oid sha256:4e3c88e517da80b03decfd01a8750593fb14bdcc5a15e7ffbbbfe2e795c399c6
 size 4915916176

model-00004-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e031ee5e5bc29128ad6489bc237b3440c81b0316972f92bf87cc85eec34b2b5a
 size 1168138808

 version https://git-lfs.github.com/spec/v1
+oid sha256:e8629c656223b718a9ff445ca07f26f716746321918a18ceae4514c8d446b9c9
 size 1168138808