Upload folder using huggingface_hub

Files changed (3) hide show

config.json CHANGED Viewed

@@ -16,7 +16,7 @@
   "max_position_embeddings": 4096,
   "model_type": "baichuan",
   "num_attention_heads": 32,
-  "num_hidden_layers": 24,
   "pad_token_id": 0,
   "rms_norm_eps": 1e-06,
   "tie_word_embeddings": false,

   "max_position_embeddings": 4096,
   "model_type": "baichuan",
   "num_attention_heads": 32,
+  "num_hidden_layers": 25,
   "pad_token_id": 0,
   "rms_norm_eps": 1e-06,
   "tie_word_embeddings": false,

model-00005-of-00005.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7b63070a92f06996e9761e6e96f4a173cb0009b8282a432927dc6b82df6b7319
-size 2038515408

 version https://git-lfs.github.com/spec/v1
+oid sha256:1a3fbb8e427a4d4cb32de7d1c2ba2ccc34d15985676c939502a75df9d97c9079
+size 2848050024

model.safetensors.index.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "metadata": {
-    "total_size": 21525977088
   },
   "weight_map": {
     "lm_head.weight": "model-00005-of-00005.safetensors",
@@ -141,6 +141,14 @@
     "model.layers.23.self_attn.W_pack.weight": "model-00005-of-00005.safetensors",
     "model.layers.23.self_attn.o_proj.weight": "model-00005-of-00005.safetensors",
     "model.layers.23.self_attn.rotary_emb.inv_freq": "model-00005-of-00005.safetensors",
     "model.layers.3.input_layernorm.weight": "model-00001-of-00005.safetensors",
     "model.layers.3.mlp.down_proj.weight": "model-00001-of-00005.safetensors",
     "model.layers.3.mlp.gate_proj.weight": "model-00001-of-00005.safetensors",

 {
   "metadata": {
+    "total_size": 22335510784
   },
   "weight_map": {
     "lm_head.weight": "model-00005-of-00005.safetensors",
     "model.layers.23.self_attn.W_pack.weight": "model-00005-of-00005.safetensors",
     "model.layers.23.self_attn.o_proj.weight": "model-00005-of-00005.safetensors",
     "model.layers.23.self_attn.rotary_emb.inv_freq": "model-00005-of-00005.safetensors",
+    "model.layers.24.input_layernorm.weight": "model-00005-of-00005.safetensors",
+    "model.layers.24.mlp.down_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.24.mlp.gate_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.24.mlp.up_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.24.post_attention_layernorm.weight": "model-00005-of-00005.safetensors",
+    "model.layers.24.self_attn.W_pack.weight": "model-00005-of-00005.safetensors",
+    "model.layers.24.self_attn.o_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.24.self_attn.rotary_emb.inv_freq": "model-00005-of-00005.safetensors",
     "model.layers.3.input_layernorm.weight": "model-00001-of-00005.safetensors",
     "model.layers.3.mlp.down_proj.weight": "model-00001-of-00005.safetensors",
     "model.layers.3.mlp.gate_proj.weight": "model-00001-of-00005.safetensors",