austindavis commited on
Commit
0cfaa55
·
verified ·
1 Parent(s): 0084c97

Trained on 2025-02-27/16-29-15 https://wandb.ai/austinleedavis/train/runs/cb3q0p93

Browse files
Files changed (2) hide show
  1. config.json +2 -1
  2. model.safetensors +1 -1
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "outputs/2025-02-26/13-23-58/checkpoint/../hf_model",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
@@ -10,6 +10,7 @@
10
  "eos_token_id": 2,
11
  "initializer_range": 0.02,
12
  "layer_norm_epsilon": 1e-05,
 
13
  "model_type": "gpt2",
14
  "n_ctx": 1024,
15
  "n_embd": 768,
 
1
  {
2
+ "_name_or_path": "outputs/checkpoint/../hf_model",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
 
10
  "eos_token_id": 2,
11
  "initializer_range": 0.02,
12
  "layer_norm_epsilon": 1e-05,
13
+ "loss_type": "ForCausalLM",
14
  "model_type": "gpt2",
15
  "n_ctx": 1024,
16
  "n_embd": 768,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:94f48cb45c303c664768a40bf0831abeb1f93eb1dd4cc57c96a0976d83619004
3
  size 343605888
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33e61e0cd2b46e0ac3db0bc3a4b6fdab3ac300f3cfbf51bae7fc26538b735797
3
  size 343605888