philschmid HF staff commited on
Commit
f3bfff4
1 Parent(s): 0edb10c

Synchronizing local compiler cache.

Browse files
.gitattributes CHANGED
@@ -5951,3 +5951,6 @@ neuronxcc-2.15.128.0+56dc5a86/MODULE_5945967229162609153+df3e6f3f/model.neff fil
5951
  neuronxcc-2.15.128.0+56dc5a86/MODULE_6216273858989637920+df3e6f3f/model.neff filter=lfs diff=lfs merge=lfs -text
5952
  neuronxcc-2.15.128.0+56dc5a86/MODULE_7378323632343424858+df3e6f3f/model.neff filter=lfs diff=lfs merge=lfs -text
5953
  neuronxcc-2.15.128.0+56dc5a86/MODULE_8853125480725449932+df3e6f3f/model.neff filter=lfs diff=lfs merge=lfs -text
 
 
 
 
5951
  neuronxcc-2.15.128.0+56dc5a86/MODULE_6216273858989637920+df3e6f3f/model.neff filter=lfs diff=lfs merge=lfs -text
5952
  neuronxcc-2.15.128.0+56dc5a86/MODULE_7378323632343424858+df3e6f3f/model.neff filter=lfs diff=lfs merge=lfs -text
5953
  neuronxcc-2.15.128.0+56dc5a86/MODULE_8853125480725449932+df3e6f3f/model.neff filter=lfs diff=lfs merge=lfs -text
5954
+ neuronxcc-2.15.128.0+56dc5a86/MODULE_12094726845982372710+df3e6f3f/model.neff filter=lfs diff=lfs merge=lfs -text
5955
+ neuronxcc-2.15.128.0+56dc5a86/MODULE_15554787448610520234+df3e6f3f/model.neff filter=lfs diff=lfs merge=lfs -text
5956
+ neuronxcc-2.15.128.0+56dc5a86/MODULE_15574943571739609130+df3e6f3f/model.neff filter=lfs diff=lfs merge=lfs -text
neuronxcc-2.15.128.0+56dc5a86/0_REGISTRY/0.0.27.dev0/training/llama/meta-llama/Llama-3.1-8b/3f29fd7fbf155e589bff.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": 128001, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 131072, "mlp_bias": false, "model_type": "llama", "neuron": {"compiler_version": "2.15.128.0+56dc5a86", "input_specs": {"attention_mask": [1, 1024], "input_ids": [1, 1024], "labels": [1, 1024]}, "model_class": "LlamaForCausalLM", "num_neuron_cores_per_node": 32, "pipeline_parallel_size": 1, "precision": "bfloat16", "tensor_parallel_size": 8, "training": true}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": {"factor": 8.0, "high_freq_factor": 4.0, "low_freq_factor": 1.0, "original_max_position_embeddings": 8192, "rope_type": "llama3"}, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": false, "vocab_size": 128256}
neuronxcc-2.15.128.0+56dc5a86/MODULE_12094726845982372710+df3e6f3f/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--model-type=transformer", "--distribution-strategy=llm-training", "--enable-saturate-infinity", "--model-type=transformer"]
neuronxcc-2.15.128.0+56dc5a86/MODULE_12094726845982372710+df3e6f3f/model.done ADDED
File without changes
neuronxcc-2.15.128.0+56dc5a86/MODULE_12094726845982372710+df3e6f3f/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69e52f59b8e7dc35fe4375a0d518005067df6e1bfab0acd47315533d34582b80
3
+ size 1101499
neuronxcc-2.15.128.0+56dc5a86/MODULE_12094726845982372710+df3e6f3f/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdeb4922f1c00b519774c1e85e6fc8860617f175589a8da726b6c287d3a8e33b
3
+ size 8018944
neuronxcc-2.15.128.0+56dc5a86/MODULE_15554787448610520234+df3e6f3f/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--model-type=transformer", "--distribution-strategy=llm-training", "--enable-saturate-infinity", "--model-type=transformer"]
neuronxcc-2.15.128.0+56dc5a86/MODULE_15554787448610520234+df3e6f3f/model.done ADDED
File without changes
neuronxcc-2.15.128.0+56dc5a86/MODULE_15554787448610520234+df3e6f3f/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f50a502890f6fd3848f4abeb8559698849b3ec7d4b1bef88403c6e22dd79001
3
+ size 1167881
neuronxcc-2.15.128.0+56dc5a86/MODULE_15554787448610520234+df3e6f3f/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09fc69fd9a18a87cdc66970c5ba0a935ca6d77521a68dbd2ecdee2c868796cd6
3
+ size 10251264
neuronxcc-2.15.128.0+56dc5a86/MODULE_15574943571739609130+df3e6f3f/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--model-type=transformer", "--distribution-strategy=llm-training", "--enable-saturate-infinity", "--model-type=transformer"]
neuronxcc-2.15.128.0+56dc5a86/MODULE_15574943571739609130+df3e6f3f/model.done ADDED
File without changes
neuronxcc-2.15.128.0+56dc5a86/MODULE_15574943571739609130+df3e6f3f/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d803242cbb32c3a077d50287efd102dfbfbbc5e9d390286186801e6bd6b6c19
3
+ size 1168675
neuronxcc-2.15.128.0+56dc5a86/MODULE_15574943571739609130+df3e6f3f/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79593859715cbf4d981171f646b4d27ed9684dd9f4419707caccff6541f1a4ff
3
+ size 10271744