Devops-hestabit commited on
Commit
ec365ce
·
verified ·
1 Parent(s): 4f10fb0

Upload folder using huggingface_hub

Browse files
postprocessing/1/__pycache__/model.cpython-310.pyc CHANGED
Binary files a/postprocessing/1/__pycache__/model.cpython-310.pyc and b/postprocessing/1/__pycache__/model.cpython-310.pyc differ
 
preprocessing/1/__pycache__/model.cpython-310.pyc CHANGED
Binary files a/preprocessing/1/__pycache__/model.cpython-310.pyc and b/preprocessing/1/__pycache__/model.cpython-310.pyc differ
 
tensorrt_llm/1/config.json CHANGED
@@ -28,9 +28,9 @@
28
  "mapping": {
29
  "world_size": 2,
30
  "gpus_per_node": 8,
31
- "tp_size": 1,
32
- "pp_size": 2,
33
- "moe_tp_size": 1,
34
  "moe_ep_size": 1
35
  },
36
  "quantization": {
@@ -50,11 +50,11 @@
50
  },
51
  "build_config": {
52
  "max_input_len": 28000,
53
- "max_seq_len": 32500,
54
  "opt_batch_size": null,
55
  "max_batch_size": 16,
56
  "max_beam_width": 1,
57
- "max_num_tokens": 8192,
58
  "opt_num_tokens": 16,
59
  "max_prompt_embedding_table_size": 0,
60
  "gather_context_logits": false,
 
28
  "mapping": {
29
  "world_size": 2,
30
  "gpus_per_node": 8,
31
+ "tp_size": 2,
32
+ "pp_size": 1,
33
+ "moe_tp_size": 2,
34
  "moe_ep_size": 1
35
  },
36
  "quantization": {
 
50
  },
51
  "build_config": {
52
  "max_input_len": 28000,
53
+ "max_seq_len": 32000,
54
  "opt_batch_size": null,
55
  "max_batch_size": 16,
56
  "max_beam_width": 1,
57
+ "max_num_tokens": 32000,
58
  "opt_num_tokens": 16,
59
  "max_prompt_embedding_table_size": 0,
60
  "gather_context_logits": false,
tensorrt_llm/1/rank0.engine CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7acd8fbed6cb1b6373e7e00f78cb5910ce6deeb7f5f606ad6cb2123540049bf9
3
- size 46722172788
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b03d07bc220139d071a7d50dd42a7c67235601b1d28a2aea79db0f65ea8150b4
3
+ size 46857284148
tensorrt_llm/1/rank1.engine CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f1e59d5a7bb7d8d7c87dcc81f50518d6cb7d6a0e4fde1f60ac194e02fb4ac86e
3
- size 46722181404
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1397dbb8fc710907448a5c58da6c17004b8b8fa398780b1e593b383e6b150b6f
3
+ size 46857271996
tensorrt_llm_bls/1/__pycache__/model.cpython-310.pyc CHANGED
Binary files a/tensorrt_llm_bls/1/__pycache__/model.cpython-310.pyc and b/tensorrt_llm_bls/1/__pycache__/model.cpython-310.pyc differ
 
tensorrt_llm_bls/1/lib/__pycache__/decode.cpython-310.pyc CHANGED
Binary files a/tensorrt_llm_bls/1/lib/__pycache__/decode.cpython-310.pyc and b/tensorrt_llm_bls/1/lib/__pycache__/decode.cpython-310.pyc differ
 
tensorrt_llm_bls/1/lib/__pycache__/triton_decoder.cpython-310.pyc CHANGED
Binary files a/tensorrt_llm_bls/1/lib/__pycache__/triton_decoder.cpython-310.pyc and b/tensorrt_llm_bls/1/lib/__pycache__/triton_decoder.cpython-310.pyc differ