Upload folder using huggingface_hub
Browse files- postprocessing/1/__pycache__/model.cpython-310.pyc +0 -0
- preprocessing/1/__pycache__/model.cpython-310.pyc +0 -0
- tensorrt_llm/1/config.json +5 -5
- tensorrt_llm/1/rank0.engine +2 -2
- tensorrt_llm/1/rank1.engine +2 -2
- tensorrt_llm_bls/1/__pycache__/model.cpython-310.pyc +0 -0
- tensorrt_llm_bls/1/lib/__pycache__/decode.cpython-310.pyc +0 -0
- tensorrt_llm_bls/1/lib/__pycache__/triton_decoder.cpython-310.pyc +0 -0
postprocessing/1/__pycache__/model.cpython-310.pyc
CHANGED
Binary files a/postprocessing/1/__pycache__/model.cpython-310.pyc and b/postprocessing/1/__pycache__/model.cpython-310.pyc differ
|
|
preprocessing/1/__pycache__/model.cpython-310.pyc
CHANGED
Binary files a/preprocessing/1/__pycache__/model.cpython-310.pyc and b/preprocessing/1/__pycache__/model.cpython-310.pyc differ
|
|
tensorrt_llm/1/config.json
CHANGED
@@ -28,9 +28,9 @@
|
|
28 |
"mapping": {
|
29 |
"world_size": 2,
|
30 |
"gpus_per_node": 8,
|
31 |
-
"tp_size":
|
32 |
-
"pp_size":
|
33 |
-
"moe_tp_size":
|
34 |
"moe_ep_size": 1
|
35 |
},
|
36 |
"quantization": {
|
@@ -50,11 +50,11 @@
|
|
50 |
},
|
51 |
"build_config": {
|
52 |
"max_input_len": 28000,
|
53 |
-
"max_seq_len":
|
54 |
"opt_batch_size": null,
|
55 |
"max_batch_size": 16,
|
56 |
"max_beam_width": 1,
|
57 |
-
"max_num_tokens":
|
58 |
"opt_num_tokens": 16,
|
59 |
"max_prompt_embedding_table_size": 0,
|
60 |
"gather_context_logits": false,
|
|
|
28 |
"mapping": {
|
29 |
"world_size": 2,
|
30 |
"gpus_per_node": 8,
|
31 |
+
"tp_size": 2,
|
32 |
+
"pp_size": 1,
|
33 |
+
"moe_tp_size": 2,
|
34 |
"moe_ep_size": 1
|
35 |
},
|
36 |
"quantization": {
|
|
|
50 |
},
|
51 |
"build_config": {
|
52 |
"max_input_len": 28000,
|
53 |
+
"max_seq_len": 32000,
|
54 |
"opt_batch_size": null,
|
55 |
"max_batch_size": 16,
|
56 |
"max_beam_width": 1,
|
57 |
+
"max_num_tokens": 32000,
|
58 |
"opt_num_tokens": 16,
|
59 |
"max_prompt_embedding_table_size": 0,
|
60 |
"gather_context_logits": false,
|
tensorrt_llm/1/rank0.engine
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b03d07bc220139d071a7d50dd42a7c67235601b1d28a2aea79db0f65ea8150b4
|
3 |
+
size 46857284148
|
tensorrt_llm/1/rank1.engine
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1397dbb8fc710907448a5c58da6c17004b8b8fa398780b1e593b383e6b150b6f
|
3 |
+
size 46857271996
|
tensorrt_llm_bls/1/__pycache__/model.cpython-310.pyc
CHANGED
Binary files a/tensorrt_llm_bls/1/__pycache__/model.cpython-310.pyc and b/tensorrt_llm_bls/1/__pycache__/model.cpython-310.pyc differ
|
|
tensorrt_llm_bls/1/lib/__pycache__/decode.cpython-310.pyc
CHANGED
Binary files a/tensorrt_llm_bls/1/lib/__pycache__/decode.cpython-310.pyc and b/tensorrt_llm_bls/1/lib/__pycache__/decode.cpython-310.pyc differ
|
|
tensorrt_llm_bls/1/lib/__pycache__/triton_decoder.cpython-310.pyc
CHANGED
Binary files a/tensorrt_llm_bls/1/lib/__pycache__/triton_decoder.cpython-310.pyc and b/tensorrt_llm_bls/1/lib/__pycache__/triton_decoder.cpython-310.pyc differ
|
|