Update README.md
Browse files
README.md
CHANGED
@@ -88,7 +88,8 @@ from vllm import LLM, SamplingParams
|
|
88 |
llm = LLM(
|
89 |
model='MediaTek-Research/Breeze-7B-FC-v1_0',
|
90 |
tensor_parallel_size=num_gpu, # number of gpus
|
91 |
-
gpu_memory_utilization=0.7
|
|
|
92 |
)
|
93 |
|
94 |
turn_end_token_id = 61876 # <|im_end|>
|
|
|
88 |
llm = LLM(
|
89 |
model='MediaTek-Research/Breeze-7B-FC-v1_0',
|
90 |
tensor_parallel_size=num_gpu, # number of gpus
|
91 |
+
gpu_memory_utilization=0.7,
|
92 |
+
dtype='half'
|
93 |
)
|
94 |
|
95 |
turn_end_token_id = 61876 # <|im_end|>
|