Update tensorrt_llm/config.pbtxt
Browse filesupdate model path and kv cache memory utilization
tensorrt_llm/config.pbtxt
CHANGED
@@ -382,7 +382,7 @@ parameters: {
|
|
382 |
parameters: {
|
383 |
key: "gpt_model_path"
|
384 |
value: {
|
385 |
-
string_value: "/
|
386 |
}
|
387 |
}
|
388 |
parameters: {
|
@@ -418,7 +418,7 @@ parameters: {
|
|
418 |
parameters: {
|
419 |
key: "kv_cache_free_gpu_mem_fraction"
|
420 |
value: {
|
421 |
-
string_value: "0.
|
422 |
}
|
423 |
}
|
424 |
parameters: {
|
|
|
382 |
parameters: {
|
383 |
key: "gpt_model_path"
|
384 |
value: {
|
385 |
+
string_value: "/data/llama/model_repository/tensorrt_llm/1"
|
386 |
}
|
387 |
}
|
388 |
parameters: {
|
|
|
418 |
parameters: {
|
419 |
key: "kv_cache_free_gpu_mem_fraction"
|
420 |
value: {
|
421 |
+
string_value: "0.9"
|
422 |
}
|
423 |
}
|
424 |
parameters: {
|