otherhalf-dev commited on
Commit
0dd86cd
·
verified ·
1 Parent(s): 7567662

Update tensorrt_llm/config.pbtxt

Browse files

update model path and kv cache memory utilization

Files changed (1) hide show
  1. tensorrt_llm/config.pbtxt +2 -2
tensorrt_llm/config.pbtxt CHANGED
@@ -382,7 +382,7 @@ parameters: {
382
  parameters: {
383
  key: "gpt_model_path"
384
  value: {
385
- string_value: "/all_models/inflight_batcher_llm/tensorrt_llm/1"
386
  }
387
  }
388
  parameters: {
@@ -418,7 +418,7 @@ parameters: {
418
  parameters: {
419
  key: "kv_cache_free_gpu_mem_fraction"
420
  value: {
421
- string_value: "0.1"
422
  }
423
  }
424
  parameters: {
 
382
  parameters: {
383
  key: "gpt_model_path"
384
  value: {
385
+ string_value: "/data/llama/model_repository/tensorrt_llm/1"
386
  }
387
  }
388
  parameters: {
 
418
  parameters: {
419
  key: "kv_cache_free_gpu_mem_fraction"
420
  value: {
421
+ string_value: "0.9"
422
  }
423
  }
424
  parameters: {