File tree Expand file tree Collapse file tree 1 file changed +2
-1
lines changed Expand file tree Collapse file tree 1 file changed +2
-1
lines changed Original file line number Diff line number Diff line change 1111from tensorrt_llm .executor .rpc import RPCClient
1212from tensorrt_llm .executor .rpc .rpc_common import get_unique_ipc_addr
1313from tensorrt_llm .executor .rpc_worker import RpcWorker
14- from tensorrt_llm .llmapi .llm_args import TorchLlmArgs
14+ from tensorrt_llm .llmapi .llm_args import KvCacheConfig , TorchLlmArgs
1515from tensorrt_llm .llmapi .mpi_session import MpiPoolSession
1616from tensorrt_llm .sampling_params import SamplingParams
1717
@@ -33,6 +33,7 @@ def setup_method(self):
3333 tensor_parallel_size = 1 ,
3434 backend = 'pytorch' ,
3535 enable_iter_perf_stats = True ,
36+ kv_cache_config = KvCacheConfig (free_gpu_memory_fraction = 0.5 , ),
3637 )
3738 self .pool , self .addr = self .create_worker_pool ()
3839 self .client = self .create_rpc_client (self .addr )
You can’t perform that action at this time.
0 commit comments