We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent e709de8 commit 1abc47fCopy full SHA for 1abc47f
tests/fault_tolerance/cancellation/test_trtllm.py
@@ -82,7 +82,7 @@ def __init__(
82
if mode != "prefill_and_decode":
83
with open("test_request_cancellation_trtllm_config.yaml", "w") as f:
84
f.write(
85
- "cache_transceiver_config:\n backend: DEFAULT\n max_tokens_in_buffer: 16384\n"
+ "cache_transceiver_config:\n backend: DEFAULT\n max_tokens_in_buffer: 32767\n"
86
)
87
f.write("disable_overlap_scheduler: true\n")
88
f.write("kv_cache_config:\n max_tokens: 16384\n")
0 commit comments