Skip to content

Commit 1c1c87c

Browse files
committed
fix: Remove max_tokens_in_buffer
Signed-off-by: Jacky <[email protected]>
1 parent bff07b5 commit 1c1c87c

File tree

1 file changed

+1
-3
lines changed

1 file changed

+1
-3
lines changed

tests/fault_tolerance/cancellation/test_trtllm.py

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -55,9 +55,7 @@ def __init__(self, request, mode: str = "prefill_and_decode"):
5555
]
5656
if mode != "prefill_and_decode":
5757
with open("test_request_cancellation_trtllm_config.yaml", "w") as f:
58-
f.write(
59-
"cache_transceiver_config:\n backend: DEFAULT\n max_tokens_in_buffer: 16384\n"
60-
)
58+
f.write("cache_transceiver_config:\n backend: DEFAULT\n")
6159
f.write("disable_overlap_scheduler: true\n")
6260
command += [
6361
"--extra-engine-args",

0 commit comments

Comments
 (0)