Skip to content

Commit 090f987

Browse files
committed
tmp: Test with reduced max token while keeping context length
Signed-off-by: Jacky <[email protected]>
1 parent 85621a2 commit 090f987

File tree

2 files changed

+5
-5
lines changed

2 files changed

+5
-5
lines changed

tests/fault_tolerance/cancellation/test_trtllm.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,7 @@
3535
pytest.mark.gpu_1,
3636
pytest.mark.e2e,
3737
pytest.mark.model(FAULT_TOLERANCE_MODEL_NAME),
38-
pytest.mark.post_merge, # post_merge to pinpoint failure commit
38+
pytest.mark.pre_merge, # post_merge to pinpoint failure commit
3939
pytest.mark.parametrize("request_plane", ["nats", "tcp"], indirect=True),
4040
]
4141

@@ -428,7 +428,7 @@ def test_request_cancellation_trtllm_prefill_cancel(
428428
)
429429

430430

431-
@pytest.mark.xfail(reason="Test fails only on CI", strict=False)
431+
# @pytest.mark.xfail(reason="Test fails only on CI", strict=False)
432432
@pytest.mark.timeout(195) # 3x average
433433
def test_request_cancellation_trtllm_kv_transfer_cancel(
434434
request, runtime_services_dynamic_ports, predownload_models

tests/fault_tolerance/cancellation/utils.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -281,11 +281,11 @@ def send_cancellable_request(
281281
prompt += " Make sure it is" + " long" * 16000 + "!"
282282

283283
if request_type == "completion":
284-
return send_completion_request(prompt, 16384, frontend_port)
284+
return send_completion_request(prompt, 16000, frontend_port)
285285
elif request_type == "chat_completion":
286-
return send_chat_completion_request(prompt, 16384, frontend_port, stream=False)
286+
return send_chat_completion_request(prompt, 16000, frontend_port, stream=False)
287287
elif request_type == "chat_completion_stream":
288-
return send_chat_completion_request(prompt, 16384, frontend_port, stream=True)
288+
return send_chat_completion_request(prompt, 16000, frontend_port, stream=True)
289289
else:
290290
raise ValueError(f"Unknown request type: {request_type}")
291291

0 commit comments

Comments
 (0)