|
28 | 28 | pytest.mark.gpu_1, |
29 | 29 | pytest.mark.e2e, |
30 | 30 | pytest.mark.model(FAULT_TOLERANCE_MODEL_NAME), |
31 | | - pytest.mark.parametrize("request_plane", ["nats", "tcp"], indirect=True), |
32 | 31 | pytest.mark.post_merge, # post_merge to pinpoint failure commit |
33 | 32 | ] |
34 | 33 |
|
@@ -112,6 +111,17 @@ def is_ready(self, response) -> bool: |
112 | 111 |
|
113 | 112 |
|
114 | 113 | @pytest.mark.timeout(290) # 3x average |
| 114 | +@pytest.mark.parametrize( |
| 115 | + "request_plane", |
| 116 | + [ |
| 117 | + "nats", |
| 118 | + pytest.param( |
| 119 | + "tcp", |
| 120 | + marks=pytest.mark.xfail(reason="Multi-worker TCP unstable", strict=False), |
| 121 | + ), |
| 122 | + ], |
| 123 | + indirect=True, |
| 124 | +) |
115 | 125 | def test_request_migration_trtllm_worker_failure( |
116 | 126 | request, runtime_services, set_ucx_tls_no_mm |
117 | 127 | ): |
@@ -156,6 +166,17 @@ def test_request_migration_trtllm_worker_failure( |
156 | 166 |
|
157 | 167 |
|
158 | 168 | @pytest.mark.skip(reason="TRT-LLM graceful shutdown not yet implemented") |
| 169 | +@pytest.mark.parametrize( |
| 170 | + "request_plane", |
| 171 | + [ |
| 172 | + "nats", |
| 173 | + pytest.param( |
| 174 | + "tcp", |
| 175 | + marks=pytest.mark.xfail(reason="Multi-worker TCP unstable", strict=False), |
| 176 | + ), |
| 177 | + ], |
| 178 | + indirect=True, |
| 179 | +) |
159 | 180 | def test_request_migration_trtllm_graceful_shutdown( |
160 | 181 | request, runtime_services, set_ucx_tls_no_mm |
161 | 182 | ): |
@@ -204,6 +225,17 @@ def test_request_migration_trtllm_graceful_shutdown( |
204 | 225 |
|
205 | 226 |
|
206 | 227 | @pytest.mark.timeout(185) # 3x average |
| 228 | +@pytest.mark.parametrize( |
| 229 | + "request_plane", |
| 230 | + [ |
| 231 | + "nats", |
| 232 | + pytest.param( |
| 233 | + "tcp", |
| 234 | + marks=pytest.mark.xfail(reason="Multi-worker TCP unstable", strict=False), |
| 235 | + ), |
| 236 | + ], |
| 237 | + indirect=True, |
| 238 | +) |
207 | 239 | def test_no_request_migration_trtllm_worker_failure( |
208 | 240 | request, runtime_services, set_ucx_tls_no_mm |
209 | 241 | ): |
@@ -264,6 +296,17 @@ def test_no_request_migration_trtllm_worker_failure( |
264 | 296 |
|
265 | 297 |
|
266 | 298 | @pytest.mark.skip(reason="TRT-LLM graceful shutdown not yet implemented") |
| 299 | +@pytest.mark.parametrize( |
| 300 | + "request_plane", |
| 301 | + [ |
| 302 | + "nats", |
| 303 | + pytest.param( |
| 304 | + "tcp", |
| 305 | + marks=pytest.mark.xfail(reason="Multi-worker TCP unstable", strict=False), |
| 306 | + ), |
| 307 | + ], |
| 308 | + indirect=True, |
| 309 | +) |
267 | 310 | def test_no_request_migration_trtllm_graceful_shutdown( |
268 | 311 | request, runtime_services, set_ucx_tls_no_mm |
269 | 312 | ): |
|
0 commit comments