NovaSky-AI · CharlieFRuan · Feb 24, 2026 · Feb 24, 2026 · Feb 24, 2026 · Feb 24, 2026
diff --git a/skyrl-train/tests/gpu/gpu_ci/test_pause_and_continue_generation.py b/skyrl-train/tests/gpu/gpu_ci/test_pause_and_continue_generation.py
@@ -331,7 +331,7 @@ async def one_req(i: int):
                             "messages": convs[i],
                             **sampling_params,
                         }
-                        return await client.chat_completion({"json": body, "headers": {}})
+                        return await client.engines[0].chat_completion({"json": body, "headers": {}})
                     else:
                         # completions: prompt is a string
                         prompt_str = tokenizer.apply_chat_template(convs[i], add_generation_prompt=True, tokenize=False)
@@ -340,7 +340,7 @@ async def one_req(i: int):
                             "prompt": prompt_str,
                             **sampling_params,
                         }
-                        return await client.completion({"json": body, "headers": {}})
+                        return await client.engines[0].completion({"json": body, "headers": {}})
 
                 tasks = [asyncio.create_task(one_req(i)) for i in range(4)]
                 # Wait to let it run a bit, then pause generation

diff --git a/tests/backends/skyrl_train/gpu/gpu_ci/test_pause_and_continue_generation.py b/tests/backends/skyrl_train/gpu/gpu_ci/test_pause_and_continue_generation.py
@@ -331,7 +331,7 @@ async def one_req(i: int):
                             "messages": convs[i],
                             **sampling_params,
                         }
-                        return await client.chat_completion({"json": body, "headers": {}})
+                        return await client.engines[0].chat_completion({"json": body, "headers": {}})
                     else:
                         # completions: prompt is a string
                         prompt_str = tokenizer.apply_chat_template(convs[i], add_generation_prompt=True, tokenize=False)
@@ -340,7 +340,7 @@ async def one_req(i: int):
                             "prompt": prompt_str,
                             **sampling_params,
                         }
-                        return await client.completion({"json": body, "headers": {}})
+                        return await client.engines[0].completion({"json": body, "headers": {}})
 
                 tasks = [asyncio.create_task(one_req(i)) for i in range(4)]
                 # Wait to let it run a bit, then pause generation