[https://nvbugs/5409416][fix] test_openai_multi_chat_example (#7174)

Linda-Stadter · yuanjingx87 · commit 4bb01ce0a95c · 2025-08-27T18:35:35.000-07:00
Signed-off-by: Linda-Stadter &lt;57756729+Linda-Stadter@users.noreply.github.com&gt;
diff --git a/tests/unittest/llmapi/apps/_test_openai_multi_chat.py b/tests/unittest/llmapi/apps/_test_openai_multi_chat.py
@@ -65,7 +65,10 @@ def engine_from_fp8_quantization(model_name):
 @pytest.fixture(scope="module")
 def server(model_name: str, engine_from_fp8_quantization: str):
     model_path = get_model_path(model_name)
-    args = ["--tp_size", "2", "--tokenizer", model_path]
+    args = [
+        "--tp_size", "2", "--tokenizer", model_path, "--backend", "trt",
+        "--max_num_tokens", "20480", "--max_batch_size", "128"
+    ]
     with RemoteOpenAIServer(engine_from_fp8_quantization,
                             args) as remote_server:
         yield remote_server