Skip to content

Commit 4bb01ce

Browse files
Linda-Stadteryuanjingx87
authored andcommitted
[https://nvbugs/5409416][fix] test_openai_multi_chat_example (#7174)
Signed-off-by: Linda-Stadter <57756729+Linda-Stadter@users.noreply.github.com>
1 parent a690eb2 commit 4bb01ce

File tree

1 file changed

+4
-1
lines changed

1 file changed

+4
-1
lines changed

tests/unittest/llmapi/apps/_test_openai_multi_chat.py

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -65,7 +65,10 @@ def engine_from_fp8_quantization(model_name):
6565
@pytest.fixture(scope="module")
6666
def server(model_name: str, engine_from_fp8_quantization: str):
6767
model_path = get_model_path(model_name)
68-
args = ["--tp_size", "2", "--tokenizer", model_path]
68+
args = [
69+
"--tp_size", "2", "--tokenizer", model_path, "--backend", "trt",
70+
"--max_num_tokens", "20480", "--max_batch_size", "128"
71+
]
6972
with RemoteOpenAIServer(engine_from_fp8_quantization,
7073
args) as remote_server:
7174
yield remote_server

0 commit comments

Comments
 (0)