Skip to content

Commit

Permalink
Set max_batch_size to match model's max_batch_size
Browse files Browse the repository at this point in the history
  • Loading branch information
dagardner-nv committed Jan 12, 2024
1 parent f6eaab4 commit a973eb2
Show file tree
Hide file tree
Showing 2 changed files with 5 additions and 5 deletions.
4 changes: 2 additions & 2 deletions examples/llm/vdb_upload/run.py
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
# Copyright (c) 2023, NVIDIA CORPORATION.
# Copyright (c) 2023-2024, NVIDIA CORPORATION.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
Expand Down Expand Up @@ -46,7 +46,7 @@ def run():
)
@click.option(
"--model_max_batch_size",
default=64,
default=256,
type=click.IntRange(min=1),
help="Max batch size to use for the model",
)
Expand Down
6 changes: 3 additions & 3 deletions tests/llm/test_vdb_upload_pipe.py
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
# SPDX-FileCopyrightText: Copyright (c) 2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-FileCopyrightText: Copyright (c) 2023-2024, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-License-Identifier: Apache-2.0
#
# Licensed under the Apache License, Version 2.0 (the "License");
Expand Down Expand Up @@ -37,7 +37,7 @@
from morpheus.stages.preprocess.preprocess_nlp_stage import PreprocessNLPStage

EMBEDDING_SIZE = 384
MODEL_MAX_BATCH_SIZE = 64
MODEL_MAX_BATCH_SIZE = 256
MODEL_FEA_LENGTH = 512


Expand Down Expand Up @@ -116,7 +116,7 @@ def test_vdb_upload_pipe(mock_triton_client: mock.MagicMock,
"name": "output", "datatype": "FP32", "shape": [-1, EMBEDDING_SIZE]
}]
}
mock_model_config = {"config": {"max_batch_size": 256}}
mock_model_config = {"config": {"max_batch_size": MODEL_MAX_BATCH_SIZE}}

mock_triton_client.return_value = mock_triton_client
mock_triton_client.is_server_live.return_value = True
Expand Down

0 comments on commit a973eb2

Please sign in to comment.