diff --git a/frontend/server/src/main/java/org/pytorch/serve/wlm/ModelManager.java b/frontend/server/src/main/java/org/pytorch/serve/wlm/ModelManager.java index 28c9f9c698..4cc01972ce 100644 --- a/frontend/server/src/main/java/org/pytorch/serve/wlm/ModelManager.java +++ b/frontend/server/src/main/java/org/pytorch/serve/wlm/ModelManager.java @@ -278,6 +278,13 @@ private Model createModel( archive.getModelVersion(), Model.BATCH_SIZE, batchSize); + } else { + batchSize = + configManager.getJsonIntValue( + archive.getModelName(), + archive.getModelVersion(), + Model.BATCH_SIZE, + batchSize); } model.setBatchSize(batchSize); @@ -291,6 +298,13 @@ private Model createModel( archive.getModelVersion(), Model.MAX_BATCH_DELAY, maxBatchDelay); + } else { + maxBatchDelay = + configManager.getJsonIntValue( + archive.getModelName(), + archive.getModelVersion(), + Model.MAX_BATCH_DELAY, + maxBatchDelay); } model.setMaxBatchDelay(maxBatchDelay); @@ -304,6 +318,13 @@ private Model createModel( archive.getModelVersion(), Model.RESPONSE_TIMEOUT, responseTimeout); + } else { + responseTimeout = + configManager.getJsonIntValue( + archive.getModelName(), + archive.getModelVersion(), + Model.RESPONSE_TIMEOUT, + responseTimeout); } model.setResponseTimeout(responseTimeout); model.setWorkflowModel(isWorkflowModel);