We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent a7b3254 commit ef2a8c4Copy full SHA for ef2a8c4
wlm/src/main/java/ai/djl/serving/wlm/LmiConfigRecommender.java
@@ -87,7 +87,10 @@ private static void setRollingBatch(
87
lmiProperties.setProperty("option.rolling_batch", "disable");
88
return;
89
}
90
- String rollingBatch = lmiProperties.getProperty("option.rolling_batch", "auto");
+
91
+ String defaultRollingBatch = isTnxEnabled(features) ? "disable" : "auto";
92
+ String rollingBatch =
93
+ lmiProperties.getProperty("option.rolling_batch", defaultRollingBatch);
94
String modelType = modelConfig.getModelType();
95
if (!"auto".equals(rollingBatch)) {
96
0 commit comments