You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: tensorrt_llm/llmapi/llm_args.py
+15-1Lines changed: 15 additions & 1 deletion
Original file line number
Diff line number
Diff line change
@@ -2098,6 +2098,12 @@ class TorchLlmArgs(BaseLlmArgs):
2098
2098
description="Print iteration logs.",
2099
2099
status="beta")
2100
2100
2101
+
batch_wait_timeout_ms: float=Field(
2102
+
default=0,
2103
+
description=
2104
+
"If greater than 0, the request queue might wait up to batch_wait_timeout_ms to receive max_batch_size requests, if fewer than max_batch_size requests are currently available. If 0, no waiting occurs.",
0 commit comments