44import torch_tensorrt
55from functools import partial
66
7- from typing import Any , Sequence
7+ from typing import Any , Optional , Sequence
88from torch_tensorrt import EngineCapability , Device
99from torch_tensorrt .fx .utils import LowerPrecision
1010
1717 WORKSPACE_SIZE ,
1818 MIN_BLOCK_SIZE ,
1919 PASS_THROUGH_BUILD_FAILURES ,
20+ MAX_AUX_STREAMS ,
21+ VERSION_COMPATIBLE ,
22+ OPTIMIZATION_LEVEL ,
2023 USE_EXPERIMENTAL_RT ,
2124)
2225
@@ -46,6 +49,9 @@ def compile(
4649 min_block_size = MIN_BLOCK_SIZE ,
4750 torch_executed_ops = [],
4851 torch_executed_modules = [],
52+ max_aux_streams = MAX_AUX_STREAMS ,
53+ version_compatible = VERSION_COMPATIBLE ,
54+ optimization_level = OPTIMIZATION_LEVEL ,
4955 use_experimental_rt = USE_EXPERIMENTAL_RT ,
5056 ** kwargs ,
5157):
@@ -93,6 +99,9 @@ def compile(
9399 workspace_size = workspace_size ,
94100 min_block_size = min_block_size ,
95101 torch_executed_ops = torch_executed_ops ,
102+ max_aux_streams = max_aux_streams ,
103+ version_compatible = version_compatible ,
104+ optimization_level = optimization_level ,
96105 use_experimental_rt = use_experimental_rt ,
97106 ** kwargs ,
98107 )
@@ -117,6 +126,9 @@ def create_backend(
117126 min_block_size : int = MIN_BLOCK_SIZE ,
118127 torch_executed_ops : Sequence [str ] = set (),
119128 pass_through_build_failures : bool = PASS_THROUGH_BUILD_FAILURES ,
129+ max_aux_streams : Optional [int ] = MAX_AUX_STREAMS ,
130+ version_compatible : bool = VERSION_COMPATIBLE ,
131+ optimization_level : Optional [int ] = OPTIMIZATION_LEVEL ,
120132 use_experimental_rt : bool = USE_EXPERIMENTAL_RT ,
121133 ** kwargs ,
122134):
@@ -129,6 +141,10 @@ def create_backend(
129141 min_block_size: Minimum number of operators per TRT-Engine Block
130142 torch_executed_ops: Sequence of operations to run in Torch, regardless of converter coverage
131143 pass_through_build_failures: Whether to fail on TRT engine build errors (True) or not (False)
144+ max_aux_streams: Maximum number of allowed auxiliary TRT streams for each engine
145+ version_compatible: Provide version forward-compatibility for engine plan files
146+ optimization_level: Builder optimization 0-5, higher levels imply longer build time,
147+ searching for more optimization options. TRT defaults to 3
132148 use_experimental_rt: Whether to use the new experimental TRTModuleNext for TRT engines
133149 Returns:
134150 Backend for torch.compile
@@ -143,6 +159,9 @@ def create_backend(
143159 min_block_size = min_block_size ,
144160 torch_executed_ops = torch_executed_ops ,
145161 pass_through_build_failures = pass_through_build_failures ,
162+ max_aux_streams = max_aux_streams ,
163+ version_compatible = version_compatible ,
164+ optimization_level = optimization_level ,
146165 use_experimental_rt = use_experimental_rt ,
147166 )
148167
0 commit comments