Skip to content

Commit 8250179

Browse files
committed
Merge branch 'main' into lluo/save_remove_inputs
2 parents 076f47a + e2a27a0 commit 8250179

File tree

183 files changed

+2945
-722
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

183 files changed

+2945
-722
lines changed

core/runtime/TRTEngine.cpp

Lines changed: 38 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -89,6 +89,12 @@ TRTEngine::TRTEngine(
8989
cuda_engine = make_trt(rt->deserializeCudaEngine(serialized_engine.c_str(), serialized_engine.size()));
9090
TORCHTRT_CHECK((cuda_engine.get() != nullptr), "Unable to deserialize the TensorRT engine");
9191

92+
if (get_streamable_device_memory_budget() > 0) {
93+
int64_t budget_bytes = get_automatic_device_memory_budget();
94+
LOG_DEBUG("Weight streaming budget set to " << budget_bytes << "B");
95+
cuda_engine->setWeightStreamingBudgetV2(budget_bytes);
96+
}
97+
9298
exec_ctx = make_trt(cuda_engine->createExecutionContext());
9399
TORCHTRT_CHECK((exec_ctx.get() != nullptr), "Unable to create TensorRT execution context");
94100

@@ -258,6 +264,38 @@ void TRTEngine::set_profiling_paths() {
258264
cuda_graph_debug_path = std::filesystem::path{profile_path_prefix + "/" + name + "_cudagraph.dot"}.string();
259265
}
260266

267+
int64_t TRTEngine::get_device_memory_budget() {
268+
return cuda_engine->getWeightStreamingBudgetV2();
269+
}
270+
271+
bool TRTEngine::set_device_memory_budget(int64_t budget) {
272+
// Recreating the context because weight streaming budget cannot be modified while there are active context.
273+
if (exec_ctx.get() != nullptr) {
274+
exec_ctx.reset();
275+
}
276+
if (profile_execution) {
277+
trt_engine_profiler.reset();
278+
}
279+
bool result = cuda_engine->setWeightStreamingBudgetV2(budget);
280+
exec_ctx = make_trt(cuda_engine->createExecutionContext());
281+
TORCHTRT_CHECK(
282+
(exec_ctx.get() != nullptr),
283+
"Unable to recreate TensorRT execution context after setting new device memory budget");
284+
if (profile_execution) {
285+
enable_profiling();
286+
}
287+
return result;
288+
}
289+
290+
// Returns 0 if BuilderFlag::kWEIGHT_STREAMING is unset during engine building.
291+
int64_t TRTEngine::get_streamable_device_memory_budget() {
292+
return cuda_engine->getStreamableWeightsSize();
293+
}
294+
295+
int64_t TRTEngine::get_automatic_device_memory_budget() {
296+
return cuda_engine->getWeightStreamingAutomaticBudget();
297+
}
298+
261299
std::string TRTEngine::to_str() const {
262300
// clang-format off
263301
std::stringstream ss;

core/runtime/TRTEngine.h

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -71,6 +71,10 @@ struct TRTEngine : torch::CustomClassHolder {
7171
std::string get_engine_layer_info();
7272
void dump_engine_layer_info_to_file(const std::string& path);
7373
void dump_engine_layer_info();
74+
int64_t get_device_memory_budget();
75+
bool set_device_memory_budget(int64_t budget);
76+
int64_t get_streamable_device_memory_budget();
77+
int64_t get_automatic_device_memory_budget();
7478
friend std::ostream& operator<<(std::ostream& os, const TRTEngine& engine);
7579
static const char BINDING_DELIM = '%';
7680

core/runtime/register_jit_hooks.cpp

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -86,6 +86,12 @@ static auto TORCHTRT_UNUSED TRTEngineTSRegistrtion =
8686
.def("dump_engine_layer_info_to_file", &TRTEngine::dump_engine_layer_info_to_file)
8787
.def("dump_engine_layer_info", &TRTEngine::dump_engine_layer_info)
8888
.def("get_engine_layer_info", &TRTEngine::get_engine_layer_info)
89+
.def_property(
90+
"device_memory_budget",
91+
&TRTEngine::get_device_memory_budget,
92+
&TRTEngine::set_device_memory_budget)
93+
.def_property("streamable_device_memory_budget", &TRTEngine::get_streamable_device_memory_budget)
94+
.def_property("automatic_device_memory_budget", &TRTEngine::get_automatic_device_memory_budget)
8995
.def_pickle(
9096
[](const c10::intrusive_ptr<TRTEngine>& self) -> std::vector<std::string> {
9197
// Serialize TensorRT engine

docs/_cpp_api/classtorch__tensorrt_1_1DataType.html

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@
1010

1111
<meta name="viewport" content="width=device-width, initial-scale=1.0">
1212

13-
<title>Class DataType &mdash; Torch-TensorRT v2.6.0.dev0+b99d080 documentation</title>
13+
<title>Class DataType &mdash; Torch-TensorRT v2.6.0.dev0+2840531 documentation</title>
1414

1515

1616

@@ -275,7 +275,7 @@
275275

276276

277277
<div class="version">
278-
v2.6.0.dev0+b99d080
278+
v2.6.0.dev0+2840531
279279
</div>
280280

281281

@@ -330,6 +330,7 @@
330330
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/converter_overloading.html">Overloading Torch-TensorRT Converters with Custom Converters</a></li>
331331
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/custom_kernel_plugins.html">Using Custom Kernels within TensorRT Engines with Torch-TensorRT</a></li>
332332
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/mutable_torchtrt_module_example.html">Mutable Torch TensorRT Module</a></li>
333+
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/weight_streaming_example.html">Weight Streaming</a></li>
333334
</ul>
334335
<p class="caption" role="heading"><span class="caption-text">Dynamo Frontend</span></p>
335336
<ul>

docs/_cpp_api/classtorch__tensorrt_1_1Device_1_1DeviceType.html

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@
1010

1111
<meta name="viewport" content="width=device-width, initial-scale=1.0">
1212

13-
<title>Class Device::DeviceType &mdash; Torch-TensorRT v2.6.0.dev0+b99d080 documentation</title>
13+
<title>Class Device::DeviceType &mdash; Torch-TensorRT v2.6.0.dev0+2840531 documentation</title>
1414

1515

1616

@@ -275,7 +275,7 @@
275275

276276

277277
<div class="version">
278-
v2.6.0.dev0+b99d080
278+
v2.6.0.dev0+2840531
279279
</div>
280280

281281

@@ -330,6 +330,7 @@
330330
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/converter_overloading.html">Overloading Torch-TensorRT Converters with Custom Converters</a></li>
331331
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/custom_kernel_plugins.html">Using Custom Kernels within TensorRT Engines with Torch-TensorRT</a></li>
332332
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/mutable_torchtrt_module_example.html">Mutable Torch TensorRT Module</a></li>
333+
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/weight_streaming_example.html">Weight Streaming</a></li>
333334
</ul>
334335
<p class="caption" role="heading"><span class="caption-text">Dynamo Frontend</span></p>
335336
<ul>

docs/_cpp_api/classtorch__tensorrt_1_1TensorFormat.html

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@
1010

1111
<meta name="viewport" content="width=device-width, initial-scale=1.0">
1212

13-
<title>Class TensorFormat &mdash; Torch-TensorRT v2.6.0.dev0+b99d080 documentation</title>
13+
<title>Class TensorFormat &mdash; Torch-TensorRT v2.6.0.dev0+2840531 documentation</title>
1414

1515

1616

@@ -275,7 +275,7 @@
275275

276276

277277
<div class="version">
278-
v2.6.0.dev0+b99d080
278+
v2.6.0.dev0+2840531
279279
</div>
280280

281281

@@ -330,6 +330,7 @@
330330
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/converter_overloading.html">Overloading Torch-TensorRT Converters with Custom Converters</a></li>
331331
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/custom_kernel_plugins.html">Using Custom Kernels within TensorRT Engines with Torch-TensorRT</a></li>
332332
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/mutable_torchtrt_module_example.html">Mutable Torch TensorRT Module</a></li>
333+
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/weight_streaming_example.html">Weight Streaming</a></li>
333334
</ul>
334335
<p class="caption" role="heading"><span class="caption-text">Dynamo Frontend</span></p>
335336
<ul>

docs/_cpp_api/classtorch__tensorrt_1_1ptq_1_1Int8CacheCalibrator.html

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@
1010

1111
<meta name="viewport" content="width=device-width, initial-scale=1.0">
1212

13-
<title>Template Class Int8CacheCalibrator &mdash; Torch-TensorRT v2.6.0.dev0+b99d080 documentation</title>
13+
<title>Template Class Int8CacheCalibrator &mdash; Torch-TensorRT v2.6.0.dev0+2840531 documentation</title>
1414

1515

1616

@@ -275,7 +275,7 @@
275275

276276

277277
<div class="version">
278-
v2.6.0.dev0+b99d080
278+
v2.6.0.dev0+2840531
279279
</div>
280280

281281

@@ -330,6 +330,7 @@
330330
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/converter_overloading.html">Overloading Torch-TensorRT Converters with Custom Converters</a></li>
331331
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/custom_kernel_plugins.html">Using Custom Kernels within TensorRT Engines with Torch-TensorRT</a></li>
332332
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/mutable_torchtrt_module_example.html">Mutable Torch TensorRT Module</a></li>
333+
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/weight_streaming_example.html">Weight Streaming</a></li>
333334
</ul>
334335
<p class="caption" role="heading"><span class="caption-text">Dynamo Frontend</span></p>
335336
<ul>

docs/_cpp_api/classtorch__tensorrt_1_1ptq_1_1Int8Calibrator.html

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@
1010

1111
<meta name="viewport" content="width=device-width, initial-scale=1.0">
1212

13-
<title>Template Class Int8Calibrator &mdash; Torch-TensorRT v2.6.0.dev0+b99d080 documentation</title>
13+
<title>Template Class Int8Calibrator &mdash; Torch-TensorRT v2.6.0.dev0+2840531 documentation</title>
1414

1515

1616

@@ -275,7 +275,7 @@
275275

276276

277277
<div class="version">
278-
v2.6.0.dev0+b99d080
278+
v2.6.0.dev0+2840531
279279
</div>
280280

281281

@@ -330,6 +330,7 @@
330330
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/converter_overloading.html">Overloading Torch-TensorRT Converters with Custom Converters</a></li>
331331
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/custom_kernel_plugins.html">Using Custom Kernels within TensorRT Engines with Torch-TensorRT</a></li>
332332
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/mutable_torchtrt_module_example.html">Mutable Torch TensorRT Module</a></li>
333+
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/weight_streaming_example.html">Weight Streaming</a></li>
333334
</ul>
334335
<p class="caption" role="heading"><span class="caption-text">Dynamo Frontend</span></p>
335336
<ul>

docs/_cpp_api/define_macros_8h_1a18d295a837ac71add5578860b55e5502.html

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@
1010

1111
<meta name="viewport" content="width=device-width, initial-scale=1.0">
1212

13-
<title>Define STR &mdash; Torch-TensorRT v2.6.0.dev0+b99d080 documentation</title>
13+
<title>Define STR &mdash; Torch-TensorRT v2.6.0.dev0+2840531 documentation</title>
1414

1515

1616

@@ -275,7 +275,7 @@
275275

276276

277277
<div class="version">
278-
v2.6.0.dev0+b99d080
278+
v2.6.0.dev0+2840531
279279
</div>
280280

281281

@@ -330,6 +330,7 @@
330330
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/converter_overloading.html">Overloading Torch-TensorRT Converters with Custom Converters</a></li>
331331
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/custom_kernel_plugins.html">Using Custom Kernels within TensorRT Engines with Torch-TensorRT</a></li>
332332
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/mutable_torchtrt_module_example.html">Mutable Torch TensorRT Module</a></li>
333+
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/weight_streaming_example.html">Weight Streaming</a></li>
333334
</ul>
334335
<p class="caption" role="heading"><span class="caption-text">Dynamo Frontend</span></p>
335336
<ul>

docs/_cpp_api/define_macros_8h_1a282fd3c0b1c3a215148ae372070e1268.html

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@
1010

1111
<meta name="viewport" content="width=device-width, initial-scale=1.0">
1212

13-
<title>Define TORCH_TENSORRT_PATCH_VERSION &mdash; Torch-TensorRT v2.6.0.dev0+b99d080 documentation</title>
13+
<title>Define TORCH_TENSORRT_PATCH_VERSION &mdash; Torch-TensorRT v2.6.0.dev0+2840531 documentation</title>
1414

1515

1616

@@ -275,7 +275,7 @@
275275

276276

277277
<div class="version">
278-
v2.6.0.dev0+b99d080
278+
v2.6.0.dev0+2840531
279279
</div>
280280

281281

@@ -330,6 +330,7 @@
330330
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/converter_overloading.html">Overloading Torch-TensorRT Converters with Custom Converters</a></li>
331331
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/custom_kernel_plugins.html">Using Custom Kernels within TensorRT Engines with Torch-TensorRT</a></li>
332332
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/mutable_torchtrt_module_example.html">Mutable Torch TensorRT Module</a></li>
333+
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/weight_streaming_example.html">Weight Streaming</a></li>
333334
</ul>
334335
<p class="caption" role="heading"><span class="caption-text">Dynamo Frontend</span></p>
335336
<ul>

docs/_cpp_api/define_macros_8h_1a31398a6d4d27e28817afb0f0139e909e.html

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@
1010

1111
<meta name="viewport" content="width=device-width, initial-scale=1.0">
1212

13-
<title>Define TORCH_TENSORRT_MAJOR_VERSION &mdash; Torch-TensorRT v2.6.0.dev0+b99d080 documentation</title>
13+
<title>Define TORCH_TENSORRT_MAJOR_VERSION &mdash; Torch-TensorRT v2.6.0.dev0+2840531 documentation</title>
1414

1515

1616

@@ -275,7 +275,7 @@
275275

276276

277277
<div class="version">
278-
v2.6.0.dev0+b99d080
278+
v2.6.0.dev0+2840531
279279
</div>
280280

281281

@@ -330,6 +330,7 @@
330330
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/converter_overloading.html">Overloading Torch-TensorRT Converters with Custom Converters</a></li>
331331
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/custom_kernel_plugins.html">Using Custom Kernels within TensorRT Engines with Torch-TensorRT</a></li>
332332
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/mutable_torchtrt_module_example.html">Mutable Torch TensorRT Module</a></li>
333+
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/weight_streaming_example.html">Weight Streaming</a></li>
333334
</ul>
334335
<p class="caption" role="heading"><span class="caption-text">Dynamo Frontend</span></p>
335336
<ul>

docs/_cpp_api/define_macros_8h_1a35703561b26b1a9d2738ad7d58b27827.html

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@
1010

1111
<meta name="viewport" content="width=device-width, initial-scale=1.0">
1212

13-
<title>Define TORCH_TENSORRT_MINOR_VERSION &mdash; Torch-TensorRT v2.6.0.dev0+b99d080 documentation</title>
13+
<title>Define TORCH_TENSORRT_MINOR_VERSION &mdash; Torch-TensorRT v2.6.0.dev0+2840531 documentation</title>
1414

1515

1616

@@ -275,7 +275,7 @@
275275

276276

277277
<div class="version">
278-
v2.6.0.dev0+b99d080
278+
v2.6.0.dev0+2840531
279279
</div>
280280

281281

@@ -330,6 +330,7 @@
330330
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/converter_overloading.html">Overloading Torch-TensorRT Converters with Custom Converters</a></li>
331331
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/custom_kernel_plugins.html">Using Custom Kernels within TensorRT Engines with Torch-TensorRT</a></li>
332332
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/mutable_torchtrt_module_example.html">Mutable Torch TensorRT Module</a></li>
333+
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/weight_streaming_example.html">Weight Streaming</a></li>
333334
</ul>
334335
<p class="caption" role="heading"><span class="caption-text">Dynamo Frontend</span></p>
335336
<ul>

docs/_cpp_api/define_macros_8h_1abd1465eb38256d3f22cc1426b23d516b.html

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@
1010

1111
<meta name="viewport" content="width=device-width, initial-scale=1.0">
1212

13-
<title>Define TORCHTRT_API &mdash; Torch-TensorRT v2.6.0.dev0+b99d080 documentation</title>
13+
<title>Define TORCHTRT_API &mdash; Torch-TensorRT v2.6.0.dev0+2840531 documentation</title>
1414

1515

1616

@@ -275,7 +275,7 @@
275275

276276

277277
<div class="version">
278-
v2.6.0.dev0+b99d080
278+
v2.6.0.dev0+2840531
279279
</div>
280280

281281

@@ -330,6 +330,7 @@
330330
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/converter_overloading.html">Overloading Torch-TensorRT Converters with Custom Converters</a></li>
331331
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/custom_kernel_plugins.html">Using Custom Kernels within TensorRT Engines with Torch-TensorRT</a></li>
332332
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/mutable_torchtrt_module_example.html">Mutable Torch TensorRT Module</a></li>
333+
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/weight_streaming_example.html">Weight Streaming</a></li>
333334
</ul>
334335
<p class="caption" role="heading"><span class="caption-text">Dynamo Frontend</span></p>
335336
<ul>

docs/_cpp_api/define_macros_8h_1abe87b341f562fd1cf40b7672e4d759da.html

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@
1010

1111
<meta name="viewport" content="width=device-width, initial-scale=1.0">
1212

13-
<title>Define XSTR &mdash; Torch-TensorRT v2.6.0.dev0+b99d080 documentation</title>
13+
<title>Define XSTR &mdash; Torch-TensorRT v2.6.0.dev0+2840531 documentation</title>
1414

1515

1616

@@ -275,7 +275,7 @@
275275

276276

277277
<div class="version">
278-
v2.6.0.dev0+b99d080
278+
v2.6.0.dev0+2840531
279279
</div>
280280

281281

@@ -330,6 +330,7 @@
330330
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/converter_overloading.html">Overloading Torch-TensorRT Converters with Custom Converters</a></li>
331331
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/custom_kernel_plugins.html">Using Custom Kernels within TensorRT Engines with Torch-TensorRT</a></li>
332332
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/mutable_torchtrt_module_example.html">Mutable Torch TensorRT Module</a></li>
333+
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/weight_streaming_example.html">Weight Streaming</a></li>
333334
</ul>
334335
<p class="caption" role="heading"><span class="caption-text">Dynamo Frontend</span></p>
335336
<ul>

docs/_cpp_api/define_macros_8h_1ad19939408f7be171a74a89928b36eb59.html

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@
1010

1111
<meta name="viewport" content="width=device-width, initial-scale=1.0">
1212

13-
<title>Define TORCHTRT_HIDDEN &mdash; Torch-TensorRT v2.6.0.dev0+b99d080 documentation</title>
13+
<title>Define TORCHTRT_HIDDEN &mdash; Torch-TensorRT v2.6.0.dev0+2840531 documentation</title>
1414

1515

1616

@@ -275,7 +275,7 @@
275275

276276

277277
<div class="version">
278-
v2.6.0.dev0+b99d080
278+
v2.6.0.dev0+2840531
279279
</div>
280280

281281

@@ -330,6 +330,7 @@
330330
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/converter_overloading.html">Overloading Torch-TensorRT Converters with Custom Converters</a></li>
331331
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/custom_kernel_plugins.html">Using Custom Kernels within TensorRT Engines with Torch-TensorRT</a></li>
332332
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/mutable_torchtrt_module_example.html">Mutable Torch TensorRT Module</a></li>
333+
<li class="toctree-l1"><a class="reference internal" href="../tutorials/_rendered_examples/dynamo/weight_streaming_example.html">Weight Streaming</a></li>
333334
</ul>
334335
<p class="caption" role="heading"><span class="caption-text">Dynamo Frontend</span></p>
335336
<ul>

0 commit comments

Comments
 (0)