fixed a bug due to shape_change

cehongwang · cehongwang · commit d36494ac01cd · 2025-12-17T23:00:36.000Z
diff --git a/core/runtime/execute_engine.cpp b/core/runtime/execute_engine.cpp
@@ -141,7 +141,7 @@ void setup_input_tensors(
       at::Tensor contig_input = inputs[i].view(shape).contiguous();
       formatted_inputs.emplace_back(std::move(contig_input));
 
-      if (need_cudagraphs_record) {
+      if (need_cudagraphs_record or compiled_engine->allocated_outputs.size() == 0) {
         // Create a new persistent input buffer
         compiled_engine->input_buffers[i] = std::move(formatted_inputs.back().clone());
       }
diff --git a/py/torch_tensorrt/dynamo/runtime/_PythonTorchTensorRTModule.py b/py/torch_tensorrt/dynamo/runtime/_PythonTorchTensorRTModule.py
@@ -417,7 +417,9 @@ def setup_input_tensors(
                 inputs_cpu = contiguous_inputs[i].cpu().to(torch.int64).numpy().copy()
                 self.context.set_tensor_address(input_name, inputs_cpu.ctypes.data)
             else:
-                if need_cudagraphs_record:
+                if (
+                    need_cudagraphs_record or self.output_tensors is None
+                ):  # First time execution:
                     self.context.set_input_shape(
                         input_name, tuple(contiguous_inputs[i].shape)
                     )

Original file line number	Diff line number	Diff line change
`@@ -141,7 +141,7 @@ void setup_input_tensors(`
`141`	`141`	`at::Tensor contig_input = inputs[i].view(shape).contiguous();`
`142`	`142`	`formatted_inputs.emplace_back(std::move(contig_input));`
`143`	`143`
`144`		`- if (need_cudagraphs_record) {`
	`144`	`+ if (need_cudagraphs_record or compiled_engine->allocated_outputs.size() == 0) {`
`145`	`145`	`// Create a new persistent input buffer`
`146`	`146`	`compiled_engine->input_buffers[i] = std::move(formatted_inputs.back().clone());`
`147`	`147`	`}`