Skip to content

Commit a9a6923

Browse files
Speed up generation time a tiny bit.
1 parent f0c52f4 commit a9a6923

File tree

2 files changed

+2
-2
lines changed

2 files changed

+2
-2
lines changed

pyproject.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
[project]
22
name = "comfyui_tensorrt"
33
description = "TensorRT Node for ComfyUI\nThis node enables the best performance on NVIDIA RTX™ Graphics Cards (GPUs) for Stable Diffusion by leveraging NVIDIA TensorRT."
4-
version = "0.1.2"
4+
version = "0.1.3"
55
license = "LICENSE"
66
dependencies = [
77
"tensorrt>=10.0.1",

tensorrt_loader.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -96,7 +96,7 @@ def __call__(self, x, timesteps, context, y=None, control=None, transformer_opti
9696
x = model_inputs_converted[k]
9797
self.context.set_tensor_address(k, x[(x.shape[0] // curr_split_batch) * i:].data_ptr())
9898
self.context.execute_async_v3(stream_handle=stream.cuda_stream)
99-
stream.synchronize()
99+
# stream.synchronize() #don't need to sync stream since it's the default torch one
100100
return out
101101

102102
def load_state_dict(self, sd, strict=False):

0 commit comments

Comments
 (0)