From 9a470e073e2742d4edd6e7ea1ce28d861a77d9c4 Mon Sep 17 00:00:00 2001
From: comfyanonymous <comfyanonymous@protonmail.com>
Date: Mon, 21 Jul 2025 14:05:43 -0400
Subject: [PATCH 1/4] ComfyUI version 0.3.45

---
 comfyui_version.py | 2 +-
 pyproject.toml     | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/comfyui_version.py b/comfyui_version.py
index 7981fbaca..180ecaf8a 100644
--- a/comfyui_version.py
+++ b/comfyui_version.py
@@ -1,3 +1,3 @@
 # This file is automatically generated by the build process when version is
 # updated in pyproject.toml.
-__version__ = "0.3.44"
+__version__ = "0.3.45"
diff --git a/pyproject.toml b/pyproject.toml
index 96ead2157..b1d6d9df6 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -1,6 +1,6 @@
 [project]
 name = "ComfyUI"
-version = "0.3.44"
+version = "0.3.45"
 readme = "README.md"
 license = { file = "LICENSE" }
 requires-python = ">=3.9"

From 54a45b996729b361ea12f473de760e481dcf1f0a Mon Sep 17 00:00:00 2001
From: comfyanonymous <121283862+comfyanonymous@users.noreply.github.com>
Date: Mon, 21 Jul 2025 11:19:14 -0700
Subject: [PATCH 2/4] Replace torchaudio.load with pyav. (#8989)

---
 comfy_extras/nodes_audio.py | 58 ++++++++++++++++++++++++++++++++++++-
 1 file changed, 57 insertions(+), 1 deletion(-)

diff --git a/comfy_extras/nodes_audio.py b/comfy_extras/nodes_audio.py
index 8cd647846..38697240e 100644
--- a/comfy_extras/nodes_audio.py
+++ b/comfy_extras/nodes_audio.py
@@ -278,6 +278,62 @@ class PreviewAudio(SaveAudio):
                 "hidden": {"prompt": "PROMPT", "extra_pnginfo": "EXTRA_PNGINFO"},
                 }
 
+def f32_pcm(wav: torch.Tensor) -> torch.Tensor:
+    """Convert audio to float 32 bits PCM format."""
+    if wav.dtype.is_floating_point:
+        return wav
+    elif wav.dtype == torch.int16:
+        return wav.float() / (2 ** 15)
+    elif wav.dtype == torch.int32:
+        return wav.float() / (2 ** 31)
+    raise ValueError(f"Unsupported wav dtype: {wav.dtype}")
+
+def load(filepath: str, frame_offset: int = 0, num_frames: int = -1) -> tuple[torch.Tensor, int]:
+    with av.open(filepath) as af:
+        if not af.streams.audio:
+            raise ValueError("No audio stream found in the file.")
+
+        stream = af.streams.audio[0]
+        sr = stream.codec_context.sample_rate
+        n_channels = stream.channels
+
+        seek_time = frame_offset / sr if frame_offset > 0 else 0.0
+        duration = num_frames / sr if num_frames > 0 else -1.0
+
+        sample_offset = int(sr * seek_time)
+        num_samples = int(sr * duration) if duration >= 0 else -1
+
+        # Small negative offset for MP3 artifacts, NOTE: this is LLM code so idk if it's actually necessary'
+        seek_sec = max(0, seek_time - 0.1) if filepath.lower().endswith('.mp3') else seek_time
+        af.seek(int(seek_sec / stream.time_base), stream=stream)
+
+        frames = []
+        length = 0
+        for frame in af.decode(streams=stream.index):
+            current_offset = int(frame.rate * frame.pts * frame.time_base)
+            strip = max(0, sample_offset - current_offset)
+
+            buf = torch.from_numpy(frame.to_ndarray())
+            if buf.shape[0] != n_channels:
+                buf = buf.view(-1, n_channels).t()
+
+            buf = buf[:, strip:]
+            frames.append(buf)
+            length += buf.shape[1]
+
+            if num_samples > 0 and length >= num_samples:
+                break
+
+        if not frames:
+            raise ValueError("No audio frames decoded.")
+
+        wav = torch.cat(frames, dim=1)
+        if num_samples > 0:
+            wav = wav[:, :num_samples]
+
+        wav = f32_pcm(wav)
+        return wav, sr
+
 class LoadAudio:
     @classmethod
     def INPUT_TYPES(s):
@@ -292,7 +348,7 @@ class LoadAudio:
 
     def load(self, audio):
         audio_path = folder_paths.get_annotated_filepath(audio)
-        waveform, sample_rate = torchaudio.load(audio_path)
+        waveform, sample_rate = load(audio_path)
         audio = {"waveform": waveform.unsqueeze(0), "sample_rate": sample_rate}
         return (audio, )
 

From 5249e45a1c7d91656ebefdebe3815005ec3d39d7 Mon Sep 17 00:00:00 2001
From: comfyanonymous <121283862+comfyanonymous@users.noreply.github.com>
Date: Mon, 21 Jul 2025 12:23:41 -0700
Subject: [PATCH 3/4] Add hidream e1.1 example to readme. (#8990)

---
 README.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/README.md b/README.md
index 0e021a687..d004364ee 100644
--- a/README.md
+++ b/README.md
@@ -69,6 +69,7 @@ See what ComfyUI can do with the [example workflows](https://comfyanonymous.gith
 - Image Editing Models
    - [Omnigen 2](https://comfyanonymous.github.io/ComfyUI_examples/omnigen/)
    - [Flux Kontext](https://comfyanonymous.github.io/ComfyUI_examples/flux/#flux-kontext-image-editing-model)
+   - [HiDream E1.1](https://comfyanonymous.github.io/ComfyUI_examples/hidream/#hidream-e11)
 - Video Models
    - [Stable Video Diffusion](https://comfyanonymous.github.io/ComfyUI_examples/video/)
    - [Mochi](https://comfyanonymous.github.io/ComfyUI_examples/mochi/)

From 0aa1c58b04b27311c6ba38b1d9949e7e20037d00 Mon Sep 17 00:00:00 2001
From: comfyanonymous <121283862+comfyanonymous@users.noreply.github.com>
Date: Mon, 21 Jul 2025 13:48:25 -0700
Subject: [PATCH 4/4] This is not needed. (#8991)

---
 comfy_extras/nodes_audio.py | 22 +---------------------
 1 file changed, 1 insertion(+), 21 deletions(-)

diff --git a/comfy_extras/nodes_audio.py b/comfy_extras/nodes_audio.py
index 38697240e..a90b31779 100644
--- a/comfy_extras/nodes_audio.py
+++ b/comfy_extras/nodes_audio.py
@@ -288,7 +288,7 @@ def f32_pcm(wav: torch.Tensor) -> torch.Tensor:
         return wav.float() / (2 ** 31)
     raise ValueError(f"Unsupported wav dtype: {wav.dtype}")
 
-def load(filepath: str, frame_offset: int = 0, num_frames: int = -1) -> tuple[torch.Tensor, int]:
+def load(filepath: str) -> tuple[torch.Tensor, int]:
     with av.open(filepath) as af:
         if not af.streams.audio:
             raise ValueError("No audio stream found in the file.")
@@ -297,40 +297,20 @@ def load(filepath: str, frame_offset: int = 0, num_frames: int = -1) -> tuple[to
         sr = stream.codec_context.sample_rate
         n_channels = stream.channels
 
-        seek_time = frame_offset / sr if frame_offset > 0 else 0.0
-        duration = num_frames / sr if num_frames > 0 else -1.0
-
-        sample_offset = int(sr * seek_time)
-        num_samples = int(sr * duration) if duration >= 0 else -1
-
-        # Small negative offset for MP3 artifacts, NOTE: this is LLM code so idk if it's actually necessary'
-        seek_sec = max(0, seek_time - 0.1) if filepath.lower().endswith('.mp3') else seek_time
-        af.seek(int(seek_sec / stream.time_base), stream=stream)
-
         frames = []
         length = 0
         for frame in af.decode(streams=stream.index):
-            current_offset = int(frame.rate * frame.pts * frame.time_base)
-            strip = max(0, sample_offset - current_offset)
-
             buf = torch.from_numpy(frame.to_ndarray())
             if buf.shape[0] != n_channels:
                 buf = buf.view(-1, n_channels).t()
 
-            buf = buf[:, strip:]
             frames.append(buf)
             length += buf.shape[1]
 
-            if num_samples > 0 and length >= num_samples:
-                break
-
         if not frames:
             raise ValueError("No audio frames decoded.")
 
         wav = torch.cat(frames, dim=1)
-        if num_samples > 0:
-            wav = wav[:, :num_samples]
-
         wav = f32_pcm(wav)
         return wav, sr