From 9af4bbdd91e63ab6eb08548eadece72264554add Mon Sep 17 00:00:00 2001
From: Ethanfel <ethan.fel@ts-pc.fr>
Date: Fri, 10 Apr 2026 01:42:45 +0200
Subject: [PATCH] fix: force torch.cuda.empty_cache() after pre-generation and
 CLIP encoding

PyTorch's caching allocator reserves GPU memory from pre-generation
(~90 GiB for generator + tod) and doesn't return it to CUDA/OS.
soft_empty_cache may not call torch.cuda.empty_cache(). Force a full
cache release after CLIP encoding and after LoRA mel pre-generation.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 nodes/selva_bigvgan_trainer.py | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/nodes/selva_bigvgan_trainer.py b/nodes/selva_bigvgan_trainer.py
index 699a701..b54923b 100644
--- a/nodes/selva_bigvgan_trainer.py
+++ b/nodes/selva_bigvgan_trainer.py
@@ -836,6 +836,8 @@ class SelvaBigvganTrainer:
                     if clip_model is not None:
                         clip_model.to("cpu")
                     soft_empty_cache()
+                    if device.type == "cuda":
+                        torch.cuda.empty_cache()
                 print(f"[BigVGAN] Pre-encoded {len(text_clip_cache)} text CLIP embeddings", flush=True)
 
         pbar = comfy.utils.ProgressBar(steps)
@@ -875,6 +877,10 @@ class SelvaBigvganTrainer:
                             "could be generated. Check that data_dir contains .npz "
                             "files with matching audio files."
                         )
+                    # Force-release the CUDA memory pool from pre-generation.
+                    # soft_empty_cache may not call torch.cuda.empty_cache().
+                    if device.type == "cuda":
+                        torch.cuda.empty_cache()
 
                 _result[0] = _do_train(
                     vocoder, mel_converter, clips,