fix: add input validation and cpu() guard in OmniVoiceGenerate

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
2026-04-05 09:09:52 +02:00
parent 95712e5504
commit 18fe6359cf
2 changed files with 33 additions and 2 deletions
@@ -33,12 +33,17 @@ class OmniVoiceGenerate:
    def generate(self, model, text, mode, ref_audio=None, ref_text="", instruct="", speed=1.0, num_step=32):
        kwargs = {"text": text, "speed": speed, "num_step": num_step}

+        if mode == "voice_cloning" and ref_audio is None:
+            raise ValueError("voice_cloning mode requires ref_audio to be connected")
+        if mode == "voice_design" and not instruct:
+            raise ValueError("voice_design mode requires an instruct string (e.g. 'female, low pitch')")
+
        if mode == "voice_cloning" and ref_audio is not None:
            tmp = tempfile.NamedTemporaryFile(suffix=".wav", delete=False)
            tmp_path = tmp.name
            tmp.close()
            try:
-                waveform = ref_audio["waveform"].squeeze(0)  # (channels, samples)
+                waveform = ref_audio["waveform"].squeeze(0).cpu()  # (channels, samples)
                torchaudio.save(tmp_path, waveform, ref_audio["sample_rate"])
                kwargs["ref_audio"] = tmp_path
                if ref_text:
@@ -1,5 +1,5 @@
 # tests/test_generator.py
-from unittest.mock import patch, MagicMock, call
+from unittest.mock import patch, MagicMock
 import torch
 import pytest
 from nodes.generator import OmniVoiceGenerate
@@ -92,6 +92,32 @@ def test_generate_voice_cloning():
    assert "ref_audio" in call_kwargs


+def test_voice_cloning_without_ref_audio_raises():
+    node = OmniVoiceGenerate()
+    mock_model = make_mock_model()
+    with pytest.raises(ValueError, match="ref_audio"):
+        node.generate(
+            model=mock_model,
+            text="Hello",
+            mode="voice_cloning",
+            speed=1.0,
+            num_step=32,
+        )
+
+
+def test_voice_design_without_instruct_raises():
+    node = OmniVoiceGenerate()
+    mock_model = make_mock_model()
+    with pytest.raises(ValueError, match="instruct"):
+        node.generate(
+            model=mock_model,
+            text="Hello",
+            mode="voice_design",
+            speed=1.0,
+            num_step=32,
+        )
+
+
 def test_output_waveform_shape():
    node = OmniVoiceGenerate()
    # Simulate two chunks returned by OmniVoice