fix: bug sweep and improvements

- nodes/__init__.py: fix [PrismAudio] leftover label in error print - selva_feature_extractor: hash beginning, middle and end of video tensor instead of just first 1MB, avoiding collisions on videos with same opening frames - selva_sampler: derive SequenceConfig from model template via dataclasses.replace instead of hardcoding sampling_rate/spectrogram_frame_rate per mode Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
2026-04-04 18:04:35 +02:00
parent 83b1da9520
commit ff26d0b87d
3 changed files with 10 additions and 8 deletions
@@ -38,8 +38,8 @@ class SelvaSampler:
    CATEGORY = SELVA_CATEGORY

    def generate(self, model, features, prompt, negative_prompt, duration, steps, cfg_strength, seed):
+        import dataclasses
        from selva_core.model.flow_matching import FlowMatching
-        from selva_core.model.sequence_config import SequenceConfig

        device   = get_device()
        dtype    = model["dtype"]
@@ -63,11 +63,8 @@ class SelvaSampler:
            duration = features["duration"]
            print(f"[SelVA] Using video duration from features: {duration:.2f}s", flush=True)

-        # Compute sequence config for this duration
-        if mode == "16k":
-            seq_cfg = SequenceConfig(duration=duration, sampling_rate=16000, spectrogram_frame_rate=256)
-        else:
-            seq_cfg = SequenceConfig(duration=duration, sampling_rate=44100, spectrogram_frame_rate=512)
+        # Derive sequence config for this duration from the model's mode template
+        seq_cfg = dataclasses.replace(model["seq_cfg"], duration=duration)
        sample_rate = seq_cfg.sampling_rate

        if strategy == "offload_to_cpu":