nomadkaraoke
diff --git a/‎audio_separator/separator/roformer/roformer_loader.py‎
Lines changed: 77 additions & 11 deletions b/‎audio_separator/separator/roformer/roformer_loader.py‎
Lines changed: 77 additions & 11 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 1 addition & 1 deletion b/‎pyproject.toml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎tests/inputs/mardy20s_(Instrumental)_mel_band_roformer_karaoke_aufr33_viperx_sdr_10.flac‎
2.04 MB b/‎tests/inputs/mardy20s_(Instrumental)_mel_band_roformer_karaoke_aufr33_viperx_sdr_10.flac‎
2.04 MB
diff --git a/‎tests/inputs/mardy20s_(Vocals)_mel_band_roformer_karaoke_aufr33_viperx_sdr_10.flac‎
1.8 MB b/‎tests/inputs/mardy20s_(Vocals)_mel_band_roformer_karaoke_aufr33_viperx_sdr_10.flac‎
1.8 MB
diff --git a/‎tests/inputs/reference/expected_mardy20s_(Instrumental)_mel_band_roformer_karaoke_aufr33_viperx_sdr_10_spectrogram.png‎
729 KB b/‎tests/inputs/reference/expected_mardy20s_(Instrumental)_mel_band_roformer_karaoke_aufr33_viperx_sdr_10_spectrogram.png‎
729 KB
diff --git a/‎tests/inputs/reference/expected_mardy20s_(Instrumental)_mel_band_roformer_karaoke_aufr33_viperx_sdr_10_waveform.png‎
52.5 KB b/‎tests/inputs/reference/expected_mardy20s_(Instrumental)_mel_band_roformer_karaoke_aufr33_viperx_sdr_10_waveform.png‎
52.5 KB
diff --git a/‎tests/inputs/reference/expected_mardy20s_(Vocals)_mel_band_roformer_karaoke_aufr33_viperx_sdr_10_spectrogram.png‎
741 KB b/‎tests/inputs/reference/expected_mardy20s_(Vocals)_mel_band_roformer_karaoke_aufr33_viperx_sdr_10_spectrogram.png‎
741 KB
diff --git a/‎tests/inputs/reference/expected_mardy20s_(Vocals)_mel_band_roformer_karaoke_aufr33_viperx_sdr_10_waveform.png‎
46 KB b/‎tests/inputs/reference/expected_mardy20s_(Vocals)_mel_band_roformer_karaoke_aufr33_viperx_sdr_10_waveform.png‎
46 KB
diff --git a/‎tests/inputs/reference/expected_mardy20s_spectrogram.png‎
0 Bytes b/‎tests/inputs/reference/expected_mardy20s_spectrogram.png‎
0 Bytes
diff --git a/‎tests/inputs/reference/expected_mardy20s_waveform.png‎
0 Bytes b/‎tests/inputs/reference/expected_mardy20s_waveform.png‎
0 Bytes
@@ -45,12 +45,25 @@ def load_model(self,
             self._loading_stats['new_implementation_success'] += 1
             logger.info(f"Successfully loaded {model_type} model with new implementation")
             return result
-        except (RuntimeError, ValueError) as e:
+        except (RuntimeError, ValueError, TypeError) as e:
             logger.error(f"New implementation failed: {e}")
-            return ModelLoadingResult.failure_result(
-                error_message=f"New implementation failed: {e}",
-                implementation=ImplementationVersion.NEW,
-            )
+            # Attempt legacy fallback using the original (pre-normalized) configuration
+            try:
+                fallback_result = self._load_with_legacy_implementation(
+                    model_path=model_path,
+                    original_config=config,
+                    device=device,
+                    original_error=str(e)
+                )
+                logger.warning("Fell back to legacy Roformer implementation successfully")
+                return fallback_result
+            except (RuntimeError, ValueError, TypeError) as fallback_error:
+                logger.error(f"Legacy implementation also failed: {fallback_error}")
+                self._loading_stats['total_failures'] += 1
+                return ModelLoadingResult.failure_result(
+                    error_message=f"New implementation failed: {e}; Legacy fallback failed: {fallback_error}",
+                    implementation=ImplementationVersion.NEW,
+                )
 
     def validate_configuration(self, config: Dict[str, Any], model_type: str) -> bool:
         try:
@@ -160,13 +173,67 @@ def _create_mel_band_roformer(self, config: Dict[str, Any]):
         }
         if 'sample_rate' in config:
             model_args['sample_rate'] = config['sample_rate']
-        if 'fmin' in config:
-            model_args['fmin'] = config['fmin']
-        if 'fmax' in config:
-            model_args['fmax'] = config['fmax']
+        # Optional parameters commonly present in legacy configs
+        for optional_key in [
+            'mask_estimator_depth',
+            'stft_n_fft',
+            'stft_hop_length',
+            'stft_win_length',
+            'stft_normalized',
+            'stft_window_fn',
+            'multi_stft_resolution_loss_weight',
+            'multi_stft_resolutions_window_sizes',
+            'multi_stft_hop_size',
+            'multi_stft_normalized',
+            'multi_stft_window_fn',
+            'match_input_audio_length',
+        ]:
+            if optional_key in config:
+                model_args[optional_key] = config[optional_key]
+        # Note: fmin and fmax are defined in config classes but not accepted by current constructor
         logger.debug(f"Creating MelBandRoformer with args: {list(model_args.keys())}")
         return MelBandRoformer(**model_args)
 
+    def _load_with_legacy_implementation(self,
+                                          model_path: str,
+                                          original_config: Dict[str, Any],
+                                          device: str,
+                                          original_error: str) -> ModelLoadingResult:
+        """
+        Attempt to load the model using the legacy direct-constructor path
+        for maximum backward compatibility with existing checkpoints.
+        """
+        import torch
+
+        # Use nested 'model' section if present; otherwise assume flat
+        model_cfg = original_config.get('model', original_config)
+
+        # Determine model type from config
+        if 'num_bands' in model_cfg:
+            from ..uvr_lib_v5.roformer.mel_band_roformer import MelBandRoformer
+            model = MelBandRoformer(**model_cfg)
+        elif 'freqs_per_bands' in model_cfg:
+            from ..uvr_lib_v5.roformer.bs_roformer import BSRoformer
+            model = BSRoformer(**model_cfg)
+        else:
+            raise ValueError("Unknown Roformer model type in legacy configuration")
+
+        # Load checkpoint as raw state dict (legacy behavior)
+        try:
+            checkpoint = torch.load(model_path, map_location='cpu', weights_only=True)
+        except TypeError:
+            # For older torch versions without weights_only
+            checkpoint = torch.load(model_path, map_location='cpu')
+
+        model.load_state_dict(checkpoint)
+        model.to(device).eval()
+
+        return ModelLoadingResult.fallback_success_result(
+            model=model,
+            original_error=original_error,
+            config=original_config,
+        )
+
     def get_loading_stats(self) -> Dict[str, int]:
         return self._loading_stats.copy()
 
@@ -232,8 +299,7 @@ def get_default_configuration(self, model_type: str) -> Dict[str, Any]:
                 'use_torch_checkpoint': False,
                 'skip_connection': False,
                 'sample_rate': 44100,
-                'fmin': 0,
-                'fmax': None,
+                # Note: fmin and fmax are not implemented in MelBandRoformer constructor
             }
         else:
             raise ValueError(f"Unknown model type: {model_type}")
@@ -4,7 +4,7 @@ build-backend = "poetry.core.masonry.api"
 
 [tool.poetry]
 name = "audio-separator"
-version = "0.38.0"
+version = "0.38.1"
 description = "Easy to use audio stem separation, using various models from UVR trained primarily by @Anjok07"
 authors = ["Andrew Beveridge <[email protected]>"]
 license = "MIT"