Politrees
diff --git a/‎PolUVR/separator/architectures/mdx_separator.py‎
Lines changed: 17 additions & 19 deletions b/‎PolUVR/separator/architectures/mdx_separator.py‎
Lines changed: 17 additions & 19 deletions
diff --git a/‎PolUVR/separator/roformer/parameter_validator.py‎
Lines changed: 26 additions & 44 deletions b/‎PolUVR/separator/roformer/parameter_validator.py‎
Lines changed: 26 additions & 44 deletions
diff --git a/‎specs/001-update-roformer-implementation/contracts/fallback_loader_interface.py‎
Lines changed: 0 additions & 65 deletions b/‎specs/001-update-roformer-implementation/contracts/fallback_loader_interface.py‎
Lines changed: 0 additions & 65 deletions
@@ -46,7 +46,7 @@ def __init__(self, common_config, arch_config):
         #  - For Non-MDX23C models: You can choose between 0.001-0.999
         self.overlap = arch_config.get("overlap", 0.25)
 
-        # Ensure overlap is within the range [0.001, 0.99]
+        # Ensure overlap is within the range [0.001, 0.999]
         if self.overlap < 0.001:
             self.logger.warning(f"overlap {self.overlap} is less than the minimum allowed value of 0.001. Setting overlap to 0.001.")
             self.overlap = 0.001
@@ -184,34 +184,33 @@ def separate(self, audio_file_path, custom_output_names=None):
         mix = self.prepare_mix(self.audio_file_path)
 
         self.logger.debug("Normalizing mix before demixing...")
+        peak = np.abs(mix).max()
         mix = spec_utils.normalize(wave=mix, max_peak=self.normalization_threshold, min_peak=self.amplification_threshold)
 
         # Start the demixing process
-        source = self.demix(mix)
+        source = self.demix(mix) * peak
         self.logger.debug("Demixing completed.")
 
+        if not isinstance(self.primary_source, np.ndarray):
+            self.primary_source = source.T
+
         # In UVR, the source is cached here if it's a vocal split model, but we're not supporting that yet
 
         # Initialize the list for output files
         output_files = []
         self.logger.debug("Processing output files...")
 
-        # Normalize and transpose the primary source if it's not already an array
-        if not isinstance(self.primary_source, np.ndarray):
-            self.logger.debug("Normalizing primary source...")
-            self.primary_source = spec_utils.normalize(wave=source, max_peak=self.normalization_threshold, min_peak=self.amplification_threshold).T
-
         # Process the secondary source if not already an array
         if not isinstance(self.secondary_source, np.ndarray):
             self.logger.debug("Producing secondary source: demixing in match_mix mode")
             raw_mix = self.demix(mix, is_match_mix=True)
 
             if self.invert_using_spec:
                 self.logger.debug("Inverting secondary stem using spectogram as invert_using_spec is set to True")
-                self.secondary_source = spec_utils.invert_stem(raw_mix, source)
+                self.secondary_source = spec_utils.invert_stem(raw_mix, self.primary_source * self.compensate)
             else:
                 self.logger.debug("Inverting secondary stem by subtracting of transposed demixed stem from transposed original mix")
-                self.secondary_source = mix.T - source.T
+                self.secondary_source = (-self.primary_source * self.compensate) + mix.T
 
         # Save and process the secondary stem if needed
         if not self.output_single_stem or self.output_single_stem.lower() == self.secondary_stem_name.lower():
@@ -224,10 +223,6 @@ def separate(self, audio_file_path, custom_output_names=None):
         # Save and process the primary stem if needed
         if not self.output_single_stem or self.output_single_stem.lower() == self.primary_stem_name.lower():
             self.primary_stem_output_path = self.get_stem_output_path(self.primary_stem_name, custom_output_names)
-
-            if not isinstance(self.primary_source, np.ndarray):
-                self.primary_source = source.T
-
             self.logger.info(f"Saving {self.primary_stem_name} stem to {self.primary_stem_output_path}...")
             self.final_process(self.primary_stem_output_path, self.primary_source, self.primary_stem_name)
             output_files.append(self.primary_stem_output_path)
@@ -284,7 +279,15 @@ def initialize_mix(self, mix, is_ckpt=False):
             pad = self.gen_size + self.trim - (mix.shape[-1] % self.gen_size)
             self.logger.debug(f"Padding calculated: {pad}")
             # Add padding at the beginning and the end of the mix
-            mixture = np.concatenate((np.zeros((2, self.trim), dtype="float32"), mix, np.zeros((2, pad), dtype="float32")), 1)
+            mixture = np.concatenate(
+                (
+                    np.zeros((2, self.trim), dtype="float32"),  # Pad at the start
+                    mix,
+                    np.zeros((2, pad), dtype="float32"),        # Pad in the middle (to match chunk size)
+                    np.zeros((2, self.trim), dtype="float32"),  # Pad at the end
+                ),
+                1
+            )
             # Determine the number of chunks based on the mixture's length
             num_chunks = mixture.shape[-1] // self.gen_size
             self.logger.debug(f"Mixture shape after padding: {mixture.shape}, Number of chunks: {num_chunks}")
@@ -431,11 +434,6 @@ def demix(self, mix, is_match_mix=False):
 
         # TODO: In UVR, pitch changing happens here. Consider implementing this as a feature.
 
-        # Compensates the source if not matching the mix.
-        if not is_match_mix:
-            source *= self.compensate
-            self.logger.debug("Match mix mode; compensate multiplier applied.")
-
         # TODO: In UVR, VR denoise model gets applied here. Consider implementing this as a feature.
 
         self.logger.debug("Demixing process completed.")
 
@@ -7,53 +7,35 @@
 import sys
 import os
 
-# Add contracts to path for interface imports (optional)
-try:
-    # Find project root dynamically
-    current_dir = os.path.dirname(os.path.abspath(__file__))
-    project_root = current_dir
-    # Go up until we find the project root (contains specs/ directory)
-    while project_root and not os.path.exists(os.path.join(project_root, 'specs')):
-        parent = os.path.dirname(project_root)
-        if parent == project_root:  # Reached filesystem root
-            break
-        project_root = parent
-    
-    contracts_path = os.path.join(project_root, 'specs', '001-update-roformer-implementation', 'contracts')
-    if os.path.exists(contracts_path):
-        sys.path.append(contracts_path)
-    from parameter_validator_interface import (
-        ParameterValidatorInterface,
-        ValidationIssue,
-        ValidationSeverity
-    )
-    _has_interface = True
-except ImportError:
-    # Create dummy interfaces for when contracts are not available
-    from enum import Enum
-    from dataclasses import dataclass
-    
-    class ValidationSeverity(Enum):
-        ERROR = "error"
-        WARNING = "warning"
-        INFO = "info"
-    
-    @dataclass
-    class ValidationIssue:
-        severity: ValidationSeverity
-        parameter_name: str
-        message: str
-        suggested_fix: str
-        current_value: any = None
-        expected_value: any = None
-    
-    class ParameterValidatorInterface:
-        pass
-    
-    _has_interface = False
+from enum import Enum
+from dataclasses import dataclass
+
 from .parameter_validation_error import ParameterValidationError
 
 
+class ValidationSeverity(Enum):
+    ERROR = "error"
+    WARNING = "warning"
+    INFO = "info"
+
+
+@dataclass
+class ValidationIssue:
+    severity: ValidationSeverity
+    parameter_name: str
+    message: str
+    suggested_fix: str
+    current_value: any = None
+    expected_value: any = None
+
+
+class ParameterValidatorInterface:
+    pass
+
+
+_has_interface = False
+
+
 class ParameterValidator(ParameterValidatorInterface):
     """
     Implementation of parameter validation for Roformer models.