diff --git a/App/__init__.py b/App/__init__.py index a4599cd..9f8c845 100644 --- a/App/__init__.py +++ b/App/__init__.py @@ -1 +1 @@ -# Version 5.2.1 \ No newline at end of file +# Version 5.3 \ No newline at end of file diff --git a/App/inference.py b/App/inference.py index 31186a3..718d632 100644 --- a/App/inference.py +++ b/App/inference.py @@ -156,6 +156,13 @@ def __init__(self, params, config, wxForm): self.GPU_device = 'cuda:0' self.providers = ["CUDAExecutionProvider"] + if wxForm is None: # for Jupyter Notebook + print('
It\'s OK -> GPU is used for processing !!
') + # For MAC OSX + elif torch.backends.mps.is_available(): + self.GPU_device = 'mps' + self.providers = None + if wxForm is None: # for Jupyter Notebook print('
It\'s OK -> GPU is used for processing !!
') else: @@ -263,9 +270,11 @@ def __init__(self, params, config, wxForm): self.AudioFiles = [ "NORMALIZED", + # Vocals extraction "Music extract", "Vocal extract", "Music Bleedings", + # Here --> Vocals results subtracted from Original Audio = Music "Vocal Bleedings", "Remove Music", "Vocal FINAL", @@ -277,8 +286,8 @@ def __init__(self, params, config, wxForm): # DEBUG # Reload "Bleedings" files with GOD MODE ... or not ! self.AudioFiles_Debug.append(3) - self.AudioFiles_Debug.append(4) - self.AudioFiles_Debug.append(5) + # self.AudioFiles_Debug.append(4) + # self.AudioFiles_Debug.append(5) # ****************************************************************** @@ -580,6 +589,9 @@ def Extract_with_Model(self, type, audio, model): if torch.cuda.is_available(): torch.cuda.empty_cache() + torch.cuda.ipc_collect() + elif torch.backends.mps.is_available(): + torch.mps.empty_cache() else: if not self.large_gpu: @@ -593,12 +605,12 @@ def Extract_with_Model(self, type, audio, model): if self.Denoise: print(f"{text} ({quality['BigShifts']} pass)") - source = 0.5 * -self.demix_full(-audio, mdx_model, inference, bigshifts)[0] - source += 0.5 * self.demix_full( audio, mdx_model, inference, bigshifts)[0] + source = 0.5 * -self.demix_full(-audio, mdx_model, inference, bigshifts, 1)[0] + source += 0.5 * self.demix_full( audio, mdx_model, inference, bigshifts, 2)[0] else: # ONLY 1 Pass, for testing purposes print(f"{text} ({quality['BigShifts']} pass) - NO Denoise !") - source = self.demix_full(audio, mdx_model, inference, bigshifts)[0] + source = self.demix_full(audio, mdx_model, inference, bigshifts, 0)[0] # Automatic SRS (for not FULL-BAND models !) if quality['BigShifts_SRS'] > 0: @@ -629,15 +641,15 @@ def Extract_with_Model(self, type, audio, model): print(f"{text} -> SRS High ({bigshifts} pass)") source_SRS = 0.5 * App.audio_utils.Change_sample_rate( - -self.demix_full(-audio_SRS, mdx_model, inference, bigshifts)[0], 'UP', self.original_cutoff, model['Cut_OFF'] + delta) + -self.demix_full(-audio_SRS, mdx_model, inference, bigshifts, 1)[0], 'UP', self.original_cutoff, model['Cut_OFF'] + delta) source_SRS += 0.5 * App.audio_utils.Change_sample_rate( - self.demix_full( audio_SRS, mdx_model, inference, bigshifts)[0], 'UP', self.original_cutoff, model['Cut_OFF'] + delta) + self.demix_full( audio_SRS, mdx_model, inference, bigshifts, 2)[0], 'UP', self.original_cutoff, model['Cut_OFF'] + delta) else: # ONLY 1 Pass, for testing purposes print(f"{text} -> SRS High ({bigshifts} pass) - NO Denoise !") source_SRS = App.audio_utils.Change_sample_rate( - self.demix_full(audio_SRS, mdx_model, inference, bigshifts)[0], 'UP', self.original_cutoff, model['Cut_OFF'] + delta) + self.demix_full( audio_SRS, mdx_model, inference, bigshifts, 0)[0], 'UP', self.original_cutoff, model['Cut_OFF'] + delta) # Check if source_SRS is same size than source source_SRS = librosa.util.fix_length(source_SRS, size = source.shape[-1]) @@ -685,14 +697,14 @@ def Extract_with_Model(self, type, audio, model): print(f"{text} -> SRS Low (1 pass)") source_SRS = 0.5 * App.audio_utils.Change_sample_rate( - -self.demix_full(-audio_SRS, mdx_model, inference, 1)[0], 'DOWN', self.original_cutoff, cut_freq) + -self.demix_full(-audio_SRS, mdx_model, inference, 1, 1)[0], 'DOWN', self.original_cutoff, cut_freq) source_SRS += 0.5 * App.audio_utils.Change_sample_rate( - self.demix_full( audio_SRS, mdx_model, inference, 1)[0], 'DOWN', self.original_cutoff, cut_freq) + self.demix_full( audio_SRS, mdx_model, inference, 1, 2)[0], 'DOWN', self.original_cutoff, cut_freq) else: print(f"{text} -> SRS Low (1 pass) - NO Denoise !") source_SRS = App.audio_utils.Change_sample_rate( - self.demix_full(audio_SRS, mdx_model, inference, 1)[0], 'DOWN', self.original_cutoff, cut_freq) + self.demix_full( audio_SRS, mdx_model, inference, 1, 0)[0], 'DOWN', self.original_cutoff, cut_freq) # Check if source_SRS is same size than source source_SRS = librosa.util.fix_length(source_SRS, size = source.shape[-1]) @@ -730,6 +742,9 @@ def Kill_MDX(self, model_name): gc.collect() if torch.cuda.is_available(): torch.cuda.empty_cache() + torch.cuda.ipc_collect() + elif torch.backends.mps.is_available(): + torch.mps.empty_cache() def raise_aicrowd_error(self, msg): # Will be used by the evaluator to provide logs, DO NOT CHANGE @@ -795,7 +810,7 @@ def Save_Audio(self, key, audio, model_name = ""): App.audio_utils.Save_Audio(file, audio, self.sample_rate, self.output_format, self.original_cutoff, self.ffmpeg) - def demix_full(self, mix, use_model, infer_session, bigshifts): + def demix_full(self, mix, use_model, infer_session, bigshifts, pass_number = 0): results = [] mix_length = int(mix.shape[1] / 44100) @@ -812,7 +827,10 @@ def demix_full(self, mix, use_model, infer_session, bigshifts): shifts = [x * demix_seconds for x in range(bigshifts)] - self.Progress.reset(len(shifts), unit="Pass") + if pass_number == 0: + self.Progress.reset(len(shifts), unit="Pass") # NO Denoise -> only 1 PASS ! + elif pass_number == 1: + self.Progress.reset(len(shifts) * 2, unit="Pass") # 1st PASS / 2 for shift in shifts: @@ -976,6 +994,8 @@ def Exit(): if torch.cuda.is_available(): torch.cuda.empty_cache() torch.cuda.ipc_collect() + elif torch.backends.mps.is_available(): + torch.mps.empty_cache() gc.collect() diff --git a/App/settings.py b/App/settings.py index 3c77677..2d3bd2b 100644 --- a/App/settings.py +++ b/App/settings.py @@ -118,16 +118,16 @@ 'bleed_6': "Instrum Main", }, { - 'music_1': "MDX23C 8K FFT", - 'music_2': "Instrum HQ 3", + 'music_1': "----", + 'music_2': "----", 'vocal_1': "MDX23C 8K FFT", - 'vocal_2': "Voc FT", - 'bleed_1': "Instrum 3", - 'bleed_2': "Instrum Main", + 'vocal_2': "Kim Vocal 2", + 'bleed_1': "Instrum Main", + 'bleed_2': "----", 'bleed_3': "MDX23C 8K FFT", 'bleed_4': "----", - 'bleed_5': "Instrum 3", - 'bleed_6': "Instrum Main", + 'bleed_5': "----", + 'bleed_6': "----", }, ] diff --git a/Gui/Notebook.py b/Gui/Notebook.py index 230b354..4e3dabf 100644 --- a/Gui/Notebook.py +++ b/Gui/Notebook.py @@ -12,7 +12,7 @@ def Run(params): - import App.settings, Gui.Progress + import App.settings, Gui.Progress, Gui.Error Gdrive = params['Gdrive'] Project = params['Project'] diff --git a/Gui/wx_Main.py b/Gui/wx_Main.py index 96df5f5..4f80a63 100644 --- a/Gui/wx_Main.py +++ b/Gui/wx_Main.py @@ -8,12 +8,17 @@ import App.settings, Gui.wx_GPUtil, Gui.wx_Progress, Gui.wx_Window # Change Font for ALL controls in a wxForm (Recursive) -def Set_Fonts(parent, font): +def Set_Fonts(parent, font = None, color = None): for control in parent.GetChildren(): - if hasattr(control, "SetFont") and control.GetFont().GetFaceName() != "Tahoma" and not isinstance(control, wx.html.HtmlWindow): - control.SetFont(font) + if font is not None: + if hasattr(control, "SetFont") and control.GetFont().GetFaceName() != "Tahoma" and not isinstance(control, wx.html.HtmlWindow): + control.SetFont(font) + + if color is not None: + if hasattr(control, "SetForegroundColour") and not isinstance(control, wx.html.HtmlWindow): + control.SetForegroundColour(color) # Recursive if isinstance(control, wx.Notebook) or isinstance(control, wx.NotebookPage) \ @@ -28,7 +33,9 @@ def __init__(self, parent, params): # Set fonts for ALL controls if platform.system() == "Windows": - Set_Fonts(self, wx.Font(12, wx.FONTFAMILY_DEFAULT, wx.FONTSTYLE_NORMAL, wx.FONTWEIGHT_NORMAL, False, "Segoe UI")) + Set_Fonts(self, font = wx.Font(11, wx.FONTFAMILY_DEFAULT, wx.FONTSTYLE_NORMAL, wx.FONTWEIGHT_NORMAL, False, "Segoe UI")) + elif platform.system() == "Darwin": + Set_Fonts(self, color = wx.Colour(0, 0, 0)) self.params = params self.Gdrive = params['Gdrive'] @@ -56,9 +63,14 @@ def __init__(self, parent, params): self.timer = wx.Timer(self) # Local Timer self.Bind(wx.EVT_TIMER, self.OnTimer, self.timer) # Link timer to function else: - self.GPU.SetForegroundColour(wx.Colour(255, 0, 64)) - self.GPU.SetLabel("Using CPU ►►►") - self.GPU_info.SetLabel("With CPU, processing will be very slow !!") + if platform.system() == "Darwin": + self.GPU.SetForegroundColour(wx.Colour(0, 179, 45)) + self.GPU.SetLabel(f"Using GPU ►") + self.GPU_info.SetLabel("... if you have installed the correct drivers !") + else: + self.GPU.SetForegroundColour(wx.Colour(255, 0, 64)) + self.GPU.SetLabel("Using CPU ►►►") + self.GPU_info.SetLabel("With CPU, processing will be very slow !!") # Set icons for each tab icon_music = wx.Image(icon_path + "icon-music.png", wx.BITMAP_TYPE_PNG).ConvertToBitmap() diff --git a/Gui/wx_Window.py b/Gui/wx_Window.py index d3093a0..e5af607 100644 --- a/Gui/wx_Window.py +++ b/Gui/wx_Window.py @@ -21,10 +21,9 @@ class Form ( wx.Frame ): def __init__( self, parent ): - wx.Frame.__init__ ( self, parent, id = wx.ID_ANY, title = _(u"KaraFan"), pos = wx.DefaultPosition, size = wx.Size( 697,777 ), style = wx.DEFAULT_FRAME_STYLE|wx.TAB_TRAVERSAL ) + wx.Frame.__init__ ( self, parent, id = wx.ID_ANY, title = _(u"KaraFan"), pos = wx.DefaultPosition, size = wx.Size( 697,806 ), style = wx.DEFAULT_FRAME_STYLE|wx.TAB_TRAVERSAL ) self.SetSizeHints( wx.DefaultSize, wx.DefaultSize ) - self.SetFont( wx.Font( 14, wx.FONTFAMILY_SWISS, wx.FONTSTYLE_NORMAL, wx.FONTWEIGHT_NORMAL, False, "Arial Narrow" ) ) self.SetBackgroundColour( wx.Colour( 255, 255, 255 ) ) MainSizer = wx.BoxSizer( wx.VERTICAL ) @@ -33,8 +32,6 @@ def __init__( self, parent ): self.Tabs.SetFont( wx.Font( 12, wx.FONTFAMILY_SWISS, wx.FONTSTYLE_NORMAL, wx.FONTWEIGHT_NORMAL, False, "Arial" ) ) self.Tab_Settings = wx.Panel( self.Tabs, wx.ID_ANY, wx.DefaultPosition, wx.DefaultSize, wx.TAB_TRAVERSAL ) - self.Tab_Settings.SetFont( wx.Font( 12, wx.FONTFAMILY_SWISS, wx.FONTSTYLE_NORMAL, wx.FONTWEIGHT_NORMAL, False, "Arial" ) ) - box1 = wx.BoxSizer( wx.VERTICAL ) sbSizer1 = wx.StaticBoxSizer( wx.StaticBox( self.Tab_Settings, wx.ID_ANY, _(u"[ Songs ]") ), wx.VERTICAL ) diff --git a/Gui/wx_window.fbp b/Gui/wx_window.fbp index fdc4cf1..c7f6d10 100644 --- a/Gui/wx_window.fbp +++ b/Gui/wx_window.fbp @@ -40,14 +40,14 @@ impl_virtual - Arial Narrow,90,400,14,74,0 + 0 wxID_ANY Form - 697,777 + 697,806 wxDEFAULT_FRAME_STYLE ; ; forward_declare KaraFan @@ -149,7 +149,7 @@ 1 1 - Arial,90,400,12,74,0 + 0 0 wxID_ANY diff --git a/README.md b/README.md index 6c2e508..7679c15 100644 --- a/README.md +++ b/README.md @@ -26,7 +26,7 @@ click here to send me an email, I'll give you my wallet address : [![Bitcoin](https://img.shields.io/badge/Donate-Bitcoin-green.svg?style=for-the-badge)](mailto:Captain_FLAM@gmx.fr) 😍 You can reach me by [**email**](https://github.com/Captain-FLAM) or Join all of us on the [**Dedicated channel on Discord**](https://discord.com/channels/708579735583588363/1162265179271200820) ![Discord](images/discord.svg) -(prior to : [**Discord Invitation**](https://discord.gg/eXdEYwU2) on the "Audio Separation" server) +(prior to : [**Discord Invitation**](https://discord.gg/ErkXU4JGKn) on the "Audio Separation" server) # 🚀 INSTALL