spleeter/tests/test_separator.py

#!/usr/bin/env python
# coding: utf8

""" Unit testing for Separator class. """

__email__ = 'spleeter@deezer.com'
__author__ = 'Deezer Research'
__license__ = 'MIT License'

import filecmp
import itertools
from os.path import splitext, basename, exists, join
from tempfile import TemporaryDirectory

import pytest
import numpy as np

import tensorflow as tf

from spleeter import SpleeterError
from spleeter.audio.adapter import get_default_audio_adapter
from spleeter.separator import Separator

TEST_AUDIO_DESCRIPTORS = ['audio_example.mp3', 'audio_example_mono.mp3']
BACKENDS = ["tensorflow", "librosa"]
MODELS = ['spleeter:2stems', 'spleeter:4stems', 'spleeter:5stems']

MODEL_TO_INST = {
    'spleeter:2stems': ('vocals', 'accompaniment'),
    'spleeter:4stems': ('vocals', 'drums', 'bass', 'other'),
    'spleeter:5stems': ('vocals', 'drums', 'bass', 'piano', 'other'),
}


MODELS_AND_TEST_FILES = list(itertools.product(TEST_AUDIO_DESCRIPTORS, MODELS))
TEST_CONFIGURATIONS = list(itertools.product(TEST_AUDIO_DESCRIPTORS, MODELS, BACKENDS))


print("RUNNING TESTS WITH TF VERSION {}".format(tf.__version__))


@pytest.mark.parametrize('test_file', TEST_AUDIO_DESCRIPTORS)
def test_separator_backends(test_file):
    adapter = get_default_audio_adapter()
    waveform, _ = adapter.load(test_file)

    separator_lib = Separator("spleeter:2stems", stft_backend="librosa")
    separator_tf = Separator("spleeter:2stems", stft_backend="tensorflow")

    # Test the stft and inverse stft provides exact reconstruction
    stft_matrix = separator_lib._stft(waveform)
    reconstructed = separator_lib._stft(
        stft_matrix, inverse=True, length=waveform.shape[0])
    assert np.allclose(reconstructed, waveform, atol=1e-2)

    # # now also test that tensorflow and librosa STFT provide same results
    from spleeter.audio.spectrogram import compute_spectrogram_tf
    tf_waveform = tf.convert_to_tensor(waveform, tf.float32)
    spectrogram_tf = compute_spectrogram_tf(tf_waveform,
                                            separator_tf._params['frame_length'],
                                            separator_tf._params['frame_step'],)
    with tf.Session() as sess:
        spectrogram_tf_eval = spectrogram_tf.eval()

    # check that stfts are equivalent up to the padding in the librosa case
    assert stft_matrix.shape[0] == spectrogram_tf_eval.shape[0] + 2
    assert stft_matrix.shape[1:] == spectrogram_tf_eval.shape[1:]
    assert np.allclose(
        np.abs(stft_matrix[1:-1]), spectrogram_tf_eval, atol=1e-2)

    # compare both separation, it should be close
    out_tf = separator_tf._separate_tensorflow(waveform, test_file)
    out_lib = separator_lib._separate_librosa(waveform, test_file)

    for instrument in out_lib.keys():
        # test that both outputs are not null
        assert np.sum(np.abs(out_tf[instrument])) > 1000
        assert np.sum(np.abs(out_lib[instrument])) > 1000
        assert np.allclose(out_tf[instrument], out_lib[instrument], atol=0.1)


@pytest.mark.parametrize('test_file, configuration, backend', TEST_CONFIGURATIONS)
def test_separate(test_file, configuration, backend):
    """ Test separation from raw data. """
    instruments = MODEL_TO_INST[configuration]
    adapter = get_default_audio_adapter()
    waveform, _ = adapter.load(test_file)
    separator = Separator(configuration, stft_backend=backend, multiprocess=False)
    prediction = separator.separate(waveform, test_file)
    assert len(prediction) == len(instruments)
    for instrument in instruments:
        assert instrument in prediction
    for instrument in instruments:
        track = prediction[instrument]
        assert waveform.shape[:-1] == track.shape[:-1]
        assert not np.allclose(waveform, track)
        for compared in instruments:
            if instrument != compared:
                assert not np.allclose(track, prediction[compared])
    

@pytest.mark.parametrize('test_file, configuration, backend', TEST_CONFIGURATIONS)
def test_separate_to_file(test_file, configuration, backend):
    """ Test file based separation. """
    instruments = MODEL_TO_INST[configuration]
    separator = Separator(configuration, stft_backend=backend, multiprocess=False)
    name = splitext(basename(test_file))[0]
    with TemporaryDirectory() as directory:
        separator.separate_to_file(
            test_file,
            directory)
        for instrument in instruments:
            assert exists(join(
                directory,
                '{}/{}.wav'.format(name, instrument)))


@pytest.mark.parametrize('test_file, configuration, backend', TEST_CONFIGURATIONS)
def test_filename_format(test_file, configuration, backend):
    """ Test custom filename format. """
    instruments = MODEL_TO_INST[configuration]
    separator = Separator(configuration, stft_backend=backend, multiprocess=False)
    name = splitext(basename(test_file))[0]
    with TemporaryDirectory() as directory:
        separator.separate_to_file(
            test_file,
            directory,
            filename_format='export/{filename}/{instrument}.{codec}')
        for instrument in instruments:
            assert exists(join(
                directory,
                'export/{}/{}.wav'.format(name, instrument)))


@pytest.mark.parametrize('test_file, configuration', MODELS_AND_TEST_FILES)
def test_filename_conflict(test_file, configuration):
    """ Test error handling with static pattern. """
    separator = Separator(configuration, multiprocess=False)
    with TemporaryDirectory() as directory:
        with pytest.raises(SpleeterError):
            separator.separate_to_file(
                test_file,
                directory,
                filename_format='I wanna be your lover')
test: add unit test for Separator class 2019-11-08 18:35:02 -05:00			`#!/usr/bin/env python`
			`# coding: utf8`

			`""" Unit testing for Separator class. """`

replace mail 2020-07-17 13:30:42 +02:00			`__email__ = 'spleeter@deezer.com'`
test: add unit test for Separator class 2019-11-08 18:35:02 -05:00			`__author__ = 'Deezer Research'`
			`__license__ = 'MIT License'`

refactor: Makefile test: improve separator test test: start pypi dist test 2019-11-14 14:44:19 -05:00			`import filecmp`
Adding support for mono files with librosa backend 2020-03-26 14:23:41 +01:00			`import itertools`
Fix file naming tuple bug 2019-11-23 15:42:40 -08:00			`from os.path import splitext, basename, exists, join`
test: add unit test for Separator class 2019-11-08 18:35:02 -05:00			`from tempfile import TemporaryDirectory`

fix: test parameters 2019-11-08 20:03:16 -05:00			`import pytest`
Updating tests to test for librosa backend 2020-02-27 15:38:46 +01:00			`import numpy as np`
fix: test parameters 2019-11-08 20:03:16 -05:00
Fixing tests when running in single process 2020-03-27 11:12:05 +01:00			`import tensorflow as tf`

test: add filename format tests 2019-11-20 15:18:53 +01:00			`from spleeter import SpleeterError`
test: add unit test for Separator class 2019-11-08 18:35:02 -05:00			`from spleeter.audio.adapter import get_default_audio_adapter`
			`from spleeter.separator import Separator`

Adding support for mono files with librosa backend 2020-03-26 14:23:41 +01:00			`TEST_AUDIO_DESCRIPTORS = ['audio_example.mp3', 'audio_example_mono.mp3']`
			`BACKENDS = ["tensorflow", "librosa"]`
			`MODELS = ['spleeter:2stems', 'spleeter:4stems', 'spleeter:5stems']`
Fixing tests when running in single process 2020-03-27 11:12:05 +01:00
Adding support for mono files with librosa backend 2020-03-26 14:23:41 +01:00			`MODEL_TO_INST = {`
			`'spleeter:2stems': ('vocals', 'accompaniment'),`
			`'spleeter:4stems': ('vocals', 'drums', 'bass', 'other'),`
			`'spleeter:5stems': ('vocals', 'drums', 'bass', 'piano', 'other'),`
			`}`


Fixing tests when running in single process 2020-03-27 11:12:05 +01:00			`MODELS_AND_TEST_FILES = list(itertools.product(TEST_AUDIO_DESCRIPTORS, MODELS))`
Adding support for mono files with librosa backend 2020-03-26 14:23:41 +01:00			`TEST_CONFIGURATIONS = list(itertools.product(TEST_AUDIO_DESCRIPTORS, MODELS, BACKENDS))`
test: add unit test for Separator class 2019-11-08 18:35:02 -05:00

Fixing tests when running in single process 2020-03-27 11:12:05 +01:00			`print("RUNNING TESTS WITH TF VERSION {}".format(tf.__version__))`

pep8 2020-06-18 18:12:43 +02:00
Fixing gltches issues with Istft 2020-06-18 18:01:03 +02:00			`@pytest.mark.parametrize('test_file', TEST_AUDIO_DESCRIPTORS)`
			`def test_separator_backends(test_file):`
			`adapter = get_default_audio_adapter()`
			`waveform, _ = adapter.load(test_file)`

			`separator_lib = Separator("spleeter:2stems", stft_backend="librosa")`
			`separator_tf = Separator("spleeter:2stems", stft_backend="tensorflow")`

			`# Test the stft and inverse stft provides exact reconstruction`
			`stft_matrix = separator_lib._stft(waveform)`
pep8 2020-06-18 18:12:43 +02:00			`reconstructed = separator_lib._stft(`
			`stft_matrix, inverse=True, length=waveform.shape[0])`
Fixing gltches issues with Istft 2020-06-18 18:01:03 +02:00			`assert np.allclose(reconstructed, waveform, atol=1e-2)`

			`# # now also test that tensorflow and librosa STFT provide same results`
			`from spleeter.audio.spectrogram import compute_spectrogram_tf`
			`tf_waveform = tf.convert_to_tensor(waveform, tf.float32)`
			`spectrogram_tf = compute_spectrogram_tf(tf_waveform,`
pep8 2020-06-18 18:12:43 +02:00			`separator_tf._params['frame_length'],`
			`separator_tf._params['frame_step'],)`
Fixing gltches issues with Istft 2020-06-18 18:01:03 +02:00			`with tf.Session() as sess:`
			`spectrogram_tf_eval = spectrogram_tf.eval()`

			`# check that stfts are equivalent up to the padding in the librosa case`
			`assert stft_matrix.shape[0] == spectrogram_tf_eval.shape[0] + 2`
			`assert stft_matrix.shape[1:] == spectrogram_tf_eval.shape[1:]`
pep8 2020-06-18 18:12:43 +02:00			`assert np.allclose(`
			`np.abs(stft_matrix[1:-1]), spectrogram_tf_eval, atol=1e-2)`
Fixing gltches issues with Istft 2020-06-18 18:01:03 +02:00
			`# compare both separation, it should be close`
			`out_tf = separator_tf._separate_tensorflow(waveform, test_file)`
			`out_lib = separator_lib._separate_librosa(waveform, test_file)`

			`for instrument in out_lib.keys():`
			`# test that both outputs are not null`
			`assert np.sum(np.abs(out_tf[instrument])) > 1000`
			`assert np.sum(np.abs(out_lib[instrument])) > 1000`
			`assert np.allclose(out_tf[instrument], out_lib[instrument], atol=0.1)`
Fixing tests when running in single process 2020-03-27 11:12:05 +01:00
pep8 2020-06-18 18:12:43 +02:00
correct fixtures 2020-03-26 14:27:19 +01:00			`@pytest.mark.parametrize('test_file, configuration, backend', TEST_CONFIGURATIONS)`
			`def test_separate(test_file, configuration, backend):`
test: add unit test for Separator class 2019-11-08 18:35:02 -05:00			`""" Test separation from raw data. """`
need to force flush the RAM in between pytest calls and avoid multiprocess 2020-06-26 11:03:41 +02:00			`instruments = MODEL_TO_INST[configuration]`
			`adapter = get_default_audio_adapter()`
			`waveform, _ = adapter.load(test_file)`
			`separator = Separator(configuration, stft_backend=backend, multiprocess=False)`
			`prediction = separator.separate(waveform, test_file)`
			`assert len(prediction) == len(instruments)`
			`for instrument in instruments:`
			`assert instrument in prediction`
			`for instrument in instruments:`
			`track = prediction[instrument]`
			`assert waveform.shape[:-1] == track.shape[:-1]`
			`assert not np.allclose(waveform, track)`
			`for compared in instruments:`
			`if instrument != compared:`
			`assert not np.allclose(track, prediction[compared])`

test: add unit test for Separator class 2019-11-08 18:35:02 -05:00

correct fixtures 2020-03-26 14:27:19 +01:00			`@pytest.mark.parametrize('test_file, configuration, backend', TEST_CONFIGURATIONS)`
			`def test_separate_to_file(test_file, configuration, backend):`
test: add unit test for Separator class 2019-11-08 18:35:02 -05:00			`""" Test file based separation. """`
need to force flush the RAM in between pytest calls and avoid multiprocess 2020-06-26 11:03:41 +02:00			`instruments = MODEL_TO_INST[configuration]`
			`separator = Separator(configuration, stft_backend=backend, multiprocess=False)`
			`name = splitext(basename(test_file))[0]`
			`with TemporaryDirectory() as directory:`
			`separator.separate_to_file(`
			`test_file,`
			`directory)`
			`for instrument in instruments:`
			`assert exists(join(`
			`directory,`
			`'{}/{}.wav'.format(name, instrument)))`
test: add filename format tests 2019-11-20 15:18:53 +01:00

correct fixtures 2020-03-26 14:27:19 +01:00			`@pytest.mark.parametrize('test_file, configuration, backend', TEST_CONFIGURATIONS)`
			`def test_filename_format(test_file, configuration, backend):`
test: add filename format tests 2019-11-20 15:18:53 +01:00			`""" Test custom filename format. """`
need to force flush the RAM in between pytest calls and avoid multiprocess 2020-06-26 11:03:41 +02:00			`instruments = MODEL_TO_INST[configuration]`
			`separator = Separator(configuration, stft_backend=backend, multiprocess=False)`
			`name = splitext(basename(test_file))[0]`
			`with TemporaryDirectory() as directory:`
			`separator.separate_to_file(`
			`test_file,`
			`directory,`
			`filename_format='export/{filename}/{instrument}.{codec}')`
			`for instrument in instruments:`
			`assert exists(join(`
test: add filename format tests 2019-11-20 15:18:53 +01:00			`directory,`
need to force flush the RAM in between pytest calls and avoid multiprocess 2020-06-26 11:03:41 +02:00			`'export/{}/{}.wav'.format(name, instrument)))`
test: add filename format tests 2019-11-20 15:18:53 +01:00

Fixing tests when running in single process 2020-03-27 11:12:05 +01:00			`@pytest.mark.parametrize('test_file, configuration', MODELS_AND_TEST_FILES)`
			`def test_filename_conflict(test_file, configuration):`
test: add filename format tests 2019-11-20 15:18:53 +01:00			`""" Test error handling with static pattern. """`
need to force flush the RAM in between pytest calls and avoid multiprocess 2020-06-26 11:03:41 +02:00			`separator = Separator(configuration, multiprocess=False)`
			`with TemporaryDirectory() as directory:`
			`with pytest.raises(SpleeterError):`
			`separator.separate_to_file(`
			`test_file,`
			`directory,`
			`filename_format='I wanna be your lover')`