REPETSIM

Rafii, Zafar, and Bryan Pardo. “Online REPET-SIM for real-time speech enhancement.” 2013 IEEE International Conference on Acoustics, Speech and Signal Processing. IEEE, 2013.

@inproceedings{rafii2013online,
  title={Online REPET-SIM for real-time speech enhancement},
  author={Rafii, Zafar and Pardo, Bryan},
  booktitle={2013 IEEE International Conference on Acoustics, Speech and Signal Processing},
  pages={848--852},
  year={2013},
  organization={IEEE}
}
[1]:
import nussl
import matplotlib.pyplot as plt
import time

start_time = time.time()

audio_path = nussl.efz_utils.download_audio_file(
    'historyrepeating_7olLrex.wav')
audio_signal = nussl.AudioSignal(audio_path)
separator = nussl.separation.primitive.RepetSim(
    audio_signal, mask_type='binary')
estimates = separator()

plt.figure(figsize=(10, 6))
plt.subplot(211)
nussl.utils.visualize_sources_as_masks({
    'Background': estimates[0], 'Foreground': estimates[1]},
    y_axis='mel', db_cutoff=-60, alpha_amount=2.0)

plt.subplot(212)
nussl.utils.visualize_sources_as_waveform({
    'Background': estimates[0], 'Foreground': estimates[1]},
    show_legend=False)
plt.show()
nussl.play_utils.multitrack(estimates, ['Background', 'Foreground'])
Matching file found at /home/pseetharaman/.nussl/audio/historyrepeating_7olLrex.wav, skipping download.
../../_images/examples_primitives_repet_sim_1_1.png
[2]:
end_time = time.time()
time_taken = end_time - start_time
print(f'Time taken: {time_taken:.4f} seconds')
Time taken: 3.1563 seconds