REPETSIM¶

Rafii, Zafar, and Bryan Pardo. “Online REPET-SIM for real-time speech enhancement.” 2013 IEEE International Conference on Acoustics, Speech and Signal Processing. IEEE, 2013.

@inproceedings{rafii2013online,
  title={Online REPET-SIM for real-time speech enhancement},
  author={Rafii, Zafar and Pardo, Bryan},
  booktitle={2013 IEEE International Conference on Acoustics, Speech and Signal Processing},
  pages={848--852},
  year={2013},
  organization={IEEE}
}

[1]:

import nussl
import matplotlib.pyplot as plt
import time

start_time = time.time()

audio_path = nussl.efz_utils.download_audio_file(
    'historyrepeating_7olLrex.wav')
audio_signal = nussl.AudioSignal(audio_path)
separator = nussl.separation.primitive.RepetSim(
    audio_signal, mask_type='binary')
estimates = separator()

plt.figure(figsize=(10, 6))
plt.subplot(211)
nussl.utils.visualize_sources_as_masks({
    'Background': estimates[0], 'Foreground': estimates[1]},
    y_axis='mel', db_cutoff=-60, alpha_amount=2.0)

plt.subplot(212)
nussl.utils.visualize_sources_as_waveform({
    'Background': estimates[0], 'Foreground': estimates[1]},
    show_legend=False)
plt.show()
nussl.play_utils.multitrack(estimates, ['Background', 'Foreground'])

Matching file found at /home/pseetharaman/.nussl/audio/historyrepeating_7olLrex.wav, skipping download.

../../_images/examples_primitives_repet_sim_1_1.png

[2]:

end_time = time.time()
time_taken = end_time - start_time
print(f'Time taken: {time_taken:.4f} seconds')

Time taken: 3.1563 seconds