REPETSIM¶
Rafii, Zafar, and Bryan Pardo. “Online REPET-SIM for real-time speech enhancement.” 2013 IEEE International Conference on Acoustics, Speech and Signal Processing. IEEE, 2013.
@inproceedings{rafii2013online,
title={Online REPET-SIM for real-time speech enhancement},
author={Rafii, Zafar and Pardo, Bryan},
booktitle={2013 IEEE International Conference on Acoustics, Speech and Signal Processing},
pages={848--852},
year={2013},
organization={IEEE}
}
[1]:
import nussl
import matplotlib.pyplot as plt
import time
start_time = time.time()
audio_path = nussl.efz_utils.download_audio_file(
'historyrepeating_7olLrex.wav')
audio_signal = nussl.AudioSignal(audio_path)
separator = nussl.separation.primitive.RepetSim(
audio_signal, mask_type='binary')
estimates = separator()
plt.figure(figsize=(10, 6))
plt.subplot(211)
nussl.utils.visualize_sources_as_masks({
'Background': estimates[0], 'Foreground': estimates[1]},
y_axis='mel', db_cutoff=-60, alpha_amount=2.0)
plt.subplot(212)
nussl.utils.visualize_sources_as_waveform({
'Background': estimates[0], 'Foreground': estimates[1]},
show_legend=False)
plt.show()
nussl.play_utils.multitrack(estimates, ['Background', 'Foreground'])
Matching file found at /home/pseetharaman/.nussl/audio/historyrepeating_7olLrex.wav, skipping download.
[2]:
end_time = time.time()
time_taken = end_time - start_time
print(f'Time taken: {time_taken:.4f} seconds')
Time taken: 3.1563 seconds