This repository covers EM algorithms to separate speech sources in multi-channel recordings.
In particular, the repository contains methods to integrate Deep Clustering (a neural network-based source separation algorithm) with a probabilistic spatial mixture model as proposed in the Interspeech paper "Tight integration of spatial and spectral features for BSS with Deep Clustering embeddings" presented at Interspeech 2017 in Stockholm.
@InProceedings{Drude2017DeepClusteringIntegration,
Title = {{Tight integration of spatial and spectral features for BSS with Deep Clustering embeddings}},
Author = {Drude, Lukas and and Haeb-Umbach, Reinhold},
Booktitle = {INTERSPEECH 2017, Stockholm, Sweden},
Year = {2017},
Month = {Aug}
}