{"citation":{"bibtex":"@inproceedings{Boeddeker_Rautenberg_Haeb-Umbach_2021, title={A Comparison and Combination of Unsupervised Blind Source Separation  Techniques}, booktitle={ITG Conference on Speech Communication}, author={Boeddeker, Christoph and Rautenberg, Frederik and Haeb-Umbach, Reinhold}, year={2021} }","apa":"Boeddeker, C., Rautenberg, F., & Haeb-Umbach, R. (2021). A Comparison and Combination of Unsupervised Blind Source Separation  Techniques. ITG Conference on Speech Communication. ITG Conference on Speech Communication, Kiel.","short":"C. Boeddeker, F. Rautenberg, R. Haeb-Umbach, in: ITG Conference on Speech Communication, 2021.","mla":"Boeddeker, Christoph, et al. “A Comparison and Combination of Unsupervised Blind Source Separation  Techniques.” ITG Conference on Speech Communication, 2021.","ieee":"C. Boeddeker, F. Rautenberg, and R. Haeb-Umbach, “A Comparison and Combination of Unsupervised Blind Source Separation  Techniques,” presented at the ITG Conference on Speech Communication, Kiel, 2021.","ama":"Boeddeker C, Rautenberg F, Haeb-Umbach R. A Comparison and Combination of Unsupervised Blind Source Separation  Techniques. In: ITG Conference on Speech Communication. ; 2021.","chicago":"Boeddeker, Christoph, Frederik Rautenberg, and Reinhold Haeb-Umbach. “A Comparison and Combination of Unsupervised Blind Source Separation  Techniques.” In ITG Conference on Speech Communication, 2021."},"main_file_link":[{"open_access":"1","url":"https://arxiv.org/pdf/2106.05627.pdf"}],"publication":"ITG Conference on Speech Communication","ddc":["000"],"file_date_updated":"2023-11-15T15:29:32Z","has_accepted_license":"1","_id":"44843","user_id":"40767","year":"2021","file":[{"date_created":"2023-05-16T08:37:31Z","content_type":"application/pdf","relation":"main_file","creator":"frra","file_size":295972,"access_level":"open_access","file_name":"2106.05627.pdf","date_updated":"2023-11-15T15:29:32Z","file_id":"44856"}],"author":[{"full_name":"Boeddeker, Christoph","id":"40767","last_name":"Boeddeker","first_name":"Christoph"},{"first_name":"Frederik","last_name":"Rautenberg","id":"72602","full_name":"Rautenberg, Frederik"},{"last_name":"Haeb-Umbach","full_name":"Haeb-Umbach, Reinhold","id":"242","first_name":"Reinhold"}],"abstract":[{"text":"Unsupervised blind source separation methods do not require a training phase\r\nand thus cannot suffer from a train-test mismatch, which is a common concern in\r\nneural network based source separation. The unsupervised techniques can be\r\ncategorized in two classes, those building upon the sparsity of speech in the\r\nShort-Time Fourier transform domain and those exploiting non-Gaussianity or\r\nnon-stationarity of the source signals. In this contribution, spatial mixture\r\nmodels which fall in the first category and independent vector analysis (IVA)\r\nas a representative of the second category are compared w.r.t. their separation\r\nperformance and the performance of a downstream speech recognizer on a\r\nreverberant dataset of reasonable size. Furthermore, we introduce a serial\r\nconcatenation of the two, where the result of the mixture model serves as\r\ninitialization of IVA, which achieves significantly better WER performance than\r\neach algorithm individually and even approaches the performance of a much more\r\ncomplex neural network based technique.","lang":"eng"}],"title":"A Comparison and Combination of Unsupervised Blind Source Separation Techniques","language":[{"iso":"eng"}],"conference":{"name":"ITG Conference on Speech Communication","location":"Kiel"},"date_created":"2023-05-15T07:59:33Z","department":[{"_id":"54"}],"oa":"1","status":"public","external_id":{"arxiv":["2106.05627"]},"type":"conference","date_updated":"2023-11-15T15:29:32Z"}