[{"status":"public","type":"conference","publication":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","language":[{"iso":"eng"}],"user_id":"72602","department":[{"_id":"54"},{"_id":"660"}],"project":[{"name":"TRR 318 - C06: TRR 318 - Technisch unterstütztes Erklären von Stimmcharakteristika (Teilprojekt C06)","_id":"129","grant_number":"438445824"}],"_id":"59999","citation":{"ama":"Rautenberg F, Kuhlmann M, Seebauer F, Wiechmann J, Wagner P, Haeb-Umbach R. Speech Synthesis along Perceptual Voice Quality Dimensions. In: <i>ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)</i>. IEEE; 2025. doi:<a href=\"https://doi.org/10.1109/icassp49660.2025.10888012\">10.1109/icassp49660.2025.10888012</a>","ieee":"F. Rautenberg, M. Kuhlmann, F. Seebauer, J. Wiechmann, P. Wagner, and R. Haeb-Umbach, “Speech Synthesis along Perceptual Voice Quality Dimensions,” presented at the IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), Hyderabad, India , 2025, doi: <a href=\"https://doi.org/10.1109/icassp49660.2025.10888012\">10.1109/icassp49660.2025.10888012</a>.","chicago":"Rautenberg, Frederik, Michael Kuhlmann, Fritz Seebauer, Jana Wiechmann, Petra Wagner, and Reinhold Haeb-Umbach. “Speech Synthesis along Perceptual Voice Quality Dimensions.” In <i>ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)</i>. IEEE, 2025. <a href=\"https://doi.org/10.1109/icassp49660.2025.10888012\">https://doi.org/10.1109/icassp49660.2025.10888012</a>.","short":"F. Rautenberg, M. Kuhlmann, F. Seebauer, J. Wiechmann, P. Wagner, R. Haeb-Umbach, in: ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), IEEE, 2025.","mla":"Rautenberg, Frederik, et al. “Speech Synthesis along Perceptual Voice Quality Dimensions.” <i>ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)</i>, IEEE, 2025, doi:<a href=\"https://doi.org/10.1109/icassp49660.2025.10888012\">10.1109/icassp49660.2025.10888012</a>.","bibtex":"@inproceedings{Rautenberg_Kuhlmann_Seebauer_Wiechmann_Wagner_Haeb-Umbach_2025, title={Speech Synthesis along Perceptual Voice Quality Dimensions}, DOI={<a href=\"https://doi.org/10.1109/icassp49660.2025.10888012\">10.1109/icassp49660.2025.10888012</a>}, booktitle={ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)}, publisher={IEEE}, author={Rautenberg, Frederik and Kuhlmann, Michael and Seebauer, Fritz and Wiechmann, Jana and Wagner, Petra and Haeb-Umbach, Reinhold}, year={2025} }","apa":"Rautenberg, F., Kuhlmann, M., Seebauer, F., Wiechmann, J., Wagner, P., &#38; Haeb-Umbach, R. (2025). Speech Synthesis along Perceptual Voice Quality Dimensions. <i>ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)</i>. IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), Hyderabad, India . <a href=\"https://doi.org/10.1109/icassp49660.2025.10888012\">https://doi.org/10.1109/icassp49660.2025.10888012</a>"},"year":"2025","publication_status":"published","conference":{"end_date":"2025-04-11","location":"Hyderabad, India ","name":"IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","start_date":"2025-04-06"},"doi":"10.1109/icassp49660.2025.10888012","title":"Speech Synthesis along Perceptual Voice Quality Dimensions","author":[{"first_name":"Frederik","full_name":"Rautenberg, Frederik","id":"72602","last_name":"Rautenberg"},{"first_name":"Michael","full_name":"Kuhlmann, Michael","id":"49871","last_name":"Kuhlmann"},{"first_name":"Fritz","full_name":"Seebauer, Fritz","last_name":"Seebauer"},{"first_name":"Jana","last_name":"Wiechmann","full_name":"Wiechmann, Jana"},{"last_name":"Wagner","full_name":"Wagner, Petra","first_name":"Petra"},{"first_name":"Reinhold","full_name":"Haeb-Umbach, Reinhold","id":"242","last_name":"Haeb-Umbach"}],"date_created":"2025-05-20T08:17:22Z","publisher":"IEEE","date_updated":"2025-05-26T11:09:56Z"},{"conference":{"end_date":"2025-08-21","location":"Rotterdam","name":"Interspeech","start_date":"2025-08-17"},"doi":"10.21437/Interspeech.2025-1443","title":"Synthesizing Speech with Selected Perceptual Voice Qualities – A Case Study with Creaky Voice","author":[{"id":"72602","full_name":"Rautenberg, Frederik","last_name":"Rautenberg","first_name":"Frederik"},{"full_name":"Seebauer, Fritz","last_name":"Seebauer","first_name":"Fritz"},{"last_name":"Wiechmann","full_name":"Wiechmann, Jana","first_name":"Jana"},{"full_name":"Kuhlmann, Michael","id":"49871","last_name":"Kuhlmann","first_name":"Michael"},{"first_name":"Petra","full_name":"Wagner, Petra","last_name":"Wagner"},{"last_name":"Haeb-Umbach","id":"242","full_name":"Haeb-Umbach, Reinhold","first_name":"Reinhold"}],"date_created":"2025-08-28T08:39:01Z","date_updated":"2025-08-28T08:56:49Z","publisher":"ISCA","citation":{"ama":"Rautenberg F, Seebauer F, Wiechmann J, Kuhlmann M, Wagner P, Haeb-Umbach R. Synthesizing Speech with Selected Perceptual Voice Qualities – A Case Study with Creaky Voice. In: <i>Interspeech 2025</i>. ISCA; 2025. doi:<a href=\"https://doi.org/10.21437/Interspeech.2025-1443\">10.21437/Interspeech.2025-1443</a>","ieee":"F. Rautenberg, F. Seebauer, J. Wiechmann, M. Kuhlmann, P. Wagner, and R. Haeb-Umbach, “Synthesizing Speech with Selected Perceptual Voice Qualities – A Case Study with Creaky Voice,” presented at the Interspeech, Rotterdam, 2025, doi: <a href=\"https://doi.org/10.21437/Interspeech.2025-1443\">10.21437/Interspeech.2025-1443</a>.","chicago":"Rautenberg, Frederik, Fritz Seebauer, Jana Wiechmann, Michael Kuhlmann, Petra Wagner, and Reinhold Haeb-Umbach. “Synthesizing Speech with Selected Perceptual Voice Qualities – A Case Study with Creaky Voice.” In <i>Interspeech 2025</i>. ISCA, 2025. <a href=\"https://doi.org/10.21437/Interspeech.2025-1443\">https://doi.org/10.21437/Interspeech.2025-1443</a>.","apa":"Rautenberg, F., Seebauer, F., Wiechmann, J., Kuhlmann, M., Wagner, P., &#38; Haeb-Umbach, R. (2025). Synthesizing Speech with Selected Perceptual Voice Qualities – A Case Study with Creaky Voice. <i>Interspeech 2025</i>. Interspeech, Rotterdam. <a href=\"https://doi.org/10.21437/Interspeech.2025-1443\">https://doi.org/10.21437/Interspeech.2025-1443</a>","bibtex":"@inproceedings{Rautenberg_Seebauer_Wiechmann_Kuhlmann_Wagner_Haeb-Umbach_2025, title={Synthesizing Speech with Selected Perceptual Voice Qualities – A Case Study with Creaky Voice}, DOI={<a href=\"https://doi.org/10.21437/Interspeech.2025-1443\">10.21437/Interspeech.2025-1443</a>}, booktitle={Interspeech 2025}, publisher={ISCA}, author={Rautenberg, Frederik and Seebauer, Fritz and Wiechmann, Jana and Kuhlmann, Michael and Wagner, Petra and Haeb-Umbach, Reinhold}, year={2025} }","mla":"Rautenberg, Frederik, et al. “Synthesizing Speech with Selected Perceptual Voice Qualities – A Case Study with Creaky Voice.” <i>Interspeech 2025</i>, ISCA, 2025, doi:<a href=\"https://doi.org/10.21437/Interspeech.2025-1443\">10.21437/Interspeech.2025-1443</a>.","short":"F. Rautenberg, F. Seebauer, J. Wiechmann, M. Kuhlmann, P. Wagner, R. Haeb-Umbach, in: Interspeech 2025, ISCA, 2025."},"year":"2025","language":[{"iso":"eng"}],"department":[{"_id":"54"},{"_id":"660"}],"user_id":"72602","_id":"61047","project":[{"name":"TRR 318; TP C06: Technisch unterstütztes Erklären von Stimmcharakteristika","_id":"129"}],"status":"public","publication":"Interspeech 2025","type":"conference"},{"year":"2024","citation":{"apa":"Xie, Y., Kuhlmann, M., Rautenberg, F., Tan, Z.-H., &#38; Häb-Umbach, R. (2024). Speaker and Style Disentanglement of Speech Based on Contrastive Predictive Coding Supported Factorized Variational Autoencoder. <i>2024 32nd European Signal Processing Conference (EUSIPCO)</i>, 436–440.","short":"Y. Xie, M. Kuhlmann, F. Rautenberg, Z.-H. Tan, R. Häb-Umbach, in: 2024 32nd European Signal Processing Conference (EUSIPCO), 2024, pp. 436–440.","bibtex":"@inproceedings{Xie_Kuhlmann_Rautenberg_Tan_Häb-Umbach_2024, title={Speaker and Style Disentanglement of Speech Based on Contrastive Predictive Coding Supported Factorized Variational Autoencoder}, booktitle={2024 32nd European Signal Processing Conference (EUSIPCO)}, author={Xie, Yuying and Kuhlmann, Michael and Rautenberg, Frederik and Tan, Zheng-Hua and Häb-Umbach, Reinhold}, year={2024}, pages={436–440} }","mla":"Xie, Yuying, et al. “Speaker and Style Disentanglement of Speech Based on Contrastive Predictive Coding Supported Factorized Variational Autoencoder.” <i>2024 32nd European Signal Processing Conference (EUSIPCO)</i>, 2024, pp. 436–440.","chicago":"Xie, Yuying, Michael Kuhlmann, Frederik Rautenberg, Zheng-Hua Tan, and Reinhold Häb-Umbach. “Speaker and Style Disentanglement of Speech Based on Contrastive Predictive Coding Supported Factorized Variational Autoencoder.” In <i>2024 32nd European Signal Processing Conference (EUSIPCO)</i>, 436–440, 2024.","ieee":"Y. Xie, M. Kuhlmann, F. Rautenberg, Z.-H. Tan, and R. Häb-Umbach, “Speaker and Style Disentanglement of Speech Based on Contrastive Predictive Coding Supported Factorized Variational Autoencoder,” in <i>2024 32nd European Signal Processing Conference (EUSIPCO)</i>, 2024, pp. 436–440.","ama":"Xie Y, Kuhlmann M, Rautenberg F, Tan Z-H, Häb-Umbach R. Speaker and Style Disentanglement of Speech Based on Contrastive Predictive Coding Supported Factorized Variational Autoencoder. In: <i>2024 32nd European Signal Processing Conference (EUSIPCO)</i>. ; 2024:436–440."},"page":"436–440","title":"Speaker and Style Disentanglement of Speech Based on Contrastive Predictive Coding Supported Factorized Variational Autoencoder","date_updated":"2024-11-15T06:54:40Z","author":[{"first_name":"Yuying","full_name":"Xie, Yuying","last_name":"Xie"},{"first_name":"Michael","last_name":"Kuhlmann","full_name":"Kuhlmann, Michael","id":"49871"},{"id":"72602","full_name":"Rautenberg, Frederik","last_name":"Rautenberg","first_name":"Frederik"},{"first_name":"Zheng-Hua","full_name":"Tan, Zheng-Hua","last_name":"Tan"},{"id":"242","full_name":"Häb-Umbach, Reinhold","last_name":"Häb-Umbach","first_name":"Reinhold"}],"date_created":"2024-11-15T06:52:54Z","status":"public","type":"conference","publication":"2024 32nd European Signal Processing Conference (EUSIPCO)","language":[{"iso":"eng"}],"_id":"57099","user_id":"49871","department":[{"_id":"54"}]},{"external_id":{"arxiv":["2310.12599"]},"ddc":["000"],"language":[{"iso":"eng"}],"publication":"ITG Conference on Speech Communication","abstract":[{"text":"Unsupervised speech disentanglement aims at separating fast varying from\r\nslowly varying components of a speech signal. In this contribution, we take a\r\ncloser look at the embedding vector representing the slowly varying signal\r\ncomponents, commonly named the speaker embedding vector. We ask, which\r\nproperties of a speaker's voice are captured and investigate to which extent do\r\nindividual embedding vector components sign responsible for them, using the\r\nconcept of Shapley values. Our findings show that certain speaker-specific\r\nacoustic-phonetic properties can be fairly well predicted from the speaker\r\nembedding, while the investigated more abstract voice quality features cannot.","lang":"eng"}],"file":[{"date_updated":"2023-10-20T08:20:58Z","date_created":"2023-10-20T08:20:58Z","creator":"frra","file_size":272390,"file_id":"48359","access_level":"closed","file_name":"arxiv.pdf","content_type":"application/pdf","success":1,"relation":"main_file"}],"date_created":"2023-10-20T08:04:46Z","title":"On Feature Importance and Interpretability of Speaker Representations","year":"2023","project":[{"_id":"129","name":"TRR 318 - C06: TRR 318 - Technisch unterstütztes Erklären von Stimmcharakteristika (Teilprojekt C06)","grant_number":"438445824"}],"_id":"48355","user_id":"72602","department":[{"_id":"54"},{"_id":"660"}],"file_date_updated":"2023-10-20T08:20:58Z","type":"conference","status":"public","date_updated":"2023-11-22T13:44:33Z","oa":"1","author":[{"last_name":"Rautenberg","id":"72602","full_name":"Rautenberg, Frederik","first_name":"Frederik"},{"last_name":"Kuhlmann","id":"49871","full_name":"Kuhlmann, Michael","first_name":"Michael"},{"last_name":"Wiechmann","full_name":"Wiechmann, Jana","first_name":"Jana"},{"first_name":"Fritz","last_name":"Seebauer","full_name":"Seebauer, Fritz"},{"first_name":"Petra","last_name":"Wagner","full_name":"Wagner, Petra"},{"last_name":"Haeb-Umbach","id":"242","full_name":"Haeb-Umbach, Reinhold","first_name":"Reinhold"}],"main_file_link":[{"url":"https://arxiv.org/abs/2310.12599","open_access":"1"}],"conference":{"name":"ITG Conference on Speech Communication","start_date":"2023-09-20","end_date":"2023-09-22","location":"Aachen"},"has_accepted_license":"1","citation":{"apa":"Rautenberg, F., Kuhlmann, M., Wiechmann, J., Seebauer, F., Wagner, P., &#38; Haeb-Umbach, R. (2023). On Feature Importance and Interpretability of Speaker Representations. <i>ITG Conference on Speech Communication</i>. ITG Conference on Speech Communication, Aachen.","mla":"Rautenberg, Frederik, et al. “On Feature Importance and Interpretability of Speaker Representations.” <i>ITG Conference on Speech Communication</i>, 2023.","short":"F. Rautenberg, M. Kuhlmann, J. Wiechmann, F. Seebauer, P. Wagner, R. Haeb-Umbach, in: ITG Conference on Speech Communication, 2023.","bibtex":"@inproceedings{Rautenberg_Kuhlmann_Wiechmann_Seebauer_Wagner_Haeb-Umbach_2023, title={On Feature Importance and Interpretability of Speaker Representations}, booktitle={ITG Conference on Speech Communication}, author={Rautenberg, Frederik and Kuhlmann, Michael and Wiechmann, Jana and Seebauer, Fritz and Wagner, Petra and Haeb-Umbach, Reinhold}, year={2023} }","ieee":"F. Rautenberg, M. Kuhlmann, J. Wiechmann, F. Seebauer, P. Wagner, and R. Haeb-Umbach, “On Feature Importance and Interpretability of Speaker Representations,” presented at the ITG Conference on Speech Communication, Aachen, 2023.","chicago":"Rautenberg, Frederik, Michael Kuhlmann, Jana Wiechmann, Fritz Seebauer, Petra Wagner, and Reinhold Haeb-Umbach. “On Feature Importance and Interpretability of Speaker Representations.” In <i>ITG Conference on Speech Communication</i>, 2023.","ama":"Rautenberg F, Kuhlmann M, Wiechmann J, Seebauer F, Wagner P, Haeb-Umbach R. On Feature Importance and Interpretability of Speaker Representations. In: <i>ITG Conference on Speech Communication</i>. ; 2023."}},{"language":[{"iso":"eng"}],"file_date_updated":"2023-10-24T08:03:27Z","ddc":["040"],"department":[{"_id":"54"},{"_id":"660"}],"user_id":"72602","_id":"48410","project":[{"name":"TRR 318 - C06: TRR 318 - Technisch unterstütztes Erklären von Stimmcharakteristika (Teilprojekt C06)","_id":"129","grant_number":"438445824"}],"status":"public","file":[{"date_updated":"2023-10-24T08:03:27Z","date_created":"2023-10-24T08:03:27Z","creator":"frra","file_size":209980,"file_id":"48413","file_name":"188.pdf","access_level":"closed","content_type":"application/pdf","success":1,"relation":"main_file"}],"publication":"20th International Congress of the Phonetic Sciences (ICPhS) ","type":"conference","conference":{"start_date":"2023-08-07","end_date":"2023-08-11"},"main_file_link":[{"open_access":"1"}],"title":"Explaining voice characteristics to novice voice practitioners-How successful is it?","date_created":"2023-10-24T08:05:40Z","author":[{"first_name":"Jana","last_name":"Wiechmann","full_name":"Wiechmann, Jana"},{"first_name":"Frederik","full_name":"Rautenberg, Frederik","id":"72602","last_name":"Rautenberg"},{"first_name":"Petra","full_name":"Wagner, Petra","last_name":"Wagner"},{"full_name":"Haeb-Umbach, Reinhold","id":"242","last_name":"Haeb-Umbach","first_name":"Reinhold"}],"oa":"1","date_updated":"2023-11-22T13:44:59Z","citation":{"chicago":"Wiechmann, Jana, Frederik Rautenberg, Petra Wagner, and Reinhold Haeb-Umbach. “Explaining Voice Characteristics to Novice Voice Practitioners-How Successful Is It?” In <i>20th International Congress of the Phonetic Sciences (ICPhS) </i>, 2023.","ieee":"J. Wiechmann, F. Rautenberg, P. Wagner, and R. Haeb-Umbach, “Explaining voice characteristics to novice voice practitioners-How successful is it?,” 2023.","ama":"Wiechmann J, Rautenberg F, Wagner P, Haeb-Umbach R. Explaining voice characteristics to novice voice practitioners-How successful is it? In: <i>20th International Congress of the Phonetic Sciences (ICPhS) </i>. ; 2023.","mla":"Wiechmann, Jana, et al. “Explaining Voice Characteristics to Novice Voice Practitioners-How Successful Is It?” <i>20th International Congress of the Phonetic Sciences (ICPhS) </i>, 2023.","bibtex":"@inproceedings{Wiechmann_Rautenberg_Wagner_Haeb-Umbach_2023, title={Explaining voice characteristics to novice voice practitioners-How successful is it?}, booktitle={20th International Congress of the Phonetic Sciences (ICPhS) }, author={Wiechmann, Jana and Rautenberg, Frederik and Wagner, Petra and Haeb-Umbach, Reinhold}, year={2023} }","short":"J. Wiechmann, F. Rautenberg, P. Wagner, R. Haeb-Umbach, in: 20th International Congress of the Phonetic Sciences (ICPhS) , 2023.","apa":"Wiechmann, J., Rautenberg, F., Wagner, P., &#38; Haeb-Umbach, R. (2023). Explaining voice characteristics to novice voice practitioners-How successful is it? <i>20th International Congress of the Phonetic Sciences (ICPhS) </i>."},"year":"2023","has_accepted_license":"1"},{"publication_status":"published","has_accepted_license":"1","year":"2023","citation":{"ama":"Rautenberg F, Kuhlmann M, Ebbers J, et al. Speech Disentanglement for Analysis and Modification of Acoustic and Perceptual Speaker Characteristics. In: <i>Fortschritte Der Akustik - DAGA 2023</i>. ; 2023:1409-1412.","chicago":"Rautenberg, Frederik, Michael Kuhlmann, Janek Ebbers, Jana Wiechmann, Fritz Seebauer, Petra Wagner, and Reinhold Haeb-Umbach. “Speech Disentanglement for Analysis and Modification of Acoustic and Perceptual Speaker Characteristics.” In <i>Fortschritte Der Akustik - DAGA 2023</i>, 1409–12, 2023.","ieee":"F. Rautenberg <i>et al.</i>, “Speech Disentanglement for Analysis and Modification of Acoustic and Perceptual Speaker Characteristics,” in <i>Fortschritte der Akustik - DAGA 2023</i>, Hamburg, 2023, pp. 1409–1412.","apa":"Rautenberg, F., Kuhlmann, M., Ebbers, J., Wiechmann, J., Seebauer, F., Wagner, P., &#38; Haeb-Umbach, R. (2023). Speech Disentanglement for Analysis and Modification of Acoustic and Perceptual Speaker Characteristics. <i>Fortschritte Der Akustik - DAGA 2023</i>, 1409–1412.","bibtex":"@inproceedings{Rautenberg_Kuhlmann_Ebbers_Wiechmann_Seebauer_Wagner_Haeb-Umbach_2023, title={Speech Disentanglement for Analysis and Modification of Acoustic and Perceptual Speaker Characteristics}, booktitle={Fortschritte der Akustik - DAGA 2023}, author={Rautenberg, Frederik and Kuhlmann, Michael and Ebbers, Janek and Wiechmann, Jana and Seebauer, Fritz and Wagner, Petra and Haeb-Umbach, Reinhold}, year={2023}, pages={1409–1412} }","mla":"Rautenberg, Frederik, et al. “Speech Disentanglement for Analysis and Modification of Acoustic and Perceptual Speaker Characteristics.” <i>Fortschritte Der Akustik - DAGA 2023</i>, 2023, pp. 1409–12.","short":"F. Rautenberg, M. Kuhlmann, J. Ebbers, J. Wiechmann, F. Seebauer, P. Wagner, R. Haeb-Umbach, in: Fortschritte Der Akustik - DAGA 2023, 2023, pp. 1409–1412."},"page":"1409-1412","date_updated":"2024-02-29T17:05:16Z","oa":"1","author":[{"last_name":"Rautenberg","full_name":"Rautenberg, Frederik","id":"72602","first_name":"Frederik"},{"first_name":"Michael","id":"49871","full_name":"Kuhlmann, Michael","last_name":"Kuhlmann"},{"full_name":"Ebbers, Janek","id":"34851","last_name":"Ebbers","first_name":"Janek"},{"first_name":"Jana","full_name":"Wiechmann, Jana","last_name":"Wiechmann"},{"last_name":"Seebauer","full_name":"Seebauer, Fritz","first_name":"Fritz"},{"full_name":"Wagner, Petra","last_name":"Wagner","first_name":"Petra"},{"first_name":"Reinhold","full_name":"Haeb-Umbach, Reinhold","id":"242","last_name":"Haeb-Umbach"}],"date_created":"2023-05-15T08:48:54Z","title":"Speech Disentanglement for Analysis and Modification of Acoustic and Perceptual Speaker Characteristics","main_file_link":[{"open_access":"1","url":"https://pub.dega-akustik.de/DAGA_2023/data/articles/000105.pdf"}],"conference":{"start_date":"2023-03-06","name":"DAGA 2023 - 49. Jahrestagung für Akustik","location":"Hamburg","end_date":"2023-03-09"},"type":"conference","publication":"Fortschritte der Akustik - DAGA 2023","file":[{"relation":"main_file","content_type":"application/pdf","file_size":289493,"file_name":"Daga_2023_Rautenberg_Paper.pdf","access_level":"open_access","file_id":"52221","date_updated":"2024-02-29T16:15:12Z","creator":"frra","date_created":"2024-02-29T16:15:12Z"}],"status":"public","project":[{"name":"TRR 318 - C06: TRR 318 - Technisch unterstütztes Erklären von Stimmcharakteristika (Teilprojekt C06)","_id":"129","grant_number":"438445824"}],"_id":"44849","user_id":"72602","department":[{"_id":"54"},{"_id":"660"}],"ddc":["000"],"language":[{"iso":"eng"}],"file_date_updated":"2024-02-29T16:15:12Z"},{"citation":{"chicago":"Wiechmann, Jana, Thomas Glarner, Frederik Rautenberg, Petra Wagner, and Reinhold Haeb-Umbach. “Technically Enabled Explaining of Voice Characteristics.” In <i>18. Phonetik Und Phonologie Im Deutschsprachigen Raum (P&#38;P)</i>, 2022.","ieee":"J. Wiechmann, T. Glarner, F. Rautenberg, P. Wagner, and R. Haeb-Umbach, “Technically enabled explaining of voice characteristics,” Bielefeld, 2022.","ama":"Wiechmann J, Glarner T, Rautenberg F, Wagner P, Haeb-Umbach R. Technically enabled explaining of voice characteristics. In: <i>18. Phonetik Und Phonologie Im Deutschsprachigen Raum (P&#38;P)</i>. ; 2022.","apa":"Wiechmann, J., Glarner, T., Rautenberg, F., Wagner, P., &#38; Haeb-Umbach, R. (2022). Technically enabled explaining of voice characteristics. <i>18. Phonetik Und Phonologie Im Deutschsprachigen Raum (P&#38;P)</i>.","short":"J. Wiechmann, T. Glarner, F. Rautenberg, P. Wagner, R. Haeb-Umbach, in: 18. Phonetik Und Phonologie Im Deutschsprachigen Raum (P&#38;P), 2022.","mla":"Wiechmann, Jana, et al. “Technically Enabled Explaining of Voice Characteristics.” <i>18. Phonetik Und Phonologie Im Deutschsprachigen Raum (P&#38;P)</i>, 2022.","bibtex":"@inproceedings{Wiechmann_Glarner_Rautenberg_Wagner_Haeb-Umbach_2022, title={Technically enabled explaining of voice characteristics}, booktitle={18. Phonetik und Phonologie im deutschsprachigen Raum (P&#38;P)}, author={Wiechmann, Jana and Glarner, Thomas and Rautenberg, Frederik and Wagner, Petra and Haeb-Umbach, Reinhold}, year={2022} }"},"year":"2022","has_accepted_license":"1","conference":{"end_date":"2022-10-07","location":"Bielefeld","start_date":"2022-10-06"},"title":"Technically enabled explaining of voice characteristics","date_created":"2022-10-12T07:10:03Z","author":[{"first_name":"Jana","last_name":"Wiechmann","full_name":"Wiechmann, Jana"},{"first_name":"Thomas","full_name":"Glarner, Thomas","last_name":"Glarner"},{"first_name":"Frederik","last_name":"Rautenberg","full_name":"Rautenberg, Frederik","id":"72602"},{"first_name":"Petra","last_name":"Wagner","full_name":"Wagner, Petra"},{"first_name":"Reinhold","last_name":"Haeb-Umbach","id":"242","full_name":"Haeb-Umbach, Reinhold"}],"date_updated":"2023-11-22T13:45:30Z","oa":"1","file":[{"content_type":"application/pdf","relation":"main_file","date_created":"2022-10-12T07:09:26Z","creator":"huesera","date_updated":"2022-10-12T07:09:26Z","access_level":"open_access","file_name":"PP_2022_paper_8911.pdf","file_id":"33697","file_size":109294}],"status":"public","type":"conference","publication":"18. Phonetik und Phonologie im deutschsprachigen Raum (P&P)","file_date_updated":"2022-10-12T07:09:26Z","language":[{"iso":"eng"}],"ddc":["000"],"user_id":"72602","department":[{"_id":"54"},{"_id":"660"}],"project":[{"name":"TRR 318 - C06: TRR 318 - Technisch unterstütztes Erklären von Stimmcharakteristika (Teilprojekt C06)","_id":"129","grant_number":"438445824"}],"_id":"33696"},{"type":"conference","status":"public","_id":"44843","user_id":"40767","department":[{"_id":"54"}],"file_date_updated":"2023-11-15T15:29:32Z","has_accepted_license":"1","citation":{"ieee":"C. Boeddeker, F. Rautenberg, and R. Haeb-Umbach, “A Comparison and Combination of Unsupervised Blind Source Separation  Techniques,” presented at the ITG Conference on Speech Communication, Kiel, 2021.","chicago":"Boeddeker, Christoph, Frederik Rautenberg, and Reinhold Haeb-Umbach. “A Comparison and Combination of Unsupervised Blind Source Separation  Techniques.” In <i>ITG Conference on Speech Communication</i>, 2021.","ama":"Boeddeker C, Rautenberg F, Haeb-Umbach R. A Comparison and Combination of Unsupervised Blind Source Separation  Techniques. In: <i>ITG Conference on Speech Communication</i>. ; 2021.","apa":"Boeddeker, C., Rautenberg, F., &#38; Haeb-Umbach, R. (2021). A Comparison and Combination of Unsupervised Blind Source Separation  Techniques. <i>ITG Conference on Speech Communication</i>. ITG Conference on Speech Communication, Kiel.","bibtex":"@inproceedings{Boeddeker_Rautenberg_Haeb-Umbach_2021, title={A Comparison and Combination of Unsupervised Blind Source Separation  Techniques}, booktitle={ITG Conference on Speech Communication}, author={Boeddeker, Christoph and Rautenberg, Frederik and Haeb-Umbach, Reinhold}, year={2021} }","mla":"Boeddeker, Christoph, et al. “A Comparison and Combination of Unsupervised Blind Source Separation  Techniques.” <i>ITG Conference on Speech Communication</i>, 2021.","short":"C. Boeddeker, F. Rautenberg, R. Haeb-Umbach, in: ITG Conference on Speech Communication, 2021."},"date_updated":"2023-11-15T15:29:32Z","oa":"1","author":[{"last_name":"Boeddeker","full_name":"Boeddeker, Christoph","id":"40767","first_name":"Christoph"},{"id":"72602","full_name":"Rautenberg, Frederik","last_name":"Rautenberg","first_name":"Frederik"},{"last_name":"Haeb-Umbach","full_name":"Haeb-Umbach, Reinhold","id":"242","first_name":"Reinhold"}],"main_file_link":[{"open_access":"1","url":"https://arxiv.org/pdf/2106.05627.pdf"}],"conference":{"location":"Kiel","name":"ITG Conference on Speech Communication"},"publication":"ITG Conference on Speech Communication","abstract":[{"text":"Unsupervised blind source separation methods do not require a training phase\r\nand thus cannot suffer from a train-test mismatch, which is a common concern in\r\nneural network based source separation. The unsupervised techniques can be\r\ncategorized in two classes, those building upon the sparsity of speech in the\r\nShort-Time Fourier transform domain and those exploiting non-Gaussianity or\r\nnon-stationarity of the source signals. In this contribution, spatial mixture\r\nmodels which fall in the first category and independent vector analysis (IVA)\r\nas a representative of the second category are compared w.r.t. their separation\r\nperformance and the performance of a downstream speech recognizer on a\r\nreverberant dataset of reasonable size. Furthermore, we introduce a serial\r\nconcatenation of the two, where the result of the mixture model serves as\r\ninitialization of IVA, which achieves significantly better WER performance than\r\neach algorithm individually and even approaches the performance of a much more\r\ncomplex neural network based technique.","lang":"eng"}],"file":[{"relation":"main_file","content_type":"application/pdf","file_size":295972,"file_name":"2106.05627.pdf","access_level":"open_access","file_id":"44856","date_updated":"2023-11-15T15:29:32Z","creator":"frra","date_created":"2023-05-16T08:37:31Z"}],"external_id":{"arxiv":["2106.05627"]},"ddc":["000"],"language":[{"iso":"eng"}],"year":"2021","date_created":"2023-05-15T07:59:33Z","title":"A Comparison and Combination of Unsupervised Blind Source Separation  Techniques"}]
