@article {Krawczyk-Becker1603_2016, year = {2016}, author = {Krawczyk-Becker, Martin and Gerkmann, Timo}, title = {Fundamental Frequency Informed Speech Enhancement in a Flexible Statistical Framework}, journal = {IEEE Trans. Aud. Sp. Lang. Proc.}, volume = {24}, number = {5}, DOI = {10.1109/TASLP.2016.2533867}, ISSN = {2329-9290 }, abstract = {Conventional statistical clean speech estimators, like the Wiener filter, are frequently used for the spectro-temporal enhancement of noise corrupted speech. Most of these approaches estimate the clean speech independently for each time-frequency point, neglecting the structure of the underlying speech sound. In this work, we derive a statistical estimator that explicitly takes into account information about the characteristic structure of voiced speech by means of a harmonic signal model. To this end, we also present a way to estimate a harmonic model-based clean speech representation and the corresponding error variance directly in the short-time Fourier transform domain. The resulting estimator is optimal in the minimum-mean-squared error sense and can conveniently be formulated in terms of a multichannel Wiener filter. The proposed estimator outperforms several reference algorithms in terms of speech quality and intelligibility as predicted by instrumental measures. }, note = {INSPEC Accession Number: 15874620 } }