Citation

BibTex format

@article{Green:2022:10.1177/23312165211068629,
author = {Green, T and Hilkhuysen, G and Huckvale, M and Rosen, S and Brookes, M and Moore, A and Naylor, P and Lightburn, L and Xue, W},
doi = {10.1177/23312165211068629},
journal = {Trends in Hearing},
pages = {1--16},
title = {Speech recognition with a hearing-aid processing scheme combining beamforming with mask-informed speech enhancement},
url = {http://dx.doi.org/10.1177/23312165211068629},
volume = {26},
year = {2022}
}

RIS format (EndNote, RefMan)

TY  - JOUR
AB - A signal processing approach combining beamforming with mask-informed speech enhancement was assessed by measuring sentence recognition in listeners with mild-to-moderate hearing impairment in adverse listening conditions that simulated the output of behind-the-ear hearing aids in a noisy classroom. Two types of beamforming were compared: binaural, with the two microphones of each aid treated as a single array, and bilateral, where independent left and right beamformers were derived. Binaural beamforming produces a narrower beam, maximising improvement in signal-to-noise ratio (SNR), but eliminates the spatial diversity that is preserved in bilateral beamforming. Each beamformer type was optimised for the true target position and implemented with and without additional speech enhancement in which spectral features extracted from the beamformer output were passed to a deep neural network trained to identify time-frequency regions dominated by target speech. Additional conditions comprising binaural beamforming combined with speech enhancement implemented using Wiener filtering or modulation-domain Kalman filtering were tested in normally-hearing (NH) listeners. Both beamformer types gave substantial improvements relative to no processing, with significantly greater benefit for binaural beamforming. Performance with additional mask-informed enhancement was poorer than with beamforming alone, for both beamformer types and both listener groups. In NH listeners the addition of mask-informed enhancement produced significantly poorer performance than both other forms of enhancement, neither of which differed from the beamformer alone. In summary, the additional improvement in SNR provided by binaural beamforming appeared to outweigh loss of spatial information, while speech understanding was not further improved by the mask-informed enhancement method implemented here.
AU - Green,T
AU - Hilkhuysen,G
AU - Huckvale,M
AU - Rosen,S
AU - Brookes,M
AU - Moore,A
AU - Naylor,P
AU - Lightburn,L
AU - Xue,W
DO - 10.1177/23312165211068629
EP - 16
PY - 2022///
SN - 2331-2165
SP - 1
TI - Speech recognition with a hearing-aid processing scheme combining beamforming with mask-informed speech enhancement
T2 - Trends in Hearing
UR - http://dx.doi.org/10.1177/23312165211068629
UR - http://gateway.webofknowledge.com/gateway/Gateway.cgi?GWVersion=2&SrcApp=PARTNER_APP&SrcAuth=LinksAMR&KeyUT=WOS:000740680100001&DestLinkType=FullRecord&DestApp=ALL_WOS&UsrCustomerID=1ba7043ffcc86c417c072aa74d649202
UR - https://journals.sagepub.com/doi/10.1177/23312165211068629
UR - http://hdl.handle.net/10044/1/93637
VL - 26
ER -

Contact us

Address

Speech and Audio Processing Lab
CSP Group, EEE Department
Imperial College London

Exhibition Road, London, SW7 2AZ, United Kingdom

Email

p.naylor@imperial.ac.uk