C. Herff, G. Johnson, L. Diener, J. Shih, D. Krusienski, T. Schultz
Reference:
Towards direct speech synthesis from ECoG: A pilot study (C. Herff, G. Johnson, L. Diener, J. Shih, D. Krusienski, T. Schultz), at EMBC 2016 - 38th Annual International Conference of the IEEE Engineering in Medicine and Biology Society, August 2016
Bibtex Entry:
@inproceedings{herff2016towards,
title = {Towards direct speech synthesis from ECoG: A pilot study},
author = {Herff, C. and Johnson, G. and Diener, L. and Shih, J. and Krusienski, D. and
Schultz, T.},
year = 2016,
month = aug,
booktitle = {{EMBC} 2016 - 38th Annual International Conference of the IEEE Engineering in
Medicine and Biology Society},
doi = {0.1109/EMBC.2016.7591004},
abstract = {Most current Brain-Computer Interfaces (BCIs) achieve high information transfer
rates using spelling paradigms based on stimulus-evoked potentials. Despite the success of this
interfaces, this mode of communication can be cumbersome and unnatural. Direct synthesis of
speech from neural activity represents a more natural mode of communi- cation that would enable
users to convey verbal messages in real-time. In this pilot study with one participant, we
demonstrate that electrocoticography (ECoG) intracranial activity from temporal areas can be
used to resynthesize speech in real-time. This is accomplished by reconstructing the audio
magnitude spectrogram from neural activity and subsequently creating the audio waveform from
these reconstructed spectrograms. We show that significant correlations between the original and
reconstructed spectrograms and temporal waveforms can be achieved. While this pilot study uses
audibly spoken speech for the models, it represents a first step towards speech synthesis from
speech imagery.},
url = {https://halcy.de/cites/pdf/herff2016towards.pdf},
poster = {https://halcy.de/cites/pdf/herff2016towards_poster.pdf},
}