@inproceedings{6d497813f1e44587bbd81ba52dca6a55,
title = "Crowdsourced Video Subtitling with Adaptation Based on User-Corrected Lattices",
abstract = "This paper investigates an approach for fast hybrid human and machine video subtitling based on lattice disambiguation and posterior model adaptation. The approach aims at correcting Automatic Speech Recognition (ASR) transcriptions requiring minimal effort from the user and facilitating user corrections from smart-phone devices. Our approach is based on three key concepts. Firstly, only a portion of the data is sent to the user for correction. Secondly, user action is limited to selecting from a fixed set of options extracted from the ASR word lattice. Thirdly, user feedback is used to update the ASR parameters and further enhance performance. To investigate the potential and limitations of this approach, we carry out experiments employing simulated and real user corrections of TED talks videos. Simulated corrections include both the true reference and the best combination of the options shown to the user. Real corrections are obtained from 30 editors through a special purpose web-interface displaying the options for small video segments. We analyze the fixed option approach and the trade-off between model adaptation and increasing the amount of corrected data.",
keywords = "Automatic Speech Recognition, Error Analysis",
author = "Jo{\~a}o Miranda and Ram{\'o}n Astudillo and {\^A}ngela Costa and Andr{\'e} Silva and Hugo Silva and Jo{\~a}o Gra{\c c}a and Bhiksha Raj",
note = "info:eu-repo/grantAgreement/FCT/5876/147282/PT# info:eu-repo/grantAgreement/FCT/SFRH/SFRH%2FBPD%2F68428%2F2010/PT# info:eu-repo/grantAgreement/FCT/5665-PICT/137166/PT# info:eu-repo/grantAgreement/FCT/SFRH/SFRH%2FBD%2F85737%2F2012/PT#; International Conference on Advances in Speech and Language Technologies for Iberian Languages, IberSPEECH 2016 ; Conference date: 23-11-2016 Through 25-11-2016",
year = "2016",
doi = "10.1007/978-3-319-49169-1_14",
language = "English",
isbn = "978-3-319-49168-4",
volume = "10077",
series = "Lecture Notes In Computer Science",
publisher = "Springer",
pages = "138--147",
editor = "Alberto Abad",
booktitle = "International Conference on Advances in Speech and Language Technologies for Iberian Languages",
}