{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,21]],"date-time":"2025-08-21T16:44:58Z","timestamp":1755794698230,"version":"3.28.0"},"reference-count":36,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016,3]]},"DOI":"10.1109\/icassp.2016.7472804","type":"proceedings-article","created":{"date-parts":[[2016,6,24]],"date-time":"2016-06-24T01:58:30Z","timestamp":1466733510000},"page":"5875-5879","source":"Crossref","is-referenced-by-count":5,"title":["Data selection from multiple ASR systems' hypotheses for unsupervised acoustic model training"],"prefix":"10.1109","author":[{"given":"Sheng","family":"Li","sequence":"first","affiliation":[]},{"given":"Yuya","family":"Akita","sequence":"additional","affiliation":[]},{"given":"Tatsuya","family":"Kawahara","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.2307\/2006193"},{"key":"ref32","article-title":"Fast speaker normalization and adaptation based on BIC for meeting speech recognition","author":"mimura","year":"2011","journal-title":"Proc APSIPA ASC"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/P14-2042"},{"key":"ref30","article-title":"Discriminative Joint Modeling of Lexical Variation and Acoustic Confusion for Automated Narrative Retelling Assessment","author":"lehr","year":"2013","journal-title":"Proc NAACL"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1121\/1.4768800"},{"key":"ref35","article-title":"Modeling Characters versus Words for Mandarin Speech Recognition","author":"luo","year":"2009","journal-title":"Proc ICASSP"},{"key":"ref34","first-page":"1022","article-title":"Multi-interval discretization of continuous attributes for classification learning","author":"fayyad","year":"1993","journal-title":"Proc IJCAI"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/89.906002"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2004.1326105"},{"key":"ref12","first-page":"495","article-title":"Finding Consensus Among Words: Lattice-Based Word Error Minimization","author":"mangu","year":"0","journal-title":"Proc Eurospeech'99"},{"key":"ref13","article-title":"Posterior probability decoding, confidence estimation and system combination","author":"evermann","year":"2000","journal-title":"NIST Speech Transcription Workshop"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2014.2303295"},{"key":"ref15","article-title":"Ensemble deep learning for speech recognition","author":"deng","year":"2014","journal-title":"Proc INTERSPEECH"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.1997.659110"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2004.1326105"},{"key":"ref18","article-title":"Conditional random fields: Probabilistic models for segmenting and labeling sequence data","author":"lafferty","year":"2001","journal-title":"Proc ICML"},{"key":"ref19","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2011-352","article-title":"Combining Information Sources for Confidence Estimation with CRF Models","author":"seigel","year":"2011","journal-title":"Proc INTERSPEECH"},{"key":"ref28","article-title":"The Kaldi speech recognition toolkit","author":"povey","year":"2011","journal-title":"ASRU IEEE"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2013.6707741"},{"key":"ref27","first-page":"3526","article-title":"Discriminative data selection for lightly supervised training of acoustic model using closed caption texts","author":"li","year":"2015","journal-title":"Proc INTERSPEECH"},{"key":"ref3","first-page":"2360","article-title":"Semi-supervised GMM and DNN acoustic model training with multi-system combination and confidence re-calibration","author":"huang","year":"2013","journal-title":"Proc INTERSPEECH"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2014.6854214"},{"key":"ref29","article-title":"ASR error dection in a conversational spoken language translation system","author":"chen","year":"2013","journal-title":"Proc ICASSP"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2014.6854014"},{"key":"ref8","first-page":"455","volume":"45","author":"jiang","year":"2005","journal-title":"Confidence measures for speech recognition a survey Speech Communication"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2009.03.004"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2013.6707758"},{"key":"ref9","doi-asserted-by":"crossref","first-page":"827","DOI":"10.21437\/Eurospeech.1997-281","article-title":"Estimating confidence using word lattices","volume":"2","author":"kemp","year":"1997","journal-title":"Proc EUROSPEECH"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2010.02.014"},{"key":"ref20","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2010-96","article-title":"CRF-based combination of contextual features to improve a posteriori wordlevel confidence measures","author":"fayolle","year":"2010","journal-title":"Proc INTERSPEECH"},{"key":"ref22","doi-asserted-by":"crossref","first-page":"232","DOI":"10.21437\/Interspeech.2008-71","article-title":"iCNC and iROVER: The Limits of Improving System Combination with Classification?","author":"hoffmeister","year":"2008","journal-title":"Proc INTERSPEECH"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.3115\/1614108.1614125"},{"key":"ref24","first-page":"2781","article-title":"A Comparative Study on Speech Summarization of Broadcast News and Lecture Speech","author":"zhang","year":"2007","journal-title":"Proc INTERSPEECH"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ISCSLP.2014.6936595"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1006\/csla.2001.0186"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2009.4960682"}],"event":{"name":"2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","start":{"date-parts":[[2016,3,20]]},"location":"Shanghai","end":{"date-parts":[[2016,3,25]]}},"container-title":["2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7465907\/7471614\/07472804.pdf?arnumber=7472804","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,6,17]],"date-time":"2024-06-17T21:27:17Z","timestamp":1718659637000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7472804\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,3]]},"references-count":36,"URL":"https:\/\/doi.org\/10.1109\/icassp.2016.7472804","relation":{},"subject":[],"published":{"date-parts":[[2016,3]]}}}