{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,8]],"date-time":"2025-09-08T05:56:31Z","timestamp":1757310991866,"version":"3.28.0"},"reference-count":32,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,11]]},"DOI":"10.1109\/iscslp.2018.8706700","type":"proceedings-article","created":{"date-parts":[[2019,5,20]],"date-time":"2019-05-20T22:58:35Z","timestamp":1558393115000},"page":"270-274","source":"Crossref","is-referenced-by-count":6,"title":["Formosa Speech Recognition Challenge 2018: Data, Plan and Baselines"],"prefix":"10.1109","author":[{"given":"Yuan-Fu","family":"Liao","sequence":"first","affiliation":[]},{"given":"Wu-Hua","family":"Hsu","sequence":"additional","affiliation":[]},{"given":"Yu-Chen","family":"Lin","sequence":"additional","affiliation":[]},{"given":"Yung-Hsiang Shawn","family":"Chang","sequence":"additional","affiliation":[]},{"given":"Matus","family":"Pleva","sequence":"additional","affiliation":[]},{"given":"Jozef","family":"Juhar","sequence":"additional","affiliation":[]},{"given":"Guang-Feng","family":"Deng","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref32","first-page":"1","article-title":"Low latency acoustic modeling using temporal convolution and LSTMs","author":"peddinti","year":"2017","journal-title":"IEEE Signal Process Lett"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2011.03.001"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2016-595"},{"key":"ref10","first-page":"687","article-title":"The MGB challenge: Evaluating multi-genre broadcast media recognition","author":"bell","year":"2016","journal-title":"2015 IEEE Work Autom Speech Recognit Understanding ASRU 2015 - Proc"},{"journal-title":"National Education Radio","year":"2018","key":"ref11"},{"journal-title":"PTS","year":"2018","key":"ref12"},{"journal-title":"OpenCourseWare (OCW) National Chiao Tung University of Technology","year":"2018","key":"ref13"},{"year":"2018","key":"ref14"},{"journal-title":"Junyi Academy","year":"2018","key":"ref15"},{"journal-title":"Formosa Grand Challenge Talk to AI","year":"2018","key":"ref16"},{"journal-title":"Formosa Speech in the Wild Corpus","year":"0","author":"liao","key":"ref17"},{"key":"ref18","article-title":"Computer-coding the IPA: a proposed extension of SAMPA","author":"wells","year":"0","journal-title":"UCL Phonetics Linguist"},{"key":"ref19","first-page":"54","article-title":"Phonetic modeling in the Philips Chinese continuous-speech recognition system","author":"seide","year":"1998","journal-title":"ISCSLP 1998"},{"key":"ref28","first-page":"2","article-title":"A time delay neural network architecture for efficient modeling of long temporal contexts","author":"peddinti","year":"2015","journal-title":"InterSpeech"},{"journal-title":"Exploring neural transducers for end-to-end speech recognition","year":"2017","author":"battenberg","key":"ref4"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2010.2064307"},{"journal-title":"Cold Fusion Training Seq2Seq Models Together with Language Models","year":"2017","author":"sriram","key":"ref3"},{"journal-title":"Achieving human parity in conversational speech recognition","year":"2016","author":"xiong","key":"ref6"},{"key":"ref29","first-page":"3","volume":"2","author":"ko","year":"0","journal-title":"Audio augmentation for speech recognition"},{"journal-title":"The Microsoft 2017 conversational speech recognition system","year":"2017","author":"xiong","key":"ref5"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-1768"},{"key":"ref7","doi-asserted-by":"crossref","first-page":"1183","DOI":"10.21437\/Interspeech.2017-721","article-title":"Deep Clustering-based Beamforming for Separation with Unknown Number of Sources","volume":"2017","author":"higuchi","year":"2017","journal-title":"Proc Interspeech 2017"},{"key":"ref2","first-page":"3","author":"chiu","year":"2017","journal-title":"State-of-the-art speech recognition with sequence-to-sequence models"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2017.8268952"},{"journal-title":"ACLCLP Database HomePage","year":"2018","key":"ref1"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICSDA.2017.8384450"},{"key":"ref22","first-page":"1","article-title":"The Kaldi speech recognition toolkit","author":"povey","year":"2011","journal-title":"IEEE Workshop Automatic Speech Recognition Understanding"},{"journal-title":"Praat Doing phonetics by computer","year":"2018","key":"ref21"},{"journal-title":"Kaldi Speech Recognition Toolkit GitHub Pull Request #2474","year":"0","key":"ref24"},{"journal-title":"The demo recipes of the Formosa Speech Recognition Challenge 2018","year":"0","author":"liao","key":"ref23"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICSDA.2017.8384449"},{"journal-title":"Word List with Accumulated Word Frequency in Sinica Corpus","year":"2018","key":"ref25"}],"event":{"name":"2018 11th International Symposium on Chinese Spoken Language Processing (ISCSLP)","start":{"date-parts":[[2018,11,26]]},"location":"Taipei City, Taiwan","end":{"date-parts":[[2018,11,29]]}},"container-title":["2018 11th International Symposium on Chinese Spoken Language Processing (ISCSLP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8701133\/8706262\/08706700.pdf?arnumber=8706700","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,8,24]],"date-time":"2020-08-24T06:15:37Z","timestamp":1598249737000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8706700\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,11]]},"references-count":32,"URL":"https:\/\/doi.org\/10.1109\/iscslp.2018.8706700","relation":{},"subject":[],"published":{"date-parts":[[2018,11]]}}}