@InProceedings{luong-vu:2016:WLSI-OIAF4HLT2016,
  author    = {Luong, Hieu-Thi  and  Vu, Hai-Quan},
  title     = {A non-expert Kaldi recipe for Vietnamese Speech Recognition System},
  booktitle = {Proceedings of the Third International Workshop on Worldwide Language Service Infrastructure and Second Workshop on Open Infrastructures and Analysis Frameworks for Human Language Technologies (WLSI/OIAF4HLT2016)},
  month     = {December},
  year      = {2016},
  address   = {Osaka, Japan},
  publisher = {The COLING 2016 Organizing Committee},
  pages     = {51--55},
  abstract  = {In this paper we describe a non-expert setup for Vietnamese speech recognition
	system using Kaldi toolkit. We collected a speech corpus over fifteen hours
	from about fifty Vietnamese native speakers and using it to test the
	feasibility
	of our setup. The essential linguistic components for the Automatic Speech
	Recognition (ASR) system was prepared basing on the written form of the
	language instead of expertise knowledge on linguistic and phonology as commonly
	seen in rich resource languages like English. The modeling of tones by
	integrating them into the phoneme and using the phonetic decision tree is also
	discussed. Experimental results showed this setup for ASR systems does yield
	competitive results while still have potentials for further improvements.},
  url       = {http://aclweb.org/anthology/W16-5207}
}

