@InProceedings{schulz-aziz-cohn:2018:Long,
  author    = {Schulz, Philip  and  Aziz, Wilker  and  Cohn, Trevor},
  title     = {A Stochastic Decoder for Neural Machine Translation},
  booktitle = {Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)},
  month     = {July},
  year      = {2018},
  address   = {Melbourne, Australia},
  publisher = {Association for Computational Linguistics},
  pages     = {1243--1252},
  abstract  = {The process of translation is ambiguous, in that there are typically many valid translations for a given sentence. This gives rise to significant variation in parallel corpora, however, most current models of machine translation do not account for this variation, instead treating the problem as a deterministic process. To this end, we present a deep generative model of machine translation which incorporates a chain of latent variables, in order to account for local lexical and syntactic variation in parallel corpora. We provide an in-depth analysis of the pitfalls encountered in variational inference for training deep generative models. Experiments on several different language pairs demonstrate that the model consistently improves over strong baselines.},
  url       = {http://www.aclweb.org/anthology/P18-1115}
}

