Neural machine translation is a relatively new approach to statistical machine translation based purely on neural networks. The neural machine translation models often consist of an encoder and a decoder. The encoder extracts a fixed-length representation from a variable-length input sentence, and the decoder generates a correct translation from this representation. In this paper, we focus on analyzing the properties of the neural machine translation using two models; RNN Encoder--Decoder and a newly proposed gated recursive convolutional neural network. We show that the neural machine translation performs relatively well on short sentences without unknown words, but its performance degrades rapidly as the length of the sentence and the number of unknown words increase. Furthermore, we find that the proposed gated recursive convolutional network learns a grammatical structure of a sentence automatically.
:C$\backslash$:/Users/Usuario/AppData/Local/Mendeley Ltd./Mendeley Desktop/Downloaded/Cho et al. - 2014 - On the Properties of Neural Machine Translation Encoder-Decoder Approaches.pdf:pdf
%0 Journal Article
%1 Cho2014
%A Cho, Kyunghyun
%A van Merrienboer, Bart
%A Bahdanau, Dzmitry
%A Bengio, Yoshua
%D 2014
%J CoRR
%K final thema:personalized_top-n
%T On the Properties of Neural Machine Translation: Encoder-Decoder Approaches.
%U http://arxiv.org/abs/1409.1259
%X Neural machine translation is a relatively new approach to statistical machine translation based purely on neural networks. The neural machine translation models often consist of an encoder and a decoder. The encoder extracts a fixed-length representation from a variable-length input sentence, and the decoder generates a correct translation from this representation. In this paper, we focus on analyzing the properties of the neural machine translation using two models; RNN Encoder--Decoder and a newly proposed gated recursive convolutional neural network. We show that the neural machine translation performs relatively well on short sentences without unknown words, but its performance degrades rapidly as the length of the sentence and the number of unknown words increase. Furthermore, we find that the proposed gated recursive convolutional network learns a grammatical structure of a sentence automatically.
@article{Cho2014,
abstract = {Neural machine translation is a relatively new approach to statistical machine translation based purely on neural networks. The neural machine translation models often consist of an encoder and a decoder. The encoder extracts a fixed-length representation from a variable-length input sentence, and the decoder generates a correct translation from this representation. In this paper, we focus on analyzing the properties of the neural machine translation using two models; RNN Encoder--Decoder and a newly proposed gated recursive convolutional neural network. We show that the neural machine translation performs relatively well on short sentences without unknown words, but its performance degrades rapidly as the length of the sentence and the number of unknown words increase. Furthermore, we find that the proposed gated recursive convolutional network learns a grammatical structure of a sentence automatically.},
added-at = {2021-01-20T22:50:15.000+0100},
archiveprefix = {arXiv},
arxivid = {1409.1259v2},
author = {Cho, Kyunghyun and van Merrienboer, Bart and Bahdanau, Dzmitry and Bengio, Yoshua},
biburl = {https://www.bibsonomy.org/bibtex/23c5e897e8d06d579ba82b22464279c91/helenaf},
eprint = {1409.1259v2},
file = {:C$\backslash$:/Users/Usuario/AppData/Local/Mendeley Ltd./Mendeley Desktop/Downloaded/Cho et al. - 2014 - On the Properties of Neural Machine Translation Encoder-Decoder Approaches.pdf:pdf},
interhash = {762b86f271d539b0c572e58174401369},
intrahash = {3c5e897e8d06d579ba82b22464279c91},
journal = {CoRR},
keywords = {final thema:personalized_top-n},
mendeley-tags = {MTM16,ciencia{\_}computacional,traducci{\'{o}}n{\_}autom{\'{a}}tica{\_}neuronal},
month = oct,
timestamp = {2021-01-20T22:50:15.000+0100},
title = {On the Properties of Neural Machine Translation: Encoder-Decoder Approaches.},
url = {http://arxiv.org/abs/1409.1259},
year = 2014
}