Recently, multilingual question answering became a crucial research topic,
and it is receiving increased interest in the NLP community. However, the
unavailability of large-scale datasets makes it challenging to train
multilingual QA systems with performance comparable to the English ones. In
this work, we develop the Translate Align Retrieve (TAR) method to
automatically translate the Stanford Question Answering Dataset (SQuAD) v1.1 to
Spanish. We then used this dataset to train Spanish QA systems by fine-tuning a
Multilingual-BERT model. Finally, we evaluated our QA models with the recently
proposed MLQA and XQuAD benchmarks for cross-lingual Extractive QA.
Experimental results show that our models outperform the previous
Multilingual-BERT baselines achieving the new state-of-the-art value of 68.1 F1
points on the Spanish MLQA corpus and 77.6 F1 and 61.8 Exact Match points on
the Spanish XQuAD corpus. The resulting, synthetically generated SQuAD-es v1.1
corpora, with almost 100\% of data contained in the original English version, to
the best of our knowledge, is the first large-scale QA training resource for
Spanish.
Description
[1912.05200] Automatic Spanish Translation of the SQuAD Dataset for Multilingual Question Answering
%0 Generic
%1 carrino2019automatic
%A Carrino, Casimiro Pio
%A Costa jussà, Marta R.
%A Fonollosa, José A. R.
%D 2019
%K dataset masterthesis qna squad
%T Automatic Spanish Translation of the SQuAD Dataset for Multilingual
Question Answering
%U http://arxiv.org/abs/1912.05200
%X Recently, multilingual question answering became a crucial research topic,
and it is receiving increased interest in the NLP community. However, the
unavailability of large-scale datasets makes it challenging to train
multilingual QA systems with performance comparable to the English ones. In
this work, we develop the Translate Align Retrieve (TAR) method to
automatically translate the Stanford Question Answering Dataset (SQuAD) v1.1 to
Spanish. We then used this dataset to train Spanish QA systems by fine-tuning a
Multilingual-BERT model. Finally, we evaluated our QA models with the recently
proposed MLQA and XQuAD benchmarks for cross-lingual Extractive QA.
Experimental results show that our models outperform the previous
Multilingual-BERT baselines achieving the new state-of-the-art value of 68.1 F1
points on the Spanish MLQA corpus and 77.6 F1 and 61.8 Exact Match points on
the Spanish XQuAD corpus. The resulting, synthetically generated SQuAD-es v1.1
corpora, with almost 100\% of data contained in the original English version, to
the best of our knowledge, is the first large-scale QA training resource for
Spanish.
@misc{carrino2019automatic,
abstract = {Recently, multilingual question answering became a crucial research topic,
and it is receiving increased interest in the NLP community. However, the
unavailability of large-scale datasets makes it challenging to train
multilingual QA systems with performance comparable to the English ones. In
this work, we develop the Translate Align Retrieve (TAR) method to
automatically translate the Stanford Question Answering Dataset (SQuAD) v1.1 to
Spanish. We then used this dataset to train Spanish QA systems by fine-tuning a
Multilingual-BERT model. Finally, we evaluated our QA models with the recently
proposed MLQA and XQuAD benchmarks for cross-lingual Extractive QA.
Experimental results show that our models outperform the previous
Multilingual-BERT baselines achieving the new state-of-the-art value of 68.1 F1
points on the Spanish MLQA corpus and 77.6 F1 and 61.8 Exact Match points on
the Spanish XQuAD corpus. The resulting, synthetically generated SQuAD-es v1.1
corpora, with almost 100\% of data contained in the original English version, to
the best of our knowledge, is the first large-scale QA training resource for
Spanish.},
added-at = {2020-12-19T15:45:30.000+0100},
author = {Carrino, Casimiro Pio and Costa jussà, Marta R. and Fonollosa, José A. R.},
biburl = {https://www.bibsonomy.org/bibtex/2f36a4d65cf37a253a447e7db2a9a97c5/festplatte},
description = {[1912.05200] Automatic Spanish Translation of the SQuAD Dataset for Multilingual Question Answering},
interhash = {4a509dbd6552cb3d2d8df15c4604cc90},
intrahash = {f36a4d65cf37a253a447e7db2a9a97c5},
keywords = {dataset masterthesis qna squad},
note = {cite arxiv:1912.05200Comment: Submitted to LREC 2020},
timestamp = {2020-12-19T15:48:37.000+0100},
title = {Automatic Spanish Translation of the SQuAD Dataset for Multilingual
Question Answering},
url = {http://arxiv.org/abs/1912.05200},
year = 2019
}