@inproceedings{a0d95c87c1eb46ec9798af37e1eeaada,
title = "mRAT-SQL+GAP: A Portuguese Text-to-SQL Transformer",
abstract = "The translation of natural language questions to SQL queries has attracted growing attention, in particular in connection with transformers and similar language models. A large number of techniques are geared towards the English language; in this work, we thus investigated translation to SQL when input questions are given in the Portuguese language. To do so, we properly adapted state-of-the-art tools and resources. We changed the RAT-SQL+GAP system by relying on a multilingual BART model (we report tests with other language models), and we produced a translated version of the Spider dataset. Our experiments expose interesting phenomena that arise when non-English languages are targeted; in particular, it is better to train with original and translated training datasets together, even if a single target language is desired. This multilingual BART model fine-tuned with a double-size training dataset (English and Portuguese) achieved 83% of the baseline, making inferences for the Portuguese test dataset. This investigation can help other researchers to produce results in Machine Learning in a language different from English. Our multilingual ready version of RAT-SQL+GAP and the data are available, open-sourced as mRAT-SQL+GAP at: https://github.com/C4AI/gap-text2sql.",
keywords = "BART, BERTimbau, Deep learning, NL2SQL, RAT-SQL+GAP, Spider dataset",
author = "Jos{\'e}, {Marcelo Archanjo} and Cozman, {Fabio Gagliardi}",
note = "Publisher Copyright: {\textcopyright} 2021, Springer Nature Switzerland AG.; null ; Conference date: 29-11-2021 Through 03-12-2021",
year = "2021",
doi = "10.1007/978-3-030-91699-2_35",
language = "Ingl{\'e}s",
isbn = "9783030916985",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "511--525",
editor = "Andr{\'e} Britto and {Valdivia Delgado}, Karina",
booktitle = "Intelligent Systems - 10th Brazilian Conference, BRACIS 2021, Proceedings, Part 2",
address = "Alemania",
}