We present work on the automatic generation of question-answer pairs in Portuguese, useful, for instance, for populating the knowledge-base of question-answering systems. This includes: (i) a new corpus of close to 600 factoid sentences, manually created from an existing corpus of questions and answers, used as our benchmark; (ii) two approaches for the automatic generation of question-answer pairs, which can be seen as baselines; (iii) results of those approaches in the corpus.
@InProceedings{ferreira_et_al:OASIcs.SLATE.2020.16, author = {Ferreira, Jo\~{a}o and Rodrigues, Ricardo and Gon\c{c}alo Oliveira, Hugo}, title = {{Assessing Factoid Question-Answer Generation for Portuguese}}, booktitle = {9th Symposium on Languages, Applications and Technologies (SLATE 2020)}, pages = {16:1--16:9}, series = {Open Access Series in Informatics (OASIcs)}, ISBN = {978-3-95977-165-8}, ISSN = {2190-6807}, year = {2020}, volume = {83}, editor = {Sim\~{o}es, Alberto and Henriques, Pedro Rangel and Queir\'{o}s, Ricardo}, publisher = {Schloss Dagstuhl -- Leibniz-Zentrum f{\"u}r Informatik}, address = {Dagstuhl, Germany}, URL = {https://drops.dagstuhl.de/entities/document/10.4230/OASIcs.SLATE.2020.16}, URN = {urn:nbn:de:0030-drops-130298}, doi = {10.4230/OASIcs.SLATE.2020.16}, annote = {Keywords: Question-Answer Generation, Corpus, NLP, Portuguese} }
Feedback for Dagstuhl Publishing