Parallel text alignment is a key procedure in the automated translation area. A large number of aligners have been presented along the years, but these require that the target resources have been pre-prepared for alignment (either manually or automatically). It is rather normal to encounter mixed language documents, that is, documents where the same information is written in many languages (Ex: manuals of electronic devices, touristic information, PhD thesis with dual language abstracts, etc). In this article we present MLT-prealigner: a tool aimed at helping those that need to process mixed texts in order to feed alignment tools and other related language systems.
@InProceedings{carvalho_et_al:OASIcs.SLATE.2014.283, author = {Carvalho, Pedro and Almeida, Jos\'{e} Jo\~{a}o}, title = {{MLT-prealigner: a Tool for Multilingual Text Alignment}}, booktitle = {3rd Symposium on Languages, Applications and Technologies}, pages = {283--290}, series = {Open Access Series in Informatics (OASIcs)}, ISBN = {978-3-939897-68-2}, ISSN = {2190-6807}, year = {2014}, volume = {38}, editor = {Pereira, Maria Jo\~{a}o Varanda and Leal, Jos\'{e} Paulo and Sim\~{o}es, Alberto}, publisher = {Schloss Dagstuhl -- Leibniz-Zentrum f{\"u}r Informatik}, address = {Dagstuhl, Germany}, URL = {https://drops.dagstuhl.de/entities/document/10.4230/OASIcs.SLATE.2014.283}, URN = {urn:nbn:de:0030-drops-45776}, doi = {10.4230/OASIcs.SLATE.2014.283}, annote = {Keywords: parallel corpora, multilingual text alignment, language detection, Perl, automated translation} }
Feedback for Dagstuhl Publishing