In this paper we describe the methodology and evaluation of the expansion of Galnet - the Galician wordnet - using a multilingual Bible through lexical alignment and semantic annotation. For this experiment we used the Galician, Portuguese, Spanish, Catalan and English versions of the Bible. They were annotated with part-of-speech and WordNet sense using FreeLing. The resulting synsets were aligned, and new variants for the Galician language were extracted. After manual evaluation the approach presented a 96.8% accuracy.
@InProceedings{simoes_et_al:OASIcs.SLATE.2018.14, author = {Sim\~{o}es, Alberto and Guinovart, Xavier G\'{o}mez}, title = {{Extending the Galician Wordnet Using a Multilingual Bible Through Lexical Alignment and Semantic Annotation}}, booktitle = {7th Symposium on Languages, Applications and Technologies (SLATE 2018)}, pages = {14:1--14:13}, series = {Open Access Series in Informatics (OASIcs)}, ISBN = {978-3-95977-072-9}, ISSN = {2190-6807}, year = {2018}, volume = {62}, editor = {Henriques, Pedro Rangel and Leal, Jos\'{e} Paulo and Leit\~{a}o, Ant\'{o}nio Menezes and Guinovart, Xavier G\'{o}mez}, publisher = {Schloss Dagstuhl -- Leibniz-Zentrum f{\"u}r Informatik}, address = {Dagstuhl, Germany}, URL = {https://drops.dagstuhl.de/entities/document/10.4230/OASIcs.SLATE.2018.14}, URN = {urn:nbn:de:0030-drops-92726}, doi = {10.4230/OASIcs.SLATE.2018.14}, annote = {Keywords: WordNet, lexical acquisition, parallel corpora, semantic annotation} }
Feedback for Dagstuhl Publishing