In today’s media and in the Web of Data, non-Western people still suffer a lack of representation. In our work, we address this issue by presenting a pipeline for collecting and semantically encoding Wikipedia biographies of writers who are under-represented due to their non-Western origins, or their legal status in a country. The two main components of the ontology will be described, together with a framework for mapping textual biographies to their corresponding semantic representations. A description of the data set, and some examples of biographical texts conversion to the Ontology Classes, will be provided.
@InProceedings{stranisci_et_al:OASIcs.LDK.2021.7, author = {Stranisci, Marco Antonio and Patti, Viviana and Damiano, Rossana}, title = {{Representing the Under-Represented: a Dataset of Post-Colonial, and Migrant Writers}}, booktitle = {3rd Conference on Language, Data and Knowledge (LDK 2021)}, pages = {7:1--7:14}, series = {Open Access Series in Informatics (OASIcs)}, ISBN = {978-3-95977-199-3}, ISSN = {2190-6807}, year = {2021}, volume = {93}, editor = {Gromann, Dagmar and S\'{e}rasset, Gilles and Declerck, Thierry and McCrae, John P. and Gracia, Jorge and Bosque-Gil, Julia and Bobillo, Fernando and Heinisch, Barbara}, publisher = {Schloss Dagstuhl -- Leibniz-Zentrum f{\"u}r Informatik}, address = {Dagstuhl, Germany}, URL = {https://drops.dagstuhl.de/entities/document/10.4230/OASIcs.LDK.2021.7}, URN = {urn:nbn:de:0030-drops-145431}, doi = {10.4230/OASIcs.LDK.2021.7}, annote = {Keywords: Ontologies, Knowledge Graph, Language Resources, Migrations} }
Feedback for Dagstuhl Publishing