Reproducibility is a key principle of the modern scientific method. Maps, as an important means of communicating scientific results in GIScience and across disciplines, should be reproducible. Currently, map reproducibility assessment is done manually, which makes the assessment process tedious and time-consuming, ultimately limiting its efficiency. Hence, this work explores the extent to which Visual Question-Answering (VQA) can be used to automate some tasks relevant to map reproducibility assessment. We selected five state-of-the-art vision language models (VLMs) and followed a three-step approach to evaluate their ability to discriminate between maps and other images, interpret map content, and compare two map images using VQA. Our results show that current VLMs already possess map-reading capabilities and demonstrate understanding of spatial concepts, such as cardinal directions, geographic scope, and legend interpretation. Our paper demonstrates the potential of using VQA to support reproducibility assessment and highlights the outstanding issues that need to be addressed to achieve accurate, trustworthy map descriptions, thereby reducing the time and effort required by human evaluators.
@InProceedings{koukouraki_et_al:LIPIcs.GIScience.2025.13, author = {Koukouraki, Eftychia and Degbelo, Auriol and Kray, Christian}, title = {{Assessing Map Reproducibility with Visual Question-Answering: An Empirical Evaluation}}, booktitle = {13th International Conference on Geographic Information Science (GIScience 2025)}, pages = {13:1--13:12}, series = {Leibniz International Proceedings in Informatics (LIPIcs)}, ISBN = {978-3-95977-378-2}, ISSN = {1868-8969}, year = {2025}, volume = {346}, editor = {Sila-Nowicka, Katarzyna and Moore, Antoni and O'Sullivan, David and Adams, Benjamin and Gahegan, Mark}, publisher = {Schloss Dagstuhl -- Leibniz-Zentrum f{\"u}r Informatik}, address = {Dagstuhl, Germany}, URL = {https://drops.dagstuhl.de/entities/document/10.4230/LIPIcs.GIScience.2025.13}, URN = {urn:nbn:de:0030-drops-238426}, doi = {10.4230/LIPIcs.GIScience.2025.13}, annote = {Keywords: map comparison, computational reproducibility, visual question answering, large language models, GeoAI} }
Feedback for Dagstuhl Publishing