Learning programming boils down to the practice of solving exercises. However, although there are good and diversified exercises, these are held in proprietary systems hindering their interoperability. This article presents a simple scraping tool, called ScraPE, which through a navigation, interaction and data extraction script, materialized in a domain-specific language, allows extracting the data necessary from Web pages - typically online judges - to compose programming exercises in a standard language. The tool is validated by extracting exercises from a specific online judge. This tool is part of a larger project where the main objective is to provide programming exercises through a simple GraphQL API.
@InProceedings{queiros:OASIcs.SLATE.2022.18, author = {Queir\'{o}s, Ricardo}, title = {{ScraPE - An Automated Tool for Programming Exercises Scraping}}, booktitle = {11th Symposium on Languages, Applications and Technologies (SLATE 2022)}, pages = {18:1--18:7}, series = {Open Access Series in Informatics (OASIcs)}, ISBN = {978-3-95977-245-7}, ISSN = {2190-6807}, year = {2022}, volume = {104}, editor = {Cordeiro, Jo\~{a}o and Pereira, Maria Jo\~{a}o and Rodrigues, Nuno F. and Pais, Sebasti\~{a}o}, publisher = {Schloss Dagstuhl -- Leibniz-Zentrum f{\"u}r Informatik}, address = {Dagstuhl, Germany}, URL = {https://drops.dagstuhl.de/entities/document/10.4230/OASIcs.SLATE.2022.18}, URN = {urn:nbn:de:0030-drops-167646}, doi = {10.4230/OASIcs.SLATE.2022.18}, annote = {Keywords: Web scrapping, crawling, programming exercises, online judges, DOM} }
Feedback for Dagstuhl Publishing