Querying data is core to databases and data science. However, the two communities have seemingly different concepts and use cases. As a result, both designers and users of the query languages disagree on whether the core abstractions - dataframes (data science) and tables (databases) - and the operations are the same. To investigate the difference from a PL-HCI perspective, we identify the basic affordances provided by tables and dataframes and how programming experiences over tables and dataframes differ. We show that the data structures nudge programmers to query and store their data in different ways. We hope the case study could clarify confusions, dispel misinformation, increase cross-pollination between the two communities, and identify open PL-HCI questions.
@InProceedings{wu:OASIcs.PLATEAU.2019.6, author = {Wu, Yifan}, title = {{Is a Dataframe Just a Table?}}, booktitle = {10th Workshop on Evaluation and Usability of Programming Languages and Tools (PLATEAU 2019)}, pages = {6:1--6:10}, series = {Open Access Series in Informatics (OASIcs)}, ISBN = {978-3-95977-135-1}, ISSN = {2190-6807}, year = {2020}, volume = {76}, editor = {Chasins, Sarah and Glassman, Elena L. and Sunshine, Joshua}, publisher = {Schloss Dagstuhl -- Leibniz-Zentrum f{\"u}r Informatik}, address = {Dagstuhl, Germany}, URL = {https://drops.dagstuhl.de/entities/document/10.4230/OASIcs.PLATEAU.2019.6}, URN = {urn:nbn:de:0030-drops-119600}, doi = {10.4230/OASIcs.PLATEAU.2019.6}, annote = {Keywords: Usability of Programming Languages} }