SQLShare is a database service aimed at removing the obstacles to using relational databases: installation, configuration, schema design, tuning, data ingest, and even application design. You simply upload your data and immediately start querying it. One of the main lessons from SQLShare is that a relatively minor set of changes to how existing database technology is packaged and delivered is sufficient to convince science and data science users to adopt SQL in their day-to-day data manipulation and analysis tasks, potentially displacing script-and-file based approaches.
We analyzed the handwritten SQL queries and found that the features of SQLShare were instrumental in attracting new kinds of ad hoc queries and that the SQLShare workload is demonstrably more diverse than a comparable public workload in science, and that users are writing very complex queries by hand. The query log can be downloaded from SQLShare data release page.
Current
Past
@inproceedings{alawini2015relationships, author = {Alawini, Abdussalam and Maier, David and Tufte, Kristin and Howe, Bill and Nandikur, Rashmi}, title = {Towards automated prediction of relationships among scientific datasets}, booktitle = {Proceedings of the 27th International Conference on Scientific and Statistical Database Management, {SSDBM} '15, La Jolla, CA, USA, June 29 - July 1, 2015}, pages = {35:1--35:5}, year = {2015}, crossref = {DBLP:conf/ssdbm/2015}, url = {http://doi.acm.org/10.1145/2791347.2791358}, doi = {10.1145/2791347.2791358}, timestamp = {Tue, 08 Sep 2015 16:21:54 +0200}, biburl = {http://dblp.uni-trier.de/rec/bib/conf/ssdbm/AlawiniMTHN15}, bibsource = {dblp computer science bibliography, http://dblp.org} }
@inproceedings{alawini2014helping, title = {Helping scientists reconnect their datasets}, author = {Alawini, Abdussalam and Maier, David and Tufte, Kristin and Howe, Bill}, booktitle = {Proceedings of the 26th International Conference on Scientific and Statistical Database Management}, pages = {29}, year = {2014}, organization = {ACM} }
@article{howe2013collaborative, title = {Collaborative science workflows in SQL}, author = {Howe, Bill and Halperin, Daniel and Ribalet, Francois and Chitnis, Sagar and Armbrust, E Virginia}, journal = {Computing in Science and Engineering}, volume = {15}, number = {3}, pages = {22--31}, year = {2013}, publisher = {AIP Publishing} }
@inproceedings{howe2011example, author = {Howe, Bill and Cole, Garrett and Khoussainova, Nodira and Battle, Leilani}, title = {Automatic example queries for ad hoc databases}, booktitle = {Proceedings of the {ACM} {SIGMOD} International Conference on Management of Data, {SIGMOD} 2011, Athens, Greece, June 12-16, 2011}, pages = {1319--1322}, year = {2011}, crossref = {DBLP:conf/sigmod/2011}, url = {http://doi.acm.org/10.1145/1989323.1989487}, doi = {10.1145/1989323.1989487}, timestamp = {Thu, 16 Jun 2011 17:14:38 +0200}, biburl = {http://dblp.uni-trier.de/rec/bib/conf/sigmod/HoweCKB11}, bibsource = {dblp computer science bibliography, http://dblp.org} }
@inproceedings{howe2011database, title = {Database-as-a-service for long-tail science}, author = {Howe, Bill and Cole, Garret and Souroush, Emad and Koutris, Paraschos and Key, Alicia and Khoussainova, Nodira and Battle, Leilani}, booktitle = {Scientific and Statistical Database Management}, pages = {480--489}, year = {2011}, organization = {Springer} }
@inproceedings{howe2010sql, title = {SQL is dead; long live SQL: Lightweight query services for ad hoc research data}, author = {Howe, Bill and Cole, Garret}, booktitle = {4th Microsoft eScience Workshop}, year = {2010} }