Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

First draft of data analysis environments #13

Open
wants to merge 6 commits into
base: trunk
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Binary file added images/dsjs.gif
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added images/insitu.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added images/jupyter.gif
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
98 changes: 98 additions & 0 deletions src/data-analysis-environments.bib
Original file line number Diff line number Diff line change
@@ -0,0 +1,98 @@
@inproceedings{muller:2019,
title = {How Data Science Workers Work with Data: Discovery, Capture, Curation, Design, Creation},
author = {Muller, Michael and Lange, Ingrid and Wang, Dakuo and Piorkowski, David and Tsay, Jason and Liao, Q. Vera and Dugan, Casey and Erickson, Thomas},
booktitle = {Proceedings of the 2019 CHI Conference on Human Factors in Computing Systems},
year = {2019},
pages = {126:1--126:15},
doi = {10.1145/3290605.3300356},
publisher = {ACM}
}

@article{donoho:2017,
title = {50 Years of Data Science},
author = {David Donoho},
journal = {Journal of Computational and Graphical Statistics},
year = {2017},
publisher = {Taylor & Francis},
doi = {10.1080/10618600.2017.1384734},
}

@inproceedings{kery:2017:exploring,
title = {Exploring exploratory programming},
author = {Kery, Mary Beth and Myers, Brad A.},
doi = {10.1109/VLHCC.2017.8103446},
booktitle = {2017 {IEEE} Symposium on Visual Languages and Human-Centric Computing ({VL}/{HCC})},
date = {2017-10},
year = {2017}
}

@inproceedings{zhang:2017,
author = {Zhang, Xiong and Guo, Philip J.},
title = {{DS.Js}: Turn Any Webpage into an Example-Centric Live Programming Environment for Learning Data Science},
booktitle = {Proceedings of the 30th Annual ACM Symposium on User Interface Software and Technology},
series = {UIST '17},
year = {2017},
doi = {10.1145/3126594.3126663},
publisher = {ACM},
}

@inproceedings{zhang:2019,
author = {Zhang, Xiong and Guo, Philip J.},
title = {Mallard\&\#58; Turn the Web into a Contextualized Prototyping Environment for Machine Learning},
booktitle = {Proceedings of the 32nd Annual ACM Symposium on User Interface Software and Technology},
series = {UIST '19},
year = {2019},
pages = {605--618},
numpages = {14},
doi = {10.1145/3332165.3347936},
publisher = {ACM},
}

@inproceedings{gulwani:2011,
author = {Gulwani, Sumit},
title = {Automating String Processing in Spreadsheets Using Input-output Examples},
booktitle = {Proceedings of the 38th Annual ACM SIGPLAN-SIGACT Symposium on Principles of Programming Languages},
series = {POPL '11},
year = {2011},
pages = {317--330},
numpages = {14},
doi = {10.1145/1926385.1926423},
publisher = {ACM},
}

@article{wang:2012,
author = {Wang, Jiannan and Kraska, Tim and Franklin, Michael J. and Feng, Jianhua},
title = {CrowdER: Crowdsourcing Entity Resolution},
journal = {Proc. VLDB Endow.},
issue_date = {July 2012},
volume = {5},
number = {11},
year = {2012},
pages = {1483--1494},
numpages = {12},
doi = {10.14778/2350229.2350263},
publisher = {VLDB Endowment},
}

@inproceedings{kandel:2011,
author = {Kandel, Sean and Paepcke, Andreas and Hellerstein, Joseph and Heer, Jeffrey},
title = {Wrangler: Interactive Visual Specification of Data Transformation Scripts},
booktitle = {Proceedings of the SIGCHI Conference on Human Factors in Computing Systems},
series = {CHI '11},
year = {2011},
pages = {3363--3372},
numpages = {10},
doi = {10.1145/1978942.1979444},
publisher = {ACM},
}

@article{satyanarayan:2017,
author={Satyanarayan, Arvind and Moritz, Dominik and Wongsuphasawat, Kanit and Heer, Jeffrey},
journal={IEEE Transactions on Visualization and Computer Graphics},
title={Vega-Lite: A Grammar of Interactive Graphics},
year={2017},
volume={23},
number={1},
pages={341-350},
doi={10.1109/TVCG.2016.2599030},
}
117 changes: 117 additions & 0 deletions src/data-analysis-environments2.bib
Original file line number Diff line number Diff line change
@@ -0,0 +1,117 @@
@inproceedings{hoffswell:2018,
author = {Hoffswell, Jane and Satyanarayan, Arvind and Heer, Jeffrey},
title = {Augmenting Code with In Situ Visualizations to Aid Program Understanding},
booktitle = {Proceedings of the 2018 CHI Conference on Human Factors in Computing Systems},
series = {CHI '18},
year = {2018},
pages = {532:1--532:12},
articleno = {532},
numpages = {12},
doi = {10.1145/3173574.3174106},
publisher = {ACM},
}

@inproceedings{xia:2018,
author = {Xia, Haijun and Henry Riche, Nathalie and Chevalier, Fanny and De Araujo, Bruno and Wigdor, Daniel},
title = {{DataInk}: Direct and Creative Data-Oriented Drawing},
booktitle = {Proceedings of the 2018 CHI Conference on Human Factors in Computing Systems},
series = {CHI '18},
year = {2018},
pages = {223:1--223:13},
articleno = {223},
numpages = {13},
doi = {10.1145/3173574.3173797},
publisher = {ACM},
}

@inproceedings{jun:2019,
author = {Jun, Eunice and Daum, Maureen and Roesch, Jared and Chasins, Sarah and Berger, Emery and Just, Rene and Reinecke, Katharina},
title = {Tea: A High-level Language and Runtime System for Automating Statistical Analysis},
booktitle = {Proceedings of the 32Nd Annual ACM Symposium on User Interface Software and Technology},
series = {UIST '19},
year = {2019},
pages = {591--603},
numpages = {13},
doi = {10.1145/3332165.3347940},
publisher = {ACM},
}

@inproceedings{chasins:2018,
author = {Chasins, Sarah E. and Mueller, Maria and Bodik, Rastislav},
title = {Rousillon: Scraping Distributed Hierarchical Web Data},
booktitle = {Proceedings of the 31st Annual ACM Symposium on User Interface Software and Technology},
series = {UIST '18},
year = {2018},
pages = {963--975},
numpages = {13},
doi = {10.1145/3242587.3242661},
acmid = {3242661},
publisher = {ACM},
}

@inproceedings{rule:2018,
author = {Rule, Adam and Tabard, Aur{\'e}lien and Hollan, James D.},
title = {Exploration and Explanation in Computational Notebooks},
booktitle = {Proceedings of the 2018 CHI Conference on Human Factors in Computing Systems},
series = {CHI '18},
year = {2018},
pages = {32:1--32:12},
articleno = {32},
numpages = {12},
doi = {10.1145/3173574.3173606},
publisher = {ACM},
}

@inproceedings{kery:2018,
author = {Kery, Mary Beth and Radensky, Marissa and Arya, Mahima and John, Bonnie E. and Myers, Brad A.},
title = {The Story in the Notebook: Exploratory Data Science Using a Literate Programming Tool},
booktitle = {Proceedings of the 2018 CHI Conference on Human Factors in Computing Systems},
series = {CHI '18},
year = {2018},
pages = {174:1--174:11},
articleno = {174},
numpages = {11},
doi = {10.1145/3173574.3173748},
acmid = {3173748},
publisher = {ACM}
}

@inproceedings{kery:2017,
author = {Kery, Mary Beth and Horvath, Amber and Myers, Brad},
title = {Variolite: Supporting Exploratory Programming by Data Scientists},
booktitle = {Proceedings of the 2017 CHI Conference on Human Factors in Computing Systems},
series = {CHI '17},
year = {2017},
pages = {1265--1276},
numpages = {12},
doi = {10.1145/3025453.3025626},
acmid = {3025626},
publisher = {ACM}
}

@inproceedings{kery:2019,
author = {Kery, Mary Beth and John, Bonnie E. and O'Flaherty, Patrick and Horvath, Amber and Myers, Brad A.},
title = {Towards Effective Foraging by Data Scientists to Find Past Analysis Choices},
booktitle = {Proceedings of the 2019 CHI Conference on Human Factors in Computing Systems},
series = {CHI '19},
year = {2019},
pages = {92:1--92:13},
articleno = {92},
numpages = {13},
doi = {10.1145/3290605.3300322},
publisher = {ACM}
}

@inproceedings{head:2019,
author = {Head, Andrew and Hohman, Fred and Barik, Titus and Drucker, Steven M. and DeLine, Robert},
title = {Managing Messes in Computational Notebooks},
booktitle = {Proceedings of the 2019 CHI Conference on Human Factors in Computing Systems},
series = {CHI '19},
year = {2019},
pages = {270:1--270:12},
articleno = {270},
numpages = {12},
doi = {10.1145/3290605.3300500},
publisher = {ACM},
}

11 changes: 11 additions & 0 deletions src/data-analysis-environments3.bib
Original file line number Diff line number Diff line change
@@ -0,0 +1,11 @@
@article{perez:2007,
author={F. {Perez} and B. E. {Granger}},
journal={Computing in Science Engineering},
title={IPython: A System for Interactive Scientific Computing},
year={2007},
volume={9},
number={3},
pages={21-29},
doi={10.1109/MCSE.2007.53},
ISSN={1558-366X},
month={May},}
Loading