-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathground.bib
332 lines (299 loc) · 10.4 KB
/
ground.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
@misc{basel3,
title="{The Basel iii Accord}",
author="{The Basel Committee}",
key="Basel",
year=2016,
note={\url{http://www.basel-iii-accord.com}, retrieved November, 2016.}
}
@book{cheney2009provenance,
title={Provenance in Databases},
author={Cheney, James and Chiticariu, Laura and Tan, Wang-Chiew},
year={2009},
publisher={Now Publishers Inc}
}
@book{inmon2005building,
title={Building the data warehouse},
author={Inmon, William H},
year={2005},
publisher={John Wiley \& Sons}
}
@misc{gartner,
title={Gartner Says Every Budget is Becoming an {IT} Budget},
author={Gartner},
month=oct,
year=2012,
number=2208015,
note={\url{http://www.gartner.com/newsroom/id/2208015}
}
}
@book{patil2012data,
title={Data Jujitsu: The Art of Turning Data into Product},
author={Patil, DJ},
year={2012},
publisher={O'Reilly Media}
}
@inproceedings{zeldovich2008securing,
title={Securing Distributed Systems with Information Flow Control.},
author={Zeldovich, Nickolai and Boyd-Wickizer, Silas and Mazieres, David},
booktitle={NSDI},
volume={8},
pages={293--308},
year={2008}
}
@misc{starwarskid,
title="{Star Wars Kid: The Data Dump}",
key={star wars},
year=2008,
note={\url{http://waxy.org/2008/05/star_wars_kid_the_data_dump/}, retrieved June, 2008.}
}
@book{stonebraker1987design,
title={The design of the {Postgres} storage system},
author={Stonebraker, Michael},
year={1987},
publisher={Morgan Kaufmann Publishers Burlington}
}
@book{loshin2010master,
title={Master Data Management},
author={Loshin, David},
year={2010},
publisher={Morgan Kaufmann}
}
@book{grades16,
editor = {Peter Boncz and Josep{-}Lluis Larriba{-}Pey},
title={International Workshop on Graph Data Management
Experiences and Systems {(GRADES)}},
year=2016,
publisher={{ACM}}
}
@inproceedings{mcsherry2015scalability,
title="{Scalability! But at what COST?}",
author={McSherry, Frank and Isard, Michael and Murray, Derek G},
booktitle={HotOS XV},
year={2015}
}
@inproceedings{kandogan2015labbook,
title={Lab{B}ook: {M}etadata-driven social collaborative data analysis},
author={Kandogan, Eser and Roth, Mary and Schwarz, Peter and Hui, Joshua and Terrizzano, Ignacio and Christodoulakis, Christina and Miller, Ren{\'e}e J},
booktitle={Big Data (Big Data), 2015 IEEE International Conference on},
pages={431--440},
year={2015},
organization={IEEE}
}
@article{clio,
title={The {C}lio project: {M}anaging heterogeneity},
author={Miller, Ren{\'e}e J and Hern{\'a}ndez, Mauricio A and Haas, Laura M and Yan, Ling-Ling and Ho, CT Howard and Fagin, Ronald and Popa, Lucian},
journal={SIGMOD Record},
volume={30},
number={1},
pages={78--83},
year={2001}
}
@inproceedings{goods,
title={Goods: {O}rganizing {G}oogle's Datasets},
author={Halevy, Alon and Korn, Flip and Noy, Natalya F and Olston, Christopher and Polyzotis, Neoklis and Roy, Sudip and Whang, Steven Euijong},
booktitle={Proceedings of the 2016 International Conference on Management of Data},
pages={795--806},
year={2016},
organization={ACM}
}
@inproceedings{vistrails,
title={Vis{T}rails: {V}isualization meets data management},
author={Callahan, Steven P and Freire, Juliana and Santos, Emanuele and Scheidegger, Carlos E and Silva, Cl{\'a}udio T and Vo, Huy T},
booktitle={Proceedings of the 2006 ACM SIGMOD international conference on Management of data},
pages={745--747},
year={2006},
organization={ACM}
}
@inproceedings{datahub,
title={Data{H}ub: {C}ollaborative data science \& dataset version management at scale},
author={Bhardwaj, Anant and Bhattacherjee, Souvik and Chavan, Amit and Deshpande, Amol and Elmore, Aaron J and Madden, Samuel and Parameswaran, Aditya G},
booktitle={CIDR},
year={2015}
}
@article{decibel,
title={Decibel: {T}he relational dataset branching system},
author={Maddox, Michael and Goehring, David and Elmore, Aaron J and Madden, Samuel and Parameswaran, Aditya and Deshpande, Amol},
journal={Proceedings of the VLDB Endowment},
volume={9},
number={9},
pages={624--635},
year={2016},
publisher={VLDB Endowment}
}
@article{provdb,
title={Prov{DB}: {A} System for Lifecycle Management of Collaborative Analysis Workflows},
author={Miao, Hui and Chavan, Amit and Deshpande, Amol},
journal={arXiv preprint arXiv:1610.04963},
year={2016}
}
@inproceedings{burrito,
title={{BURRITO}: {W}rapping Your Lab Notebook in Computational Infrastructure.},
author={Guo, Philip J and Seltzer, Margo},
booktitle={Workshop on the Theory and Practice of Provenance (TaPP)},
year={2012}
}
@inproceedings{reprozip,
author = {Fernando Seabra Chirigati and
Dennis E. Shasha and
Juliana Freire},
title = {Repro{Z}ip: {U}sing Provenance to Support Computational Reproducibility},
booktitle = {Workshop on the Theory and Practice of Provenance (TaPP)},
year = {2013},
}
@inproceedings{datatamer,
title={Data Curation at Scale: {T}he Data Tamer System.},
author={Stonebraker, Michael and Bruckner, Daniel and Ilyas, Ihab F and Beskales, George and Cherniack, Mitch and Zdonik, Stanley B and Pagan, Alexander and Xu, Shan},
booktitle={CIDR},
year={2013}
}
@article{deepdive,
title={Deep{D}ive: {W}eb-scale Knowledge-base Construction using Statistical Learning and Inference.},
author={Niu, Feng and Zhang, Ce and R{\'e}, Christopher and Shavlik, Jude W},
journal={VLDS},
volume={12},
pages={25--28},
year={2012}
}
@inproceedings{yago,
title={Yago: {A} core of semantic knowledge},
author={Suchanek, Fabian M and Kasneci, Gjergji and Weikum, Gerhard},
booktitle={Proceedings of the 16th international conference on World Wide Web},
pages={697--706},
year={2007},
organization={ACM}
}
@inproceedings{myers1999jflow,
title={J{F}low: {P}ractical mostly-static information flow control},
author={Myers, Andrew C},
booktitle={Proceedings of the 26th ACM SIGPLAN-SIGACT symposium on Principles of programming languages},
pages={228--241},
year={1999},
organization={ACM}
}
@article{webtables,
title={Web{T}ables: {E}xploring the power of tables on the web},
author={Cafarella, Michael J and Halevy, Alon and Wang, Daisy Zhe and Wu, Eugene and Zhang, Yang},
journal={Proceedings of the VLDB Endowment},
volume={1},
number={1},
pages={538--549},
year={2008},
publisher={VLDB Endowment}
}
@article{adelfio2013schema,
title={Schema extraction for tabular data on the web},
author={Adelfio, Marco D and Samet, Hanan},
journal={Proceedings of the VLDB Endowment},
volume={6},
number={6},
pages={421--432},
year={2013},
publisher={VLDB Endowment}
}
@inproceedings{wrangler,
title={Wrangler: {I}nteractive visual specification of data transformation scripts},
author={Kandel, Sean and Paepcke, Andreas and Hellerstein, Joseph and Heer, Jeffrey},
booktitle={Proceedings of the SIGCHI Conference on Human Factors in Computing Systems},
pages={3363--3372},
year={2011},
organization={ACM}
}
@inproceedings{flashextract,
title={Flash{E}xtract: {A} framework for data extraction by examples},
author={Le, Vu and Gulwani, Sumit},
booktitle={ACM SIGPLAN Notices},
volume={49},
pages={542--553},
year={2014},
organization={ACM}
}
@article{manyeyes,
title={Many{E}yes: {A} site for visualization at internet scale},
author={Viegas, Fernanda B and Wattenberg, Martin and Van Ham, Frank and Kriss, Jesse and McKeon, Matt},
journal={IEEE transactions on visualization and computer graphics},
volume={13},
number={6},
pages={1121--1128},
year={2007},
publisher={IEEE}
}
@inproceedings{willett,
title={Comment{S}pace: {S}tructured support for collaborative visual analysis},
author={Willett, Wesley and Heer, Jeffrey and Hellerstein, Joseph and Agrawala, Maneesh},
booktitle={Proceedings of the SIGCHI conference on Human Factors in Computing Systems},
pages={3131--3140},
year={2011},
organization={ACM}
}
@techreport{dresnerdataprep,
title="{2016 End User Data Preparation Market Study}",
author={Howard Dresner},
year={2016},
institution={Dresner Advisory Services, LLC}
}
@techreport{dresnercollectiveinsights,
title="{2016 Collective Insights Market Study Report}",
author={Howard Dresner},
year={2016},
institution={Dresner Advisory Services, LLC}
}
@techreport{gartnermetadata,
title="{Magic Quadrant for Metadata Management Solutions}",
author={Guido De Simoni and Roxane Edjlali},
institution={Gartner, Inc.},
year={2016}
}
@techreport{gartnerdataprep,
title="{Market Guide for Self-Service Data Preparation}",
author={Rita L. Sallam and Paddy Forry and Ehtisham Zaidi and Shubhangi Vashisth},
institution={Gartner, Inc.},
year={2016}
}
@techreport{gartnerdatacatalog,
title={How Chief Data Officers Can Use an Information Catalog to Maximize Business Value From Information Assets},
author={Alan D. Duncan and Douglas Laney and Guido De Simoni},
institution={Gartner, Inc.},
year={2016}
}
@inproceedings{sculley2,
title = {Machine Learning: The High Interest Credit Card of Technical Debt},
author = {D. Sculley and Gary Holt and Daniel Golovin and Eugene Davydov and Todd Phillips and Dietmar Ebner and Vinay Chaudhary and Michael Young},
year = 2014,
booktitle = {SE4ML: Software Engineering for Machine Learning (NIPS 2014 Workshop)}
}
@inproceedings{Crankshaw15,
author = {Daniel Crankshaw and
Peter Bailis and
Joseph E. Gonzalez and
Haoyuan Li and
Zhao Zhang and
Michael J. Franklin and
Ali Ghodsi and
Michael I. Jordan},
title = {The Missing Piece in Complex Analytics: Low Latency, Scalable Model Management and Serving with Velox},
booktitle = {{CIDR} 2015, Seventh Biennial Conference on Innovative Data Systems},
year = {2015}
}
@misc{tfserving,
title = {{TensorFlow Serving}},
howpublished = {\url{https://tensorflow.github.io/serving}},
key = {tfserving},
}
@inproceedings{bernstein1994overview,
title={An overview of repository technology},
author={Bernstein, Philip A and Dayal, Umeshwar},
booktitle={VLDB},
volume={94},
pages={705--713},
year={1994}
}
@article{bernstein1999microsoft,
title={Microsoft repository version 2 and the open information model},
author={Bernstein, Philip A and Bergstraesser, Thomas and Carlson, Jason and Pal, Shankar and Sanders, Paul and Shutt, David},
journal={Information Systems},
volume={24},
number={2},
pages={71--98},
year={1999},
publisher={Elsevier}
}