In the context of the contemporary push for “big data” in many fields, we review recent experiences building large databases for turbulence research. We consider data from direct numerical simulations (DNS) of various canonical flows and from experimental studies and related numerical simulations of wall-bounded turbulence, where the data storage needs are particularly challenging due to the very large range of length and time scales that exists in these flows at high Reynolds numbers. The focus is on a move from the traditional approach of data-handling and analysis where datasets are moved to individual computers, to one where much of the analysis is moved to the hosting system that stores these data. In this context we give a summary of a unique open numerical laboratory that archives over 200 Terabytes of DNS data, including full spatio-temporal flow fields of various canonical flows. Particular attention is given to the unique access requirements for large datasets to become open to the research community and the success the system has had in democratizing access to large datasets.
%0 Book Section
%1 meneveau2017turbulence
%A Meneveau, Charles
%A Marusic, Ivan
%B Whither turbulence and big data in the 21st century?
%C Switzerland
%D 2017
%E Pollard, Andrew
%E Castillo, Luciano
%E Danaila, Luminita
%E Glauser, Mark
%I Springer
%K bigdata engineering forschungsdaten iag obib
%P 497-507
%R http://dx.doi.org/10.1007/978-3-319-41217-7
%T Turbulence in the Era of Big Data: Recent Experiences with Sharing Large Datasets
%X In the context of the contemporary push for “big data” in many fields, we review recent experiences building large databases for turbulence research. We consider data from direct numerical simulations (DNS) of various canonical flows and from experimental studies and related numerical simulations of wall-bounded turbulence, where the data storage needs are particularly challenging due to the very large range of length and time scales that exists in these flows at high Reynolds numbers. The focus is on a move from the traditional approach of data-handling and analysis where datasets are moved to individual computers, to one where much of the analysis is moved to the hosting system that stores these data. In this context we give a summary of a unique open numerical laboratory that archives over 200 Terabytes of DNS data, including full spatio-temporal flow fields of various canonical flows. Particular attention is given to the unique access requirements for large datasets to become open to the research community and the success the system has had in democratizing access to large datasets.
%& 27
%@ 978-3-319-41217-7
@inbook{meneveau2017turbulence,
abstract = {In the context of the contemporary push for “big data” in many fields, we review recent experiences building large databases for turbulence research. We consider data from direct numerical simulations (DNS) of various canonical flows and from experimental studies and related numerical simulations of wall-bounded turbulence, where the data storage needs are particularly challenging due to the very large range of length and time scales that exists in these flows at high Reynolds numbers. The focus is on a move from the traditional approach of data-handling and analysis where datasets are moved to individual computers, to one where much of the analysis is moved to the hosting system that stores these data. In this context we give a summary of a unique open numerical laboratory that archives over 200 Terabytes of DNS data, including full spatio-temporal flow fields of various canonical flows. Particular attention is given to the unique access requirements for large datasets to become open to the research community and the success the system has had in democratizing access to large datasets.},
added-at = {2017-07-18T09:41:03.000+0200},
address = {Switzerland},
author = {Meneveau, Charles and Marusic, Ivan},
biburl = {https://puma.ub.uni-stuttgart.de/bibtex/28e03b4aeb58ea1b36ed9a9a6c72d54d1/diglezakis},
booktitle = {Whither turbulence and big data in the 21st century?},
chapter = 27,
doi = {http://dx.doi.org/10.1007/978-3-319-41217-7},
editor = {Pollard, Andrew and Castillo, Luciano and Danaila, Luminita and Glauser, Mark},
interhash = {bfc959092e0f6966f300d2ac25215c25},
intrahash = {8e03b4aeb58ea1b36ed9a9a6c72d54d1},
isbn = {978-3-319-41217-7},
keywords = {bigdata engineering forschungsdaten iag obib},
pages = {497-507},
publisher = {Springer},
timestamp = {2018-02-16T08:37:20.000+0100},
title = {Turbulence in the Era of Big Data: Recent Experiences with Sharing Large Datasets},
year = 2017
}