@inproceedings{174c618b3077497dba94c6484b266f5c,
title = "Light-weight parallel Python tools for earth system modeling workflows",
abstract = "In the last 30 years, earth system modeling has become increasingly data-intensive. The Community Earth System Model (CESM) response to the next Intergovernmental Panel on Climate Change (IPCC) assessment report (AR6) may require close to 1 Billion CPU hours of computation and generate up to 12 PB of raw data for post-processing. Existing post-processing tools are serial-only and impossibly slow with this much data. To improve the post-processing performance, our team has adopted a strategy of targeted replacement of the «bottleneck software» with light-weight parallel Python alternatives. This allows maximum impact with the least disruption to the CESM community and the shortest delivery time. We developed two light-weight parallel Python tools: one to convert model output from time-slice to time-series format, and one to perform fast time-averaging of time-series data. We present the motivation, approach, and results of these two tools, and our plans for future research and development.",
keywords = "Data processing, High performance computing, Parallel processing, Scientific computing",
author = "Kevin Paul and Sheri Mickelson and Dennis, \{John M.\} and Haiying Xu and David Brown",
note = "Publisher Copyright: {\textcopyright} 2015 IEEE.; 3rd IEEE International Conference on Big Data, Big Data 2015 ; Conference date: 29-10-2015 Through 01-11-2015",
year = "2015",
month = dec,
day = "22",
doi = "10.1109/BigData.2015.7363979",
language = "English",
series = "Proceedings - 2015 IEEE International Conference on Big Data, IEEE Big Data 2015",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "1985--1994",
editor = "Howard Ho and Ooi, \{Beng Chin\} and Zaki, \{Mohammed J.\} and Xiaohua Hu and Laura Haas and Vipin Kumar and Sudarsan Rachuri and Shipeng Yu and Hsiao, \{Morris Hui-I\} and Jian Li and Feng Luo and Saumyadipta Pyne and Kemafor Ogan",
booktitle = "Proceedings - 2015 IEEE International Conference on Big Data, Big Data 2015",
address = "United States",
}