You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
author={Abernathey, Ryan P. and Augspurger, Tom and Banihirwe, Anderson and Blackmon-Luca, Charles C. and Crone, Timothy J. and Gentemann, Chelle L. and Hamman, Joseph J. and Henderson, Naomi and Lepore, Chiara and McCaie, Theo A. and Robinson, Niall H. and Signell, Richard P.},
3
+
journal={Computing in Science & Engineering},
4
+
title={Cloud-Native Repositories for Big Scientific Data},
5
+
year={2021},
6
+
volume={23},
7
+
number={2},
8
+
pages={26-35},
9
+
keywords={Cloud computing;Training data;Computational modeling;Reproducibility of results;Collaboration;Reliability;Distributed databases},
10
+
doi={10.1109/MCSE.2021.3059437}}
11
+
12
+
@article{appel_2019_ondemand,
13
+
title = {On-{{Demand Processing}} of {{Data Cubes}} from {{Satellite Image Collections}} with the Gdalcubes {{Library}}},
14
+
author = {Appel, Marius and Pebesma, Edzer},
15
+
year = {2019},
16
+
month = jun,
17
+
journal = {Data},
18
+
volume = {4},
19
+
number = {3},
20
+
pages = {92},
21
+
issn = {2306-5729},
22
+
doi = {10.3390/data4030092},
23
+
urldate = {2025-03-10},
24
+
abstract = {Earth observation data cubes are increasingly used as a data structure to make large collections of satellite images easily accessible to scientists. They hide complexities in the data such that data users can concentrate on the analysis rather than on data management. However, the construction of data cubes is not trivial and involves decisions that must be taken with regard to any particular analyses. This paper proposes on-demand data cubes, which are constructed on the fly when data users process the data. We introduce the open-source C++ library and R package gdalcubes for the construction and processing of on-demand data cubes from satellite image collections, and show how it supports interactive method development workflows where data users can initially try methods on small subsamples before running analyses on high resolution and/or large areas. Two study cases, one on processing Sentinel-2 time series and the other on combining vegetation, land surface temperature, and precipitation data, demonstrate and evaluate this implementation. While results suggest that on-demand data cubes implemented in gdalcubes support interactivity and allow for combining multiple data products, the speed-up effect also strongly depends on how original data products are organized. The potential for cloud deployment is discussed.},
file = {/home/emmamarshall/Desktop/Zotero/storage/SPSU55IR/Appel and Pebesma - 2019 - On-Demand Processing of Data Cubes from Satellite Image Collections with the gdalcubes Library.pdf}
28
+
}
29
+
30
+
@article{baumann2017datacube,
31
+
title={The datacube manifesto},
32
+
author={Baumann, Peter},
33
+
journal={Retrieved from EarthServer website: http://earthserver. eu/tech/datacube-manifesto},
author={Gil, Yolanda and David, Cédric H. and Demir, Ibrahim and Essawy, Bakinam T. and Fulweiler, Robinson W. and Goodall, Jonathan L. and Karlstrom, Leif and Lee, Huikyo and Mills, Heath J. and Oh, Ji‐Hyun and Pierce, Suzanne A. and Pope, Allen and Tzeng, Mimi W. and Villamizar, Sandra R. and Yu, Xuan},
25
-
year={2016}, month=oct,
26
-
pages={388–415},
27
-
language={en} }
28
-
29
-
@article{guo_big_2017,
53
+
@article{giuliani_2019_EarthObservationOpen,
54
+
title = {Earth {{Observation Open Science}}: {{Enhancing Reproducible Science Using Data Cubes}}},
55
+
shorttitle = {Earth {{Observation Open Science}}},
56
+
author = {Giuliani, Gregory and Camara, Gilberto and Killough, Brian and Minchin, Stuart},
57
+
year = {2019},
58
+
month = nov,
59
+
journal = {Data},
60
+
volume = {4},
61
+
number = {4},
62
+
pages = {147},
63
+
issn = {2306-5729},
64
+
doi = {10.3390/data4040147},
65
+
urldate = {2025-03-09},
66
+
abstract = {Earth Observation Data Cubes (EODC) have emerged as a promising solution to efficiently and effectively handle Big Earth Observation (EO) Data generated by satellites and made freely and openly available from different data repositories. The aim of this Special Issue, ``Earth Observation Data Cube'', in Data, is to present the latest advances in EODC development and implementation, including innovative approaches for the exploitation of satellite EO data using multi-dimensional (e.g., spatial, temporal, spectral) approaches. This Special Issue contains 14 articles covering a wide range of topics such as Synthetic Aperture Radar (SAR), Analysis Ready Data (ARD), interoperability, thematic applications (e.g., land cover, snow cover mapping), capacity development, semantics, processing techniques, as well as national implementations and best practices. These papers made significant contributions to the advancement of a more Open and Reproducible Earth Observation Science, reducing the gap between users' expectations for decision-ready products and current Big Data analytical capabilities, and ultimately unlocking the information power of EO data by transforming them into actionable knowledge.},
file = {/home/emmamarshall/Desktop/Zotero/storage/VHCMH3GQ/Giuliani et al. - 2019 - Earth Observation Open Science Enhancing Reproducible Science Using Data Cubes.pdf}
70
+
}
71
+
72
+
@article{guo_2017_big,
30
73
title = {Big {Earth} data: {A} new frontier in {Earth} and information sciences},
31
74
volume = {1},
32
75
issn = {2096-4471, 2574-5417},
@@ -42,8 +85,54 @@ @article{guo_big_2017
42
85
year = {2017},
43
86
pages = {4--20},
44
87
}
88
+
@inproceedings{lewis_2018_CEOSAnalysisReady,
89
+
title = {{{CEOS Analysis Ready Data}} for {{Land}} ({{CARD4L}}) {{Overview}}},
90
+
booktitle = {{{IGARSS}} 2018 - 2018 {{IEEE International Geoscience}} and {{Remote Sensing Symposium}}},
91
+
author = {Lewis, Adam and Lacey, Jennifer and Mecklenburg, Susanne and Ross, Jonathon and Siqueira, Andreia and Killough, Brian and Szantoi, Zoltan and Tadono, Takeo and Rosenavist, Ake and Goryl, Philippe and Miranda, Nuno and Hosford, Steven},
92
+
year = {2018},
93
+
month = jul,
94
+
pages = {7407--7410},
95
+
publisher = {IEEE},
96
+
address = {Valencia},
97
+
doi = {10.1109/IGARSS.2018.8519255},
98
+
urldate = {2025-03-10},
99
+
abstract = {For many land monitoring applications using remote sensing, lack of data is no longer an issue, as it may have been in the past. Programs, such as Copernicus by the European Commission and the Landsat Missions by the United States Geological Survey, have adopted systematic acquisition strategies, and distribute vast amounts of satellite data under open licenses. In parallel, storage and computing capability have evolved to make it cost-effective and practical to process and analyze these data at various scales. Data architecture solutions, such as the Open Data Cube (ODC) and the Copernicus Data and Information Access Services (DIAS), are providing frameworks that make [scientific] analysis much simpler and straightforward.},
100
+
isbn = {978-1-5386-7150-4},
101
+
langid = {english},
102
+
file = {/home/emmamarshall/Desktop/Zotero/storage/UXZSAALM/Lewis et al. - 2018 - CEOS Analysis Ready Data for Land (CARD4L) Overview.pdf}
103
+
}
104
+
45
105
46
-
@article{mathieu_esas_2017,
106
+
@article{lund_2020_snowmelt,
107
+
title = {Mapping Snowmelt Progression in the Upper Indus Basin with Synthetic Aperture Radar},
108
+
author = {Lund, Jewell and Forster, Richard R. and Rupper, Summer B. and Deeb, Elias J. and Marshall, H. P. and Hashmi, Muhammad Zia and Burgess, Evan},
109
+
year = {2020},
110
+
journal = {Frontiers in Earth Science},
111
+
volume = {7},
112
+
issn = {2296-6463},
113
+
doi = {10.3389/feart.2019.00318},
114
+
abstract = {{\textexclamdown}p{\textquestiondown}The Indus River is a vital resource for food security, ecosystem services, hydropower, and economy for millions of people living in Pakistan, India, China, and Afghanistan. Glacier and snowmelt from the high altitude Himalaya, Karakoram, and Hindu Kush mountain ranges are the largest drivers of discharge in the upper Indus Basin (UIB), and contribute significantly to Indus flows. Complex climatology and topography, coupled with the challenges of field study and meteorological measurement in these rugged ranges, elicit notable uncertainties in predicting seasonal runoff as well as cryospheric response to changes in climate. Here we utilize Sentinel-1 synthetic aperture radar (SAR) imagery to track ablation season development of wet snow in the Shigar Watershed of the Karakoram Mountains in Pakistan from 2015 to 2018. We exploit opportune local image acquisition times to highlight diurnal differences in radar indications of wet snow, and examine the spatial and temporal contexts of radar diurnal differences for 2015, 2017, and 2018 ablation seasons. Radar classifications for each ablation season show spatial and temporal patterns that indicate a dry winter snowpack undergoing diurnal surface melt-refreeze cycles, transitioning to surface snow that remains wet both day and night, and finally snow free conditions following melt out. Diurnally differing SAR signals may offer insights into important snowpack energy balance processes that precede melt out, which could provide useful constraints for both glacier mass balance modeling and runoff forecasting in remote alpine watersheds.{\textexclamdown}/p{\textquestiondown}}
115
+
}
116
+
@article{mahecha_2020_EarthSystemData,
117
+
title = {Earth System Data Cubes Unravel Global Multivariate Dynamics},
118
+
author = {Mahecha, Miguel D. and Gans, Fabian and Brandt, Gunnar and Christiansen, Rune and Cornell, Sarah E. and Fomferra, Normann and Kraemer, Guido and Peters, Jonas and Bodesheim, Paul and {Camps-Valls}, Gustau and Donges, Jonathan F. and Dorigo, Wouter and {Estupinan-Suarez}, Lina M. and {Gutierrez-Velez}, Victor H. and Gutwin, Martin and Jung, Martin and Londo{\~n}o, Maria C. and Miralles, Diego G. and Papastefanou, Phillip and Reichstein, Markus},
119
+
year = {2020},
120
+
month = feb,
121
+
journal = {Earth System Dynamics},
122
+
volume = {11},
123
+
number = {1},
124
+
pages = {201--234},
125
+
issn = {2190-4987},
126
+
doi = {10.5194/esd-11-201-2020},
127
+
urldate = {2025-03-10},
128
+
abstract = {Abstract. Understanding Earth system dynamics in light of ongoing human intervention and dependency remains a major scientific challenge. The unprecedented availability of data streams describing different facets of the Earth now offers fundamentally new avenues to address this quest. However, several practical hurdles, especially the lack of data interoperability, limit the joint potential of these data streams. Today, many initiatives within and beyond the Earth system sciences are exploring new approaches to overcome these hurdles and meet the growing interdisciplinary need for data-intensive research; using data cubes is one promising avenue. Here, we introduce the concept of Earth system data cubes and how to operate on them in a formal way. The idea is that treating multiple data dimensions, such as spatial, temporal, variable, frequency, and other grids alike, allows effective application of user-defined functions to co-interpret Earth observations and/or model--data integration. An implementation of this concept combines analysis-ready data cubes with a suitable analytic interface. In three case studies, we demonstrate how the concept and its implementation facilitate the execution of complex workflows for research across multiple variables, and spatial and temporal scales: (1)~summary statistics for ecosystem and climate dynamics; (2)~intrinsic dimensionality analysis on multiple timescales; and (3)~model--data integration. We discuss the emerging perspectives for investigating global interacting and coupled phenomena in observed or simulated data. In particular, we see many emerging perspectives of this approach for interpreting large-scale model ensembles. The latest developments in machine learning, causal inference, and model--data integration can be seamlessly implemented in the proposed framework, supporting rapid progress in data-intensive research across disciplinary boundaries.},
title = {Earth {{System Data Cubes}}: {{Avenues}} for Advancing {{Earth}} System Research},
152
+
shorttitle = {Earth {{System Data Cubes}}},
153
+
author = {Montero, David and Kraemer, Guido and Anghelea, Anca and Aybar, C{\'e}sar and Brandt, Gunnar and {Camps-Valls}, Gustau and Cremer, Felix and Flik, Ida and Gans, Fabian and Habershon, Sarah and Ji, Chaonan and Kattenborn, Teja and {Mart{\'i}nez-Ferrer}, Laura and Martinuzzi, Francesco and Reinhardt, Martin and S{\"o}chting, Maximilian and Teber, Khalil and Mahecha, Miguel D.},
154
+
year = {2024},
155
+
journal = {Environmental Data Science},
156
+
volume = {3},
157
+
pages = {e27},
158
+
issn = {2634-4602},
159
+
doi = {10.1017/eds.2024.22},
160
+
urldate = {2025-03-08},
161
+
abstract = {Recent advancements in Earth system science have been marked by the exponential increase in the availability of diverse, multivariate datasets characterised by moderate to high spatio-temporal resolutions. Earth System Data Cubes (ESDCs) have emerged as one suitable solution for transforming this flood of data into a simple yet robust data structure. ESDCs achieve this by organising data into an analysis-ready format aligned with a spatiotemporal grid, facilitating user-friendly analysis and diminishing the need for extensive technical data processing knowledge. Despite these significant benefits, the completion of the entire ESDC life cycle remains a challenging task. Obstacles are not only of a technical nature but also relate to domain-specific problems in Earth system research. There exist barriers to realising the full potential of data collections in light of novel cloudbased technologies, particularly in curating data tailored for specific application domains. These include transforming data to conform to a spatio-temporal grid with minimum distortions and managing complexities such as spatio-temporal autocorrelation issues. Addressing these challenges is pivotal for the effective application of Artificial Intelligence (AI) approaches. Furthermore, adhering to open science principles for data dissemination, reproducibility, visualisation, and reuse is crucial for fostering sustainable research. Overcoming these challenges offers a substantial opportunity to advance data-driven Earth system research, unlocking the full potential of an integrated, multidimensional view of Earth system processes. This is particularly true when such research is coupled with innovative research paradigms and technological progress.},
file = {/home/emmamarshall/Desktop/Zotero/storage/PRF46R2L/Montero et al. - 2024 - Earth System Data Cubes Avenues for advancing Earth system research.pdf}
165
+
}
61
166
62
-
@article{palumbo_building_2017,
167
+
168
+
@article{palumbo_2017_building,
63
169
title = {Building capacity in remote sensing for conservation: present and future challenges},
64
170
volume = {3},
65
171
issn = {2056-3485, 2056-3485},
@@ -76,7 +182,7 @@ @article{palumbo_building_2017
76
182
year = {2017},
77
183
pages = {21--29},
78
184
}
79
-
@article{radocaj_global_2020,
185
+
@article{radocaj_2020_global,
80
186
title = {Global {Open} {Data} {Remote} {Sensing} {Satellite} {Missions} for {Land} {Monitoring} and {Conservation}: {A} {Review}},
title = {Towards {{Sentinel-1 SAR Analysis-Ready Data}}: {{A Best Practices Assessment}} on {{Preparing Backscatter Data}} for the {{Cube}}},
233
+
shorttitle = {Towards {{Sentinel-1 SAR Analysis-Ready Data}}},
234
+
author = {Truckenbrodt, John and Freemantle, Terri and Williams, Chris and Jones, Tom and Small, David and Dubois, Cl{\'e}mence and Thiel, Christian and Rossi, Cristian and Syriou, Asimina and Giuliani, Gregory},
235
+
year = {2019},
236
+
month = jul,
237
+
journal = {Data},
238
+
volume = {4},
239
+
number = {3},
240
+
pages = {93},
241
+
issn = {2306-5729},
242
+
doi = {10.3390/data4030093},
243
+
urldate = {2025-03-09},
244
+
abstract = {This study aims at assessing the feasibility of automatically producing analysis-ready radiometrically terrain-corrected (RTC) Synthetic Aperture Radar (SAR) gamma nought backscatter data for ingestion into a data cube for use in a large spatio-temporal data environment. As such, this study investigates the analysis readiness of different openly available digital elevation models (DEMs) and the capability of the software solutions SNAP and GAMMA in terms of overall usability as well as backscatter data quality. To achieve this, the study builds on the Python library pyroSAR for providing the workflow implementation test bed and provides a Jupyter notebook for transparency and future reproducibility of performed analyses. Two test sites were selected, over the Alps and Fiji, to be able to assess regional differences and support the establishment of the Swiss and Common Sensing Open Data cubes respectively.},
file = {/home/emmamarshall/Desktop/Zotero/storage/Q7XR23EU/Truckenbrodt et al. - 2019 - Towards Sentinel-1 SAR Analysis-Ready Data A Best Practices Assessment on Preparing Backscatter Dat.pdf}
248
+
}
249
+
250
+
251
+
@article{wagemann_2021_user,
112
252
title = {A user perspective on future cloud-based services for {Big} {Earth} data},
0 commit comments