@article{SchweppeThoberMuelleretal.2022, author = {Schweppe, Robert and Thober, Stephan and M{\"u}ller, Sebastian and Kelbling, Matthias and Kumar, Rohini and Attinger, Sabine and Samaniego, Luis}, title = {MPR 1.0: a stand-alone multiscale parameter regionalization tool for improved parameter estimation of land surface models}, series = {Geoscientific model development : an interactive open access journal of the European Geosciences Union}, volume = {15}, journal = {Geoscientific model development : an interactive open access journal of the European Geosciences Union}, number = {2}, publisher = {Copernicus}, address = {G{\"o}ttingen}, issn = {1991-959X}, doi = {10.5194/gmd-15-859-2022}, pages = {859 -- 882}, year = {2022}, abstract = {Distributed environmental models such as land surface models (LSMs) require model parameters in each spatial modeling unit (e.g., grid cell), thereby leading to a high-dimensional parameter space. One approach to decrease the dimensionality of the parameter space in these models is to use regularization techniques. One such highly efficient technique is the multiscale parameter regionalization (MPR) framework that translates high-resolution predictor variables (e.g., soil textural properties) into model parameters (e.g., porosity) via transfer functions (TFs) and upscaling operators that are suitable for every modeled process. This framework yields seamless model parameters at multiple scales and locations in an effective manner. However, integration of MPR into existing modeling workflows has been hindered thus far by hard-coded configurations and non-modular software designs. For these reasons, we redesigned MPR as a model-agnostic, stand-alone tool. It is a useful software for creating graphs of NetCDF variables, wherein each node is a variable and the links consist of TFs and/or upscaling operators. In this study, we present and verify our tool against a previous version, which was implemented in the mesoscale hydrologic model (mHM; https://www.ufz.de/mhm, last access: 16 January 2022). By using this tool for the generation of continental-scale soil hydraulic parameters applicable to different models (Noah-MP and HTESSEL), we showcase its general functionality and flexibility. Further, using model parameters estimated by the MPR tool leads to significant changes in long-term estimates of evapotranspiration, as compared to their default parameterizations. For example, a change of up to 25 \% in long-term evapotranspiration flux is observed in Noah-MP and HTESSEL in the Mississippi River basin. We postulate that use of the stand-alone MPR tool will considerably increase the transparency and reproducibility of the parameter estimation process in distributed (environmental) models. It will also allow a rigorous uncertainty estimation related to the errors of the predictors (e.g., soil texture fields), transfer function and its parameters, and remapping (or upscaling) algorithms.}, language = {en} } @article{SchmidtHesseAttingeretal.2020, author = {Schmidt, Lennart and Hesse, Falk and Attinger, Sabine and Kumar, Rohini}, title = {Challenges in applying machine learning models for hydrological inference}, series = {Water resources research}, volume = {56}, journal = {Water resources research}, number = {5}, publisher = {American Geophysical Union}, address = {Washington}, issn = {0043-1397}, doi = {10.1029/2019WR025924}, pages = {10}, year = {2020}, abstract = {Machine learning (ML) algorithms are being increasingly used in Earth and Environmental modeling studies owing to the ever-increasing availability of diverse data sets and computational resources as well as advancement in ML algorithms. Despite advances in their predictive accuracy, the usefulness of ML algorithms for inference remains elusive. In this study, we employ two popular ML algorithms, artificial neural networks and random forest, to analyze a large data set of flood events across Germany with the goals to analyze their predictive accuracy and their usability to provide insights to hydrologic system functioning. The results of the ML algorithms are contrasted against a parametric approach based on multiple linear regression. For analysis, we employ a model-agnostic framework named Permuted Feature Importance to derive the influence of models' predictors. This allows us to compare the results of different algorithms for the first time in the context of hydrology. Our main findings are that (1) the ML models achieve higher prediction accuracy than linear regression, (2) the results reflect basic hydrological principles, but (3) further inference is hindered by the heterogeneity of results across algorithms. Thus, we conclude that the problem of equifinality as known from classical hydrological modeling also exists for ML and severely hampers its potential for inference. To account for the observed problems, we propose that when employing ML for inference, this should be made by using multiple algorithms and multiple methods, of which the latter should be embedded in a cross-validation routine.}, language = {en} } @misc{JingKumarHesseetal.2020, author = {Jing, Miao and Kumar, Rohini and Heße, Falk and Thober, Stephan and Rakovec, Oldrich and Samaniego, Luis and Attinger, Sabine}, title = {Assessing the response of groundwater quantity and travel time distribution to 1.5, 2, and 3 °C global warming in a mesoscale central German basin}, series = {Zweitver{\"o}ffentlichungen der Universit{\"a}t Potsdam : Mathematisch-Naturwissenschaftliche Reihe}, journal = {Zweitver{\"o}ffentlichungen der Universit{\"a}t Potsdam : Mathematisch-Naturwissenschaftliche Reihe}, number = {3}, issn = {1866-8372}, doi = {10.25932/publishup-50934}, url = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-509343}, pages = {18}, year = {2020}, abstract = {Groundwater is the biggest single source of high-quality freshwater worldwide, which is also continuously threatened by the changing climate. In this paper, we investigate the response of the regional groundwater system to climate change under three global warming levels (1.5, 2, and 3 ∘C) in a central German basin (N{\"a}gelstedt). This investigation is conducted by deploying an integrated modeling workflow that consists of a mesoscale hydrologic model (mHM) and a fully distributed groundwater model, OpenGeoSys (OGS). mHM is forced with climate simulations of five general circulation models under three representative concentration pathways. The diffuse recharges estimated by mHM are used as boundary forcings to the OGS groundwater model to compute changes in groundwater levels and travel time distributions. Simulation results indicate that groundwater recharges and levels are expected to increase slightly under future climate scenarios. Meanwhile, the mean travel time is expected to decrease compared to the historical average. However, the ensemble simulations do not all agree on the sign of relative change. Changes in mean travel time exhibit a larger variability than those in groundwater levels. The ensemble simulations do not show a systematic relationship between the projected change (in both groundwater levels and travel times) and the warming level, but they indicate an increased variability in projected changes with adjusting the enhanced warming level from 1.5 to 3 ∘C. Correspondingly, it is highly recommended to restrain the trend of global warming.}, language = {en} } @misc{SchmidtHesseAttingeretal.2020, author = {Schmidt, Lennart and Heße, Falk and Attinger, Sabine and Kumar, Rohini}, title = {Challenges in applying machine learning models for hydrological inference: a case study for flooding events across Germany}, series = {Postprints der Universit{\"a}t Potsdam : Mathematisch-Naturwissenschaftliche Reihe}, journal = {Postprints der Universit{\"a}t Potsdam : Mathematisch-Naturwissenschaftliche Reihe}, number = {5}, issn = {1866-8372}, doi = {10.25932/publishup-52384}, url = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-523843}, pages = {12}, year = {2020}, abstract = {Machine learning (ML) algorithms are being increasingly used in Earth and Environmental modeling studies owing to the ever-increasing availability of diverse data sets and computational resources as well as advancement in ML algorithms. Despite advances in their predictive accuracy, the usefulness of ML algorithms for inference remains elusive. In this study, we employ two popular ML algorithms, artificial neural networks and random forest, to analyze a large data set of flood events across Germany with the goals to analyze their predictive accuracy and their usability to provide insights to hydrologic system functioning. The results of the ML algorithms are contrasted against a parametric approach based on multiple linear regression. For analysis, we employ a model-agnostic framework named Permuted Feature Importance to derive the influence of models' predictors. This allows us to compare the results of different algorithms for the first time in the context of hydrology. Our main findings are that (1) the ML models achieve higher prediction accuracy than linear regression, (2) the results reflect basic hydrological principles, but (3) further inference is hindered by the heterogeneity of results across algorithms. Thus, we conclude that the problem of equifinality as known from classical hydrological modeling also exists for ML and severely hampers its potential for inference. To account for the observed problems, we propose that when employing ML for inference, this should be made by using multiple algorithms and multiple methods, of which the latter should be embedded in a cross-validation routine.}, language = {en} } @article{SchmidtHesseAttingeretal.2020, author = {Schmidt, Lennart and Heße, Falk and Attinger, Sabine and Kumar, Rohini}, title = {Challenges in applying machine learning models for hydrological inference: a case study for flooding events across Germany}, series = {Water Resources Research}, volume = {56}, journal = {Water Resources Research}, number = {5}, publisher = {John Wiley \& Sons, Inc.}, address = {New Jersey}, pages = {10}, year = {2020}, abstract = {Machine learning (ML) algorithms are being increasingly used in Earth and Environmental modeling studies owing to the ever-increasing availability of diverse data sets and computational resources as well as advancement in ML algorithms. Despite advances in their predictive accuracy, the usefulness of ML algorithms for inference remains elusive. In this study, we employ two popular ML algorithms, artificial neural networks and random forest, to analyze a large data set of flood events across Germany with the goals to analyze their predictive accuracy and their usability to provide insights to hydrologic system functioning. The results of the ML algorithms are contrasted against a parametric approach based on multiple linear regression. For analysis, we employ a model-agnostic framework named Permuted Feature Importance to derive the influence of models' predictors. This allows us to compare the results of different algorithms for the first time in the context of hydrology. Our main findings are that (1) the ML models achieve higher prediction accuracy than linear regression, (2) the results reflect basic hydrological principles, but (3) further inference is hindered by the heterogeneity of results across algorithms. Thus, we conclude that the problem of equifinality as known from classical hydrological modeling also exists for ML and severely hampers its potential for inference. To account for the observed problems, we propose that when employing ML for inference, this should be made by using multiple algorithms and multiple methods, of which the latter should be embedded in a cross-validation routine.}, language = {en} } @article{JingKumarHesseetal.2020, author = {Jing, Miao and Kumar, Rohini and Heße, Falk and Thober, Stephan and Rakovec, Oldrich and Samaniego, Luis and Attinger, Sabine}, title = {Assessing the response of groundwater quantity and travel time distribution to 1.5, 2, and 3 °C global warming in a mesoscale central German basin}, series = {Hydrology and Earth System Sciences}, volume = {24}, journal = {Hydrology and Earth System Sciences}, number = {3}, publisher = {Copernicus Publ.}, address = {G{\"o}ttingen}, issn = {1607-7938}, doi = {10.5194/hess-24-1511-2020}, pages = {1511 -- 1526}, year = {2020}, abstract = {Groundwater is the biggest single source of high-quality freshwater worldwide, which is also continuously threatened by the changing climate. In this paper, we investigate the response of the regional groundwater system to climate change under three global warming levels (1.5, 2, and 3 ∘C) in a central German basin (N{\"a}gelstedt). This investigation is conducted by deploying an integrated modeling workflow that consists of a mesoscale hydrologic model (mHM) and a fully distributed groundwater model, OpenGeoSys (OGS). mHM is forced with climate simulations of five general circulation models under three representative concentration pathways. The diffuse recharges estimated by mHM are used as boundary forcings to the OGS groundwater model to compute changes in groundwater levels and travel time distributions. Simulation results indicate that groundwater recharges and levels are expected to increase slightly under future climate scenarios. Meanwhile, the mean travel time is expected to decrease compared to the historical average. However, the ensemble simulations do not all agree on the sign of relative change. Changes in mean travel time exhibit a larger variability than those in groundwater levels. The ensemble simulations do not show a systematic relationship between the projected change (in both groundwater levels and travel times) and the warming level, but they indicate an increased variability in projected changes with adjusting the enhanced warming level from 1.5 to 3 ∘C. Correspondingly, it is highly recommended to restrain the trend of global warming.}, language = {en} } @misc{KumarHesseRaoetal.2020, author = {Kumar, Rohini and Hesse, Fabienne and Rao, P. Srinivasa and Musolff, Andreas and Jawitz, James and Sarrazin, Francois and Samaniego, Luis and Fleckenstein, Jan H. and Rakovec, Oldrich and Thober, S. and Attinger, Sabine}, title = {Strong hydroclimatic controls on vulnerability to subsurface nitrate contamination across Europe}, series = {Zweitver{\"o}ffentlichungen der Universit{\"a}t Potsdam : Mathematisch-Naturwissenschaftliche Reihe}, journal = {Zweitver{\"o}ffentlichungen der Universit{\"a}t Potsdam : Mathematisch-Naturwissenschaftliche Reihe}, number = {1}, issn = {1866-8372}, doi = {10.25932/publishup-54987}, url = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-549875}, pages = {12}, year = {2020}, abstract = {Subsurface contamination due to excessive nutrient surpluses is a persistent and widespread problem in agricultural areas across Europe. The vulnerability of a particular location to pollution from reactive solutes, such as nitrate, is determined by the interplay between hydrologic transport and biogeochemical transformations. Current studies on the controls of subsurface vulnerability do not consider the transient behaviour of transport dynamics in the root zone. Here, using state-of-the-art hydrologic simulations driven by observed hydroclimatic forcing, we demonstrate the strong spatiotemporal heterogeneity of hydrologic transport dynamics and reveal that these dynamics are primarily controlled by the hydroclimatic gradient of the aridity index across Europe. Contrasting the space-time dynamics of transport times with reactive timescales of denitrification in soil indicate that similar to 75\% of the cultivated areas across Europe are potentially vulnerable to nitrate leaching for at least onethird of the year. We find that neglecting the transient nature of transport and reaction timescale results in a great underestimation of the extent of vulnerable regions by almost 50\%. Therefore, future vulnerability and risk assessment studies must account for the transient behaviour of transport and biogeochemical transformation processes.}, language = {en} } @article{KumarHesseRaoetal.2020, author = {Kumar, Rohini and Hesse, Fabienne and Rao, P. Srinivasa and Musolff, Andreas and Jawitz, James and Sarrazin, Francois and Samaniego, Luis and Fleckenstein, Jan H. and Rakovec, Oldrich and Thober, S. and Attinger, Sabine}, title = {Strong hydroclimatic controls on vulnerability to subsurface nitrate contamination across Europe}, series = {Nature Communications}, volume = {11}, journal = {Nature Communications}, number = {1}, publisher = {Nature Publishing Group UK}, address = {London}, issn = {2041-1723}, doi = {10.1038/s41467-020-19955-8}, pages = {1 -- 10}, year = {2020}, abstract = {Subsurface contamination due to excessive nutrient surpluses is a persistent and widespread problem in agricultural areas across Europe. The vulnerability of a particular location to pollution from reactive solutes, such as nitrate, is determined by the interplay between hydrologic transport and biogeochemical transformations. Current studies on the controls of subsurface vulnerability do not consider the transient behaviour of transport dynamics in the root zone. Here, using state-of-the-art hydrologic simulations driven by observed hydroclimatic forcing, we demonstrate the strong spatiotemporal heterogeneity of hydrologic transport dynamics and reveal that these dynamics are primarily controlled by the hydroclimatic gradient of the aridity index across Europe. Contrasting the space-time dynamics of transport times with reactive timescales of denitrification in soil indicate that similar to 75\% of the cultivated areas across Europe are potentially vulnerable to nitrate leaching for at least onethird of the year. We find that neglecting the transient nature of transport and reaction timescale results in a great underestimation of the extent of vulnerable regions by almost 50\%. Therefore, future vulnerability and risk assessment studies must account for the transient behaviour of transport and biogeochemical transformation processes.}, language = {en} } @article{BaroniSchalgeRakovecetal.2019, author = {Baroni, Gabriele and Schalge, Bernd and Rakovec, Oldrich and Kumar, Rohini and Sch{\"u}ler, Lennart and Samaniego, Luis and Simmer, Clemens and Attinger, Sabine}, title = {A Comprehensive Distributed Hydrological Modeling Intercomparison to Support Process Representation and Data Collection Strategies}, series = {Water resources research}, volume = {55}, journal = {Water resources research}, number = {2}, publisher = {American Geophysical Union}, address = {Washington}, issn = {0043-1397}, doi = {10.1029/2018WR023941}, pages = {990 -- 1010}, year = {2019}, abstract = {The improvement of process representations in hydrological models is often only driven by the modelers' knowledge and data availability. We present a comprehensive comparison between two hydrological models of different complexity that is developed to support (1) the understanding of the differences between model structures and (2) the identification of the observations needed for model assessment and improvement. The comparison is conducted on both space and time and by aggregating the outputs at different spatiotemporal scales. In the present study, mHM, a process-based hydrological model, and ParFlow-CLM, an integrated subsurface-surface hydrological model, are used. The models are applied in a mesoscale catchment in Germany. Both models agree in the simulated river discharge at the outlet and the surface soil moisture dynamics, lending their supports for some model applications (drought monitoring). Different model sensitivities are, however, found when comparing evapotranspiration and soil moisture at different soil depths. The analysis supports the need of observations within the catchment for model assessment, but it indicates that different strategies should be considered for the different variables. Evapotranspiration measurements are needed at daily resolution across several locations, while highly resolved spatially distributed observations with lower temporal frequency are required for soil moisture. Finally, the results show the impact of the shallow groundwater system simulated by ParFlow-CLM and the need to account for the related soil moisture redistribution. Our comparison strategy can be applied to other models types and environmental conditions to strengthen the dialog between modelers and experimentalists for improving process representations in Earth system models.}, language = {en} } @article{JingHesseKumaretal.2019, author = {Jing, Miao and Hesse, Falk and Kumar, Rohini and Kolditz, Olaf and Kalbacher, Thomas and Attinger, Sabine}, title = {Influence of input and parameter uncertainty on the prediction of catchment-scale groundwater travel time distributions}, series = {Hydrology and earth system sciences : HESS}, volume = {23}, journal = {Hydrology and earth system sciences : HESS}, number = {1}, publisher = {Copernicus}, address = {G{\"o}ttingen}, issn = {1027-5606}, doi = {10.5194/hess-23-171-2019}, pages = {171 -- 190}, year = {2019}, abstract = {Groundwater travel time distributions (TTDs) provide a robust description of the subsurface mixing behavior and hydrological response of a subsurface system. Lagrangian particle tracking is often used to derive the groundwater TTDs. The reliability of this approach is subjected to the uncertainty of external forcings, internal hydraulic properties, and the interplay between them. Here, we evaluate the uncertainty of catchment groundwater TTDs in an agricultural catchment using a 3-D groundwater model with an overall focus on revealing the relationship between external forcing, internal hydraulic properties, and TTD predictions. Eight recharge realizations are sampled from a high-resolution dataset of land surface fluxes and states. Calibration-constrained hydraulic conductivity fields (Ks fields) are stochastically generated using the null-space Monte Carlo (NSMC) method for each recharge realization. The random walk particle tracking (RWPT) method is used to track the pathways of particles and compute travel times. Moreover, an analytical model under the random sampling (RS) assumption is fit against the numerical solutions, serving as a reference for the mixing behavior of the model domain. The StorAge Selection (SAS) function is used to interpret the results in terms of quantifying the systematic preference for discharging young/old water. The simulation results reveal the primary effect of recharge on the predicted mean travel time (MTT). The different realizations of calibration-constrained Ks fields moderately magnify or attenuate the predicted MTTs. The analytical model does not properly replicate the numerical solution, and it underestimates the mean travel time. Simulated SAS functions indicate an overall preference for young water for all realizations. The spatial pattern of recharge controls the shape and breadth of simulated TTDs and SAS functions by changing the spatial distribution of particles' pathways. In conclusion, overlooking the spatial nonuniformity and uncertainty of input (forcing) will result in biased travel time predictions. We also highlight the worth of reliable observations in reducing predictive uncertainty and the good interpretability of SAS functions in terms of understanding catchment transport processes.}, language = {en} }