We propose a statistical learning framework based on group-sparse regression that can be used to (i) enforce conservation laws, (ii) ensure model equivalence, and (iii) guarantee symmetries when learning or inferring differential-equation models from data. Directly learning interpretable mathematical models from data has emerged as a valuable modeling approach. However, in areas such as biology, high noise levels, sensor-induced correlations, and strong intersystem variability can render data-driven models nonsensical or physically inconsistent without additional constraints on the model structure. Hence, it is important to leverage prior knowledge from physical principles to learn biologically plausible and physically consistent models rather than models that simply fit the data best. We present the group iterative hard thresholding algorithm and use stability selection to infer physically consistent models with minimal parameter tuning. We show several applications from systems biology that demonstrate the benefits of enforcing priors in data-driven modeling.
%0 Journal Article
%1 08160aa735004254a4f84c6e5549379f
%A Maddu, Suryanarayana
%A Cheeseman, Bevan L.
%A Müller, Christian L.
%A Sbalzarini, Ivo F.
%D 2021
%I American Physical Society, College Park
%J Physical Review E
%K FIS_scads imported
%N 4
%R 10.1103/PhysRevE.103.042310
%T Learning physically consistent differential equation models from data using group sparsity
%V 103
%X We propose a statistical learning framework based on group-sparse regression that can be used to (i) enforce conservation laws, (ii) ensure model equivalence, and (iii) guarantee symmetries when learning or inferring differential-equation models from data. Directly learning interpretable mathematical models from data has emerged as a valuable modeling approach. However, in areas such as biology, high noise levels, sensor-induced correlations, and strong intersystem variability can render data-driven models nonsensical or physically inconsistent without additional constraints on the model structure. Hence, it is important to leverage prior knowledge from physical principles to learn biologically plausible and physically consistent models rather than models that simply fit the data best. We present the group iterative hard thresholding algorithm and use stability selection to infer physically consistent models with minimal parameter tuning. We show several applications from systems biology that demonstrate the benefits of enforcing priors in data-driven modeling.
@article{08160aa735004254a4f84c6e5549379f,
abstract = {We propose a statistical learning framework based on group-sparse regression that can be used to (i) enforce conservation laws, (ii) ensure model equivalence, and (iii) guarantee symmetries when learning or inferring differential-equation models from data. Directly learning interpretable mathematical models from data has emerged as a valuable modeling approach. However, in areas such as biology, high noise levels, sensor-induced correlations, and strong intersystem variability can render data-driven models nonsensical or physically inconsistent without additional constraints on the model structure. Hence, it is important to leverage prior knowledge from physical principles to learn biologically plausible and physically consistent models rather than models that simply fit the data best. We present the group iterative hard thresholding algorithm and use stability selection to infer physically consistent models with minimal parameter tuning. We show several applications from systems biology that demonstrate the benefits of enforcing priors in data-driven modeling.},
added-at = {2024-11-28T16:27:18.000+0100},
author = {Maddu, Suryanarayana and Cheeseman, {Bevan L.} and M{\"u}ller, {Christian L.} and Sbalzarini, {Ivo F.}},
biburl = {https://puma.scadsai.uni-leipzig.de/bibtex/25c1191f2db021d14fc71a975ebc42844/scadsfct},
doi = {10.1103/PhysRevE.103.042310},
interhash = {aef0487607d91f90191444fb870d0224},
intrahash = {5c1191f2db021d14fc71a975ebc42844},
issn = {2470-0045},
journal = {Physical Review E},
keywords = {FIS_scads imported},
language = {English},
month = apr,
note = {Publisher Copyright: {\textcopyright} 2021 authors.},
number = 4,
publisher = {American Physical Society, College Park},
timestamp = {2024-11-28T16:27:18.000+0100},
title = {Learning physically consistent differential equation models from data using group sparsity},
volume = 103,
year = 2021
}