@article { , title = {BHPMF - a hierarchical Bayesian approach to gap-filling and trait prediction for macroecology and functional biogeography: Gap-filling in trait databases}, abstract = {Aim: Functional traits of organisms are key to understanding and predicting biodiversity and ecological change, which motivates continuous collection of traits and their integration into global databases. Such trait matrices are inherently sparse, severely limiting their usefulness for further analyses. On the other hand, traits are characterized by the phylogenetic trait signal, trait–trait correlations and environmental constraints, all of which provide information that could be used to statistically fill gaps. We propose the application of probabilistic models which, for the first time, utilize all three characteristics to fill gaps in trait databases and predict trait values at larger spatial scales. Innovation For this purpose we introduce BHPMF, a ierarchical Bayesian extension of probabilistic matrix actorization (PMF). PMF is a machine learning technique which exploits the correlation structure of sparse matrices to impute missing entries. BHPMF additionally utilizes the taxonomic hierarchy for trait prediction and provides uncertainty estimates for each imputation. In combination with multiple regression against environmental information, BHPMF allows for extrapolation frompoint measurements to larger spatial scales.We demonstrate the applicability of BHPMF in ecological contexts, using different plant functional trait datasets, also comparing results to taking the species mean and PMF. Main conclusions Sensitivity analyses validate the robustness and accuracy of BHPMF: our method captures the correlation structure of the trait matrix as well as the phylogenetic trait signal – also for extremely sparse trait matrices – and provides a robust measure of confidence in prediction accuracy for each missing entry. The combination of BHPMF with environmental constraints provides a promising concept to extrapolate traits beyond sampled regions, accounting for intraspecific trait variability. We conclude that BHPMF and its derivatives have a high potential to support future trait-based research in macroecology and functional biogeography.}, doi = {10.1111/geb.12335}, eissn = {1466-8238}, issn = {1466-822X}, issue = {12}, journal = {Global Ecology and Biogeography}, note = {Published version submitted. If AAM received will need to add set statement "This is the peer reviewed version of the following article: [FULL CITE], which has been published in final form at [Link to final article using the DOI]. This article may be used for non-commercial purposes in accordance with Wiley Terms and Conditions for Self-Archiving." KJB 31.10.2017 Contacted Wiley permissions to confirm if published version can be used as this article is "free access" confirmation from Wiley on 14.11.2017 that the published version can be used. KJB 15.11.2017}, pages = {1510-1521}, publicationstatus = {Published}, publisher = {Wiley}, url = {https://nottingham-repository.worktribe.com/output/767539}, volume = {24}, keyword = {Bayesian hierarchical model, Gap-filling, Imputation, Machine learning, Matrix factorization, PFT, Plant functional trait, Sparse matrix, Spatial extrapolation, TRY}, year = {2015}, author = {Schrodt, Franziska and Kattge, Jens and Shan, Hanhuai and Fazayeli, Farideh and Joswig, Julia and Banerjee, Arindam and Reichstein, Markus and Bönisch, Gerhard and Diaz, Sandra and Dickie, John and Gillison, Andy and Karpatne, Anuj and Lavorel, Sandra and Leadley, Paul and Wirth, Christian B. and Wright, Ian J. and Wright, S. Joseph and Reich, Peter B.} }