BibTeX
@article{2211.03747v1,
Author = {Bingjie Wang and Joel Leja and Ashley Villar and Joshua S. Speagle},
Title = {Monte Carlo Techniques for Addressing Large Errors and Missing Data in
Simulation-based Inference},
Eprint = {2211.03747v1},
ArchivePrefix = {arXiv},
PrimaryClass = {astro-ph.IM},
Abstract = {Upcoming astronomical surveys will observe billions of galaxies across cosmic
time, providing a unique opportunity to map the many pathways of galaxy
assembly to an incredibly high resolution. However, the huge amount of data
also poses an immediate computational challenge: current tools for inferring
parameters from the light of galaxies take $\gtrsim 10$ hours per fit. This is
prohibitively expensive. Simulation-based Inference (SBI) is a promising
solution. However, it requires simulated data with identical characteristics to
the observed data, whereas real astronomical surveys are often highly
heterogeneous, with missing observations and variable uncertainties determined
by sky and telescope conditions. Here we present a Monte Carlo technique for
treating out-of-distribution measurement errors and missing data using standard
SBI tools. We show that out-of-distribution measurement errors can be
approximated by using standard SBI evaluations, and that missing data can be
marginalized over using SBI evaluations over nearby data realizations in the
training set. While these techniques slow the inference process from $\sim 1$
sec to $\sim 1.5$ min per object, this is still significantly faster than
standard approaches while also dramatically expanding the applicability of SBI.
This expanded regime has broad implications for future applications to
astronomical surveys.},
Year = {2022},
Month = {Nov},
Url = {http://arxiv.org/abs/2211.03747v1},
File = {2211.03747v1.pdf}
}