@misc{10876e3b8a3e4865ab460749b27b3e6f,
title = "Surrogate Model Based Optimization for Finding Robust Deep Learning Model Architectures",
abstract = "Deep Learning (DL) models are increasingly used throughout the sciences. However, their performance and usefulness depend greatly on their architecture which is defined by hyperparameters such as the number of nodes, layers, the learning rate, etc. Tuning these hyperparameters is time-consuming because evaluating their performance requires a lengthy training step. Stochastic optimizers used in training lead to performance variability and potentially prediction reliability issues. In this talk, we will describe an automated optimization method based on surrogate models and active learning strategies for tuning DL model architectures. We take into account the prediction variability with the goal to identify architectures that make reliable and robust predictions. We demonstrate our developments on an application arising in particle physics.",
keywords = "deep learning, high energy physics, hyperparameter optimization, surrogate modeling",
author = "Juliane Mueller and Vincent Dumont and Xiangyang Ju",
year = "2022",
language = "American English",
series = "Presented at the 2022 INFORMS Annual Meeting, 16-19 October 2022, Indianapolis, Indiana",
type = "Other",
}