@inproceedings{2244d288b12341248b425698e783ef4d,
title = "Shrink-Perturb Improves Architecture Mixing During Population Based Training for Neural Architecture Search",
abstract = "In this work, we show that simultaneously training and mixing neural networks is a promising way to conduct Neural Architecture Search (NAS). For hyperparameter optimization, reusing the partially trained weights allows for efficient search, as was previously demonstrated by the Population Based Training (PBT) algorithm. We propose PBT-NAS, an adaptation of PBT to NAS where architectures are improved during training by replacing poorly-performing networks in a population with the result of mixing well-performing ones and inheriting the weights using the shrink-perturb technique. After PBT-NAS terminates, the created networks can be directly used without retraining. PBT-NAS is highly parallelizable and effective: on challenging tasks (image generation and reinforcement learning) PBT-NAS achieves superior performance compared to baselines (random search and mutation-based PBT).",
author = "Alexander Chebykin and Arkadiy Dushatskiy and Tanja Alderliesten and Peter Bosman",
year = "2023",
doi = "10.3233/FAIA230294",
language = "English",
series = "Frontiers in Artificial Intelligence and Applications",
publisher = "IOS Press",
pages = "381--388",
editor = "Kobi Gal and Kobi Gal and Ann Nowe and Nalepa, {Grzegorz J.} and Roy Fairstein and Roxana Radulescu",
booktitle = "ECAI 2023 - 26th European Conference on Artificial Intelligence, including 12th Conference on Prestigious Applications of Intelligent Systems, PAIS 2023 - Proceedings",
address = "Netherlands",
note = "26th European Conference on Artificial Intelligence, ECAI 2023 ; Conference date: 30-09-2023 Through 04-10-2023",
}