@inbook{b085c27972834f4fa2a0b1e65a55be38,
title = "On the biological plausibility of orthogonal initialisation for solving gradient instability in deep neural networks",
abstract = "Initialising the synaptic weights of artificial neural networks (ANNs) with orthogonal matrices is known to alleviate vanishing and exploding gradient problems. A major objection against such initialisation schemes is that they are deemed biologically implausible as they mandate factorization techniques that are difficult to attribute to a neurobiological process. This paper presents two initialisation schemes that allow a network to naturally evolve its weights to form orthogonal matrices, provides theoretical analysis that pre-training orthogonalisation always converges, and empirically confirms that the proposed schemes outperform randomly initialised recurrent and feedforward networks. ",
keywords = "cs.NE, cs.AI, cs.LG",
author = "Nikolay Manchev and Michael Spratling",
note = "9 pages, 3 figures, to be published in ISCMI2022 conference proceedings",
year = "2023",
month = mar,
day = "21",
doi = "10.1109/ISCMI56532.2022.10068489",
language = "English",
series = "2022 9th International Conference on Soft Computing and Machine Intelligence, ISCMI 2022",
publisher = "IEEE",
pages = "47--55",
booktitle = "2022 9th International Conference on Soft Computing and Machine Intelligence, ISCMI 2022",
}