diff options
Diffstat (limited to 'topology.bib')
-rw-r--r-- | topology.bib | 28 |
1 files changed, 28 insertions, 0 deletions
diff --git a/topology.bib b/topology.bib index bb46305..5fc6836 100644 --- a/topology.bib +++ b/topology.bib @@ -675,3 +675,31 @@ eprinttype = {arxiv} } +@inproceedings{Mannelli_2019_Who, + author = {Sarao Mannelli, Stefano and Biroli, Giulio and Cammarota, Chiara and Krzakala, Florent and Zdeborová, Lenka}, + title = {Who is Afraid of Big Bad Minima? Analysis of gradient-flow in spiked matrix-tensor models}, + publisher = {Curran Associates, Inc.}, + year = {2019}, + volume = {32}, + pages = {}, + url = {https://proceedings.neurips.cc/paper_files/paper/2019/file/fbad540b2f3b5638a9be9aa6a4d8e450-Paper.pdf}, + booktitle = {Advances in Neural Information Processing Systems}, + editor = {Wallach, H. and Larochelle, H. and Beygelzimer, A. and Alché-Buc, F. d' and Fox, E. and Garnett, R.} +} + +@inproceedings{Mannelli_2019_Passed, + author = {Mannelli, Stefano Sarao and Krzakala, Florent and Urbani, Pierfrancesco and Zdeborova, Lenka}, + title = {Passed \& Spurious: Descent Algorithms and Local Minima in Spiked Matrix-Tensor Models}, + publisher = {PMLR}, + year = {2019}, + month = {09--15 Jun}, + volume = {97}, + pages = {4333--4342}, + url = {https://proceedings.mlr.press/v97/mannelli19a.html}, + abstract = {In this work we analyse quantitatively the interplay between the loss landscape and performance of descent algorithms in a prototypical inference problem, the spiked matrix-tensor model. We study a loss function that is the negative log-likelihood of the model. We analyse the number of local minima at a fixed distance from the signal/spike with the Kac-Rice formula, and locate trivialization of the landscape at large signal-to-noise ratios. We evaluate analytically the performance of a gradient flow algorithm using integro-differential PDEs as developed in physics of disordered systems for the Langevin dynamics. We analyze the performance of an approximate message passing algorithm estimating the maximum likelihood configuration via its state evolution. We conclude by comparing the above results: while we observe a drastic slow down of the gradient flow dynamics even in the region where the landscape is trivial, both the analyzed algorithms are shown to perform well even in the part of the region of parameters where spurious local minima are present.}, + booktitle = {Proceedings of the 36th International Conference on Machine Learning}, + editor = {Chaudhuri, Kamalika and Salakhutdinov, Ruslan}, + pdf = {http://proceedings.mlr.press/v97/mannelli19a/mannelli19a.pdf}, + series = {Proceedings of Machine Learning Research} +} + |