summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorJaron Kent-Dobias <jaron@kent-dobias.com>2025-03-11 14:19:52 -0300
committerJaron Kent-Dobias <jaron@kent-dobias.com>2025-03-11 14:19:52 -0300
commit596e488214dcaaea47fa42149067fb50604ae988 (patch)
tree3e0e2be85166bef1885281af4e89e584033f038e
parent65cf33acfe0594e95f75c2840a9a020e5a4324f1 (diff)
downloadSciPostPhys_18_158-596e488214dcaaea47fa42149067fb50604ae988.tar.gz
SciPostPhys_18_158-596e488214dcaaea47fa42149067fb50604ae988.tar.bz2
SciPostPhys_18_158-596e488214dcaaea47fa42149067fb50604ae988.zip
Many small wording tweaks
-rw-r--r--topology.bib92
-rw-r--r--topology.tex36
2 files changed, 84 insertions, 44 deletions
diff --git a/topology.bib b/topology.bib
index bf5b2e8..70d053d 100644
--- a/topology.bib
+++ b/topology.bib
@@ -8,7 +8,7 @@
number = {1},
volume = {99},
pages = {010401},
- url = {http://dx.doi.org/10.1103/PhysRevE.99.010401},
+ url = {https://dx.doi.org/10.1103/PhysRevE.99.010401},
doi = {10.1103/physreve.99.010401},
issn = {2470-0053}
}
@@ -23,7 +23,7 @@
number = {22},
volume = {131},
pages = {227301},
- url = {http://dx.doi.org/10.1103/PhysRevLett.131.227301},
+ url = {https://dx.doi.org/10.1103/PhysRevLett.131.227301},
doi = {10.1103/physrevlett.131.227301},
issn = {1079-7114}
}
@@ -86,7 +86,7 @@
title = {The Spherical $p+s$ Spin Glass At Zero Temperature},
year = {2022},
month = {9},
- url = {http://arxiv.org/abs/2209.03866},
+ url = {https://arxiv.org/abs/2209.03866},
note = {arXiv preprint},
date = {2022-09-08T15:08:26Z},
eprint = {2209.03866},
@@ -104,7 +104,7 @@
number = {48},
volume = {113},
pages = {E7655--E7662},
- url = {http://dx.doi.org/10.1073/pnas.1608103113},
+ url = {https://dx.doi.org/10.1073/pnas.1608103113},
doi = {10.1073/pnas.1608103113},
issn = {1091-6490}
}
@@ -133,7 +133,7 @@
number = {2},
volume = {108},
pages = {024310},
- url = {http://dx.doi.org/10.1103/PhysRevE.108.024310},
+ url = {https://dx.doi.org/10.1103/PhysRevE.108.024310},
doi = {10.1103/physreve.108.024310},
issn = {2470-0053}
}
@@ -157,7 +157,7 @@
title = {On the Trajectories of {SGD} Without Replacement},
year = {2023},
month = {dec},
- url = {http://arxiv.org/abs/2312.16143},
+ url = {https://arxiv.org/abs/2312.16143},
note = {arXiv preprint},
archiveprefix = {arXiv},
eprint = {2312.16143},
@@ -271,7 +271,7 @@
number = {8},
volume = {2024},
pages = {083302},
- url = {http://dx.doi.org/10.1088/1742-5468/ad685a},
+ url = {https://dx.doi.org/10.1088/1742-5468/ad685a},
doi = {10.1088/1742-5468/ad685a},
issn = {1742-5468}
}
@@ -329,7 +329,7 @@
number = {14},
volume = {49},
pages = {145001},
- url = {http://dx.doi.org/10.1088/1751-8113/49/14/145001},
+ url = {https://dx.doi.org/10.1088/1751-8113/49/14/145001},
doi = {10.1088/1751-8113/49/14/145001},
issn = {1751-8121}
}
@@ -344,7 +344,7 @@
number = {3},
volume = {2},
pages = {019},
- url = {http://dx.doi.org/10.21468/SciPostPhys.2.3.019},
+ url = {https://dx.doi.org/10.21468/SciPostPhys.2.3.019},
doi = {10.21468/scipostphys.2.3.019},
issn = {2542-4653}
}
@@ -359,7 +359,7 @@
number = {11},
volume = {123},
pages = {115702},
- url = {http://dx.doi.org/10.1103/PhysRevLett.123.115702},
+ url = {https://dx.doi.org/10.1103/PhysRevLett.123.115702},
doi = {10.1103/physrevlett.123.115702},
issn = {1079-7114}
}
@@ -401,7 +401,7 @@
number = {7},
volume = {51},
pages = {1663},
- url = {http://dx.doi.org/10.5506/APhysPolB.51.1663},
+ url = {https://dx.doi.org/10.5506/APhysPolB.51.1663},
doi = {10.5506/aphyspolb.51.1663},
issn = {1509-5770}
}
@@ -416,7 +416,7 @@
number = {24},
volume = {55},
pages = {244008},
- url = {http://dx.doi.org/10.1088/1751-8121/ac6d8e},
+ url = {https://dx.doi.org/10.1088/1751-8121/ac6d8e},
doi = {10.1088/1751-8121/ac6d8e},
issn = {1751-8121}
}
@@ -454,7 +454,7 @@
number = {5},
volume = {15},
pages = {219},
- url = {http://dx.doi.org/10.21468/SciPostPhys.15.5.219},
+ url = {https://dx.doi.org/10.21468/SciPostPhys.15.5.219},
doi = {10.21468/scipostphys.15.5.219},
issn = {2542-4653}
}
@@ -464,7 +464,7 @@
title = {Stochastic Gradient Descent outperforms Gradient Descent in recovering a high-dimensional signal in a glassy energy landscape},
year = {2023},
month = {sep},
- url = {http://arxiv.org/abs/2309.04788},
+ url = {https://arxiv.org/abs/2309.04788},
note = {arXiv preprint},
archiveprefix = {arXiv},
eprint = {2309.04788},
@@ -521,7 +521,7 @@
number = {1},
volume = {16},
pages = {001},
- url = {http://dx.doi.org/10.21468/SciPostPhys.16.1.001},
+ url = {https://dx.doi.org/10.21468/SciPostPhys.16.1.001},
doi = {10.21468/scipostphys.16.1.001},
issn = {2542-4653}
}
@@ -536,7 +536,7 @@
number = {6},
volume = {110},
pages = {064148},
- url = {http://dx.doi.org/10.1103/PhysRevE.110.064148},
+ url = {https://dx.doi.org/10.1103/PhysRevE.110.064148},
doi = {10.1103/physreve.110.064148},
issn = {2470-0053}
}
@@ -551,7 +551,7 @@
number = {1–2},
volume = {103},
pages = {107--113},
- url = {http://dx.doi.org/10.1016/j.jphysparis.2009.05.013},
+ url = {https://dx.doi.org/10.1016/j.jphysparis.2009.05.013},
doi = {10.1016/j.jphysparis.2009.05.013},
issn = {0928-4257}
}
@@ -561,7 +561,7 @@
title = {Solving overparametrized systems of random equations: I. Model and algorithms for approximate solutions},
year = {2023},
month = {jun},
- url = {http://arxiv.org/abs/2306.13326},
+ url = {https://arxiv.org/abs/2306.13326},
note = {arXiv preprint},
archiveprefix = {arXiv},
eprint = {2306.13326},
@@ -574,7 +574,7 @@
title = {On {Smale}'s 17th problem over the reals},
year = {2024},
month = {may},
- url = {http://arxiv.org/abs/2405.01735},
+ url = {https://arxiv.org/abs/2405.01735},
note = {arXiv preprint},
archiveprefix = {arXiv},
eprint = {2405.01735},
@@ -629,7 +629,7 @@
number = {11},
volume = {56},
pages = {115003},
- url = {http://dx.doi.org/10.1088/1751-8121/acb742},
+ url = {https://dx.doi.org/10.1088/1751-8121/acb742},
doi = {10.1088/1751-8121/acb742},
issn = {1751-8121}
}
@@ -644,7 +644,7 @@
number = {8},
volume = {2024},
pages = {083301},
- url = {http://dx.doi.org/10.1088/1742-5468/ad0635},
+ url = {https://dx.doi.org/10.1088/1742-5468/ad0635},
doi = {10.1088/1742-5468/ad0635},
issn = {1742-5468}
}
@@ -654,7 +654,7 @@
title = {Statistical physics of complex systems: glasses, spin glasses, continuous constraint satisfaction problems, high-dimensional inference and neural networks},
year = {2024},
month = {may},
- url = {http://arxiv.org/abs/2405.06384},
+ url = {https://arxiv.org/abs/2405.06384},
note = {arXiv preprint},
archiveprefix = {arXiv},
eprint = {2405.06384},
@@ -667,7 +667,7 @@
title = {Random Linear Systems with Quadratic Constraints: from Random Matrix Theory to replicas and back},
year = {2024},
month = {jan},
- url = {http://arxiv.org/abs/2401.03209},
+ url = {https://arxiv.org/abs/2401.03209},
note = {arXiv preprint},
archiveprefix = {arXiv},
eprint = {2401.03209},
@@ -699,7 +699,51 @@
abstract = {In this work we analyse quantitatively the interplay between the loss landscape and performance of descent algorithms in a prototypical inference problem, the spiked matrix-tensor model. We study a loss function that is the negative log-likelihood of the model. We analyse the number of local minima at a fixed distance from the signal/spike with the Kac-Rice formula, and locate trivialization of the landscape at large signal-to-noise ratios. We evaluate analytically the performance of a gradient flow algorithm using integro-differential PDEs as developed in physics of disordered systems for the Langevin dynamics. We analyze the performance of an approximate message passing algorithm estimating the maximum likelihood configuration via its state evolution. We conclude by comparing the above results: while we observe a drastic slow down of the gradient flow dynamics even in the region where the landscape is trivial, both the analyzed algorithms are shown to perform well even in the part of the region of parameters where spurious local minima are present.},
booktitle = {Proceedings of the 36th International Conference on Machine Learning},
editor = {Chaudhuri, Kamalika and Salakhutdinov, Ruslan},
- pdf = {http://proceedings.mlr.press/v97/mannelli19a/mannelli19a.pdf},
+ pdf = {https://proceedings.mlr.press/v97/mannelli19a/mannelli19a.pdf},
series = {Proceedings of Machine Learning Research}
}
+@unpublished{ElAlaoui_2020_Algorithmic,
+ author = {El Alaoui, Ahmed and Montanari, Andrea},
+ title = {Algorithmic Thresholds in Mean Field Spin Glasses},
+ year = {2020},
+ month = {Sept},
+ url = {https://arxiv.org/abs/2009.11481},
+ archiveprefix = {arXiv},
+ date = {2020-09-24T04:22:42Z},
+ eprint = {2009.11481},
+ eprintclass = {cond-mat.stat-mech},
+ eprinttype = {arxiv},
+ note = {ArXiv preprint},
+ primaryclass = {cond-mat.stat-mech}
+}
+
+@article{ElAlaoui_2021_Optimization,
+ author = {El Alaoui, Ahmed and Montanari, Andrea and Sellke, Mark},
+ title = {Optimization of mean-field spin glasses},
+ journal = {The Annals of Probability},
+ publisher = {Institute of Mathematical Statistics},
+ year = {2021},
+ month = {11},
+ number = {6},
+ volume = {49},
+ pages = {2922--2960},
+ url = {https://doi.org/10.1214%2F21-aop1519},
+ doi = {10.1214/21-aop1519}
+}
+
+@article{Gamarnik_2021-10_The,
+ author = {Gamarnik, David},
+ title = {The overlap gap property: A topological barrier to optimizing over random structures},
+ journal = {Proceedings of the National Academy of Sciences},
+ publisher = {Proceedings of the National Academy of Sciences},
+ year = {2021},
+ month = {October},
+ number = {41},
+ volume = {118},
+ pages = {e2108492118},
+ url = {https://dx.doi.org/10.1073/pnas.2108492118},
+ doi = {10.1073/pnas.2108492118},
+ issn = {1091-6490}
+}
+
diff --git a/topology.tex b/topology.tex
index cb95e01..6fb6bce 100644
--- a/topology.tex
+++ b/topology.tex
@@ -676,7 +676,7 @@ When $M=1$ the solution manifold corresponds to the energy
level set of a spherical spin glass with energy density $E=V_0/\sqrt N$. All the
results from the previous sections follow, and can be translated to the spin
glasses by taking the limit $\alpha\to0$ while keeping $E=V_0\alpha^{1/2}$ fixed.\footnote{
- It is plausible that the limits of $N\to\infty$ implicit in the saddle point expansion and the limit of $\alpha\to0$ taken here do not commute, and that $M=1$ should be taken from the beginning of the calculation. However, in this case the two procedures do commute. The $\alpha\to0$ limit accomplishes only the elimination of the first term from the effective action \eqref{eq:S.m}, while following Appendix~\ref{sec:euler} with $M=1$ from the outset results in the same term not appearing in the effective action because it is of subleading order in $N$.
+ It is plausible that the limit of $N\to\infty$ implicit in the saddle point expansion and the limit of $\alpha\to0$ taken here do not commute, and that $M=1$ should be set from the beginning of the calculation. However, in this case the two procedures do commute. The $\alpha\to0$ limit accomplishes only the elimination of the first term from the effective action \eqref{eq:S.m}, while following Appendix~\ref{sec:euler} with $M=1$ from the outset results in the same term not appearing in the effective action because it is of subleading order in $N$.
} With a little algebra this procedure yields
\begin{align}
E_\text{on}=\pm\sqrt{2f(1)}
@@ -776,37 +776,33 @@ descent from a uniformly random initial condition, but other algorithms find
minima at other energies. Optimal message passing algorithms were shown to find
configurations at an energy level where another topological property---the
overlap gap property---transitions, and this energy level is believed to bound from below
-all polynomial-time algorithms. On the other hand, physically inspired
+all polynomial-time algorithms \cite{ElAlaoui_2020_Algorithmic, ElAlaoui_2021_Optimization, Gamarnik_2021-10_The}. On the other hand, physically inspired
modifications of gradient descent---notably, drawing the initial condition from
a nonuniform distribution like the Boltzmann distribution with a finite
-temperature---can find energy configurations with energies lower than those
-found with gradient descent from a uniform initial condition. If the
+temperature---find energy configurations with energies lower than those
+found with gradient descent from a uniform initial condition \cite{Folena_2020_Rethinking, Folena_2021_Gradient}. If the
topological transition described in this paper does predict the asymptotic
performance of gradient descent from a uniform initial condition, then it
provides a topological bound from above for the performance of reasonable
-algorithms that terminate in minima. Whether the performance of gradient
+algorithms that terminate in minima. It is unknown whether the performance of gradient
descent from better initial conditions, or of other algorithms like simulated
-annealing, can be predicted with a similar method is not known.
+annealing, can be predicted with a topological property.
Finally, a common extension of the spherical spin glasses is to add a
deterministic piece to the energy, sometimes called a signal or a spike. Recent
-work argued that gradient descent can avoid being trapped in marginal minima
-and reach the vicinity of the signal if the set of trapping marginal minima has
+work argued that gradient descent can avoid being trapped by the minima that typically trap dynamics
+and reach the vicinity of the signal if the set of typically trapping minima has
been destabilized by the presence of the signal \cite{SaraoMannelli_2019_Passed,
SaraoMannelli_2019_Who}. The authors of Ref.~\cite{SaraoMannelli_2019_Who}
conjecture based on \textsc{dmft} data for $2+3$ mixed spherical spin glasses that the
-trapping marginal minima are those at the traditional threshold energy
-$E_\text{th}$. However, Ref.~\cite{Folena_2023_On} demonstrated that in mixed
-$p+s$ spherical spin glasses with small $p$ and $s$, the difference between
-$E_\text{th}$ and the true trapping energy is difficult to resolve with the
-current precision of \textsc{dmft} integration schemes. Therefore,
-the authors of Ref.~\cite{SaraoMannelli_2019_Who} may have incorrectly conflated the
-threshold with the trapping marginal minima, and that the correct set of
-marginal minima that must be destabilized to reach a signal might be the same set
-that trap dynamics in the signal-free model. This paper conjectures that the important trapping minima
-are those at the shattering energy. Comparing the predictions of
+typically trapping minima are those at the threshold energy
+$E_\text{th}$. However, as discussed above, Ref.~\cite{Folena_2023_On} demonstrated that in signal-free mixed
+$p+s$ spherical spin glasses $E_\text{th}$ is not the energy of typical trapping minima, and furthermore that, when $p$ and $s$ are small, the difference between
+$E_\text{th}$ and the energy of the actual trapping minima is difficult to resolve with the
+current precision of \textsc{dmft} integration schemes. Therefore, it is plausible that the picture described in Ref.~\cite{SaraoMannelli_2019_Who} is correct except that the set of minima that must be destabilised to reach the signal is that at the typical trapping energy of the isotropic problem and not the threshold energy $E_\text{th}$. If the conjecture made in this paper is true, then this typical trapping energy is the shattering energy $E_\text{sh}$.
+Comparing the predictions of
Ref.~\cite{SaraoMannelli_2019_Who} to \textsc{dmft} simulations of a model with
-better separation between $p$ and $s$ would help resolve this issue.
+better separation between $p$ and $s$ would help resolve this question.
\section{Conclusion}
\label{sec:conclusion}
@@ -1155,7 +1151,7 @@ $\frac12\log\det(\mathbb Q-\mathbb M\mathbb M^T)$ in the effective action from
=1
\end{equation}
where the final superdeterminant is identically 1 for any superoperator $\tilde{\mathbb Q}$, not just its saddle-point value.\footnote{
- The subscript notation in \eqref{eq:supermatrix.saddle} indicates which superindices of the four-index superoperator associated with the Hessian belong to the domain and codomain, analogous to writing $\det A=\det_{ij}A_{ij}$ for a two-index complex-valued matrix. In this case, the domain is indexed by $\{3,4\}$ and the codomain is indexed by $\{1,2\}$.
+ The subscript notation in \eqref{eq:supermatrix.saddle} indicates which superindices of the four-index superoperator associated with the Hessian belong to the domain and codomain, analogous to writing $\det A=\det_{ij}A_{ij}$ for a two-index complex-valued operator. In this case, the domain is indexed by $\{3,4\}$ and the codomain is indexed by $\{1,2\}$.
}
The Hubbard--Stratonovich transformation therefore contributes a factor of
\begin{equation}