summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--figs/phases_34.pdfbin37589 -> 37679 bytes
-rw-r--r--when_annealed.bib140
-rw-r--r--when_annealed.tex288
3 files changed, 298 insertions, 130 deletions
diff --git a/figs/phases_34.pdf b/figs/phases_34.pdf
index ee6afae..ad8deb9 100644
--- a/figs/phases_34.pdf
+++ b/figs/phases_34.pdf
Binary files differ
diff --git a/when_annealed.bib b/when_annealed.bib
index d13ddf8..42c2e31 100644
--- a/when_annealed.bib
+++ b/when_annealed.bib
@@ -1,3 +1,17 @@
+@article{Altieri_2021_Properties,
+ author = {Altieri, Ada and Roy, Felix and Cammarota, Chiara and Biroli, Giulio},
+ title = {Properties of Equilibria and Glassy Phases of the Random {Lotka}-{Volterra} Model with Demographic Noise},
+ journal = {Physical Review Letters},
+ publisher = {American Physical Society (APS)},
+ year = {2021},
+ month = {6},
+ number = {25},
+ volume = {126},
+ pages = {258301},
+ url = {https://doi.org/10.1103%2Fphysrevlett.126.258301},
+ doi = {10.1103/physrevlett.126.258301}
+}
+
@article{Auffinger_2022_The,
author = {Auffinger, Antonio and Zhou, Yuxin},
title = {The Spherical {$p+s$} Spin Glass At Zero Temperature},
@@ -24,6 +38,48 @@
doi = {10.1002/cpa.21875}
}
+@article{Bray_2007_Statistics,
+ author = {Bray, Alan J. and Dean, David S.},
+ title = {Statistics of Critical Points of {Gaussian} Fields on Large-Dimensional Spaces},
+ journal = {Physical Review Letters},
+ publisher = {American Physical Society (APS)},
+ year = {2007},
+ month = {4},
+ number = {15},
+ volume = {98},
+ pages = {150201},
+ url = {https://doi.org/10.1103%2Fphysrevlett.98.150201},
+ doi = {10.1103/physrevlett.98.150201}
+}
+
+@article{Cavagna_1998_Stationary,
+ author = {Cavagna, Andrea and Giardina, Irene and Parisi, Giorgio},
+ title = {Stationary points of the {Thouless}-{Anderson}-{Palmer} free energy},
+ journal = {Physical Review B},
+ publisher = {American Physical Society (APS)},
+ year = {1998},
+ month = {5},
+ number = {18},
+ volume = {57},
+ pages = {11251--11257},
+ url = {https://doi.org/10.1103%2Fphysrevb.57.11251},
+ doi = {10.1103/physrevb.57.11251}
+}
+
+@article{Crisanti_1992_The,
+ author = {Crisanti, A. and Sommers, H.-J.},
+ title = {The spherical $p$-spin interaction spin glass model: the statics},
+ journal = {Zeitschrift für Physik B Condensed Matter},
+ publisher = {Springer Science and Business Media LLC},
+ year = {1992},
+ month = {10},
+ number = {3},
+ volume = {87},
+ pages = {341--354},
+ url = {https://doi.org/10.1007%2Fbf01309287},
+ doi = {10.1007/bf01309287}
+}
+
@article{Crisanti_2004_Spherical,
author = {Crisanti, A. and Leuzzi, L.},
title = {Spherical $2+p$ Spin-Glass Model: An Exactly Solvable Model for Glass to Spin-Glass Transition},
@@ -95,6 +151,20 @@
numpages = {26}
}
+@article{Folena_2021_Gradient,
+ author = {Folena, Giampaolo and Franz, Silvio and Ricci-Tersenghi, Federico},
+ title = {Gradient descent dynamics in the mixed $p$-spin spherical model: finite-size simulations and comparison with mean-field integration},
+ journal = {Journal of Statistical Mechanics: Theory and Experiment},
+ publisher = {IOP Publishing},
+ year = {2021},
+ month = {3},
+ number = {3},
+ volume = {2021},
+ pages = {033302},
+ url = {https://doi.org/10.1088%2F1742-5468%2Fabe29f},
+ doi = {10.1088/1742-5468/abe29f}
+}
+
@article{Folena_2023_On,
author = {Folena, Giampaolo and Zamponi, Francesco},
title = {On weak ergodicity breaking in mean-field spin glasses},
@@ -121,6 +191,20 @@
doi = {10.1103/physrevlett.92.240601}
}
+@article{Fyodorov_2007_Density,
+ author = {Fyodorov, Y. V. and Sommers, H.-J. and Williams, I.},
+ title = {Density of stationary points in a high dimensional random energy landscape and the onset of glassy behavior},
+ journal = {JETP Letters},
+ publisher = {Pleiades Publishing Ltd},
+ year = {2007},
+ month = {5},
+ number = {5},
+ volume = {85},
+ pages = {261--266},
+ url = {https://doi.org/10.1134%2Fs0021364007050098},
+ doi = {10.1134/s0021364007050098}
+}
+
@article{Fyodorov_2012_Critical,
author = {Fyodorov, Yan V. and Nadal, Celine},
title = {Critical Behavior of the Number of Minima of a Random Landscape at the Glass Transition Point and the Tracy-Widom Distribution},
@@ -149,6 +233,20 @@
doi = {10.1103/physrevlett.130.237103}
}
+@article{Kent-Dobias_2021_Complex,
+ author = {Kent-Dobias, Jaron and Kurchan, Jorge},
+ title = {Complex complex landscapes},
+ journal = {Physical Review Research},
+ publisher = {American Physical Society (APS)},
+ year = {2021},
+ month = {4},
+ number = {2},
+ volume = {3},
+ pages = {023064},
+ url = {https://doi.org/10.1103%2Fphysrevresearch.3.023064},
+ doi = {10.1103/physrevresearch.3.023064}
+}
+
@article{Kent-Dobias_2023_How,
author = {Kent-Dobias, Jaron and Kurchan, Jorge},
title = {How to count in hierarchical landscapes: a full solution to mean-field complexity},
@@ -163,6 +261,20 @@
doi = {10.1103/PhysRevE.107.064111}
}
+@article{Krzakala_2007_Landscape,
+ author = {Krzakala, Florent and Kurchan, Jorge},
+ title = {Landscape analysis of constraint satisfaction problems},
+ journal = {Physical Review E},
+ publisher = {American Physical Society (APS)},
+ year = {2007},
+ month = {8},
+ number = {2},
+ volume = {76},
+ pages = {021122},
+ url = {https://doi.org/10.1103%2Fphysreve.76.021122},
+ doi = {10.1103/physreve.76.021122}
+}
+
@article{Muller_2006_Marginal,
author = {Müller, Markus and Leuzzi, Luca and Crisanti, Andrea},
title = {Marginal states in mean-field glasses},
@@ -230,6 +342,20 @@ interactions: the typical number of equilibria},
eprinttype = {arxiv}
}
+@article{Stein_1995_Broken,
+ author = {Stein, D. L. and Newman, C. M.},
+ title = {Broken ergodicity and the geometry of rugged landscapes},
+ journal = {Physical Review E},
+ publisher = {American Physical Society (APS)},
+ year = {1995},
+ month = {6},
+ number = {6},
+ volume = {51},
+ pages = {5228--5238},
+ url = {https://doi.org/10.1103%2Fphysreve.51.5228},
+ doi = {10.1103/physreve.51.5228}
+}
+
@article{Wainrib_2013_Topological,
author = {Wainrib, Gilles and Touboul, Jonathan},
title = {Topological and Dynamical Complexity of Random Neural Networks},
@@ -244,3 +370,17 @@ interactions: the typical number of equilibria},
doi = {10.1103/physrevlett.110.118101}
}
+@article{Yang_2023_Stochastic,
+ author = {Yang, Ning and Tang, Chao and Tu, Yuhai},
+ title = {Stochastic Gradient Descent Introduces an Effective Landscape-Dependent Regularization Favoring Flat Solutions},
+ journal = {Physical Review Letters},
+ publisher = {American Physical Society (APS)},
+ year = {2023},
+ month = {6},
+ number = {23},
+ volume = {130},
+ pages = {237101},
+ url = {https://doi.org/10.1103%2Fphysrevlett.130.237101},
+ doi = {10.1103/physrevlett.130.237101}
+}
+
diff --git a/when_annealed.tex b/when_annealed.tex
index 6e63ded..2d50dd2 100644
--- a/when_annealed.tex
+++ b/when_annealed.tex
@@ -36,32 +36,33 @@
A common measure of a function's complexity is the count of its stationary
points. For complicated functions, this count grows exponentially with the
volume and dimension of their domain. In practice, the count is averaged over
- a class of such functions (the annealed average), but the large numbers
- involved can result in averages biased by extremely rare samples. Typical
+ a class of functions (the annealed average), but the large numbers
+ involved can produce averages biased by extremely rare samples. Typical
counts are reliably found by taking the average of the logarithm (the
quenched average), which is more difficult and not often done in practice.
When most stationary points are uncorrelated with each other, quenched and
- anneals averages are equal. There are heuristics from equilibrium
- calculations that guarantee when most of the lowest minima will be
- uncorrelated. Here, we show that these equilibrium heuristics cannot be used
- to draw conclusions about other minima and saddles. We produce examples among
- Gaussian-correlated functions on the hypersphere where the count of certain
- saddles and minima has different quenched and annealed averages, despite
- being guaranteed `safe' in the equilibrium setting. We determine conditions
- for the emergence of nontrivial correlations between saddles, and discuss the
- implications for the geometry of those functions and what out-of-equilibrium
- settings might be affected.
+ anneals averages are equal. Equilibrium heuristics can guarantee when most of
+ the lowest minima will be uncorrelated. We show that these equilibrium
+ heuristics cannot be used to draw conclusions about other minima and saddles
+ by producing examples among Gaussian-correlated functions on the hypersphere
+ where the count of certain saddles and minima has different quenched and
+ annealed averages, despite being guaranteed `safe' in the equilibrium
+ setting. We determine conditions for the emergence of nontrivial correlations
+ between saddles, and discuss the implications for the geometry of those
+ functions and what out-of-equilibrium settings might be affected.
\end{abstract}
-Random high-dimensional energies, cost functions, and interaction networks are important in many fields. The energy landscape of glasses, the likelihood
-landscape of machine learning and inference, and the
-interactions between organisms in an ecosystem are just a few examples. A
-traditional tool for making sense of their behavior is to analyze the
-statistics of points where their dynamics are stationary. For energy or cost
-landscapes, these correspond to the minima, maxima, and saddles, while for
-ecosystems and other non-gradient dynamical systems these correspond to
-equilibria of the dynamics. When many stationary points are present, the system
-is considered complex.
+Random high-dimensional energies, cost functions, and interaction networks are
+important in many fields. The energy landscape of glasses, the likelihood
+landscape of machine learning and inference, and the interactions between
+organisms in an ecosystem are just a few examples \cite{Stein_1995_Broken, Krzakala_2007_Landscape, Altieri_2021_Properties, Yang_2023_Stochastic}. A traditional tool for
+making sense of their behavior is to analyze the statistics of points where
+their dynamics are stationary \cite{Cavagna_1998_Stationary,
+Fyodorov_2004_Complexity, Fyodorov_2007_Density, Bray_2007_Statistics}. For
+energy or cost landscapes, these correspond to the minima, maxima, and saddles,
+while for ecosystems and other non-gradient dynamical systems these correspond
+to equilibria of the dynamics. When many stationary points are present, the
+system is considered complex.
Despite the importance of stationary point statistics for understanding complex
behavior, they are often calculated using an uncontrolled approximation.
@@ -69,59 +70,62 @@ Because their number is so large, it cannot be reliably averaged. The annealed
approximation takes this average anyway, risking a systematic bias by rare and
atypical samples. The annealed approximation is known to be exact for certain
models and in certain circumstances, but it is used outside those circumstances
-without much reflection \cite{Wainrib_2013_Topological, Gershenzon_2023_On-Site}. In a few cases researches have made instead the
+without much reflection \cite{Wainrib_2013_Topological, Kent-Dobias_2021_Complex,
+Gershenzon_2023_On-Site}. In a few cases researchers have instead made the
better-controlled quenched average, which averages the logarithm of the number
of stationary points, and find deviations from the annealed approximation with
-important implications for the system's behavior \cite{Muller_2006_Marginal, Ros_2019_Complexity,
-Kent-Dobias_2023_How, Ros_2023_Quenched}. Generically, the annealed
-approximation to the complexity is wrong when a nonvanishing fraction of pairs
-of stationary points have nontrivial correlations in their mutual position.
+important implications for the behavior \cite{Muller_2006_Marginal,
+Ros_2019_Complex, Kent-Dobias_2023_How, Ros_2023_Quenched}. Generically,
+the annealed approximation to the complexity is wrong when a nonvanishing
+fraction of pairs of stationary points have nontrivial correlations in their
+mutual position.
A heuristic line of reasoning for the appropriateness of the annealed
approximation is sometimes made when the approximation is correct for an
equilibrium calculation on the same system. The argument goes like this: since
-the limit of zero temperature or noise in an equilibrium calculation
-concentrates the measure onto the lowest set of minima, the equilibrium free
-energy in the limit to zero temperature should be governed by the same
-statistics as the count of that lowest set of minima. This argument is valid,
-but only for the lowest set of minima, which at least in glassy problems are
+the limit of zero temperature in an equilibrium calculation
+concentrates the Boltzmann measure onto the lowest set of minima, the equilibrium free
+energy in the limit to zero temperature will be governed by the same
+statistics as the count of that lowest set of minima. This argument is strictly
+valid only for the lowest minima, which at least in glassy problems are
rarely relevant to dynamical behavior. What about the \emph{rest} of the
stationary points?
In this paper, we show that the behavior of the ground state, or \emph{any}
equilibrium behavior, does not govern whether stationary points will have a
correct annealed average. In a prototypical family of models of random
-functions, we calculate a condition for determining when annealed averages should fail
-and stationary points should have nontrivial correlations in their mutual
-position. We produce examples of models whose equilibrium is guaranteed to
-never see such correlations between thermodynamic states, but where a
+functions, we calculate a condition for determining when annealed averages
+should fail and stationary points should have nontrivial correlations in their
+mutual position. We produce examples of models whose equilibrium is guaranteed
+to never see such correlations between thermodynamic states, but where a
population of saddle points is nevertheless correlated.
We study the mixed spherical models, which are models of Gaussian-correlated
random functions with isotropic statistics on the $(N-1)$-sphere. Each model
consists of a class of functions $H:S^{N-1}\to\mathbb R$ defined by the
-covariance between the function evaluated at two different points
+covariance between the functions evaluated at two different points
$\pmb\sigma_1,\pmb\sigma_2\in S^{N-1}$, which is a function of the scalar
product (or overlap) between the two configurations:
\begin{equation} \label{eq:covariance}
\overline{H(\pmb\sigma_1)H(\pmb\sigma_2)}=\frac1Nf\bigg(\frac{\pmb\sigma_1\cdot\pmb\sigma_2}N\bigg)
\end{equation}
-Specifying the covariance function $f$ uniquely specifies the model. The
-series coefficients of $f$ need to be nonnnegative in order for $f$ to be a
+Specifying the covariance function $f$ uniquely specifies the model. The series
+coefficients of $f$ need to be nonnnegative in order for $f$ to be a
well-defined covariance. The case where $f$ is a homogeneous polynomial has
been extensively studied, and corresponds to the pure spherical models of glass
physics or the spiked tensor models of statistical inference. Here we will
study cases where $f(q)=\frac12\big(\lambda q^3+(1-\lambda)q^s\big)$ for
-$\lambda\in(0,1)$, called $3+s$ models. These are examples of \emph{mixed} spherical models, which
-have been studied in the physics and statistics literature and host a zoo of
-complex orders and phase transitions \cite{Crisanti_2004_Spherical,
-Crisanti_2006_Spherical, Crisanti_2011_Statistical}.
+$\lambda\in(0,1)$, called $3+s$ models. These are examples of \emph{mixed}
+spherical models, which have been studied in the physics and statistics
+literature and host a zoo of complex orders and phase transitions
+\cite{Crisanti_2004_Spherical, Crisanti_2006_Spherical,
+Crisanti_2011_Statistical}.
There are several well-established results on the equilibrium of this model.
-First, if the function $f$ is convex then it is not possible for the
+First, if the function $\chi(q)=f''(q)^{-1/2}$ is convex then it is not possible for the
equilibrium solution to have nontrivial correlations between states at any
-temperature.\footnote{
- More specifically, convex $f$ cannot have an equilibrium order with more than
+temperature \cite{Crisanti_1992_The}.\footnote{
+ More specifically, convex $\chi$ cannot have an equilibrium order with more than
{\oldstylenums1\textsc{rsb}} order among the configurations. In equilibrium,
{\oldstylenums1\textsc{rsb}} corresponds to trivial correlations between
thermodynamic states, but nontrivial correlations exist \emph{within} a state
@@ -132,33 +136,35 @@ temperature.\footnote{
equilibrium trivial because it does not imply any nontrivial correlations
between states.
}
-This is a very strong condition on the form of equilibrium order. Note that
-non-convex $f$ does not imply that you will see nontrivial correlations between
+This is a strong condition on the form of equilibrium order. Note that
+non-convex $\chi$ does not imply that you will see nontrivial correlations between
states at some temperature. In the $3+s$ models we consider here, models with
-$s>8$ have non-convex $f$ and those with $s\geq8$ have convex $f$ independent
+$s>8$ have non-convex $\chi$ and those with $s\leq8$ have convex $\chi$ independent
of $\lambda$. Second, the characterization of the ground state has been made
\cite{Crisanti_2004_Spherical, Crisanti_2006_Spherical,
Crisanti_2011_Statistical, Auffinger_2022_The}. In the $3+s$ models we
-consider, for $s>12.430\ldots$ nontrivial ground state configurations appear in
-certain ranges of $\lambda$. These bounds on equilibrium order are shown in
-Fig.~\ref{fig:phases}, along with our result in this paper for where the
-complexity has nontrivial \textsc{rsb}. As evidenced in that figure,
-\textsc{rsb} among saddles is possible well outside the bounds from
+consider, for $s>12.430...$ nontrivial ground state configurations appear in
+a range of $\lambda$. These bounds on equilibrium order are shown in
+Fig.~\ref{fig:phases}, along with our result for where the complexity has
+nontrivial correlations between some stationary points. As evidenced in that
+figure, \textsc{rsb} among saddles is possible well outside the bounds from
equilibrium.
-There are two important features which differentiate stationary points $\pmb\sigma^*$ in the
-spherical models: their \emph{energy density} $E=\frac1NH(\pmb\sigma^*)$ and
-their \emph{stability}
+There are two important features which differentiate stationary points
+$\pmb\sigma^*$ in the spherical models: their \emph{energy density}
+$E=\frac1NH(\pmb\sigma^*)$ and their \emph{stability}
$\mu=\frac1N\operatorname{\mathrm{Tr}}\operatorname{\mathrm{Hess}}H(\pmb\sigma^*)$.
-The energy density should be familiar, as the `height' in the landscape. The
-stability is so-called because it governs the spectrum of the stationary point.
+The energy density gives the `height' in the landscape, while the
+stability governs the spectrum of the stationary point.
In each spherical model, the spectrum of every stationary point is a Wigner
semicircle of the same width $\mu_\mathrm m=\sqrt{4f''(1)}$, but shifted by
constant. The stability $\mu$ sets this constant shift. When $\mu<\mu_\mathrm
m$, the spectrum still has support over zero and we have saddles with an
extensive number of downward directions. When $\mu>\mu_\mathrm m$ the spectrum
-has support only over positive eigenvalues, and we have stable minima. When
-$\mu=\mu_\mathrm m$, the spectrum has a pseudogap, and we have marginal minima.
+has support only over positive eigenvalues, and we have stable minima.\footnote{
+ Saddle points with a subextensive number of downward directions also exist
+ via large deviations of some number of eigenvalues from the average spectrum.
+} When $\mu=\mu_\mathrm m$, the spectrum has a pseudogap, and we have marginal minima.
\begin{figure}
\centering
@@ -166,30 +172,33 @@ $\mu=\mu_\mathrm m$, the spectrum has a pseudogap, and we have marginal minima.
\caption{
A phase diagram of the boundaries we discuss in this paper for the $3+s$
model with $f=\frac12\big(\lambda q^3+(1-\lambda)q^s\big)$. The blue region
- shows where there exist some stationary points whose complexity is
- {\oldstylenums1}\textsc{rsb}, and is given by $G_f>0$ where $G_f$ is found
- in \eqref{eq:condition}. The yellow region shows where $f$ is not convex
- and therefore \textsc{rsb} solutions are possible in equilibrium. The green
- region shows where \textsc{rsb} solutions are correct at the ground state,
- adapted from \cite{Auffinger_2022_The}.
+ shows models which have some stationary points with nontrivial correlated
+ (\textsc{rsb}) structure, and is given by $G_f>0$ where $G_f$ is found in
+ \eqref{eq:condition}. The yellow region shows where $\chi(q)=f''(q)^{-1/2}$
+ is not convex and therefore nontrivial correlations between states are
+ possible in equilibrium. The green region shows where nontrivial
+ solutions are correct at the ground state, adapted from
+ \cite{Auffinger_2022_The}. We find that models where correlations between
+ equilibrium states are forbidden can nonetheless harbor
+ correlated stationary points.
} \label{fig:phases}
\end{figure}
The number $\mathcal N(E,\mu)$ of stationary points with energy density $E$ and
-stability $\mu$ is exponential in $N$ for these models. Their complexity $\Sigma(E,\mu)$ is
-defined by the average of the logarithm of their number, or
-$\Sigma(E,\mu)=\frac1N\overline{\log\mathcal N(E,\mu)}$. More often the annealed
-complexity is calculated, where the average is taken before the logarithm:
-$\Sigma_\mathrm a(E,\mu)=\frac1N\log\overline{\mathcal N(E,\mu)}$. The annealed
-complexity has been computed for these models \cite{BenArous_2019_Geometry,
-Folena_2020_Rethinking}, and the quenched complexity has been computed for a
-couple examples which have correlations among ground-state minima
-\cite{Kent-Dobias_2023_How}.
+stability $\mu$ is exponential in $N$. Their complexity
+$\Sigma(E,\mu)$ is defined by the average of the logarithm of their number:
+$\Sigma(E,\mu)=\frac1N\overline{\log\mathcal N(E,\mu)}$. More often the
+annealed complexity is calculated, where the average is taken before the
+logarithm: $\Sigma_\mathrm a(E,\mu)=\frac1N\log\overline{\mathcal N(E,\mu)}$.
+The annealed complexity has been computed for these models
+\cite{BenArous_2019_Geometry, Folena_2020_Rethinking}, and the quenched
+complexity has been computed for a couple examples which have nontrivial ground
+states \cite{Kent-Dobias_2023_How}.
In these models, trivial correlations between stationary points correspond with
zero overlap: almost all stationary points are orthogonal to each other. This
corresponds with \emph{replica symmetric} (\textsc{rs}) order. The emergence of
-nontrivial correlations, and the invalidity of the anneal approximation, occurs
+nontrivial correlations, and the invalidity of the annealed approximation, occurs
when some non-vanishing fraction of stationary point pairs have a nonzero
overlap. This corresponds to some kind of \emph{replica symmetry breaking}
(\textsc{rsb}). Here we restrict ourselves to a {\oldstylenums1}\textsc{rsb}
@@ -197,21 +206,22 @@ ansatz, which corresponds to two kinds of pairs of stationary point: a fraction
$x$ of pairs have the trivial zero overlap, and the remaining fraction $1-x$
have a nontrivial overlap $q_1$. In the annealed or replica-symmetric case,
$x=1$ and all but a vanishing fraction of stationary points are uncorrelated
-with each other. Since other kinds of \textsc{rsb} order encompass {\oldstylenums1}\textsc{rsb}, we are guaranteed that
-$\Sigma\leq\Sigma_{\oldstylenums1\textsc{rsb}}\leq\Sigma_\mathrm a$. We
-will discuss later in what settings the {\oldstylenums1}\textsc{rsb} complexity
-is correct.
+with each other. Since other kinds of \textsc{rsb} order encompass
+{\oldstylenums1}\textsc{rsb}, we are guaranteed that
+$\Sigma\leq\Sigma_{\oldstylenums1\textsc{rsb}}\leq\Sigma_\mathrm a$. We will
+discuss later in what settings the {\oldstylenums1}\textsc{rsb} complexity is
+correct.
When the complexity is calculated using the Kac--Rice formula and a physicists'
tool set, the problem is reduced to the evaluation of an integral by the saddle
-point method for large $N$ \cite{Kent-Dobias_2023_How}.
-The complexity is given by extremizing an effective action,
+point method for large $N$ \cite{Kent-Dobias_2023_How}. The complexity is given
+by extremizing an effective action,
\begin{equation}
\Sigma_{\oldstylenums1\textsc{rsb}}(E,\mu)
=\lim_{n\to0}\int dq_1\,dx\,\mathcal S_{\oldstylenums1\textsc{rsb}}(q_1,x\mid E,\mu)e^{nN\mathcal S_{\oldstylenums1\textsc{rsb}}(q_1,x\mid E,\mu)}
=\mathop{\mathrm{extremum}}_{q_1,x}\mathcal S_{\oldstylenums1\textsc{rsb}}(q_1,x\mid E,\mu)
\end{equation}
-for the action $\mathcal S$ given by
+for the action $\mathcal S_{\oldstylenums1\textsc{rsb}}$ given by
\begin{equation}
\begin{aligned}
&\mathcal S_{\oldstylenums1\textsc{rsb}}(q_1,x\mid E,\mu)
@@ -245,14 +255,13 @@ where $\Delta x=1-x$ and
-\log\left(\left|\frac{\mu}{\mu_\text m}\right|-\sqrt{\big(\frac\mu{\mu_\text m}\big)^2-1}\right) & \mu^2>\mu_\text m^2
\end{cases}
\end{equation}
+The details of the derivation of these expressions can be found in \cite{Kent-Dobias_2023_How}.
The extremal problem in $\hat\beta$, $r_\mathrm d$, $r_1$, $d_\mathrm d$, and
$d_1$ has a unique solution and can be found explicitly, but the resulting
-formula is much more complicated so we do not include it here. There can be
-multiple extrema at which to evaluate $\mathcal
-S_{\oldstylenums1\textsc{rsb}}$, in this case the one for which $\Sigma$ is
+formula is unwieldy. The action can have multiple extrema, but the one for which the complexity is
\emph{smallest} gives the correct solution. There is always a solution for
-$x=1$ which is independent of $q_1$, which corresponds to the replica symmetric
-case and which is equal to the annealed calculation, so $\Sigma_\mathrm
+$x=1$ which is independent of $q_1$, corresponding to the replica symmetric
+case, and with $\Sigma_\mathrm
a(E,\mu)=\mathcal S_{\oldstylenums1\textsc{rsb}}(E,\mu\mid q_1,1)$. The crux of
this paper will be to determine when this solution is not the global one.
@@ -261,24 +270,25 @@ It isn't accurate to say that a solution to the saddle point equations is
not a variational problem, so there is nothing to be maximized or minimized,
and in general even global solutions are not even local minima of the action.
However, the stability of the action can still tell us something about the
-emergence of new solutions: when another solution bifurcates from an existing
-one, the action will have a flat direction. Unfortunately this is a difficult
-procedure to apply in general, since one must know the parameters of the new
-solution, and some parameters, e.g., $q_1$, are unconstrained and can take any
-value in the old solution.
+emergence of new solutions: when a new solution bifurcates from an existing
+one, the action will have a flat direction. Unfortunately this is difficult to
+search out, since one must know the parameters of the new solution, and $q_1$
+is unconstrained and can take any value in the old solution.
There is one place where we can consistently search for a bifurcating solution
-to the saddle point equations: along the zero complexity line
-$\Sigma_\mathrm a(E,\mu)=0$. Going along this line in the replica symmetric solution, the
+to the saddle point equations: along the zero complexity line $\Sigma_\mathrm
+a(E,\mu)=0$. Going along this line in the replica symmetric solution, the
{\oldstylenums1}\textsc{rsb} complexity transitions at a critical point where
$x=q_1=1$ \cite{Kent-Dobias_2023_How}. Since all the parameters in the
bifurcating solution are known at this point, we can search for it by looking
-for a flat direction in the way described above. In the annealed
-solution for points describing saddles ($\mu<\mu_\mathrm m$), this line is
+for a flat direction. In the annealed solution for
+points describing saddles ($\mu<\mu_\mathrm m$), this line is
\begin{equation} \label{eq:extremal.line}
\mu_0=-\frac1{z_f}\left(2Ef'f''+\sqrt{2f''u_f\bigg(\log\frac{f''}{f'}z_f-E^2(f''-f')\bigg)}\right)
\end{equation}
-where we define for brevity (here and elsewhere) the constants
+where we have chosen the lower branch as a convention (see
+Fig.~\ref{fig:complexity_35}) and where we define for brevity (here and
+elsewhere) the constants
\begin{align}
u_f&=f(f'+f'')-f'^2
&&
@@ -294,14 +304,16 @@ these constants are positive. We also define $E_\textrm{min}$, the minimum
energy at which saddle points with an extensive number of downward directions
are found, as the energy for which $\mu_0(E_\mathrm{min})=\mu_\mathrm m$.
-Let $M$ be the matrix of double partial derivatives of $\mathcal S$ with
+Let $M$ be the matrix of double partial derivatives of the action with
respect to $q_1$ and $x$. We evaluate $M$ at the replica symmetric saddle point
$x=1$ with the additional constraint that $q_1=1$ and along the extremal
complexity line \eqref{eq:extremal.line}. We determine when a zero eigenvalue
appears, indicating the presence of a bifurcating {\oldstylenums1}\textsc{rsb}
solution, by solving $0=\det M$. We find
\begin{equation}
- \det M=-\bigg(\frac{\partial^2\mathcal S}{\partial q_1\partial x}\bigg|_{\substack{x=1\\q_1=1}}\bigg)^2\propto(ay^2+bE^2+2cyE-d)^2
+ \det M
+ =-\bigg(\frac{\partial^2\mathcal S_{\oldstylenums1\textsc{rsb}}}{\partial q_1\partial x}\bigg|_{\substack{x=1\\q_1=1}}\bigg)^2
+ \propto(ay^2+bE^2+2cyE-d)^2
\end{equation}
where $y=-\frac12z_f\mu-f'f''E$ is proportional to the square-root term in
\eqref{eq:extremal.line} and the constants $a$, $b$, $c$, and $d$ are defined
@@ -315,11 +327,11 @@ by
\qquad
d=\frac{w_f}{f'f''}
\end{equation}
-Changing variables to $y$ from $\mu$ is a
-convenient choice because the branch of \eqref{eq:extremal.line} is chosen
-by the sign of $y$ (the lower-energy branch we are interested in corresponds
-with $y>0$) and the relationship between $y$ and $E$ on the extremal line is
-$g=2hy^2+eE^2$, where the constants $e$, $g$, and $h$ are given by
+Changing variables from $\mu$ to $y$ is convenient because the branch
+of \eqref{eq:extremal.line} is chosen by the sign of $y$ (the lower-energy
+branch we are interested in corresponds with $y>0$). The relationship
+between $y$ and $E$ on the extremal line is $g=2hy^2+eE^2$, where the constants
+$e$, $g$, and $h$ are given by
\begin{equation}
e=f''-f'
\qquad
@@ -335,8 +347,8 @@ $g=2hy^2+eE^2$, where the constants $e$, $g$, and $h$ are given by
\caption{
Stationary point statistics as a function of energy density $E$ and
stability $\mu$ for a $3+5$ model with $\lambda=\frac12$. The dashed black
- line shows the line of zero complexity, where stationary points vanish, and
- enclosed inside they are found in exponential number. The red region (blown
+ line shows the line of zero annealed complexity, where stationary points vanish, and
+ enclosed inside they are found in exponential number. The solid black line (only visible in the inset) gives the line of zero {\oldstylenums1\textsc{rsb}} complexity. The red region (blown
up in the inset) shows where the annealed complexity gives the wrong count
and a {\oldstylenums1}\textsc{rsb} complexity in necessary. The red points
show where $\det M=0$. The left point, which is only an upper bound on the
@@ -358,7 +370,7 @@ energies that satisfy
\end{equation}
This predicts two points where a {\oldstylenums1}\textsc{rsb} solution can
bifurcate from the annealed one. The remainder of the transition line can be
-found by trying to solve the extremal problem for the action very close to one
+found by solving the extremal problem for the action very close to one
of these solutions, and then taking small steps in the parameters $E$ and $\mu$
until it terminates. In many cases considered here, the line of transitions in
the complexity that begins at $E_{\oldstylenums1\textsc{rsb}}^+$, the higher
@@ -367,7 +379,8 @@ energy point, so that these two points give the precise range of energies at
which \textsc{rsb} saddles are found. An example that conforms with this
picture for a $3+5$ mixed model is shown in Fig.~\ref{fig:complexity_35}.
-The expression inside the inner square root of \eqref{eq:energies} is proportional to
+The expression inside the inner square root of \eqref{eq:energies} is
+proportional to
\begin{equation} \label{eq:condition}
G_f
=
@@ -377,8 +390,8 @@ The expression inside the inner square root of \eqref{eq:energies} is proportion
-2(f''-f')u_fw_f
-2\log^2\frac{f''}{f'}f'^2f''v_f
\end{equation}
-If $G_f>0$, then the bifurcating solutions exist, and there is someplace where
-the annealed solution is corrected by a {\oldstylenums1\textsc{rsb}} solution.
+If $G_f>0$, then the bifurcating solutions exist, and there are some saddles whose
+complexity is corrected by a {\oldstylenums1\textsc{rsb}} solution.
Therefore, $G_f>0$ is a condition to see {\oldstylenums1}\textsc{rsb} in the
complexity. If $G_f<0$, then there is nowhere along the extremal line where
saddles can be described by such a complexity. The range of $3+s$ models where
@@ -408,15 +421,15 @@ $G_f$ is positive is shown in Fig.~\ref{fig:phases}.
$E_\textrm{min}$, the minimum energy where saddles are found, and in the
bottom row this energy is subtracted away to emphasize when the
\textsc{rsb} region crosses into minima. For most $s$, both the top and
- bottom lines are given by $E_{\oldstylenums1\textsc{rsb}}$, but for $s=14$
+ bottom lines are given by $E_{\oldstylenums1\textsc{rsb}}^\pm$, but for $s=14$
there is a portion where the low-energy boundary has $q_1<1$. In that plot,
- the continuation of the $E_{\oldstylenums1\textsc{rsb}}$ line is shown
+ the continuation of the $E_{\oldstylenums1\textsc{rsb}}^-$ line is shown
dashed. Also marked is the range of $\lambda$ for which the ground state
minima are characterized by nontrivial \textsc{rsb}.
} \label{fig:energy_ranges}
\end{figure}
-Fig.~\ref{fig:energy_ranges} shows the range of energies at which nontrivial
+Fig.~\ref{fig:energy_ranges} shows the range of energies where nontrivial
correlations are found between stationary points in several $3+s$ models as
$\lambda$ is varied. For models with smaller $s$, such correlations are found
only among saddles, with the boundary never dipping beneath the minimum energy
@@ -428,7 +441,7 @@ $s$, the range passes into minima, which is excepted as these models have
nontrivial complexity of their ground states. This also seems to correspond
with the decoupling of the \textsc{rsb} solutions connected to
$E_{\oldstylenums1\textsc{rsb}}^+$ and $E_{\oldstylenums1\textsc{rsb}}^-$, with
-the two phase boundaries not corresponding, as in Fig.~\ref{fig:order}. In
+the two phase boundaries no longer corresponding, as in Fig.~\ref{fig:order}. In
these cases, $E_{\oldstylenums1\textsc{rsb}}^-$ sometimes gives the lower
bound, but sometimes it is given by the termination of the phase boundary
extended from $E_{\oldstylenums1\textsc{rsb}}^+$.
@@ -461,15 +474,15 @@ extended from $E_{\oldstylenums1\textsc{rsb}}^+$.
} \label{fig:order}
\end{figure}
-There are implications for the emergence of \textsc{rsb} in equilibrium. Consider a specific $H$ with
+There are implications for the emergence of \textsc{rsb} in equilibrium.
+Consider a specific $H$ with
\begin{equation}
H(\pmb\sigma)
- =\frac{\sqrt\lambda}{p!}\sum_{i_1\cdots i_p}J^{(p)}_{i_1\cdots i_p}\sigma_{i_1}\cdots\sigma_{i_2}
+ =\frac{\sqrt\lambda}{p!}\sum_{i_1\cdots i_p}J^{(p)}_{i_1\cdots i_p}\sigma_{i_1}\cdots\sigma_{i_p}
+\frac{\sqrt{1-\lambda}}{s!}\sum_{i_1\cdots i_s}J^{(s)}_{i_1\cdots i_s}\sigma_{i_1}\cdots\sigma_{i_s}
\end{equation}
where the interaction tensors $J$ are drawn from zero-mean normal distributions
-with $\overline{(J^{(p)})^2}=p!/2N^{p-1}$ and likewise for $J^{(s)}$. It is
-straightforward to confirm that $H$ defined this way has the covariance
+with $\overline{(J^{(p)})^2}=p!/2N^{p-1}$ and likewise for $J^{(s)}$. Functions $H$ defined this way have the covariance
property \eqref{eq:covariance} with $f(q)=\frac12\big(\lambda
q^p+(1-\lambda)q^s\big)$. With the $J$s drawn in this way and fixed for $p=3$
and $s=14$, we can vary $\lambda$, and according to Fig.~\ref{fig:phases} we
@@ -482,10 +495,10 @@ uncorrelated low-lying states splitting apart into correlated clusters. Where
existing stationary points do appear to split apart, when $\lambda$ is
decreased from large values, is among saddles, not minima.
-Similar reasoning can be made for other mixed models, like the $2+s$, which
+A imilar analysis can be made for other mixed models, like the $2+s$, which
should see complexities with other forms of \textsc{rsb}. For instance, in
\cite{Kent-Dobias_2023_How} we show that the complexity transitions from
-\textsc{rs} to full \textsc{rsb} when
+\textsc{rs} to full \textsc{rsb} (\textsc{frsb}) along the line
\begin{equation}
\mu
=-\frac{(f'+f''(0))u_f}{(2f-f')f'f''(0)^{1/2}}
@@ -493,29 +506,44 @@ should see complexities with other forms of \textsc{rsb}. For instance, in
\end{equation}
which can only be realized when $f''(0)\neq0$, as in the $2+s$ models. For
$s>2$, this transition line \emph{always} intersects the extremal line
-\eqref{eq:extremal.line}, and so \textsc{rsb} complexity should always be found
+\eqref{eq:extremal.line}, and so \textsc{rsb} complexity will always be found
among some population of stationary points. However, it is likely that for much
of the parameter space the so-called one-full \textsc{rsb}
-({\oldstylenums1\textsc{frsb}}) is the correct solution, as it likely is for
-large $s$ in the $3+s$ model at hand. Further work to find the conditions for
-transitions of the complexity to these forms of order is necessary.
+({\oldstylenums1\textsc{frsb}}), rather than \textsc{frsb}, is the correct solution, as it likely is for
+large $s$ and certain $\lambda$ in the $3+s$ models studied here. Further work to find the conditions for
+transitions of the complexity to {\oldstylenums1\textsc{frsb}} and {\oldstylenums2\textsc{frsb}} is necessary. For values
+of $s$ where there is no \textsc{rsb} of any kind in the ground state, we
+expect that the {\oldstylenums1\textsc{rsb}} complexity is correct.
What are the implications for dynamics? We find that nontrivial correlations
-tend to exist among saddle points with the maximum or minimum index possible at
+tend to exist among saddle points with the largest or smallest possible index at
a given energy density, which are quite atypical in the landscape. However,
these strangely correlated saddle points must descend to uncorrelated minima,
which raises questions about whether structure on the boundary of a basin of
-attraction is influential to the dynamics that descends into that basin. These saddles might act as early-time separatrices for descent trajectories. With
-large open problems in even the gradient decent dynamics on these models, it
+attraction is influential to the dynamics that descends into that basin. These
+saddles might act as early-time separatrices for descent trajectories. With
+open problems in even the gradient decent dynamics on these models (itself attracted to an atypical subset of marginal minima), it
remains to be seen whether such structures could be influential
-\cite{Folena_2020_Rethinking, Folena_2023_On}.
+\cite{Folena_2020_Rethinking, Folena_2021_Gradient, Folena_2023_On}. This structure among saddles
+cannot be the only influence, since it seems that the $3+4$ model is `safe'
+from nontrivial \textsc{rsb} among saddles.
We have determined the conditions under which the complexity of the mixed $3+s$
spherical models has different quenched and annealed averages, as the result of
nontrivial correlations between stationary points. We saw that these conditions
can arise among certain populations of saddle points even when the model is
guaranteed to lack such correlations between equilibrium states, and exist for
-saddle points at a wide range of energies.
+saddle points at a wide range of energies. This suggests that studies using
+complexity calculations cannot reliably use equilibrium behavior to defend
+making the annealed approximation. Our result has direct implications for the
+geometry of these landscapes, and perhaps could be influential to certain
+out-of-equilibrium dynamics.
+
+
+\paragraph{Funding information}
+
+JK-D is supported by a \textsc{DynSysMath} Specific Initiative of the
+INFN.
\printbibliography