\documentclass[reqno]{amsart}
\usepackage{hyperref}

\AtBeginDocument{{\noindent\small
\emph{Electronic Journal of Differential Equations},
Vol. 2017 (2017), No. 189, pp. 1--40.\newline
ISSN: 1072-6691. URL: http://ejde.math.txstate.edu or http://ejde.math.unt.edu}
\thanks{\copyright 2017 Texas State University.}
\vspace{8mm}}

\begin{document}
\title[\hfilneg EJDE-2017/189\hfil Galerkin approximations of optimal control problems]
{Galerkin approximations of nonlinear optimal control problems in Hilbert spaces}

\author[M. D. Chekroun, A. Kr\"oner, H. Liu \hfil EJDE-2017/189\hfilneg]
{Micka\"el D. Chekroun, Axel Kr\"oner, Honghu Liu}

\address{Micka\"el D. Chekroun \newline
Department of Atmospheric \& Oceanic Sciences,
University of California, Los Angeles, CA 90095-1565, USA}
\email{mchekroun@atmos.ucla.edu}

\address{Axel Kr\"oner \newline
Institut f\"ur Mathematik, Humbolt-Universit\"at Berlin,
10099 Berlin, Germany. \newline
INRIA and CMAP, \'Ecole Polytechnique,
CNRS, Universit\'e, Paris Saclay, \newline
91128 Palaiseau, France}
\email{axel.kroener@inria.fr}

\address{Honghu Liu \newline
Department of Mathematics,
Virginia Polytechnic Institute and State University,\newline
Blacksburg, Virginia 24061, USA}
\email{hhliu@vt.edu}

\dedicatory{Communicated by Jesus Ildefonso Diaz}

\thanks{Submitted April 2, 2017. Published July 28, 2017.}
\subjclass[2010]{35Q86, 35Q93, 35K58, 49J15, 49J20, 86-08}
\keywords{Nonlinear optimal control problems;  Galerkin approximations;
\hfill\break\indent Greenhouse gas emissions; Energy balance models;
Trotter-Kato approximations}

\begin{abstract}
 Nonlinear optimal control problems in Hilbert spaces are considered
 for which we derive approximation theorems for Galerkin approximations.
 Approximation theorems are available in the literature. The originality
 of our approach relies on the identification of a set of natural
 assumptions that allows us to deal with a broad class of nonlinear
 evolution equations and cost functionals for which we derive convergence
 of the value functions associated with the optimal control problem of
 the Galerkin approximations. This convergence result holds for a broad
 class of nonlinear control strategies as well. In particular, we show
 that the framework applies to the optimal control of semilinear heat
 equations posed on a general compact manifold without boundary.
 The framework is then shown to apply to geoengineering and mitigation of
 greenhouse gas emissions formulated here in terms of optimal control
 of energy balance climate models posed on the sphere $\mathbb{S}^2$.
\end{abstract}

\maketitle
\numberwithin{equation}{section}
\newtheorem{theorem}{Theorem}[section]
\newtheorem{lemma}[theorem]{Lemma}
\newtheorem{remark}[theorem]{Remark}
\newtheorem{definition}[theorem]{Definition}
\newtheorem{corollary}[theorem]{Corollary}
\allowdisplaybreaks

%\tableofcontents

\section{Introduction}

Optimal control problems of infinite dimensional systems play an important role
in a broad range of applications in engineering and various scientific disciplines
 \cite{bensoussan2007representation,Fattorini99,Fur00,HPUU09,Lions71,Tro10}.
 Various methods for solving numerically the related optimization problems
are available; see e.g.~\cite{HPUU09,medjo2008optimal}.
The case of linear evolution equations has benefited from a long tradition,
and an abundant literature exists about finite element techniques or
Galerkin methods for the design of approximate optimal controls;
see e.g.~\cite{Alt_al89,Banks_al84,Gibson79, knowles1982finite, lasiecka1980unified,
lasiecka1987regulator,malanowski1982convergence, Mcknight_al73}.
  The case of Galerkin approximations of optimal control problems for nonlinear
evolutions seems to have been much less addressed. Semidiscrete Ritz-Galerkin
approximations of nonlinear parabolic boundary control problems have been
considered for which convergence of the approximate controls have been obtained;
 see \cite{MR1297998,MR1264014}. We refer also to
\cite{meidner2007adaptive,Neitzel2012} for error estimates concerned with
space-time finite element approximations of the state and control to optimal
control problems governed by semilinear parabolic equations, and to
\cite{deckelnick2004semidiscretization} for finite element approximations
of optimal control problems associated with the Navier-Stokes equations.


In this article, we study Galerkin approximations for (possibly non-quadratic)
optimal control problems over a finite horizon $[0,T]$, of nonlinear evolution
equations in Hilbert space. Our framework covers not only a broad class of
semilinear parabolic equations but also includes systems of nonlinear delay
differential equations (DDEs)  \cite{CGLW15,CKL17_DDE} and allows in each case for a
broad class of nonlinear control strategies. The main contribution of this
article is to identify for such equations a set of easily checkable conditions
in practice, from which we prove the pointwise convergence of the value
functions associated with the optimal control problem of the Galerkin
approximations, and for a broad class of cost functionals; see
Theorem~\ref{Thm_cve_Galerkin_val}, our main result. This convergence at the
 level of value functions results essentially from a double uniform
convergence -- with respect to time and the set of admissible controllers --
of the controlled Galerkin states; see Theorem \ref{Lem:uniform_in_u_conv}
and Corollary \ref{Lem:uniform_conv_locally_Lip_t_v2}.

The treatment adopted here is based on the classical Trotter-Kato approximation
approach from the $C_0$-semigroup theory \cite{Pazy83,Goldstein85}, which
can be viewed as the functional analysis operator version of the Lax equivalence
principle, i.e., if ``consistency'' and ``stability'' are satisfied,
then ``convergence'' holds, and reciprocally.
 Within this approach, we generalize,
in particular, the convergence results about value functions obtained in the
earlier work \cite{Ferretti97} concerned with the Galerkin approximations
to optimal control problems governed by linear evolution equations in Hilbert
space.  Given a Hilbert state space $\mathcal{H}$, denoting by $\Pi_N$ the orthogonal
projector associated with the $N$-dimensional Galerkin subspace, and by
$y_N(\cdot; \Pi_N x, u)$  the controlled  Galerkin state (driven by $u$)
and emanating from $\Pi_N x$, a key property to ensure convergence of
the value functions for such optimal control problems is the following double
uniform convergence
\begin{equation} \label{uniform_in_u_conv_Intro}
\lim_{N\to \infty}  \sup_{u\in \mathcal{U}_{ad}} \sup_{t \in [0, T]}
\|y_N(t; \Pi_N x, u) - y(t; x,u)\|_{\mathcal{H}} = 0, \quad \forall  x \in \mathcal{H},
\end{equation}
where $\mathcal{U}_{ad}$ denotes a set of admissible controls;
see \cite[Theorem 4.2]{Ferretti97}.


When the evolution equation involves  state- or control-dependent nonlinear terms,
the conditions provided in \cite[Proposition 2.1]{Ferretti97} to ensure
\eqref{uniform_in_u_conv_Intro} needs to be amended. Whether the nonlinear
terms involve the controls or the system's state,  our working assumption
regarding the linear terms of the original equation and of its Galerkin
approximations, is (as in \cite{Ferretti97}) to satisfy respectively the
``stability'' and ``consistency'' conditions required in the Trotter-Kato
theorem; see Assumption (A1) and Assumption (A2) in
Sect.~\ref{Sec_Galerkin_prelim}.  In the case of a linear equation with nonlinear
 control terms, a simple compactness assumption about the set of admissible
controls (see Assumption (A5) in Sect.~\ref{Sect_uniform_convergence})
is sufficient to ensure \eqref{uniform_in_u_conv_Intro}; see Remark \ref{Rmk_F=0}.

In the case of an evolution equation depending nonlinearly on the system's state
and on the controls, a key assumption is introduced to ensure
\eqref{uniform_in_u_conv_Intro} that adds up to standard local
Lipschitz conditions on the state-dependent nonlinear terms
(Assumption~(A3)) and the nonlinear control operator $\mathfrak{C}:V\to \mathcal{H}$,
 where $V$ denotes an auxiliary Hilbert space in which the controls take values.
 Introducing $\Pi^\perp_N:=\operatorname{Id}_{\mathcal{H}} - \Pi_N$, this assumption concerns
a double uniform convergence about the residual energy
$\|\Pi^\perp_N y(t;x,w)\|_{\mathcal{H}}$ (see Assumption (A7) in
Sect.~\ref{Sect_uniform_convergence}), namely
\begin{equation} \label{Est_uniformity_highmodes_intro}
\lim_{N \to \infty}  \sup_{u\in \mathcal{U}_{ad}}
\sup_{t\in[0,T]} \|\Pi^\perp_N y(t;x,u)\|_{\mathcal{H}} =0.
\end{equation}

 With this assumption at hand, and the rest of our working assumptions,
standard {\it a priori} bounds -- uniform in $u$ in $\mathcal{U}_{ad}$
(Assumption~(A6)) -- allow us to ensure
\eqref{uniform_in_u_conv_Intro} for a broad class of nonlinear evolution
equations in Hilbert spaces.  The pointwise convergence of the value
functions associated with the optimal control problem of the corresponding
Galerkin approximations is then easily derived for a broad class of cost
functionals; see Theorem~\ref{Thm_cve_Galerkin_val}.


The relevance of assumption \eqref{Est_uniformity_highmodes_intro} for applications
is addressed through various angles. First, from the proof of
Corollary \ref{Lem:uniform_conv_locally_Lip_t_v2} (and thus
Theorem \ref{Lem:uniform_in_u_conv}) in which
Theorem~\ref{Thm_cve_Galerkin_val} relies.  In that respect, a sort of
pedagogical detour is made in Sect.~\ref{Sect_local_convergence} in which
we show essentially that a weaker (than \eqref{uniform_in_u_conv_Intro})
local-in-$u$ approximation  result (Lemma \ref{Lem_local_in_u_est})
 follows from the rest of our working assumptions (except Assumptions (A6)
 and (A7)\footnote{More precisely, by assuming a weaker version of
Assumption (A6), namely Assumption~(A4), and without assuming (A7).})
 and from a local-in-$u$ estimate about the residual energy
(Lemma~\ref{Lem:local_in_u_conv}); the latter resulting itself from the
continuity of the mapping $u\mapsto y(t;x,u)$. Condition
\eqref{Est_uniformity_highmodes_intro} constitutes thus a natural
strengthening of inherent properties to the approximation problem.

From a more applied perspective, sufficient conditions concerning the spectrum
of the linear part --such as self-adjointness and compact resolvent--
are pointed out in Sect.~\ref{Sect_examples} to ensure
\eqref{Est_uniformity_highmodes_intro}; see\footnote{See also
\cite[Sect.~2.3]{CKL17_DDE} for other spectral conditions which do not
rely on self-adjointness while ensuring  \eqref{Est_uniformity_highmodes_intro}.}
 Lemma \ref{Lem_examples} and  Remark \ref{Rmk_other_spectral_assumption}.
Finally,  Sect.~\ref{Sec_Err_estimates} provides error estimates concerning the
value function and the optimal control that complete the picture and emphasize
from another perspective the relevance of the residual energy in the analysis
of the approximation problem; see Theorem \ref{Thm_PM_val} and
Corollary \ref{Lem_controller_est}.

With this preamble in mind, we provide now the more formal organization of this
article. First, we present in Sect.~\ref{Sec_Galerkin_prelim} the type of state
equation and its corresponding Galerkin approximations that we will be working on.
A trajectory-wise convergence result for each fixed control $u$ is then derived
in Sect.~\ref{Sect_trajectory_convergence}. As mentioned earlier, it relies
essentially on the theory of $C_0$-semigroups and the Trotter-Kato theorem
\cite[Thm.~4.5, p.88]{Pazy83}; see Lemma~\ref{Lem:local_in_u_conv}.
In a second step, we derive a ``local-in-$u$'' approximation result in
Sect.~\ref{Sect_local_convergence} for controls that lie within a neighborhood
of a given control $u$; see Lemma \ref{Lem_local_in_u_est}.
As discussed above, a key approximation property about the residual energy
 of solutions (see \eqref{Est_local_uniformity_highmodes}) is then amended into
an assumption (see Assumption (A7))
to ensure a uniform-in-$u$ convergence result; see Theorem \ref{Lem:uniform_in_u_conv}
 of Sect.~\ref{Sect_uniform_convergence}. As shown in Sect.~\ref{Sec_cve}, this
uniform convergence result helps us derive --in the spirit of dynamic programming
(see Corollary \ref{Lem:uniform_conv_locally_Lip_t_v2})-- the convergence of
the value functions associated with optimal control problems based on Galerkin
approximations; see Theorem~\ref{Thm_cve_Galerkin_val}. For this purpose,
 some standard sufficient conditions for the existence of optimal controls
are also recalled in Appendix~\ref{Sec_existence_opt_contr}. Simple and useful
error estimates about the value function and the optimal control are then
provided in Sect.~\ref{Sec_Err_estimates}. In Sect.~\ref{Sect_examples} we point
out a broad class of evolution equations for which Assumption (A7) is satisfied.

As applications of the theoretical results derived in Sect.~\ref{Sect_Galerkin},
we show in Sect.~\ref{Sec_appl} that our framework allows to provide
rigorous Galerkin approximations to the optimal control of  a broad class of
semilinear heat problems, posed on a compact (smooth) manifold without boundary.
 As a concrete example, the framework is shown to apply to geoengineering and
the mitigation of greenhouse gas (GHG) emissions formulated for the first
time here in terms of optimal control of energy balance models (EBMs) arising
in climate modeling; see \cite{Budyko69,Sellers69,Ghil76,North_al81} for an
 introduction on EBMs, and \cite{Diaz98,bermejo2009mathematical} for a mathematical
 analysis.   After recalling some fundamentals of differential geometry in
 Sect.~\ref{Sect_diff_geo_prelim} to prepare the analysis, a general convergence
result of Galerkin approximations to controlled semilinear heat problems posed
on an $n$-dimensional sphere $\mathbb{S}^n$ is formulated in
Sect.~\ref{Sec_optctr_man}; see Corollary~\ref{Cor:heat_Galerkin_approx}.
The application to the optimal control of EBMs is then presented in
Sect.~\ref{Sec_EBM} in the context of geoengineering and GHG emissions
for which approximation of the value function and error estimates about
the optimal control are obtained. Finally,
Sect.~\ref{Sect_concluding_remarks} outlines several possible directions
for future research the framework introduced in this article opens up.

\section{Galerkin approximations for optimal control problems: Convergence results}  \label{Sect_Galerkin}

We present in this section, rigorous convergence results for semi-discretization
of optimal control problems based on Galerkin approximations.
In particular, we derive the pointwise convergence of the value functions
associated with optimal control problems based on Galerkin approximations
in Sect.~\ref{Sec_cve}.


\subsection{Preliminaries} \label{Sec_Galerkin_prelim}
We consider in this article finite-dimensional approximations of the following
initial-value problem (IVP):
\begin{equation} \label{ODE}
\begin{gathered}
\frac{\mathrm{d} y}{\mathrm{d} t} = L y + F(y) + \mathfrak{C} (u(t)),  \quad t \in (0, T],\\
y(0) = x,
\end{gathered}
\end{equation}
where $x$ lies in $\mathcal{H}$, and $\mathcal{H}$ denotes a separable Hilbert space.
 The time-dependent forcing $u$ lives in a separable Hilbert space $V$
(possibly different from $\mathcal{H}$); the (possibly nonlinear) mapping
$\mathfrak{C}: V \to \mathcal{H}$ is assumed to be such that $\mathfrak{C}(0)=0$.
Other assumptions regarding $\mathfrak{C}$ will be made precise when needed.

We assume that the linear operator $L: D(L) \subset \mathcal{H} \to \mathcal{H}$ is the
 infinitesimal  generator of a
$C_0$-semigroup of bounded linear operators $T(t)$ on $\mathcal{H}$.
Recall that in this case the domain $D(L)$ of $L$ is dense in $\mathcal{H}$
and that $L$ is a closed operator;  see \cite[Cor.~2.5, p.~5]{Pazy83}.

Under the above assumptions on the operator $L$, recall that there exists
$M\geq 1$ and $\omega \geq 0$  \cite[Thm.~2.2, p.~4]{Pazy83} such that
\begin{equation} \label{Eq_control_T_t}
\|T(t)\| \le M e^{\omega t},  \quad t \ge 0,
\end{equation}
where $\|\cdot \|$ denotes the operator norm subordinated to $\|\cdot\|_{\mathcal{H}}$.

For the moment, we take the set of admissible controls to be
\begin{equation} \label{Eq_admissible_set_LpV}
 \mathcal{U} := L^q(0, T; V),
\end{equation}
with $q\geq1$. In the later subsections, further assumptions on the
admissible controls will be specified when needed.


Let $u$ be in $\mathcal{U}$  given by \eqref{Eq_admissible_set_LpV}, a
 {\it mild solution} to \eqref{ODE} over $[0,T]$ is a function $y$ in
$C([0,T],\mathcal{H})$ such that
\begin{equation} \label{Eq_mild}
y(t)=T(t)x + \int_0^t T(t-s) F(y(s)) \mathrm{d} s + \int_0^t T(t-s)
\mathfrak{C}(u(s)) \mathrm{d} s, \quad t\in [0,T].
\end{equation}
In what follows we will often denote by $t\mapsto y(t;x,u)$ a mild solution
to \eqref{ODE}.


Let $\{\mathcal{H}_N: N \in \mathbb{Z}_+^\ast\}$ be a sequence of finite-dimensional
subspaces of $\mathcal{H}$ associated with {\it orthogonal  projectors}
\begin{equation}
\Pi_N: \mathcal{H} \to \mathcal{H}_N,
\end{equation}
such that
\begin{equation} \label{Eq_identity_approx}
\|(\Pi_N-\operatorname{Id}) x\| \underset{N \to \infty}\longrightarrow 0, \quad
\forall x \in \mathcal{H},
\end{equation}
and
\begin{equation} \label{Eq_XN_in_domain}
\mathcal{H}_N\subset D(L), \quad \forall  N\geq 1.
\end{equation}

The corresponding Galerkin approximation of \eqref{ODE} associated with $\mathcal{H}_N$
 is then given by:
\begin{equation} \label{ODE_Galerkin}
\begin{gathered}
\frac{\mathrm{d} y_N}{\mathrm{d} t} = L_N y_N + \Pi_N F(y_N) + \Pi_N \mathfrak{C} (u(t)), \quad
 t\in [0,T],\\
y_N(0) = \Pi_N x, \quad  x\in \mathcal{H},
\end{gathered}
\end{equation}
where
\begin{equation} \label{Def_LN}
L_N := \Pi_N L \Pi_N : \mathcal{H} \to \mathcal{H}_N.
\end{equation}
In particular, the domain
$D(L_N)$ of $L_N$ is $\mathcal{H}$, because of \eqref{Eq_XN_in_domain}.

Throughout this section,  we assume the following set of assumptions:
\begin{itemize}

\item[(A0)]  The linear operator $L: D(L) \subset \mathcal{H} \to \mathcal{H}$ is the
infinitesimal  generator of a
$C_0$-semigroup of bounded linear operators $T(t)$ on $\mathcal{H}$.

\item[(A1)]   For each positive integer $N$, the linear flow
$e^{L_N t}:\mathcal{H}_N \to \mathcal{H}_N$ extends to a $C_0$-semigroup $T_N(t)$ on
$\mathcal{H}$. Furthermore the following uniform bound is satisfied by the family
$\{T_N(t)\}_{N \geq 1, t\geq0}$
\begin{equation} \label{Eq_control_linearflow}
\|T_N(t)\| \le M e^{\omega t}, \quad N \geq 1,  \quad t \ge 0,
\end{equation}
where $\|T_N(t)\|:=\sup\{\|T_N(t)x\|_{\mathcal{H}}, \; \|x\|_{\mathcal{H}} \leq 1, x\in \mathcal{H}\}$
and the constants $M$ and $\omega$ are the same as given in
\eqref{Eq_control_T_t}.

\item[(A2)]
 The following convergence holds
\begin{equation} \label{Eq_L_Approx}
\lim_{N \to \infty} \|L_N  \phi - L \phi \|_{\mathcal{H}} = 0, \quad \forall \phi \in D(L).
\end{equation}

\item[(A3)]  The nonlinearity $F$ is locally Lipschitz in the sense given
in \eqref{Local_Lip_cond} below.

\end{itemize}


Following the presentation commonly  adopted for the Trotter-Kato approach,
the assumptions (A0)--(A2) are concerned with the linear parts of the original
system \eqref{ODE} and of its Galerkin approximation \eqref{ODE_Galerkin}.
Assumption (A3) is concerned with the nonlinearity in \eqref{ODE}.
Other assumptions regarding the latter will be made in the sequel.
Throughout this article, a mapping $f: \mathcal{W}_1 \to \mathcal{W}_2$
between two Banach spaces, $\mathcal{W}_1$ and $\mathcal{W}_2$, is said to
 be locally Lipschitz if for any ball $\mathfrak{B}_r \subset \mathcal{W}_1$
with radius $r>0$ centered at the origin,  there exists a constant
$\operatorname{Lip}(f\vert{_{\mathfrak{B}_r}})>0$ such that
\begin{equation} \label{Local_Lip_cond}
\|f(y_1) - f(y_2)\|_{\mathcal{W}_2}
\le \operatorname{Lip}(f\vert{_{\mathfrak{B}_r}})\|y_1 - y_2\|_{\mathcal{W}_1},
\quad \forall y_1, y_2 \in \mathfrak{B}_r.
\end{equation}


\subsection{Convergence of Galerkin approximations: Trajectory-wise result}
 \label{Sect_trajectory_convergence}

As a preparation for the main result given in Sect.~\ref{Sec_cve}, we derive
hereafter a trajectory-wise convergence result for the solutions to the
 Galerkin approximations \eqref{ODE_Galerkin}; see
Lemma~\ref{Lem:local_in_u_conv} below.

With this purpose in mind, besides (A0)--(A3), we will also make use of the
following assumption.
\begin{itemize}
\item[(A4)]  For each $T>0$, $x$ in $\mathcal{H}$ and each $u$ in $\mathcal{U}$ with
$\mathcal{U}$ defined in \eqref{Eq_admissible_set_LpV}, the problem
\eqref{ODE} admits a unique mild solution $y(\cdot; x, u)$ in $C([0,T],\mathcal{H})$,
and its Galerkin approximation \eqref{ODE_Galerkin} admits a unique solution
$y_N(\cdot; \Pi_N x, u)$ in  $C([0,T],\mathcal{H}_N)$ for each $N$ in $\mathbb{Z}_+^\ast$.
 Moreover, there exists a constant $C:=C(T,x,u)$ such that
\begin{equation} \label{Eq_y_local-in-u_bounds}
 \|y_N(t; \Pi_N x, u)\|_{\mathcal{H}} \le C, \quad \forall t\in[0,T],\;
 N \in \mathbb{Z}_+^\ast.
\end{equation}
\end{itemize}

Note that in applications, (A4) is typically satisfied via {\it a priori}
estimates; see Remark~\ref{Rmk:unif_bdd_on_soln}-(ii) below.

\begin{lemma} \label{Lem:local_in_u_conv}
Let $\mathcal{U}$ be the set of admissible controls given by
\eqref{Eq_admissible_set_LpV}, with $q$ defined therein.
Consider the IVP \eqref{ODE} and the associated Galerkin approximation
\eqref{ODE_Galerkin}.  Assume that the nonlinear operator $\mathfrak{C}:V\to \mathcal{H}$
satisfies, for  $1\leq p \leq q$, the following growth condition,
\begin{equation} \label{Eq_poly_growth_C}
\|\mathfrak{C} (w)\|_{\mathcal{H}} \le \gamma_1 \|w\|^p_V + \gamma_2, \quad \forall w \in V,
\end{equation}
where $\gamma_1 > 0$ and $\gamma_2 \ge 0$.

Assume also that {\rm (A0)--(A4)} hold. Then for each fixed $T > 0$, $x$
in ${\mathcal{H}}$ and $u$ in $\mathcal{U}$, the following convergence result
is satisfied:
\begin{equation} \label{local_in_u_conv_Goal}
\lim_{N\to \infty}  \sup_{t \in [0, T]} \|y_N(t; \Pi_N x, u) - y(t; x,u)\|_{\mathcal{H}} = 0.
\end{equation}
\end{lemma}


\begin{proof}
To simplify the notations, only the $x$-dependency that matters to the estimates
derived hereafter will be made explicit.
Let $u$ be given in $\mathcal{U}$ and $x$ in $\mathcal{H}$, then by the variation-of-constants
formula applied to \eqref{ODE_Galerkin} we have, for $0\leq t\leq T$ and $N$
in $\mathbb{Z}_+^\ast$, that
\begin{equation} \label{Eq_Galerkin_VCF}
\begin{aligned}
y_N(t; u) &= e^{L_N t} \Pi_N x  + \int_0^t e^{L_N (t -s )} \Pi_N F(y_N(s; u)) \mathrm{d} s \\
& \quad + \int_0^t e^{L_N (t -s )} \Pi_N \mathfrak{C} (u(s)) \mathrm{d} s.
\end{aligned}
\end{equation}


Then, it follows from \eqref{Eq_mild} and \eqref{Eq_Galerkin_VCF} that the
 difference
\[
w_N(t; u):=y(t; u)  - y_N(t; u),
\]
satisfies
\begin{equation}
\begin{aligned}
w_N(t; u)
&=  T(t) x - e^{L_N t} \Pi_N x  \\
&\quad + \int_0^t T(t-s)F(y(s; u)) \mathrm{d} s -
\int_0^t e^{L_N (t -s )} \Pi_N F(y_N(s; u)) \mathrm{d} s  \\
& \quad  +  \int_0^t T(t-s)\mathfrak{C} (u(s)) \mathrm{d} s
- \int_0^t e^{L_N (t -s )} \Pi_N \mathfrak{C} (u(s)) \mathrm{d} s
\end{aligned}
\end{equation}
and hence, we have
\begin{equation}
\begin{aligned}
w_N(t; u)
&=  T(t) x - e^{L_N t} \Pi_N x +
\int_0^t \big( T(t-s) -  e^{L_N (t -s )} \Pi_N  \big)  F(y(s; u)) \mathrm{d} s  \\
& \quad +  \int_0^t e^{L_N (t -s )} \Pi_N \big(F(y(s; u)) - F(y_N(s; u)) \big ) \mathrm{d} s \\
& \quad + \int_0^t \Big( T(t-s) - e^{L_N (t -s )} \Pi_N \Big)
 \mathfrak{C} (u(s)) \mathrm{d} s.
\end{aligned} \label{eq:residual}
\end{equation}

Let us introduce for every $s$ in $[0, T]$, $x$ in $\mathcal{H}$, and $u$ in $\mathcal{U}$,
\begin{subequations}\label{eq:symbols_residual}
\begin{gather}
 r_N(s; u)  := \|y(s; u)  - y_N(s; u) \|_{\mathcal{H}},   \label{totoa} \\
\zeta_N(x)  := \sup_{t\in[0, T]} \|T(t) x - e^{L_N t} \Pi_N x\|_{\mathcal{H}},   \label{totob}\\
 d_N(s; u)  := \sup_{t\in[s, T]} \| \big( T(t-s)
 -  e^{L_N (t -s )} \Pi_N \big) F(y(s; u)) \|_{\mathcal{H}}, \label{totoc}
\end{gather}
 \end{subequations}
and for almost every $s$ in $[0, T]$,
\begin{equation} \label{totod}
\widetilde{d}_N (s; u) := \sup_{t\in[s, T]} \| \big( T(t-s)
-  e^{L_N (t -s )} \Pi_N \big) \mathfrak{C}(u(s)) \|_{\mathcal{H}}.
\end{equation}

For $x$ is in $\mathcal{H}$ and $u$ in $\mathcal{U}$, let us denote by $\mathfrak{B}$
the closed ball in $\mathcal{H}$ with radius $C$ centered at the origin where $C$
is the upper bound in estimate \eqref{Eq_y_local-in-u_bounds} for the Galerkin
solutions (Assumption (A4)).

Since by assumption, $t\mapsto y(t; x, u)$ lies in $ C([0,T],\mathcal{H})$ for any
 $x$ in $\mathcal{H}$ and $u$ in $\mathcal{U}$ given by \eqref{Eq_admissible_set_LpV},
one can assume without loss of generality that $y(t; x, u)$ stays in
$\mathfrak{B}$ for all $t$ in $[0,T]$, by possibly redefining $C$.


We obtain  then  from \eqref{eq:residual} that
\begin{equation} \label{eq:residual2}
\begin{aligned}
 r_N(t; u)
& \le \zeta_N(x) + \int_0^t \|e^{L_N (t -s )} \Pi_N \big(F(y(s; u)) -F(y_N(s; u))
 \big )\|_{\mathcal{H}} \mathrm{d} s \\
& \quad +  \int_0^t d_N(s; u) \mathrm{d} s +\int_0^t  \widetilde{d}_N(s; u) \mathrm{d} s\\
& \le \zeta_N(x) + \int_0^t d_N(s; u) \mathrm{d} s + M \text{Lip}(F\vert{_\mathfrak{B}})
  \int_0^t e^{\omega (t -s )}  r_N(s; u) \mathrm{d} s \\
& \quad +   \int_0^t  \widetilde{d}_N(s; u) \mathrm{d} s\\
& \le \zeta_N(x) + \int_0^t d_N(s; u) \mathrm{d} s
 + M\text{Lip}(F\vert{_\mathfrak{B}})  \, e^{\omega T} \int_0^t  r_N(s; u) \mathrm{d} s  \\
 & \quad +   \int_0^t  \widetilde{d}_N(s; u) \mathrm{d} s,
\end{aligned}
\end{equation}
where we have used that $F$  is locally Lipschitz (Assumption (A3)) and the
uniform bound  \eqref{Eq_control_linearflow}  of  Assumption~(A1).

It follows then from Gronwall's inequality that for all $t$ in $[0,T]$,
\begin{equation} \label{eq_rn_gronwall}
\begin{aligned}
r_N(t; u) &\le \Big(\zeta_N(x)  +  \int_0^T   d_N(s; u) \mathrm{d} s
 +  \int_0^T   \widetilde{d}_N(s; u) \mathrm{d} s\Big) \\
&\quad\times \exp\big(M \text{Lip}(F\vert{_\mathfrak{B}}) e^{\omega T} T \big).
\end{aligned}
\end{equation}

We are thus left with the estimation of $\zeta_N(x)$,  $\int_0^T d_N(s; u) \mathrm{d} s$
and $\int_0^T  \widetilde{d}_N(s; u) \mathrm{d} s$ as $N \to \infty$. Note that the
assumptions (A1) and (A2) allow us to use a version of the Trotter-Kato
theorem \cite[Thm.~4.5, p.88]{Pazy83} which implies
together with \eqref{Eq_identity_approx} that
\begin{equation} \label{eq:linear_pointwise_convergence}
\lim_{N\to \infty} e^{L_N t} \Pi_N \phi  = T(t) \phi, \quad \forall \phi \in \mathcal{H},
\end{equation}
uniformly in $t$ lying in bounded intervals; see also \cite[footnote 6]{CGLW15}.

It follows that
\begin{equation} \label{eq:est_initial}
\lim_{N\to \infty} \zeta_N(x)=0,
\end{equation}
and that $d_N(\cdot; u)$ and $\widetilde{d}_N(\cdot; u)$ converge point-wisely
to zero on $[0,T]$, i.e.,
\begin{equation} \label{eq:dn_pointwise_convergence}
\lim_{N\to \infty} d_N(s; u)  = 0, \quad \forall s \in [0,T],
\end{equation}
and
\begin{equation} \label{eq:tilde_dn_pointwise_convergence}
\lim_{N\to \infty} \widetilde{d}_N(s; u)  = 0,  \textrm{ for a.e. } s \in [0,T].
\end{equation}

On the other hand, by using \eqref{Eq_control_T_t} and \eqref{Eq_control_linearflow}
and from the local Lipschitz assumption on $F$, we obtain for $0\le s \le t \le T$,
\begin{equation}
\begin{aligned}
&\| \big( T(t-s) -  e^{L_N (t -s )}  \Pi_N \big) F(y(s; u)) \|_{\mathcal{H}} \\
& \le 2Me^{\omega (t-s)}\|F(y(s; u)) \|_{\mathcal{H}} \\
& \le 2Me^{\omega (t-s)}\Big(\|F(y(s; u)) - F(0) \|_{\mathcal{H}} +\|F(0) \|_{\mathcal{H}} \Big) \\
& \le 2Me^{\omega (t-s)} \big(\text{Lip}(F\vert{_\mathfrak{B}})
 \, \|y(s; u) \|_{\mathcal{H}}  + \|F(0)\|_{\mathcal{H}}\big),
\end{aligned}
\end{equation}
which implies
\begin{equation} \label{eq:dn_dominated}
d_N(s,u) \le 2Me^{\omega T} \big(\text{Lip}(F\vert{_\mathfrak{B}})  \,
\|y(s; u) \|_{\mathcal{H}}  + \|F(0)\|_{\mathcal{H}}\big), \quad \forall s \in [0,T].
\end{equation}
Since $y(\cdot; u)$  lies in $C([0,T]; \mathcal{H})$, the mapping
$s\mapsto \|y(s,u)\|_{\mathcal{H}}$ is in particular integrable on $[0,T]$, and
the Lebesgue dominated convergence theorem allows us to conclude from
\eqref{eq:dn_pointwise_convergence} and \eqref{eq:dn_dominated} that
\begin{equation} \label{eq:est_dn_vf}
\lim_{N\to \infty} \int_0^T d_N(s; u) \mathrm{d} s  =0.
\end{equation}

Let us estimate  $\int_0^T \widetilde{d}_N(s; u) \mathrm{d} s$ as $N \to \infty$.
By using the growth condition \eqref{Eq_poly_growth_C}, we obtain for a.e.
$s \in [0, T]$ and all $t \in [s, T]$
\begin{equation} \label{eq:tilde_dn_dominated}
\| \big( T(t-s) -  e^{L_N (t -s )} \Pi_N \big) \mathfrak{C}(u(s)) \|_{\mathcal{H}}
\le 2 M e^{\omega T} \Big(\gamma_1 \|u(s)\|^p_V + \gamma_2\Big).
\end{equation}
Since $u$ lies in $L^q([0,T];V)$ with $q\geq p$, then $u$ lies in $L^p([0,T];V)$
and  the right hand side (RHS) of \eqref{eq:tilde_dn_dominated} is integrable
on $[0,T]$. The Lebesgue dominated  convergence theorem allows us then to
conclude from \eqref{eq:tilde_dn_pointwise_convergence} and
\eqref{eq:tilde_dn_dominated} that
\begin{equation} \label{eq:est_tilde_dn_vf}
\lim_{N\to \infty}  \int_0^T \widetilde{d}_N(s; u)  \mathrm{d} s  =0.
\end{equation}
The desired convergence result \eqref{local_in_u_conv_Goal} follows
now from \eqref{eq_rn_gronwall} by using \eqref{eq:est_initial},
\eqref{eq:est_dn_vf} and \eqref{eq:est_tilde_dn_vf}.
\end{proof}

\subsection{Local-in-$u$ approximation result} \label{Sect_local_convergence}

In this section, we consider for $q\geq 1$, $\mathcal{U}_{ad}$, to be the subset
of $L^q(0,T; V)$, constituted by measurable functions that
take values in  $U$, a bounded subset of the Hilbert space $V$.
In other words,
\begin{equation} \label{Eq_U_bounded}
\mathcal{U}_{ad}:=\{f\in L^q(0,T; V): f(s) \in U \text{ for a.e. } s \in [0,T]\},
\;q\geq 1.
\end{equation}
The set $\mathcal{U}_{ad}$ will be endowed with the induced topology from that
of $L^q(0,T; V)$.

We present hereafter a natural property that is derived from our working assumptions,
 namely that given an finite-dimensional approximation $\mathcal{H}_N$ of $\mathcal{H}$, the
residual energy of solutions to the IVP \eqref{ODE}, i.e.
\[
\|(\operatorname{Id}_{\mathcal{H}} - \Pi_N) y(t;x,w)\|_{\mathcal{H}},
\]
 can be made arbitrarily small as $N\to \infty$ and uniformly in $w$,
provided that $w$ lies within a sufficiently small open set of
$\mathcal{U}_{ad}$ given in \eqref{Eq_U_bounded}.


This is the purpose of Lemma \ref{Lem_A7_local_verion} which boils down
to proving the continuity of the mapping $u\mapsto y(t;x,u)$;
see \eqref{local_uniformity_highmodes_est1} below. As a consequence a
local-in-$u$ approximation result is naturally inferred; see
Lemma \ref{Lem_local_in_u_est}. However, as pointed out and amended in
 Sect.~\ref{Sect_uniform_convergence} below, this is insufficient to
guarantee convergence results for the value functions associated with
Galerkin approximations of optimal control problems subordinated to \eqref{ODE}.

The merit of Lemma \ref{Lem_A7_local_verion} below is nevertheless not only
to identify a symptom, but also to help us propose a cure.
Indeed, by requiring the residual energy of the solution to the IVP \eqref{ODE}
to vanish uniformly (in $u$) as $N\to \infty$, we are able to conclude about
 the desired convergence results for the value functions. The latter uniform
property (i.e.~the ``cure'') is shown below to hold for a broad class of
 IVPs; see Sect.~\ref{Sect_examples}.  For the moment, let us present the
``symptom,'' i.e.~the local-in-$u$ approximation results.  For that purpose,
we start with a local-in-$u$  estimate about the residual energy,
 \[
 \|(\operatorname{Id}_{\mathcal{H}} - \Pi_N) y(t;x,w)\|_{\mathcal{H}},
\]
where $w$ lives in some neighborhood of $u$.

\begin{lemma} \label{Lem_A7_local_verion}
Assume that {\rm (A0)--(A4)} hold. Assume furthermore that
$\mathfrak{C}:V\to \mathcal{H}$ is locally Lipschitz  and that the admissible controls
lie in $\mathcal{U}_{ad}$ given by \eqref{Eq_U_bounded} and endowed with the
induced $ L^q(0,T; V)$-topology, for $q > 1$.

Then, for any $(x,u)$ in $\mathcal{H} \times \mathcal{U}_{ad}$  and any $\epsilon>0$
there exists a neighborhood $\mathcal{O}_u \subset \mathcal{U}_{ad}$ of $u$
and $N_0\geq 1$ such that the mild solution $y(t;x,u)$ to \eqref{ODE}  satisfies
\begin{equation} \label{Est_local_uniformity_highmodes}
\sup_{w \in \mathcal{O}_u} \sup_{t\in[0,T]} \|(\operatorname{Id}_{\mathcal{H}} - \Pi_N)
y(t;x,w)\|_{\mathcal{H}} \le \epsilon, \quad \forall N \ge N_0.
\end{equation}
\end{lemma}

\begin{proof}

As we will see, we mainly need to show that the solution $y(t;x,u)$ to
\eqref{ODE} depends continuously on the control $u$ in $\mathcal{U}_{ad}$,
endowed with the $L^q(0,T; V)$-topology. The above estimate
\eqref{Est_local_uniformity_highmodes} follows then directly from this
continuous dependence as explained at the end of the proof.

Given $u$  in $\mathcal{U}_{ad}$ and $r > 0$, we denote by
$\mathfrak{B}_{\scriptscriptstyle\mathcal{U}_{ad}}(u,r)$ the closed ball
 centered at $u$ with radius $r$, for the induced $ L^q(0,T; V)$-topology
on $\mathcal{U}_{ad}$.   For any $w$ in
$\mathfrak{B}_{\scriptscriptstyle\mathcal{U}_{ad}}(u,r)$, $x$ in $\mathcal{H}$ and
$t$ in $[0,T]$, consider $\phi(t):=y(t;x, u)  - y(t;x,w)$ and note that $\phi(0)=0$.
It follows from \eqref{Eq_mild} that
\begin{equation}
\begin{aligned}
\phi(t) &=  \int_0^t T(t-s)\big(F(y(s;x,u)) - F(y(s;x,w)) \big)\mathrm{d} s \\
& \quad +  \int_0^t T(t-s) \big( \mathfrak{C} (u(s)) - \mathfrak{C} (w(s))\big) \mathrm{d} s.
\end{aligned}
\end{equation}
We have then
\begin{equation} \label{local_uniformity_highmodes_est0}
\begin{aligned}
\|\phi(t)\|_{\mathcal{H}}
& \leq \int_0^t M e^{\omega(t-s)} \|F(y(s;x,u)) - F(y(s;x,w))\|_{\mathcal{H}} \mathrm{d} s \\
& \quad + \int_0^t  M e^{\omega(t-s)} \|\mathfrak{C} (u(s))
- \mathfrak{C} (w(s))\|_{\mathcal{H}} \mathrm{d} s.
\end{aligned}
\end{equation}
Let $C>0$ be chosen such that $\|y(t;x,u)\|_{\mathcal{H}} \le C$ for all $t\in [0,T]$,
 and let  $w$ be in $\mathfrak{B}_{\mathcal{U}_{ad}}(u,r)$, we define then
\begin{equation} \label{Def_t*}
t^*:=\max\{t \in [0,T] : \|y(t;x,w)\|_{\mathcal{H}} < 2 C\}.
\end{equation}


First let us note that $t^\ast >0$. Indeed recalling that
$ \|y(t;x,u)\|_{\mathcal{H}} \le C$ by assumption, we have in particular that
$\|x\|_{\mathcal{H}} \le C$. Now due to the continuity for any $(x,w)$ in
$\mathcal{H} \times \mathcal{U}_{ad}$ of the mapping
$[0,T] \to \mathcal{H}$, $t\mapsto y(t;x,w)$,
(since $y(t;x,w)$ is a mild solution), we infer, since $\|x\|_{\mathcal{H}} \le C$,
for each $w$ in $\mathfrak{B}_{\scriptscriptstyle\mathcal{U}_{ad}}(u,r)$
the existence of $t'(w)>0$ such that
\[
\|y(t;x,w)\|_{\mathcal{H}} < 2 C,  \quad \forall t \in [0,t'(w)],
\]
and therefore $t^\ast >0$.

Denote also $\mathfrak{B}_{ \scriptscriptstyle\mathcal{H}} \subset \mathcal{H}$ the closed
 ball centered at the origin with radius $2C$.
Let $\mathfrak{B}_{\scriptscriptstyle V}$ be the smallest closed ball in $V$
containing the bounded set $U$.
By using the local Lipschitz property of $F$ and $\mathfrak{C}$, we obtain
from \eqref{local_uniformity_highmodes_est0} that
\begin{equation}
\begin{aligned}
\|\phi(t)\|_{\mathcal{H}}
& \le \int_0^t M e^{\omega(t-s)} \operatorname{Lip}
 (F\vert_{\mathfrak{B}_{\scriptscriptstyle \mathcal{H}}})\|\phi(s)\|_{\mathcal{H}} \mathrm{d} s \\
& \quad + \int_0^t  M e^{\omega(t-s)} \operatorname{Lip}(\mathfrak{C}
 \vert_{\mathfrak{B}_{\scriptscriptstyle V}}) \|u(s) - w(s)\|_{V} \mathrm{d} s \\
& \le M\operatorname{Lip}(F\vert_{\mathfrak{B}_\mathcal{H}}) \int_0^t e^{\omega(t-s)}
  \|\phi(s)\|_{\mathcal{H}} \mathrm{d} s \\
& \quad + e^{\omega t^*} M \operatorname{Lip}(\mathfrak{C}\vert_{\mathfrak{B}_V})
\int_0^t  \|u(s) - w(s)\|_{V} \mathrm{d} s,  \quad \forall t \in [0, t^*].
\end{aligned}
\end{equation}
By H\"older's inequality, we have
\begin{equation}
\int_0^t  \|u(s) - w(s)\|_{V} \mathrm{d} s
\le t^{\frac{p-1}{p}}\|u-w\|_{L^p(0,T;V)}
\le t^{\frac{p-1}{p}} r,
\end{equation}
which leads to
\begin{equation}
\begin{aligned}
\|\phi(t)\|_{\mathcal{H}}
& \le M\operatorname{Lip}(F\vert_{\mathfrak{B}_{\scriptscriptstyle \mathcal{H}}})
  \int_0^t e^{\omega(t-s)} \|\phi(s)\|_{\mathcal{H}} \mathrm{d} s\\
& \quad  + (t^*)^{\frac{p-1}{p}} r e^{\omega t^*} M\operatorname{Lip}(\mathfrak{C}
 \vert_{\mathfrak{B}_{\scriptscriptstyle V}}),  \quad \forall t \in [0, t^*].
\end{aligned}
\end{equation}

It follows then from Gronwall's inequality that
\begin{equation} \label{local_uniformity_highmodes_est0_b}
\begin{aligned}
\|\phi(t)\|_{\mathcal{H}}
& \le  (t^*)^{\frac{p-1}{p}} r M \operatorname{Lip}
 (\mathfrak{C}\vert_{\mathfrak{B}_V}) \exp{(2 \omega t^\ast
 + t^\ast M\operatorname{Lip}(F\vert_{\mathfrak{B}_\mathcal{H}}))}\\
& \le  T^{\frac{p-1}{p}} r M \operatorname{Lip}(\mathfrak{C}
 \vert_{\mathfrak{B}_V})\exp{(2 \omega T
 + T M\operatorname{Lip}(F\vert_{\mathfrak{B}_\mathcal{H}}))}\,, \quad \forall t \in  [0,t^*].
\end{aligned}
\end{equation}
Now, let $C_\ast:=T^{\frac{p-1}{p}}  M \operatorname{Lip}(\mathfrak{C}
\vert_{\mathfrak{B}_V})\exp{(2 \omega T
+ T M\operatorname{Lip}(F\vert_{\mathfrak{B}_\mathcal{H}}))}$ and
\[  %\label{local_uniformity_highmodes_est0_c}
r_1 := \frac{C}{2 C_\ast}.
\]
We claim that $t^* = T$ if $r \le r_1$. Otherwise, if $t^*< T$,
applying \eqref{local_uniformity_highmodes_est0_b} at $t=t^*$, we obtain
\begin{equation}
\|\phi(t^*)\|_{\mathcal{H}} \le \frac{C}{2},
\end{equation}
which leads then to
\begin{equation}
\|y(t^*;x,w)\|_{\mathcal{H}}  \le \|y(t^*;x,u)\|_{\mathcal{H}}
+ \|\phi(t^*)\|_{\mathcal{H}} \le \frac{3}{2}C.
\end{equation}
This last inequality contradicts with the definition of $t^*$ given by
\eqref{Def_t*}.

We obtain thus for each $r \in (0, r_1]$ that
\begin{equation} \label{local_uniformity_highmodes_est0_c}
\|\phi(t)\|_{\mathcal{H}} \le r C_\ast\; , \quad \forall t \in  [0,T].
\end{equation}
Now, it follows from \eqref{local_uniformity_highmodes_est0_c} that
for any fixed $\epsilon > 0$ there exists $r_\epsilon > 0$ sufficiently small
such that
\begin{equation}
\|\phi(t)\|_{\mathcal{H}} \le \frac{1}{2} \epsilon, \quad \forall t\in[0,T].
\end{equation}
Recalling the definition of $\phi$, we have thus proved that
\begin{equation} \label{local_uniformity_highmodes_est1}
\sup_{w\in \mathfrak{B}_{\scriptscriptstyle\mathcal{U}_{ad}}(u,r_\epsilon)}
 \sup_{t\in[0,T]}\|y(t;x,u) - y(t;x,w)\|_{\mathcal{H}} \le \frac{1}{2}\epsilon.
\end{equation}

We turn now to the last arguments needed to prove
 \eqref{Est_local_uniformity_highmodes}. It consists first to note that the
convergence property \eqref{Eq_identity_approx} and the continuity of
$t\mapsto y(t; x, u)$ imply, for the given $\epsilon > 0$, the existence of
a positive integer  $N_0$ for which
\begin{equation} \label{local_uniformity_highmodes_est2}
 \sup_{t\in[0,T]} \|(\operatorname{Id}_{\mathcal{H}} - \Pi_N) y(t;x,u)\|_{\mathcal{H}}
\le \frac{1}{2}\epsilon, \quad \forall N \ge N_0.
\end{equation}
Now by defining $\Pi_N^{\perp}:=\operatorname{Id}_{\mathcal{H}} - \Pi_N$, and noting that
\begin{equation}
\begin{aligned}
\|\Pi_N^{\perp} y(t;x,w)\|_{\mathcal{H}}
& \leq \|\Pi_N^{\perp} (y(t;x,w)-y(t;x,u))\|_{\mathcal{H}}
 +\|\Pi_N^{\perp} y(t;x,u)\|_{\mathcal{H}}\\
& \leq \|y(t;x,w)-y(t;x,u)\|_{\mathcal{H}} +\|\Pi_N^{\perp} y(t;x,u)\|_{\mathcal{H}},
\end{aligned}
\end{equation}
we conclude --from \eqref{local_uniformity_highmodes_est1}
and \eqref{local_uniformity_highmodes_est2}-- to the desired
estimate \eqref{Est_local_uniformity_highmodes} with $\mathcal{O}_u$ taken
 to be $\mathring{\mathfrak{B}}_{\mathcal{U}_{ad}}(u,r_{\epsilon})$, the open ball
in $\mathcal{U}_{ad}$ of radius $r_\epsilon$.
\end{proof}

We conclude this section with a local-in-$u$ approximation result.

\begin{lemma} \label{Lem_local_in_u_est}
Assume the assumptions of  Lemma~\ref{Lem_A7_local_verion} hold.
Then, for any $(x,u)$ in $\mathcal{H} \times \mathcal{U}_{ad}$  and any $\epsilon>0$
there exists a neighborhood $\mathcal{O}_u \subset \mathcal{U}_{ad}$ of $u$ and
$N_0\geq 1$ such that the mild solution $y(t;x,u)$ to \eqref{ODE}  satisfies
\begin{equation} \label{Eq_local_in_u_est_goal}
\sup_{w \in \mathcal{O}_u} \sup_{t\in[0,T]} \|y_N(t;\Pi_N x,w) - y(t;x,w)\|_{\mathcal{H}}
 \le \epsilon, \quad \forall N \ge N_0,
\end{equation}
where $y_N$ denotes the solution to the Galerkin approximation \eqref{ODE_Galerkin}.
\end{lemma}

\begin{proof}
First, let us remark that even if here $\mathfrak{C}$ does not satisfy the growth
condition \eqref{Eq_poly_growth_C}, one can still derive the trajectory-wise
convergence result \eqref{local_in_u_conv_Goal} by exploiting the fact that $u$
lies in $\mathcal{U}_{ad}$ and $\mathfrak{C}$ is locally Lipschitz.
The only change in the proof consists indeed of replacing (for a.e.
 $s \in [0, T]$ and all $t \in [s, T]$) the estimate
\eqref{eq:tilde_dn_dominated} by the following:
\begin{equation} \label{eq:tilde_dn_dominated_new}
\| \big( T(t-s) -  e^{L_N (t -s )} \Pi_N \big) \mathfrak{C}(u(s)) \|_{\mathcal{H}}
\le 2 M e^{\omega T} \operatorname{Lip}(\mathfrak{C}\vert_{\mathfrak{B}_V})
\|u(s)\|_V,
\end{equation}
where $\mathfrak{B}_{\scriptscriptstyle V}$ denotes the smallest closed ball
in $V$ containing the bounded set $U$. Since $u$ lies in $L^q([0,T];V)$,
then $u$ lies in $L^1([0,T];V)$ and  the RHS of \eqref{eq:tilde_dn_dominated_new}
is integrable on $[0,T]$. We can then, this time from
\eqref{eq:tilde_dn_dominated_new}, still use the Lebesgue dominated  convergence
theorem to have \eqref{eq:est_tilde_dn_vf} to hold, without thus assuming the
growth condition \eqref{Eq_poly_growth_C}.

We explain now how to derive \eqref{Eq_local_in_u_est_goal}  from
\eqref{local_in_u_conv_Goal}.
Recall that from \eqref{local_uniformity_highmodes_est1} derived  in the proof
of Lemma \ref{Lem_A7_local_verion}, the mild solutions to the IVP \eqref{ODE}
depend continuously on the control $u$ in $\mathcal{U}_{ad}$, endowed with
the $L^q([0,T];V)$-topology. An estimate similar to
\eqref{local_uniformity_highmodes_est1}  can be derived for the solutions to
 Galerkin approximation \eqref{ODE_Galerkin}, ensuring thus also their continuous
dependence on $u$.

As a consequence, for any given $\epsilon >0$ and $u$ in $\mathcal{U}_{ad}$,
there exists a neighborhood $\mathcal{O}_u \subset \mathcal{U}_{ad}$ containing
$u$ for which
\begin{equation}  \label{Eq_local_in_u_est1}
\begin{gathered}
 \sup_{w\in \mathcal{O}_u} \sup_{t\in[0,T]}\|y(t;x,u) - y(t;x,w)\|_{\mathcal{H}}
 \le \frac{1}{3}\epsilon, \\
 \sup_{w\in \mathcal{O}_u} \sup_{t\in[0,T]}\|y_N(t;\Pi_N x,u)
- y_N(t;\Pi_N x,w)\|_{\mathcal{H}}
\le \frac{1}{3}\epsilon, \quad \forall N \in \mathbb{Z}_+^\ast.
\end{gathered}
\end{equation}
On the other hand, the trajectory-wise convergence  \eqref{local_in_u_conv_Goal}
ensures the existence of a positive integer $N_0$, such that
\begin{equation} \label{Eq_local_in_u_est2}
\sup_{t \in [0, T]} \|y_N(t; \Pi_N x, u) - y(t; x,u)\|_{\mathcal{H}}
\le \frac{1}{3}\epsilon, \quad \forall N \ge N_0.
\end{equation}
Since
\begin{equation}
\begin{aligned}
&\|y_N(t;\Pi_N x,w) - y(t;x,w)\|_{\mathcal{H}} \\
& \le \|y_N(t;\Pi_N x,w) - y_N(t;\Pi_N x,u)\|_{\mathcal{H}}
 + \|y_N(t;\Pi_N x,u) - y(t; x,u)\|_{\mathcal{H}} \\
& \quad  + \|y(t;x,u) - y(t;x,w)\|_{\mathcal{H}},
\end{aligned}
\end{equation}
the desired estimate \eqref{Eq_local_in_u_est_goal} follows
from \eqref{Eq_local_in_u_est1} and \eqref{Eq_local_in_u_est2}.
\end{proof}

\subsection{Convergence of Galerkin approximations: Uniform-in-$u$ result}
\label{Sect_uniform_convergence}

In the previous section, the local-in-$u$ approximation result has been derived
under a boundedness assumption on $U$ arising
in the definition of $\mathcal{U}_{ad}$. Here, compactness  will substitute
the boundedness to derive  convergence results that are uniform in $u$.
More precisely, we will assume for that purpose
\begin{itemize}
\item[(A5)]  The set of admissible controls $\mathcal{U}_{ad}$ is given
by \eqref{Eq_U_bounded} with
$U$ being a compact subset of the Hilbert space~$V$.
\end{itemize}
We will make also use of the following assumptions.
\begin{itemize}
\item[(A6)]  Let $\mathcal{U}_{ad}$ be given by  \eqref{Eq_U_bounded}.
 For each $T>0$, $(x,u)$ in $\mathcal{H} \times \mathcal{U}_{ad}$, the
problem \eqref{ODE} admits a unique mild solution $y(\cdot; x, u)$
in $C([0,T],\mathcal{H})$, and for each $N\geq 1$, its Galerkin approximation
\eqref{ODE_Galerkin} admits a unique solution $y_N(\cdot; \Pi_N x, u)$
in $C([0,T],\mathcal{H})$. Moreover, there exists a constant $\mathcal{C}:=\mathcal{C}(T,x)$
 such that
\begin{equation} \label{Eq_y_uniform-in-u_bounds}
\begin{gathered}
 \|y(t; x, u)\|_{\mathcal{H}} \le \mathcal{C}, \quad \forall t\in[0,T],
\; u \in  \mathcal{U}_{ad}, \\
 \|y_N(t; \Pi_N x, u)\|_{\mathcal{H}} \le \mathcal{C}, \quad \forall t\in[0,T],\;
N \in \mathbb{Z}_+^\ast, \; u \in  \mathcal{U}_{ad}.
\end{gathered}
\end{equation}

\item[(A7)]   Let $\mathcal{U}_{ad}$ be given by  \eqref{Eq_U_bounded}.
For each fixed $T > 0$, and any mild solution $y(\cdot;x,u)$ to \eqref{ODE}
with  $(x,u)$ in $\mathcal{H} \times \mathcal{U}_{ad}$, it holds that
\begin{equation} \label{Est_uniformity_highmodes}
\lim_{N \to \infty}  \sup_{u\in \mathcal{U}_{ad}} \sup_{t\in[0,T]}
\|(\operatorname{Id}_{\mathcal{H}} - \Pi_N) y(t;x,u)\|_{\mathcal{H}} =0.
\end{equation}
\end{itemize}



\begin{remark} \label{Rmk:unif_bdd_on_soln} \rm
\begin{itemize}
\item[(i)]  Note that (A6) differs from (A4) by the inequality
$\|y(t; x, u)\|_{\mathcal{H}}\leq \mathcal{C}$, and that
  the constant in \eqref{Eq_y_uniform-in-u_bounds}  is independent of the control $u$.
\item[(ii)]  Let $u$ be in $\mathcal{U}_{ad}$  given by  \eqref{Eq_U_bounded}.
Then uniform bounds such as in \eqref{Eq_y_uniform-in-u_bounds} are guaranteed
if e.g.~an {\it a priori} estimate of the following type holds for IVPs \eqref{ODE}
and \eqref{ODE_Galerkin}:
\begin{equation}
\sup_{t \in [0,T]} \| y(t;x,u)\|_{\mathcal{H}}
\leq \alpha ( \| x\|_{\mathcal{H}}+ \|u\|_{L^{q}(0,T;V)}) +\beta,\quad \alpha >0, \;
 \beta\geq 0.
\end{equation}
See e.g.~\cite{Cazenave_al98,Tem97} for such a priori bounds for nonlinear partial
 differential equations.
Such bounds can also be derived for nonlinear systems of delay differential
equations (DDEs); see in that respect the proofs of
\cite[Estimates (4.75)]{CGLW15} and \cite[Corollary 4.3]{CGLW15} which can be
adapted to the case of controlled DDEs.


\item[(iii)] We refer to Sect.~\ref{Sect_examples} below for a broad class
of IVPs for which Assumption (A7) holds.
\end{itemize}
\end{remark}


As a preparatory lemma to Theorem \ref{Lem:uniform_in_u_conv}, we first prove
that given $x$ in $\mathcal{H}$,
\[
(\operatorname{Id}_{\mathcal{H}} - \Pi_N) F(y(t;x,u)) \underset{N\to \infty}
\longrightarrow 0,
\]
 uniformly in $u$ lying in $\mathcal{U}_{ad}$ and $t$ in $[0,T]$. For that
only assumptions (A3), (A6) and (A7) are used, and $U$ involved in the
definition \eqref{Eq_U_bounded} of $\mathcal{U}_{ad}$ is assumed to be bounded
(not necessarily compact).


\begin{lemma} \label{Lem:highmode_F_est}
Assume that {\rm (A3), (A6)} and {\rm (A7)} hold. Then
\begin{equation} \label{Eq_highmode_F_est}
\lim_{N\to \infty} \sup_{u\in \mathcal{U}_{ad}}
\sup_{t\in[0,T]} \|(\operatorname{Id}_{\mathcal{H}} - \Pi_N) F(y(t;x,u))\|_{\mathcal{H}} =0.
\end{equation}
\end{lemma}

\begin{proof}
For any given $\epsilon > 0$, by (A7), there exists $N_0$ in $\mathbb{Z}_+^\ast$
such that
\begin{equation} \label{Eq_unif_est_ys}
\sup_{u\in \mathcal{U}_{ad}} \sup_{t\in[0,T]} \|(\operatorname{Id}_{\mathcal{H}}
- \Pi_{N}) y(t;x,u)\|_{\mathcal{H}} \le \epsilon, \quad \forall N \ge N_0.
\end{equation}
Note also that for all $x$ in $\mathcal{H}$, and $u$ in $\mathcal{U}_{ad}$ given by
 \eqref{Eq_U_bounded},
 \begin{equation} \label{Eq_unif_est_F}
\begin{aligned}
&\|(\operatorname{Id}_{\mathcal{H}}   -  \Pi_N) F(y(t;x,u))\|_{\mathcal{H}}  \\
&  \le   \| (\operatorname{Id}_{\mathcal{H}}  -  \Pi_N) F(\Pi_{N_0}  y(t; x, u)) \|_{\mathcal{H}} \\
& \quad  +  \| (\operatorname{Id}_{\mathcal{H}}  -  \Pi_N) \big(F(y(t; x, u))
 -  F(\Pi_{N_0} y(t; x, u))\big) \|_{\mathcal{H}}.
\end{aligned}
\end{equation}
For the second term on the RHS, we have
\begin{align*}
& \| (\operatorname{Id}_{\mathcal{H}} - \Pi_N) \big(F(y(t; x, u))
 - F(\Pi_{N_0} y(t; x, u))\big) \|_{\mathcal{H}} \\
& \le \|F(y(t; x, u)) - F(\Pi_{N_0} y(t; x, u))\|_{\mathcal{H}} \\
& \le  \operatorname{Lip}(F\vert_{\mathfrak{B}})\| (\operatorname{Id}_{\mathcal{H}}
- \Pi_{N_0} ) y(t; x, u) \|_{\mathcal{H}}, \quad  \forall t\in [0,T], \;
u \in \mathcal{U}_{ad},
\end{align*}
where $\mathfrak{B}$ denotes the ball in $\mathcal{H}$ centered at the origin with
radius $ \mathcal{C}$ given by \eqref{Eq_y_uniform-in-u_bounds}.

It follows then from \eqref{Eq_unif_est_ys} that
\begin{equation} \label{Eq_unif_est_Fs}
\sup_{u\in \mathcal{U}_{ad}} \sup_{t\in[0,T]} \| (\operatorname{Id}_{\mathcal{H}}
- \Pi_N) \big(F(y(t; x, u)) - F(\Pi_{N_0} y(t; x, u))\big) \|_{\mathcal{H}}
\le \operatorname{Lip}(F\vert_{\mathfrak{B}}) \; \epsilon.
\end{equation}


Because of (A6), for each $x$ in $\mathcal{H}$,  $\Pi_{N_0} y(s; x, u)$ lies in a
uniformly (in $s$ and $u$) bounded subset  of $\mathcal{H}_{N_0} $. The finite
dimensionality of $\mathcal{H}_{N_0}$ (as a Galerkin subspace) ensures the compactness
of the set
\[
\mathcal{E}_x:=\overline{\{\Pi_{N_0} y(s; x, u), \; u \in \mathcal{U}_{ad}, \;
s\in [0, T]\}}^{\mathcal{H}}.
\]

For each $z$ in $\mathcal{E}_x$ and $\epsilon>0$, due to  \eqref{Eq_identity_approx}
 there exists an integer $N_1(z)$ such that
\[
\|  (\operatorname{Id}_{\mathcal{H}} - \Pi_N) F(z)\| \leq \frac{\epsilon}{2}, \quad
 \forall N \ge N_1(z).
\]
Since $F$ is continuous, there exists a neighborhood $\mathcal{N}_z$ of $z$
in $\mathcal{H}_{N_0}$ such that
\begin{equation} \label{eq_control_F}
\|  (\operatorname{Id}_{\mathcal{H}} - \Pi_N) F(w)\| \leq \epsilon, \quad
 \forall N \ge N_1(z), \; w \in \mathcal{N}_z.
\end{equation}
From the compactness of $\mathcal{E}_x$ we can extract a finite cover of
$\mathcal{E}_x$ by such neighborhoods $ \mathcal{N}_z$ for which
\eqref{eq_control_F} holds, and thus one can ensure the existence of an
integer $N_1$ for which
\begin{equation}
\sup_{z \in \mathcal{E}_x} \|  (\operatorname{Id}_{\mathcal{H}} - \Pi_N)   F(z) \|_{\mathcal{H}}
\le \epsilon, \quad \forall N \ge N_1.
\end{equation}
This last inequality ensures for each $x$ in $\mathcal{H}$, the existence of an integer
$N_1$ for which
\begin{equation} \label{Eq_unif_est_Fn}
\sup_{u \in  \mathcal{U}_{ad}} \sup_{t\in[0, T]} \|  (\operatorname{Id}_{\mathcal{H}}
- \Pi_N)   F(\Pi_{N_0} y(t;x, u)) \|_{\mathcal{H}} \le \epsilon, \quad \forall N \ge N_1.
\end{equation}
Then, \eqref{Eq_highmode_F_est} follows
from \eqref{Eq_unif_est_F}, \eqref{Eq_unif_est_Fs} and \eqref{Eq_unif_est_Fn}.
\end{proof}

We are now in a  position to formulate a uniform (in $u$) version of
Lemma~\ref{Lem:local_in_u_conv} in which the growth condition
\eqref{Eq_poly_growth_C} is no longer required.

\begin{theorem} \label{Lem:uniform_in_u_conv}
Assume that {\rm (A0)--(A3)} and {\rm (A5)--(A7)} hold. Assume also that
 $\mathfrak{C}:V\to \mathcal{H}$ is continuous.  Then, for any $(x,u)$ in
$\mathcal{H} \times \mathcal{U}_{ad}$, the mild solution $y(t;x,u)$ to \eqref{ODE}
satisfies the following uniform convergence result
\begin{equation} \label{uniform_in_u_conv_Goal}
\lim_{N\to \infty}  \sup_{u\in \mathcal{U}_{ad}} \sup_{t \in [0, T]}
\|y_N(t; \Pi_N x, u) - y(t; x,u)\|_{\mathcal{H}} = 0,
\end{equation}
where $y_N$ denotes the solution to the Galerkin approximation \eqref{ODE_Galerkin}.
\end{theorem}

\begin{proof}
Compared to Lemma~\ref{Lem:local_in_u_conv}, we have replaced (A4)
by the stronger assumption (A6) and the set of admissible controls
$\mathcal{U}_{ad}$ is as given in (A5). By following the proof of
Lemma~\ref{Lem:local_in_u_conv}, in order to obtain the uniform convergence
result \eqref{uniform_in_u_conv_Goal}, it suffices to show that the two
terms $\int_0^T d_N(s; u) \mathrm{d} s$ and $\int_0^T  \widetilde{d}_N(s; u) \mathrm{d} s$
involved in the RHS of \eqref{eq_rn_gronwall} converge to zero as
$N \to \infty$ uniformly with respect to $u$  in $\mathcal{U}_{ad}$.

Recall from \eqref{totoc} that
\begin{equation}
d_N(s; u) = \sup_{t\in[s, T]} \| \big( T(t-s) -  e^{L_N (t -s )} \Pi_N \big)
F(y(s; x, u)) \|_{\mathcal{H}},
\end{equation}
 which is defined for every $s$ in $[0, T]$ and $u$ in $\mathcal{U}_{ad}$.
 Thanks to Lemma~\ref{Lem:highmode_F_est}, for any fixed $\epsilon > 0$,
there exists $N_0$  in  $\mathbb{Z}_+^\ast$, such that
\begin{equation} \label{eq:uniform_est_dn_1}
\|(\operatorname{Id}_{\mathcal{H}} - \Pi_{N_0}) F(y(s;x, u))\|_{\mathcal{H}} < \epsilon,
\quad  \; s\in [0,T], \; u \in \mathcal{U}_{ad}.
\end{equation}
Now, for $N_0$ chosen above, we have
\begin{equation}  \label{eq:uniform_est_dn_2}
\begin{aligned}
&\| \big( T(t-s) -  e^{L_N (t -s )} \Pi_N \big) F(y(s; x, u)) \|_{\mathcal{H}} \\
& \le  \| \big( T(t-s) -  e^{L_N (t -s )} \Pi_N \big)
 \Pi_{N_0} F(y(s; x, u)) \|_{\mathcal{H}} \\
& \quad  + \| \big( T(t-s) -  e^{L_N (t -s )} \Pi_N \big)
 (\operatorname{Id}_{\mathcal{H}} - \Pi_{N_0} ) F(y(s; x, u)) \|_{\mathcal{H}}.
\end{aligned}
\end{equation}
By using \eqref{Eq_control_T_t} and Assumption (A1), we obtain:
\begin{equation} \label{eq:uniform_est_dn_3}
\begin{aligned}
 & \sup_{t\in[s, T]} \| \big( T(t-s) -  e^{L_N (t -s )} \Pi_N \big)
 (\operatorname{Id}_{\mathcal{H}} - \Pi_{N_0}) F(y(s; x, u)) \|_{\mathcal{H}} \\
& \le  2 Me^{\omega T}\|(\operatorname{Id}_{\mathcal{H}} - \Pi_{N_0})
 F(y(s; x, u)) \|_{\mathcal{H}} \\
 & \le 2 Me^{\omega T}\epsilon,  \quad  \forall s\in [0,T], \;
u \in \mathcal{U}_{ad},
\end{aligned}
\end{equation}
where the last inequality follows from \eqref{eq:uniform_est_dn_1}.

By (A6), for each $x$ in $\mathcal{H}$,  $y(s; x, u)$ lies in a uniformly (in $s$ and $u$)
bounded subset  of $\mathcal{H}$. This  together with the locally Lipschitz property
of $F$ implies that $\Pi_{N_0} F(y(s; x, u))$ lies in a bounded subset  of
 $\mathcal{H}_{N_0} $ for all $u$  in $\mathcal{U}_{ad}$ and for all $s$ in $[0, T]$.
The finite dimensionality of $\mathcal{H}_{N_0}$ ensures then the compactness of the set
\[
\mathcal{E}'_x=\overline{\{\Pi_{N_0} F(y(s; x, u)), \; u \in \mathcal{U}_{ad},
\; s\in [0, T]\}}^{\mathcal{H}}.
\]

Now, for each $z$ in $\mathcal{E}'_x$ and $\epsilon>0$, the convergence property
\eqref{eq:linear_pointwise_convergence} valid uniformly over bounded time-intervals
allows us to ensure the existence of an integer $N_1(z)$, for which
\[
\sup_{t\in[0, T]} \| \big( T(t) -  e^{L_N t} \Pi_N \big)  z \|_{\mathcal{H}}
\le \frac{\epsilon}{2}, \quad \forall  N \ge N_1(z).
\]
Then, by using \eqref{Eq_control_T_t} and Assumption (A1), there exists a
neighborhood $\mathcal{N}_z$ of $z$ in $\mathcal{H}_{N_0}$ such that
\begin{equation} \label{eq_control_F_v2}
\sup_{t\in[0, T]} \| \big( T(t) -  e^{L_N t} \Pi_N \big)  w \|_{\mathcal{H}} \le \epsilon,
\quad \forall  N \ge N_1(z), \; w \in \mathcal{N}_z.
\end{equation}
From the compactness of $\mathcal{E}'_x$ we can extract a finite cover of
$\mathcal{E}'_x$ by such neighborhoods in which
\eqref{eq_control_F_v2} holds, and thus one can ensure the existence of an
integer $N_1$ for which
\begin{equation} \label{eq_control_F_v2b}
\sup_{t\in[0, T]} \| \big( T(t) -  e^{L_N (t)} \Pi_N \big) w \|_{\mathcal{H}} \le \epsilon,
\quad \forall  N \ge N_1, \; w \in \mathcal{E}'_x.
\end{equation}
Now, for each fixed $s$ in $[0, T]$ and $u$ in $\mathcal{U}_{ad}$, by taking
$w = \Pi_{N_0} F(y(s; x, u))$, we obtain from
\eqref{eq_control_F_v2b} that
\[
\sup_{t\in[0, T]} \| \big( T(t) -  e^{L_N (t)} \Pi_N \big)
\Pi_{N_0} F(y(s; x, u)) \|_{\mathcal{H}} \le \epsilon, \quad \forall  N \ge N_1.
\]
It follows then for  all $u$  in $\mathcal{U}_{ad}$,
\begin{equation} \label{eq:uniform_est_dn_4}
\sup_{t\in[s, T]} \| \big( T(t-s) -  e^{L_N (t -s )} \Pi_N \big)
\Pi_{N_0} F(y(s;x, u)) \|_{\mathcal{H}} \le \epsilon, \;\forall N \ge N_1, \;  s\in [0,T].
\end{equation}


By using \eqref{eq:uniform_est_dn_3} and \eqref{eq:uniform_est_dn_4}
in \eqref{eq:uniform_est_dn_2}, we obtain
\[
d_N(s; u) \le (1 + 2 Me^{\omega T})\epsilon, \quad
\forall N \ge N_1, \; s\in [0,T], \; u \in \mathcal{U}_{ad},
\]
which leads to
\begin{equation} \label{eq:uniform_est_dn_vf}
 \sup_{u \in \mathcal{U}_{ad}} \int_0^T d_N(s; u) \mathrm{d} s
\le (1 + 2 Me^{\omega T}) T \epsilon, \quad  \forall N \ge N_1.
\end{equation}

We consider now the term $\sup_{u \in \mathcal{U}_{ad}}
\int_0^T  \widetilde{d}_N(s; u) \mathrm{d} s$ with
\[
\widetilde{d}_N (s; u) = \sup_{t\in[s, T]} \| \big( T(t-s) -  e^{L_N (t -s )}
\Pi_N \big) \mathfrak{C}(u(s)) \|_{\mathcal{H}}
\]
as defined in \eqref{totod} for almost every $s$ in $[0,T]$ and every $u$ in
$\mathcal{U}_{ad}$ here.

Since the set $U \subset V$ is compact (cf.~Assumption (A5)) and
$\mathfrak{C}: V \to \mathcal{H}$ is continuous, then  $\mathfrak{C}(U)$ is a compact
set of $\mathcal{H}$. Following a compactness argument similar to that used to
derive \eqref{eq_control_F_v2b}, we can ensure the existence of an integer $N_2$
such that
\begin{equation} \label{eq_control_C}
\sup_{t\in[0, T]} \|\big( T(t) -  e^{L_N (t)} \Pi_N \big) \mathfrak{C}(w)\|_{\mathcal{H}}
\le \epsilon, \quad \forall N \ge N_2, \; w \in U.
\end{equation}
Now, for each $u$ in $\mathcal{U}_{ad}$, since $u(s)$ takes value in $U$ for almost every $s$ in $[0,T]$, we obtain from \eqref{eq_control_C} that
\begin{equation}
\sup_{t\in[s, T]} \|\big( T(t-s) -  e^{L_N (t -s )} \Pi_N \big)
 \mathfrak{C}(u(s))\|_{\mathcal{H}} \le \epsilon, \quad \text{for all }  N \ge N_2
\text{ and a.e. } s \in [0,T].
\end{equation}
It follows then that for all $N \geq N_2$, and $u$ in $\mathcal{U}_{ad}$,
\begin{equation} \label{eq:uniform_u_est}
\int_0^T  \widetilde{d}_N(s; u) \mathrm{d} s
=  \int_0^T \sup_{t\in[s, T]} \| \big( T(t-s)
 -  e^{L_N (t -s )} \Pi_N \big) \mathfrak{C}(u(s)) \|_{\mathcal{H}} \mathrm{d} s \le T \epsilon,
\end{equation}
and thus,
\begin{equation} \label{eq:uniform_est_tilde_dn_vf}
\sup_{u \in \mathcal{U}_{ad}} \int_0^T  \widetilde{d}_N(s; u) \mathrm{d} s
\le T \epsilon,  \quad \forall  N \ge N_2.
\end{equation}

The desired uniform convergence of $\int_0^T d_N(s; u) \mathrm{d} s$ and
 $\int_0^T  \widetilde{d}_N(s; u) \mathrm{d} s$ follows from \eqref{eq:uniform_est_dn_vf}
and \eqref{eq:uniform_est_tilde_dn_vf}. The proof is now complete.
\end{proof}

\begin{remark} \label{Rmk_F=0} \rm
From the proof given above, it is clear that Assumption (A5) is made to
ensure the uniform convergence of $\int_0^T  \widetilde{d}_N(s; u) \mathrm{d} s$,
while  Assumptions (A6) and (A7) are made to ensure the uniform convergence
of $\int_0^T d_N(s; u) \mathrm{d} s$. The last two assumptions are thus not needed if
the nonlinear term $F$ is identically zero.
\end{remark}

Note that one can readily check that the convergence result stated in
Theorem~\ref{Lem:uniform_in_u_conv} also holds when \eqref{ODE} is initialized
at any other time instance $t$ in $[0,T)$. This will be needed in the next
subsection to derive approximation results for value functions associated
with optimal control problems for the IVP \eqref{ODE}.

More precisely, for each $(t,x)$  in $[0,T) \times \mathcal{H}$, we consider the
following evolution problem
\begin{equation} \label{ODE_t_sec3}
\begin{gathered}
\frac{\mathrm{d} y}{\mathrm{d} s} = L y + F(y) + \mathfrak{C} (u(s)),  \quad
s \in (t, T], \; u\in \mathcal{U}_{ad}[t,T],\\
y(t) =x  \in \mathcal{H},
\end{gathered}
\end{equation}
with
\begin{equation} \label{U_ad_toto}
\mathcal{U}_{ad}[t,T]:=\{u\vert_{[t,T]} : u \in \mathcal{U}_{ad}\},
\end{equation}
and the corresponding Galerkin approximation:
\begin{equation} \label{ODE_Galerkin_t}
\begin{gathered}
\frac{\mathrm{d} y_N}{\mathrm{d} s} = L_N y_N + \Pi_N F(y_N) + \Pi_N \mathfrak{C} (u(s)),
\quad s \in (t, T], \; u\in \mathcal{U}_{ad}[t,T],\\
y_N(t) = x_N, \quad x_N := \Pi_N x \in \mathcal{H}_N.
\end{gathered}
\end{equation}


Hereafter, we denote by $y_{t,x}(\cdot;u)$ the solution to \eqref{ODE_t_sec3}
emanating from $x$ at time $t$, and by $y^N_{t,x_N}(\cdot;u)$ the solution
to \eqref{ODE_Galerkin_t} emanating from $x_N:=\Pi_N x$ at time $t$.
We have then the following corollary of Theorem~\ref{Lem:uniform_in_u_conv}:

\begin{corollary}\label{Lem:uniform_conv_locally_Lip_t_v2}
Assume that the conditions of Theorem~\ref{Lem:uniform_in_u_conv} hold.
Then, for any  mild solution $y_{t,x}(\cdot;u)$ to \eqref{ODE_t_sec3}
over $[t,T]$, with $x$  in $\mathcal{H}$ and $u$ in $\mathcal{U}_{ad}[t,T]$ given
in \eqref{U_ad_toto},  the following convergence result is satisfied:
\begin{equation} \label{uniform_conv_Goal_t_v2}
\lim_{N\to \infty} \sup_{t\in[0,T]} \sup_{u\in\mathcal{U}_{ad}[t,T]}
\sup_{s \in [t, T]} \| y^N_{t,x_N}(s; u) - y_{t,x}(s;u)\|_{\mathcal{H}} = 0,
\end{equation}
where $ y^N_{t,x_N}$ denotes the solution to the Galerkin approximation
\eqref{ODE_Galerkin_t}.
\end{corollary}

\begin{proof}
Since both the linear operator $L$ and the nonlinearity $F$ in \eqref{ODE_t_sec3}
are time independent, then the supremum of
$\sup_{u\in\mathcal{U}_{ad}[t,T]} \sup_{s \in [t, T]} \| y^N_{t,x_N}(s; u)
- y_{t,x}(s;u)\|_{\mathcal{H}}$ as $t$  varies in $[0,T]$, is achieved at $t=0$, i.e.,
\begin{align*}
& \sup_{u\in\mathcal{U}_{ad}[t,T]}
\underset{\substack{t\in[0,T]\\{ s \in [t, T]}}}
\sup \| y^N_{t,x_N}(s; u) - y_{t,x}(s;u)\|_{\mathcal{H}} \\
&= \sup_{u\in\mathcal{U}_{ad}[0,T]} \sup_{s \in [0, T]} \| y^N_{0,x_N}(s; u)
 - y_{0,x}(s;u)\|_{\mathcal{H}} \\
& =  \sup_{u\in\mathcal{U}_{ad}[0,T]} \sup_{s \in [0, T]}
\| y_N(s;x_N, u) - y(s;x,u)\|_{\mathcal{H}}.
\end{align*}
The desired estimate \eqref{uniform_conv_Goal_t_v2} follows then
from \eqref{uniform_in_u_conv_Goal}, noting that
$\mathcal{U}_{ad}[0,T]=\mathcal{U}_{ad}$.
\end{proof}

\subsection{Galerkin approximations of optimal control and value functions:
Convergence results}\label{Sec_cve}

We assume in this section  that $U$ is a compact and convex subset of
the Hilbert space $V$. In particular this ensures that $\mathcal{U}_{ad}$
defined in \eqref{Eq_U_bounded} is a bounded, closed and convex set.
For such an admissible set of controls, conditions of existence to optimal
control problems associated with the IVPs \eqref{ODE} and \eqref{ODE_Galerkin}
are recalled in the appendix.

We introduce next the cost functional,
$J\colon \mathcal{H} \times \mathcal{U}_{ad}  \to \mathbb{R}^+$, associated with
the IVP \eqref{ODE}:
\begin{equation} \label{J_sec3}
J(x,u) := \int_0^T [\mathcal{G}(y(s; x, u)) + \mathcal{E}(u(s)) ] \, \mathrm{d} s,  \quad
 x \in \mathcal{H},
\end{equation}
where $\mathcal{G}: \mathcal{H} \to \mathbb{R}^+$ and $\mathcal{E}: V \to \mathbb{R}^+$
are assumed to be {\it continuous}, and $\mathcal{G}$ is assumed to satisfy
furthermore the condition:
\begin{equation} \label{C1} %\tag{{\bf C1}}
\mathcal{G}  \text{ is  locally Lipschitz in the sense of } \eqref{Local_Lip_cond}.
\end{equation}


The associated optimal control problem then writes
\begin{equation} \label{P_sec3}  %\tag {$\mathcal{P}$}
\begin{aligned}
\min  J(x,u)  \quad \text{s.t.}\quad
  (y, u) \in L^2(0,T; \mathcal{H}) \times  \mathcal{U}_{ad}
\text{ solves \eqref{ODE} with }   y(0)  = x \in \mathcal{H}.
\end{aligned}
\end{equation}

The cost functional, $J_N\colon \mathcal{H}_N \times \mathcal{U}_{ad}  \to \mathbb{R}^+$,
 associated with the Galerkin approximation  \eqref{ODE_Galerkin} is given by
\begin{equation} \label{J_Galerkin}
J_N(\Pi_N x,u) := \int_0^T [\mathcal{G}(y_N(s; \Pi_N x, u))
+ \mathcal{E}(u(s)) ] \, \mathrm{d} s,  \; x \in \mathcal{H},
\end{equation}
and the corresponding optimal control problem reads:
\begin{equation} \label{P_Galerkin} % \tag {$\mathcal{P}_N$}
\begin{aligned}
 \min  J_N(\Pi_N x,u)  \quad \text{s.t.} \quad
&(y_N, u) \in L^2(0,T; \mathcal{H}_N) \times  \mathcal{U}_{ad}
\text{ solves \eqref{ODE_Galerkin}}\\
& \text{with }   y_N(0)  = \Pi_N x \in \mathcal{H}_N.
\end{aligned}
\end{equation}

We assume hereafter that both problems, \eqref{P_sec3} and  \eqref{P_Galerkin},
possess each a solution. We analyze the convergence of the corresponding value
functions by adopting a dynamic programming approach.
For that purpose, we consider for each $(t,x)$  in $[0,T) \times \mathcal{H}$ a
family of optimal control problems associated with \eqref{ODE_t_sec3} and the
following cost functional $J_{t,x}$:
\begin{equation} \label{J_tx}
J_{t,x}(u) := \int_t^T [\mathcal{G}(y_{t,x}(s;u)) + \mathcal{E}(u(s)) ] \mathrm{d} s, \quad
t \in [0,T), \; u \in \mathcal{U}_{ad}[t,T].
\end{equation}

The cost functional associated with the corresponding Galerkin approximation
\eqref{ODE_Galerkin_t} is given by
\begin{equation} \label{JN_tx}
J^N_{t,x_N}(u) := \int_t^T [\mathcal{G}(y^N_{t,x_N}(s; u))
+ \mathcal{E}(u(s)) ] \mathrm{d} s,  \quad t \in [0,T), \; u \in \mathcal{U}_{ad}[t,T],
\end{equation}
in which we have denoted $\Pi_N x$ by $x_N$.

The value functions corresponding to the optimal control problems associated
respectively with \eqref{ODE_t_sec3} and with \eqref{ODE_Galerkin_t}, are
then defined as follows:
\begin{subequations}\label{Eq_val_fcts_sec3}
\begin{gather}
 v(t, x) := \inf_{u \in \mathcal{U}_{ad}[t,T]} J_{t,x}(u),  \quad
 \forall  (t,x) \in [0,T) \times \mathcal{H}   \text{ and }   v(T, x) = 0, \label{subEq1}\\
v_N(t, x_N) := \inf_{u \in \mathcal{U}_{ad}[t,T]} J^N_{t,x_N}(u),  \quad
  \forall  (t,x_N) \in [0,T)\times \mathcal{H}_N    \text{ and }    v_N(T, x_N) = 0.
\label{subEq2}
\end{gather}
\end{subequations}

We have then the following result.

\begin{theorem} \label{Thm_cve_Galerkin_val}
Assume that the conditions in Theorem~\ref{Lem:uniform_in_u_conv} together
with \eqref{C1} hold. Furthermore, let there exists for each pair $(t,x)$
a  minimizer $u_{t,x}^*$ (resp.~$u_{t,x}^{N,*}$) in $\mathcal{U}_{ad}[t,T]$
of the minimization problem in \eqref{subEq1} (resp.~in \eqref{subEq2}).

 Then for any $x$ in $\mathcal{H}$, it holds that
\begin{equation} \label{value_est_goal}
\lim_{N \to \infty} \sup_{t \in [0, T]} |v_N(t,\Pi_N x) - v(t,x)| = 0.
\end{equation}
\end{theorem}

\begin{proof}
By the definition of the value functions in \eqref{Eq_val_fcts_sec3}, we have
\begin{gather} \label{value_est_1}
v(t, x) = J_{t,x}(u_{t,x}^*) \le  J_{t,x}(u_{t,x}^{N,*}), \\
v_N(t, x_N) = J^N_{t,x_N}(u_{t,x}^{N,*}),
\end{gather}
with $x_N :=\Pi_N x$.

The inequality \eqref{value_est_1} and the definition of $J$ give then
\begin{equation}
v(t, x) \le \int_t^T [\mathcal{G}(y_{t,x}(s;u_{t,x}^{N,*}))
+ \mathcal{E}(u_{t,x}^{N,*}(s)) ] \mathrm{d} s.
\end{equation}

By subtracting $J^N_{t,x_N}(u_{t,x}^{N,*})$ on both sides of the above inequality,
we obtain
\begin{equation} \label{value_est_3}
\begin{aligned}
v(t, x) -  v_N(t, x_N)
& \le \int_t^T  [\mathcal{G}(y_{t,x}(s;u_{t,x}^{N,*}))
 + \mathcal{E}(u_{t,x}^{N,*}(s)) ] \mathrm{d} s \\
&\quad  -  \int_t^T  [\mathcal{G}(y^N_{t,x_N}(s; u_{t,x}^{N,*}))
 + \mathcal{E}(u_{t,x}^{N,*}(s)) ] \mathrm{d} s \\
& = \int_t^T  [\mathcal{G}(y_{t,x}(s;u_{t,x}^{N,*}))
 - \mathcal{G}(y^N_{t,x_N}(s; u_{t,x}^{N,*}))] \mathrm{d} s.
\end{aligned}
\end{equation}
Besides, since both $L$ and $F$ are time-independent, it follows from (A6)
that there exists a positive constant $\mathcal{C}$ such that
\begin{equation}
\begin{gathered}
 \|y_{t,x}(s; u_{t,x}^{N,*})\| \le \mathcal{C},  \quad
  \forall t \in [0, T),\; s \in [t, T], \; n \in \mathbb{Z}_+^\ast,\\
 \|y^N_{t,x_N}(s; u_{t,x}^{N,*})\| \le \mathcal{C}, \quad
 \forall t \in [0, T), \; s \in [t, T], \; n \in \mathbb{Z}_+^\ast.
\end{gathered}
\end{equation}
Now by denoting by $\mathfrak{B}$ the ball in $\mathcal{H}$ with radius $\mathcal{C}$
centered at the origin, we have
\begin{equation} \label{value_est_4}
\begin{aligned}
&\int_t^T [\mathcal{G}(y_{t,x}(s;u_{t,x}^{N,*}))
 - \mathcal{G}(y^N_{t,x_N}(s; u_{t,x}^{N,*}))] \mathrm{d} s \\
&\le   \operatorname{Lip}(\mathcal{G}\vert_{\mathfrak{B}})
 \int_t^T \|y_{t,x}(s;u_{t,x}^{N,*}) - y^N_{t,x_N}(s; u_{t,x}^{N,*})\|_{\mathcal{H}} \mathrm{d} s \\
& \le   T \operatorname{Lip}(\mathcal{G}\vert_{\mathfrak{B}})
 \sup_{s\in[t, T]}\|y_{t,x}(s;u_{t,x}^{N,*}) - y^N_{t,x_N}(s;u_{t,x}^{N,*})\|_{\mathcal{H}},
\end{aligned}
\end{equation}
which together with \eqref{value_est_3} leads to
\begin{equation} \label{value_est_5}
v(t, x) - v_N(t, x_N)  \le T \operatorname{Lip}(\mathcal{G}\vert_{\mathfrak{B}})
\sup_{s\in[t, T]}\|y_{t,x}(s; u_{t,x}^{N,*}) - y^N_{t,x_N}(s; u_{t,x}^{N,*})\|_{\mathcal{H}}.
\end{equation}
Similarly, we have
\begin{equation} \label{value_est_6}
v_N(t, x_N)  - v(t, x)  \le T  \operatorname{Lip}(\mathcal{G}\vert_{\mathfrak{B}})
\sup_{s\in[t, T]} \|y_{t,x}(s;u_{t,x}^*) - y^N_{t,x_N}(s; u_{t,x}^*)\|_{\mathcal{H}}.
\end{equation}
The convergence result \eqref{value_est_goal} follows then from
\eqref{value_est_5}, \eqref{value_est_6}, and
Corollary~\ref{Lem:uniform_conv_locally_Lip_t_v2}.
\end{proof}


\begin{remark} \label{Rmk:time-dependent-F} \rm
If the nonlinearity $F$ in  \eqref{ODE} depends also on time, by modifying
Assumption (A3) accordingly, all the results of Section~\ref{Sect_Galerkin}
still hold literally except that of Lemma~\ref{Lem:highmode_F_est}
that needs to be amended. For instance, by replacing (A3) by the following
assumption
\begin{itemize}
\item[(A3')] The nonlinearity $F: [0,T] \times \mathcal{H} \to \mathcal{H}$ satisfies
 $F(\cdot,y) \in L^\infty(0,T; \mathcal{H})$ for every $y$ in $\mathcal{H}$,  $F(t,\cdot)$
is locally Lipschitz for almost every $t$ in $[0, T]$, and for any given
bounded set $\mathfrak{B} \subset \mathcal{H}$, the mapping
$t \mapsto \operatorname{Lip}(F(t, \cdot)\vert_\mathfrak{B})$ is in
$L^\infty(0,T)$, where $\operatorname{Lip}(F(t, \cdot)\vert_\mathfrak{B})$
denotes the Lipschitz constant of $F(t,\cdot)$ on the set $\mathfrak{B}$.
\end{itemize}
Under this new assumption, by replacing in Lemma~\ref{Lem:highmode_F_est}
the supremum for $t$ over $[0,T]$ in \eqref{Eq_highmode_F_est} with the essential
supremum,  we have
\begin{equation}
\lim_{N\to \infty} \sup_{u\in \mathcal{U}_{ad}}
\operatorname{ess\,sup}_{t\in[0,T]} \|(\operatorname{Id}_{\mathcal{H}}
- \Pi_N) F(t, y(t;x,u))\|_{\mathcal{H}} =0.
\end{equation}
\end{remark}

\subsection{Galerkin approximations of optimal control and value functions:
Error estimates}\label{Sec_Err_estimates}

We provide in this section some simple and useful error estimates in terms
 of their interpretations.

For that purpose, we assume throughout this subsection the following set of
assumptions collected as follows
\begin{itemize}
\item[(A8)]
\begin{itemize}
\item The linear operator $L: D(L) \subset \mathcal{H} \to \mathcal{H}$ is self-adjoint.
\item The Galerkin approximations \eqref{ODE_Galerkin} are constructed based
on the eigen-subspaces $\mathcal{H}_{N}
:= \operatorname{span}\{e_k : k = 1, \dots, N\}, \; N\in \mathbb{Z}_+^\ast$,
where the $e_k$'s are the eigenfunctions of $L$.

\item Assumption (A6).
\item  Assumption \eqref{C1}.
\end{itemize}
\end{itemize}
We take the set of admissible controls, $\mathcal{U}_{ad}$, to be given
 by \eqref{Eq_U_bounded}. But in contrast to Sect.~\ref{Sec_cve}, the set $U$
in the definition of $\mathcal{U}_{ad}$ is not assumed to be compact in $V$.

Hereafter within this subsection, $\mathfrak{B}$ denotes the ball in $\mathcal{H}$
centered at the origin with radius $\mathcal{C}$, where  $\mathcal{C}$ is
the same as given in Assumption (A6). We start with a basic pointwise estimate
 between  the cost functional $J_{t, x}$  given by \eqref{J_tx}  and its
approximation $J_{t,x_{N}}^N$ given by \eqref{JN_tx}.


\begin{lemma} \label{lem:J_estimates}
Under the set of assumptions given by {\rm (A8)}, for any
$(t,x) \in [0,T)\times \mathcal{H}$, and $u\in \mathcal{U}_{ad}[t,T]$,
there exists $\gamma >0$, independent of $N$, such that for all $u$ in
$ \mathcal{U}_{ad}[t,T]$,
\begin{equation} \label{Eq_J_est}
\begin{aligned}
&|J_{t, x}(u) -  J_{t,x_{N}}^N(u)| \\
& \le \operatorname{Lip}(\mathcal{G}
\vert_{\mathfrak{B}}) \left[\sqrt{T-t}
 + \gamma (T-t) \right] \| \Pi_N^\perp y_{t,x}(\cdot;u)\|_{L^2(t,T; \mathcal{H})}.
\end{aligned}
\end{equation}
\end{lemma}

\begin{proof}

Note that by the definitions of $J_{t, x}$ and $J_{t,x_{N}}^N$ and the
locally Lipschitz condition \eqref{C1} on $\mathcal{G}$, we have
\begin{equation}
|J_{t, x}(u) -  J_{t,x_{N}}^N(u)|
\le \operatorname{Lip}(\mathcal{G}\vert_{\mathfrak{B}})
\int_{t}^T \|y_{t,x}(s;u) - y^N_{t,x_N}(s;u)\|_{\mathcal{H}} \mathrm{d} s,
\end{equation}
where $\mathfrak{B} \subset \mathcal{H}$ denotes a ball centered at the origin that
contains $y_{t,x}(s;u)$ and $y^N_{t,x_N}(s;u)$ for all $s$ in $[t,T]$.
By rewriting $y_{t,x}(s;u)$ as $\Pi_{N}y_{t,x}(s;u) + \Pi_{N}^\perp y_{t,x}(s;u)$,
we have thus
\begin{equation} \label{J_est1}
\begin{aligned}
&|J_{t, x}(u) -  J_{t,x_{N}}^N(u)| \\
&\le \operatorname{Lip}(\mathcal{G}\vert_{\mathfrak{B}}) \int_{t}^T
  \Big( \| \Pi_{N}y_{t,x}(s;u) - y^N_{t,x_N}(s;u)\|_{\mathcal{H}}
+  \| \Pi_{N}^\perp y_{t,x}(s;u) \|_{\mathcal{H}}  \Big) \mathrm{d} s.
\end{aligned}
\end{equation}

Estimate \eqref{Eq_J_est} follows then immediately if one proves that
 there exists $\gamma^2 > 0$ independent of $N$ such that for any
$(t,x) \in [0,T)\times \mathcal{H}$, and $u\in \mathcal{U}_{ad}[t,T]$,
\begin{equation} \label{low_mode_est}
\|\Pi_{N}y_{t,x}(s;u) -y^N_{t,x_{N}}(s;u) \|^2_{\mathcal{H}}
\le  \gamma^2 \int_t^s \| \Pi_N^\perp y_{t,x}(s';u) \|^2_{\mathcal{H}} \, \mathrm{d} s', \quad
 s \in [t, T].
\end{equation}


Indeed, in such a case we obtain
\begin{equation}
\begin{aligned}
&\int_{t}^T   \| \Pi_{N}y_{t,x}(s;u) - y^N_{t,x_N}(s;u)\|_{\mathcal{H}}  \mathrm{d} s\\
& \le \gamma  \int_{t}^T   \Big(\int_t^s \| \Pi_N^\perp y_{t,x}(s';u)
\|^2_{\mathcal{H}} \, \mathrm{d} s' \Big)^{1/2}\mathrm{d} s \\
& \le \gamma  (T-t) \| \Pi_N^\perp y_{t,x}(\cdot;u)\|_{L^2(t,T; \mathcal{H})},
\end{aligned}
\end{equation}
and by noting from  H\"older's inequality that
\[
 \int_{t}^T   \| \Pi_{N}^\perp y_{t,x}(s;u) \|_{\mathcal{H}}  \mathrm{d} s
\le \sqrt{T-t}  \| \Pi_N^\perp y_{t,x}(\cdot;u)\|_{L^2(t,T; \mathcal{H})},
\]
we arrive at \eqref{Eq_J_est}.


We are thus left with the proof of  \eqref{low_mode_est} which is easily
derived as follows. Let us introduce
\begin{equation} \label{defw}
w(s):= \Pi_{N}y_{t,x}(s;u) -y^N_{t,x_{N}}(s;u).
\end{equation}
By applying $\Pi_N$ to both sides of \eqref{ODE_t_sec3}, we obtain that
 $\Pi_{N}y_{t,x}(\cdot; u)$ satisfies the IVP
\begin{gather*}
\frac{\mathrm{d} \Pi_{N}y}{\mathrm{d} s} = L_N \Pi_N y + \Pi_{N}F
 (\Pi_N y + \Pi_{N}^\perp y_{t,x}(s;u)) +  \Pi_{N}\mathfrak{C} (u(s)),
  \quad s \in (t,T], \\
\Pi_N y(t)  = \Pi_{N} x \in \mathcal{H}_N.
\end{gather*}
This together with \eqref{ODE_Galerkin_t} implies that $w$ satisfies the
 problem
\begin{equation} \label{eq:w}
\begin{gathered}
\frac{\mathrm{d} w}{\mathrm{d} s} = L_{N} w + \Pi_{N}  F(\Pi_N y + \Pi_{N}^\perp y_{t,x}(s;u))
-  \Pi_{N}F(y_N),  \quad s \in (t,T], \\
w(t)  = 0.
\end{gathered}
\end{equation}
By taking the $\mathcal{H}$-inner product on both sides of \eqref{eq:w} with $w$,
we obtain
\begin{equation} \label{energy est:1}
\frac{1}{2}\frac{\mathrm{d} \|w\|^2_{\mathcal{H}}}{\mathrm{d} s}
= \langle L_{N} w, w \rangle + \langle \Pi_{N}
\bigl( F(\Pi_N y + \Pi_{N}^\perp y_{t,x}(s;u)) -  F(y_N)\bigr), w \rangle.
\end{equation}

The local Lipschitz property of $F$ implies then that
\begin{equation}  \label{RHS_control}
\begin{aligned}
&\langle \Pi_{N} \bigl( F(\Pi_N y + \Pi_{N}^\perp y_{t,x}(s;u))
-  F(y_N)\bigr), w \rangle\\
& \le  \operatorname{Lip}(F|_{\mathfrak{B}})
  \| \Pi_N y + \Pi_{N}^\perp y_{t,x}(s;u) - y_N \|_{\mathcal{H}} \, \|w\|_{\mathcal{H}} \\
&\le  \operatorname{Lip}(F|_{\mathfrak{B}})
 (\| w\| + \| \Pi_{N}^\perp y \|_{\mathcal{H}}) \, \|w\|_{\mathcal{H}} \\
&\le  \operatorname{Lip}(F|_{\mathfrak{B}}) \Big(\frac{3}{2} \| w\|_{\mathcal{H}}^2
 + \frac{1}{2} \| \Pi_{N}^\perp y  \|_{\mathcal{H}}^2\Big).\end{aligned}
\end{equation}
Since $L$ is self-adjoint, we have
\begin{equation} \label{RHS_control:3}
\langle L_{N} w(s), w(s) \rangle
= \sum_{i=1}^N  \beta_i \|w_i(s)\|_{\mathcal{H}}^2\le \beta_1 \|w(s)\|_{\mathcal{H}}^2,
\end{equation}
where $\beta_i$ is the eigenvalue associated with its  $i^{\mathrm{th}}$
eigenmode $e_i$.

Using \eqref{RHS_control} and \eqref{RHS_control:3} in \eqref{energy est:1},
we finally arrive at
\begin{equation} \label{Eq_interm1}
\frac{1}{2}\frac{\mathrm{d} \|w(s)\|_{\mathcal{H}}^2}{\mathrm{d} s}
\le \Big(\beta_1 + \frac{3}{2} \operatorname{Lip}(F|_{\mathfrak{B}})   \Big)
 \|w(s)\|_{\mathcal{H}}^2 + \frac{1}{2} \operatorname{Lip}(F|_{\mathfrak{B}})
\| \Pi_N^\perp y_{t,x}(s;u)\|_{\mathcal{H}}^2,
\end{equation}
which for all $s$ in $[t, T]$, by a standard application of Gronwall's inequality,
leads to
\begin{equation} \label{y-z est}
\begin{aligned}
& \|\Pi_{N}y_{t,x}(s;u) -y^N_{t,x_{N}}(s;u)\|_{\mathcal{H}}^2  \\
&= \|w(s)\|_{\mathcal{H}}^2   \\
&  \le \operatorname{Lip}(F|_{\mathfrak{B}}) \int_t^s
 e^{2[\beta_1 + \frac{3}{2}\operatorname{Lip}(F|_{\mathfrak{B}})](s-s')}
\| \Pi_N^\perp y_{t,x}(s';u)\|_{\mathcal{H}}^2 \mathrm{d} s' \\
&  \le e^{2[\beta_1 + \frac{3}{2}\operatorname{Lip}(F|_{\mathfrak{B}})]T}
\operatorname{Lip}(F|_{\mathfrak{B}})
\int_t^s \| \Pi_N^\perp y_{t,x}(s';u)\|_{\mathcal{H}}^2 \mathrm{d} s',
\end{aligned}
\end{equation}
taking into account that $w(t)= 0$ due to \eqref{defw}.
The estimate \eqref{low_mode_est} is thus verified, and the proof is complete.
\end{proof}

We have then
\begin{theorem} \label{Thm_PM_val}
Assume the set of assumptions {\rm (A8)}. Assume also that for each
$(t,x) \in [0,T)\times \mathcal{H}$, there exists a minimizer $u^*_{t,x}$
(resp.~$u^{N,\ast}_{t,x_{N}}$) for the value function $v$ (resp.~$v_N$)
defined in \eqref{Eq_val_fcts_sec3}.

Then for any $(t,x) \in [0,T)\times \mathcal{H}$ it holds that
\begin{equation} \label{PM_value_est_goal}
\begin{aligned}
&|v(t,x) - v_N(t,x_{N})|\\
 & \le \operatorname{Lip}(\mathcal{G}\vert_{\mathfrak{B}})
[\sqrt{T-t} + \gamma (T-t) ]
\Bigl( \|\Pi_N^\perp y_{t,x}(\cdot; u^\ast_{t,x})\|_{L^2(t,T; \mathcal{H})} \\
&\quad  + \| \Pi_N^\perp y_{t,x}(\cdot; u^{N,\ast}_{t,x_{N}})\|_{L^2(t,T; \mathcal{H})}
 \Bigr),
\end{aligned}
\end{equation}
where the constant $\gamma$ is the same as in Lemma~\ref{lem:J_estimates}.
\end{theorem}

\begin{proof}
The result is a direct consequence of Lemma~\ref{lem:J_estimates}. Indeed, since
\[
v(t,x)  = J_{t,x}(u^*_{t,x}) \le J_{t,x}(u^{N,\ast}_{t,x_{N}}) \quad \text{and}
\quad  v_N(t,x_{N}) = J^N_{t,x_{N}}(u^{N,\ast}_{t,x_{N}}),
\]
we obtain
\[
 v(t,x) - v_N(t,x_{N})  \le J_{t,x}(u^{N,\ast}_{t,x_{N}})
- J^N_{t,x_{N}}(u^{N,\ast}_{t,x_{N}}).
 \]
It follows then from \eqref{Eq_J_est} that
\begin{equation} \label{PM_val_est1}
\begin{aligned}
& v(t,x) - v_N(t,x_{N}) \\
& \le  \operatorname{Lip}(\mathcal{G} \vert_{\mathfrak{B}})
\left[{\sqrt{T-t}}+ \gamma (T-t) \right]
 \| \Pi_N^\perp y_{t,x}(\cdot;u^{N,\ast}_{t,x_{N}})\|_{L^2(t,T; \mathcal{H})}
\end{aligned}
\end{equation}
Similarly,
\begin{equation} \label{PM_val_est2}
\begin{aligned}
& v_N(t,x_{N})  -  v(t,x)\\
& \le  \operatorname{Lip}(\mathcal{G}\vert_{\mathfrak{B}})
\left[{\sqrt{T-t}}+ \gamma (T-t) \right]
 \|\Pi_N^\perp y_{t,x}(\cdot; u^\ast_{t,x})\|_{L^2(t,T; \mathcal{H})}
\end{aligned}
\end{equation}
The estimate \eqref{PM_value_est_goal} results then from \eqref{PM_val_est1}
 and \eqref{PM_val_est2}.
\end{proof}

\begin{remark} \label{Rmk_motivation_A7} \rm
Note that in the RHS of \eqref{PM_value_est_goal},  it is not clear a priori that
\begin{equation} \label{unif_vanishing}
\lim_{N\to \infty} \|\Pi_N^\perp y_{t,x}(\cdot; u^{N,\ast}_{t,x_{N}})
\|_{L^2(t,T; \mathcal{H})} = 0.
\end{equation}
The reason relies on the dependence on $u^{N,\ast}_{t,x_{N}}$ of
$\| \Pi_N^\perp y_{t,x}(\cdot; u^{N,\ast}_{t,x_{N}})\|_{L^2(t,T; \mathcal{H})}$,
where $u^{N,\ast}_{t,x_{N}}$ denotes the control synthesized from the
 $N$-dimensional Galerkin approximation.

Estimate  \eqref{PM_value_est_goal} provides thus another perspective regarding
the usage of Assumption (A7) to ensure the convergence of the value functions
associated with the Galerkin approximations presented in Sect.~\ref{Sec_cve}.
Note that Assumption (A7) is just a slightly strengthened form of
\eqref{unif_vanishing}. See Sect.~\ref{Sect_examples} for a broad class of
IVPs for which Assumption (A7) is satisfied.
\end{remark}

\begin{corollary} \label{Lem_controller_est}
Assume that the conditions given in Theorem~\ref{Thm_PM_val} hold.
Let us also denote $u^* := u^*_{0,x}$ and $u^{*}_{N}:= u^{N,*}_{0,x_N}$.
Assume furthermore that there exists $\sigma >0$ such that the following
local growth condition is satisfied  for the cost functional $J$ defined
in \eqref{J_sec3}:
\begin{equation} \label{Eq_growth_onJ}
\sigma \|u^*  - v\|_{L^q(0,T; V)}^q \le J(x, v) - J(x, u^*),
\end{equation}
for all $v$ in some neighborhood $\mathcal{W} \subset \mathcal{U}_{ad}$
of $u^*$, with $\mathcal{U}_{ad}$ given by \eqref{Eq_U_bounded}.
Assume finally that $u^*_N$  lies in  $\mathcal{W}$.
Then
\begin{equation}\label{Est_contr_diff}
\begin{aligned}
&\|u^\ast - u^\ast_{N}\|_{L^q(0,T; V)}^q \\
& \le \frac{1}{\sigma}\operatorname{Lip}(\mathcal{G}\vert_{\mathfrak{B}})
[\sqrt{T} + \gamma T ]
\Bigl( \| \Pi_N^\perp y(\cdot;u^*)\|_{L^2(0,T; \mathcal{H})}\\
&\quad +  2 \|  \Pi_N^\perp y (\cdot; u^{*}_{N})\|_{L^2(0,T; \mathcal{H})} \Bigr),
\end{aligned}
\end{equation}
where the constant $\gamma$ is the same as in Lemma~\ref{lem:J_estimates}.
\end{corollary}

\begin{proof}
By the assumptions, we have
\begin{equation}
\|u^*  - u^*_N\|_{L^q(0,T; V)}^q \le \frac{1}{\sigma} \left(J(x, u^*_N) - J(x, u^*)\right).
\end{equation}
Note also that
\begin{align*}
J(x, u^*_N) - J(x, u^*)
&= J(x, u^*_N) - J_N(x_{N},u^*_N) + J_N(x_{N}, u^*_N) - J(x, u^*) \\
& =  J_{0,x}(u^*_N) - J^N_{0,x_{N}}(u^*_N)+ v_N(0,x_{N}) - v(0,x),
\end{align*}
where we used the fact that
\begin{gather*}
 J(x, u^*_N) = J_{0,x}(u^*_N),  \quad J_N(x_{N},u^*_N) = J^N_{0,x_{N}}(u^*_N),\\
J_N(x_{N},u^*_N)  = v_N(0,x_{N}),   \quad J(x, u^*) = v(0,x).
\end{gather*}
The result follows by applying the estimate \eqref{Eq_J_est} to
$J_{0,x}(u^*_N) - J^N_{0,x_{N}}(u^*_N)$ and the estimate \eqref{PM_value_est_goal}
to $v_N(0,x_{N}) - v(0,x)$.
\end{proof}

\begin{remark} \rm
Note that \eqref{Eq_growth_onJ} ensures uniqueness of the local minimizer
$u^\ast$ in $\mathcal{W}$.
\end{remark}

\subsection{Examples that satisfy Assumption (A7)} \label{Sect_examples}
We consider in this subsection a special but important case of Galerkin
approximations \eqref{ODE_Galerkin} built from the
eigenfunctions\footnote{i.e.~with
$\mathcal{H}_N:=\text{span}\{e_1, \dots,e_{N}\}$ and $L_N:= \Pi_N L \Pi_N$,
for which Assumptions (A0)-(A2) are satisfied.} $\{e_k\}_{k\geq 1}$ of $L$,
and for which we assume the following properties:
\begin{itemize}

\item[(i)]  The set of admissible controls $\mathcal{U}_{ad}$ is given as
in \eqref{Eq_U_bounded} with $q>1$.

\item[(ii)]  The linear operator $L: D(L) \subset \mathcal{H} \to \mathcal{H}$  is self-adjoint
with compact resolvent and satisfies Assumption (A0).


\item[(iii)] The mapping $F: \mathcal{H} \to \mathcal{H}$ and  $\mathfrak{C}: V \to \mathcal{H}$ are
locally Lipschitz, and $\mathfrak{C}(0) = 0$.


\item[(iv)]  Assumption (A6) is satisfied.

\end{itemize}
We have then the following useful Lemma for applications; see Sect.~\ref{Sec_appl}.

\begin{lemma} \label{Lem_examples}
The convergence property \eqref{Est_uniformity_highmodes} in  {\rm (A7)}
 holds under assumptions {\rm (i)--(iv)} above.
\end{lemma}

\begin{proof}
Since $L$ is assumed to be self-adjoint with compact resolvent,
it follows from spectral theory of self-adjoint compact operator
\cite[Thm.~6.8, Prop.~6.9, and Thm.~6.11]{Brezis10} that the eigenfunctions
of $L$ form an orthonormal basis of $\mathcal{H}$, and the eigenvalues
$\{\beta_k\}_{k\geq 1}$ of $L$ approach either $\infty$ or $-\infty$ as
$k$ approaches $\infty$. Since $L$ is also assumed to be the infinitesimal
generator of a $C_0$-semigroup (Assumption (A0)), $\beta_k$ is bounded
above \cite[Thm.~5.3]{Pazy83}. It follows then that
\begin{equation}
\beta_N \to -\infty \quad \text{as }   N \to \infty.
\end{equation}

As before $\Pi_N: \mathcal{H} \to \mathcal{H}_N$ denotes the orthogonal projector associated
with $\mathcal{H}_N$ spanned by the first $N$ eigenfunctions. Let us recall also
that $\Pi_N^\perp$ denotes the orthogonal projector associated with the orthogonal
complement of $\mathcal{H}_N$ in $\mathcal{H}$, namely
\[
\Pi_N^\perp := \operatorname{Id} - \Pi_N.
\]
Now, by applying $\Pi_N^\perp$ to both sides of \eqref{Eq_mild} and
introducing the notation
\[
y_{N>} := \Pi_N^\perp y,
\]
we obtain, for all $t$ in   $[0, T]$,
\begin{equation}
y_{N>}(t) = T(t) y_{N>}(0) + \int_{0}^t T(t-s) \Pi_N^\perp \big( F(y(s;x,u))
+   \mathfrak{C} (u(s)) \big) \mathrm{d} s,
\end{equation}
where we also used the fact that $\Pi_N^\perp$ commutes with the semigroup
$\{T(t)\}_{t \ge 0}$.

Let $\mathcal{C}$ be the constant arising in the upper bounds of
\eqref{Eq_y_uniform-in-u_bounds} in Assumption (A6), and denote by
$\mathfrak{B}_{\mathcal{H}}$ the closed ball in $\mathcal{H}$ centered at the origin with
radius $\mathcal{C}$. Let also $\mathfrak{B}_{\scriptscriptstyle V}$ be the
smallest closed ball in $V$ containing the compact set $U$ given in
\eqref{Eq_U_bounded}. We get then for $t\in [0, T]$:
\begin{equation} \label{wN_bound}
\begin{aligned}
|y_{N>}(t)|
&\le e^{\beta_{N+1} t} |y_{N>}(0)|
+ \operatorname{Lip}(F\vert_{\mathfrak{B}_{\mathcal{H}}}) (\mathcal{C}
 + \|F(0)\|_{\mathcal{H}}) \int_{0}^t e^{\beta_{N+1} (t-s)}  \mathrm{d} s\\
&\quad + \operatorname{Lip}(\mathfrak{C}\vert_{\mathfrak{B}_V})
\int_{0}^t e^{\beta_{N+1} (t-s)} \|u(s)\|_V  \mathrm{d} s \\
& \le e^{\beta_{N+1} t} |y_{N>}(0)| +  \frac{1}{|\beta_{N+1}|}
\operatorname{Lip}(F\vert_{\mathfrak{B}_{\mathcal{H}}}) (\mathcal{C} + \|F(0)\|_{\mathcal{H}}) \\
& \quad + \frac{1}{(|\beta_{N+1} |q')^{\frac{1}{q'}}}
\operatorname{Lip}(\mathfrak{C}\vert_{\mathfrak{B}_V})  \|u\|_{L^{q}([0,T; V])},
\end{aligned}
\end{equation}
where we have used the H\"older inequality with $q' = q/(q-1)$ to estimate
the term $\int_{0}^t e^{\beta_{N+1} (t-s)} \|u(s)\|_V  \mathrm{d} s$.

Now, let $C_U:= \sup_{w \in U} \|w\|_V$.  We have
\begin{equation}
\|u\|_{L^{q}(0,T; V)} \le C_U T^{1/q}, \quad \forall u \in \mathcal{U}_{ad}.
\end{equation}
Using the above bound in \eqref{wN_bound}, we obtain
\begin{equation} \label{wN_bound2}
\begin{aligned}
|y_{N>}(t)|
&\le e^{\beta_{N+1} t} |y_{N>}(0)|  + \frac{1}{|\beta_{N+1}|}
\operatorname{Lip}(F\vert_{\mathfrak{B}_{\mathcal{H}}}) (\mathcal{C} + \|F(0)\|_{\mathcal{H}}) \\
& \quad + \frac{1}{(|\beta_{N+1} |q')^{\frac{1}{q'}}} C_U T^{1/q}
\operatorname{Lip}(\mathfrak{C}\vert_{\mathfrak{B}_V}), \quad
 \forall t \in [0, T], \; u \in \mathcal{U}_{ad}.
\end{aligned}
\end{equation}



Since $\beta_N$ approaches $-\infty$ as $N$ approaches $\infty$ by assumption,
we obtain that for each $\epsilon >0$, $T>0$ and $x$ in $\mathcal{H}$, there exists a
positive integer $N_0$  such that
\begin{equation} \label{Eq_unif_est_ys_ex}
\sup_{u\in \mathcal{U}_{ad}} \; \sup_{0\leq t\leq T} \|(\operatorname{Id}_{\mathcal{H}}
- \Pi_{N}) y(t;x,u)\|_{\mathcal{H}} \le \epsilon, \quad \forall N \ge N_0.
\end{equation}
Thus Assumption (A7) is satisfied.
\end{proof}

\begin{remark} \label{Rmk_other_spectral_assumption} \rm
From the proof given above, it is clear that Assumption (ii) in
Lemma~\ref{Lem_examples} can be relaxed to e.g.
\begin{itemize}
\item[(ii')] The eigenfunctions of the linear operator
$L: D(L) \subset \mathcal{H} \to \mathcal{H}$ forms an orthonormal basis of $\mathcal{H}$ and
the eigenvalues of $L$ approaches $-\infty$.
\end{itemize}

Note also that Lemma~\ref{Lem_examples} still holds if $L$ has complex eigenvalues.
 We just need to work with a complexification of the operator $L$ and the
underlying state space $\mathcal{H}$ (cf.~e.g.~\cite[footnote 17 on p.~55]{CLW15_vol2}),
and make the corresponding changes in Assumption (ii') above.
\end{remark}

\section{Application to optimal control of energy balance climate models}
\label{Sec_appl}
We show in this section that our framework allows us to provide rigorous
 Galerkin approximations to the optimal control of  broad class of semilinear
heat problems, posed on a compact (smooth) manifold without boundary.
As an application, we show in Sect.~\ref{Sec_EBM} that the optimal control
of energy balance models (EBMs) arising in the context of geoengineering
 and climate change, can be thus approximated by optimal control problems
of ODEs, more tractable numerically.  We first recall some fundamentals
of differential geometry to prepare the analysis.


\subsection{Preliminary from differential geometry} \label{Sect_diff_geo_prelim}
To properly write an EBM on the sphere, we recall how differential operators
are defined on an abstract compact smooth manifold $\mathfrak{M}$ without
boundary, of dimension $n$ and endowed with a Riemannian metric $\mathfrak{g}$.
Recall that a Riemannian metric $\mathfrak{g}$ is a smooth family of inner
products on the tangent spaces $T_p \mathfrak{M}$. Namely, $\mathfrak{g}$
associates (smoothly) to each $p$ in  $\mathfrak{M}$ a positive definite symmetric
bilinear form $\varphi_p$ on $T_p \mathfrak{M}\times T_p \mathfrak{M}$.
In local coordinates,
\[
\mathfrak{g}_{ij}(p)=\varphi_p(\partial_i,\partial_j),
\]
and thus $\det  \mathfrak{g}(p) >0$.

 Given a smooth function $u$ on $\mathfrak{M}$,  the gradient
$\nabla_{\mathfrak{g}} u$ is a vector field on $\mathfrak{M}$,
that takes in local coordinates the form
\begin{equation} \label{Eq_grad}
\nabla_{\mathfrak{g}} u:= \sum_{i=1}^n\Big(\sum_{j=1}^n \mathfrak{g}^{ij}\partial_j
u \Big)\; \partial_i.
\end{equation}
The divergence of a vector field $X=\sum_{j=1}^n X^j \partial_j$ takes the
following form in local coordinates
\begin{equation} \label{Eq_div}
\operatorname{div}_{\mathfrak{g}}  X= \frac{1}{\sqrt{\det
 \mathfrak{g}}} \sum_{i=1}^n \partial_i \Big( X^i \sqrt{\det  \mathfrak{g}}\Big).
\end{equation}
The Laplacian on $(\mathfrak{M},\mathfrak{g})$ takes then the form
\begin{equation}
\Delta_{\mathfrak{g}}
:= \operatorname{div}_{\mathfrak{g}} \circ \nabla_{\mathfrak{g}}
= \frac{1}{\sqrt{\det  \mathfrak{g}}}
\sum_{i=1}^n \partial_i\Big(\sum_{j=1}^n\mathfrak{g}^{ij}\sqrt{\det  \mathfrak{g}}
  \partial_j\Big).
\end{equation}
Set
\begin{equation}
\mathbb{S}^n:=\{x\in \mathbb{R}^{n+1}:|x|=1\}.
\end{equation}
Let $y = (y_1,\dots,y_{n+1})$ be any point of $\mathbb{S}^n$ and
$(x_1,\dots,x_n)$ be its image under the
stereographic projection from the ``north pole'' $N = (0, \dots, 0, 1)$ onto
the space
\begin{equation}
\mathbb{R}^n \equiv \{(\xi_1,\dots,\xi_{n+1}) \in \mathbb{R}^{n+1} : \xi_{n+1}=0\}.
\end{equation}

The canonical Riemannian metric on $\mathbb{S}^n$ takes then the form
\begin{equation} \label{Def_gij}
\mathfrak{g}_{ij}=\frac{4}{(1+|x|^2)^2} \delta_{ij}, \quad 1\leq i,j \leq n.
\end{equation}
Note that $\mathfrak{g}^{ij}$ introduced above has here the explicit expression:
\begin{equation}
\mathfrak{g}^{ij}=(\mathfrak{g}_{ii})^{-1}\delta_{ij}, \quad 1\leq i,j \leq n.
\end{equation}
In what follows we denote by $\langle \cdot , \cdot \rangle_{\mathfrak{g}}$
the inner Riemannian product on $(\mathbb{S}^n,\mathfrak{g})$ and
 by $L^2(\mathbb{S}^n)$ the space of square-integrable real-valued functions
for the norm induced by this inner product. The space $\vec{L}^2(\mathbb{S}^n)$
is then defined as
\[
\vec{L}^2(\mathbb{S}^n):=\underbrace{L^2(\mathbb{S}^n)\times \cdots
\times L^2(\mathbb{S}^n)}_n.
\]

Introduce now the polar coordinates on $\mathbb{S}^n$. Consider the
``south pole'' $S = (0, \dots , 0,-1)$. For any
$y\in \mathbb{S}^n \backslash \{N, S\}$, define $\rho \in (0,\pi)$
and $\theta \in \mathbb{S}^{n-1}$ by
\begin{equation}
\cos \rho =y^{n+1}, \quad \theta=\frac{y'}{|y'|},
\end{equation}
where $y'=(y_1,y_2,\dots,y_n,0)$.

These variables have the following interpretation: the polar radius
$\rho$ represents the angle between the position vectors of $y$ and $N$;
it can be also regarded as the latitude of the point $y$ measured from $N$.
The polar angle $\theta$ can be regarded as the longitude of the point $y$.

The canonical spherical Riemannian metric has the following expression
in the polar coordinates:
\begin{equation}
\mathrm{d} s^2 =\sum_{i,j=1}^n \mathfrak{g}_{ij}\; \mathrm{d} x_i \mathrm{d} x_j
=\mathrm{d} \rho^2  + (\sin \rho)^2 \mathrm{d} \theta^2.
\end{equation}
The operator $\Delta_{\mathfrak{g}}$ then takes the form
\begin{equation}
\Delta_{\mathfrak{g}}=\frac{\partial}{\partial \rho^2}
+(n-1) \cot \rho  \frac{\partial}{\partial \rho}
+\frac{1}{(\sin \rho)^2 } \Delta_{\theta},
\end{equation}
where $ \Delta_{\theta}$ denotes the Laplace-Beltrami operator on
$\mathbb{S}^{n-1}$.

Let us introduce the linear operator
\[
\mathcal{L}_\mathfrak{g}:= -\Delta_\mathfrak{g},
\]
 with domain
\begin{equation} \label{dom_L}
\mathcal{D}(\mathcal{L}_\mathfrak{g})
:=\{u \in L^2(\mathbb{S}^n) : \nabla_\mathfrak{g} u \in  \vec{L}^2(\mathbb{S}^n),
\; \Delta_\mathfrak{g} u \in L^2(\mathbb{S}^n) \}.
\end{equation}
It is known that $\mathcal{L}_\mathfrak{g}$ is self-adjoint
 \cite[Sect.~4.2]{Grigoryan09}. Moreover, the following results hold:

\begin{theorem} \label{Thm_deltag}
The spectrum of $\mathcal{L}_\mathfrak{g}$ with domain
 $\mathcal{D}(\mathcal{L}_\mathfrak{g})$ defined in \eqref{dom_L}  is
discrete and consists of an increasing sequence
$\{\lambda_{k}\}_{k=1}^\infty$ of non-negative eigenvalues (counted according to
multiplicity) such that
\[
\lim_{k\to \infty} \lambda_{k}  = +\infty.
\]
There is an orthonormal
basis $\{e_{k}\}_{k=1}^\infty$ in $L^2(\mathbb{S}^n)$ such that each function
$e_{k}$ is an eigenfunction
of $\mathcal{L}_\mathfrak{g}$ with the eigenvalue $\lambda_k$.
\end{theorem}

Let $\{E_\lambda \}_{\lambda \ge 0}$ denote the spectral resolution of
$\mathcal{L}_\mathfrak{g}$. We can define then for each $t \geq 0$,
\begin{equation} \label{Def_Pt}
P(t) :=\int_{0}^\infty e^{-t \lambda} \mathrm{d} E_\lambda, \; \;
\end{equation}
that constitutes a bounded linear operator acting on $L^2(\mathbb{S}^n)$
satisfying the  properties summarized below.


\begin{theorem} \label{Thm_heat_semigroup}
Let $P(t)$ be the operator defined by \eqref{Def_Pt}, then
\begin{itemize}
\item[(i)] For any $t \ge 0$, $P(t)$ is a bounded self-adjoint operator on
$L^2(\mathbb{S}^n)$, and
\begin{equation}
\|P(t)\|\le 1.
\end{equation}
\item[(ii)] The family $\{P(t)\}_{t\ge 0}$ satisfies the semigroup identity:
\begin{equation}
P(t) P(s) = P(t+s),
\end{equation}
for all $t,s \ge 0$.

\item[(iii)] The mapping $t \mapsto P(t)$ is strongly continuous on
$[0, \infty)$. That is, for any $t\ge 0$ and $f \in L^2(\mathbb{S}^n)$,
\begin{equation}
\lim_{s \to t} P(s) f = P(t) f,
\end{equation}
where the limit is understood in the norm of $L^2(\mathbb{S}^n)$.
In particular, for any $f \in L^2(\mathbb{S}^n)$,
\begin{equation}
\lim_{t \to 0^+} P(t) f = f.
\end{equation}

\item[(iv)] For all $f \in L^2(\mathbb{S}^n)$ and $t > 0$, we have that
 $P(t) f$  lies in $\mathcal{D}(\mathcal{L}_\mathfrak{g})$ and
\begin{equation}
\frac{\mathrm{d}}{\mathrm{d} t} (P(t) f)  = - \mathcal{L}_\mathfrak{g}(P(t) f).
\end{equation}
\end{itemize}
\end{theorem}

The above theorems are particular cases of results presented in
 \cite{Grigoryan09} for the Laplace operator defined on general
 weighted smooth manifolds \cite[Def.~3.17]{Grigoryan09}.
See \cite[Thm.~10.13]{Grigoryan09} for Theorem~\ref{Thm_deltag}
and \cite[Thm.~4.9]{Grigoryan09} for Theorem \ref{Thm_heat_semigroup}.

\subsection{Galerkin approximations of controlled semilinear heat equations on
$\mathbb{S}^n$}\label{Sec_optctr_man}

Given $\mathcal{L}_\mathfrak{g}=-\Delta_\mathfrak{g} $ with domain
$\mathcal{D}(\mathcal{L}_\mathfrak{g})$ given in \eqref{dom_L}, we consider
the following abstract controlled semilinear heat problem of the
form  \eqref{ODE} posed in $L^2(\mathbb{S}^n)$:
\begin{equation} \label{heat_eq}
\begin{gathered}
\frac{\mathrm{d} y}{\mathrm{d} t} = - \mathcal{L}_\mathfrak{g} \, y + F(y)
+ \mathfrak{C} (u(t)),  \quad t \in (0, T], \\
y(0) = x \; \in L^2(\mathbb{S}^n).
\end{gathered}
\end{equation}


In what follows we denote by $\mathcal{H}$ the space $L^2(\mathbb{S}^n)$.
Based on Theorem~\ref{Lem:uniform_in_u_conv} of Section~\ref{Sect_Galerkin},
we show the uniform convergence of Galerkin approximations  to \eqref{heat_eq}
associated with the reduced state space $\mathcal{H}_{N} \subset L^2(\mathbb{S}^n)$
defined by
\begin{equation} \label{Eq_Hn_heat}
\mathcal{H}_{N}  := \operatorname{span}\{e_k : k = 1, \dots, N\}, \; N\in \mathbb{Z}_+^\ast,
\end{equation}
in which the $e_k$'s denote the eigenfunctions of $-\mathcal{L}_\mathfrak{g}$
lying in $\mathcal{D}(\mathcal{L}_{\mathfrak{g}})$; see Theorem~\ref{Thm_deltag}.

The linear approximations $L_N$ of the operator $-\mathcal{L}_\mathfrak{g}$
are then naturally defined as
\begin{equation}
L_N:= \Pi_N \Delta_\mathfrak{g} \Pi_N: \mathcal{H} \to \mathcal{H}_N,
\end{equation}
where $\Pi_N$ denotes the orthogonal projector associated with $\mathcal{H}_N$.

Theorem~\ref{Lem:uniform_in_u_conv} leads then to the following corollary
about uniform convergence of Galerkin approximations of \eqref{heat_eq}.

\begin{corollary}\label{Cor:heat_Galerkin_approx}
Let $V$ be a Hilbert space. Assume that $F: L^2(\mathbb{S}^n) \to L^2(\mathbb{S}^n)$
and  $\mathfrak{C}: V \to L^2(\mathbb{S}^n)$ are both globally Lipschitz, and
$\mathfrak{C}(0) = 0$.  Assume the set of admissible controls $\mathcal{U}_{ad}$
is given by \eqref{Eq_U_bounded} with
$U$ therein being a compact subset of the Hilbert space~$V$ and with $q > 1$.

Then, for any $T > 0$ and any $(x,u)$ in $L^2(\mathbb{S}^n) \times \mathcal{U}_{ad}$,
the problem \eqref{heat_eq} admits a unique mild solution $y(\cdot; x, u)$
in $C([0,T],\mathcal{H})$, and its Galerkin approximation \eqref{ODE_Galerkin}
associated with the eigen-subspaces \eqref{Eq_Hn_heat} admits a unique solution
$y_N(\cdot; \Pi_N x, u)$ in  $C([0,T],\mathcal{H}_N)$ for each $N$ in $\mathbb{Z}_+^\ast$.
 Moreover,  the following uniform convergence result holds:
\begin{equation} \label{heat_eqn_uniform_in_u_conv}
\lim_{N\to \infty}  \sup_{u\in \mathcal{U}_{ad}}
\sup_{t \in [0, T]} \|y_N(t; \Pi_N x, u) - y(t; x,u)\|_{\mathcal{H}} = 0.
\end{equation}
\end{corollary}

\begin{proof}
We only need to check the conditions  (A0)--(A2),  (A6), and (A7) assumed
in Theorem~\ref{Lem:uniform_in_u_conv}. This is done below in four steps.
\medskip

\noindent\textbf{Step 1:} Checking (A0)--(A1). From Theorem~\ref{Thm_heat_semigroup},
we know that $-\mathcal{L}_\mathfrak{g}$ is the infinitesimal generator of the
$C_0$-semigroup of contractions, $\{P(t)\}_{t\ge 0}$, on $L^2(\mathbb{S}^n)$.

Since $-\mathcal{L}_\mathfrak{g}$ is self-adjoint, the operator $L_N$ is a
finite-rank diagonal operator acting on $\mathcal{H}$ and
we have for each $\phi$ in $\mathcal{H}$,
\begin{equation}
e^{t L_N} \phi := \sum_{k=1}^N e^{-t \lambda_k} \langle \phi,e_k\rangle_{\mathfrak{g}} \; e_k.
\end{equation}
It follows that each operator $L_N$ generates a $C_0$-semigroup of contractions
on $\mathcal{H}$, which will be denoted by $\{P_N(t)\}_{t\ge 0}$.
We have thus checked Assumptions (A0)--(A1) given in Section~\ref{Sect_Galerkin}
with $M=1$ and $\omega =0$, namely
\begin{equation} \label{Eq_control_linearflow_heat}
 \|P(t)\| \le 1 \quad \text{and} \quad \|P_N(t)\| \le 1, \quad N \geq 0, \;  \ge 0.
\end{equation}
\medskip

\noindent\textbf{Step 2:} Checking (A2). This condition results from the
self-adjointness of $-\mathcal{L}_\mathfrak{g}$. Indeed, for any given $\phi$
in $\mathcal{D}(\mathcal{L}_\mathfrak{g})$, since both $\phi$ and
$\Delta_\mathfrak{g}\phi$ belong to $L^2(\mathbb{S}^n)$, the following
expansions against the eigenbasis hold:
\begin{equation}
\phi = \sum_{i=1}^\infty a_i e_i, \quad
\Delta_\mathfrak{g} \phi  = \sum_{i=1}^\infty b_i e_i,
\end{equation}
where
\begin{equation}
a_i = \langle \phi, e_i \rangle_{\mathfrak{g}} ,  \quad
b_i = \langle \Delta_\mathfrak{g} \phi , e_i \rangle_{\mathfrak{g}}, \quad
i \in \mathbb{Z}_+^\ast.
\end{equation}
Note that
\begin{equation}
b_i = \langle \Delta_\mathfrak{g} \phi, e_i \rangle_{\mathfrak{g}}
=  \langle \phi, \Delta_\mathfrak{g} e_i \rangle_{\mathfrak{g}}
=  \lambda_i \langle \phi, e_i \rangle_{\mathfrak{g}}  = \lambda_i a_i.
\end{equation}
We get then that
\begin{equation}
\begin{aligned}
\|L_N \phi - \Delta_\mathfrak{g}\phi \|_{L^2(\mathbb{S}^n)}
&= \big\| \Pi_N \Delta_\mathfrak{g} \Big(\sum_{i=1}^N a_i e_i \Big)
 - \Delta_\mathfrak{g} \phi \big \|_{L^2(\mathbb{S}^n)} \\
&= \big\|  \sum_{i=1}^N \lambda_i a_i e_i
 - \sum_{i=1}^\infty b_i e_i \big \|_{L^2(\mathbb{S}^n)}
=  \big \|\sum_{i=N+1}^\infty b_i e_i \big \|_{L^2(\mathbb{S}^n)}
\end{aligned}
\end{equation}
and Assumption (A2) follows.
\medskip

\noindent\textbf{Step 3:} Checking (A6). Since $F$ and $\mathfrak{C}$
are globally Lipschitz, the existence of a unique mild solution to
\eqref{heat_eq} and to its Galerkin approximation \eqref{ODE_Galerkin}
follows directly from a classical fixed point argument and
standard Gronwall's estimates; see
e.g.~\cite[Prop.~4.3.3 and Thm.~4.3.4]{Cazenave_al98}.
In particular, by \eqref{Eq_control_linearflow_heat}, we obtain the following
a priori estimates  for all $t$ in $[0, T]$ and $N$ in $\mathbb{Z}_+^\ast$:
\begin{equation} \label{solution_bounds_heat_eq}
\begin{gathered}
\begin{aligned}
&\|y(t; x, u)\|_{L^2(\mathbb{S}^n)}  \\
&\le e^{\operatorname{Lip}(F)t}\|x\|_{L^2(\mathbb{S}^n)} + \int_0^t g(s) \mathrm{d} s
+ \operatorname{Lip}(F) \int_0^t g(s) e^{\operatorname{Lip}(F)(t-s)} \mathrm{d} s,
\end{aligned}\\
\begin{aligned}
& \|y_N(t; \Pi_N x, u)\|_{L^2(\mathbb{S}^n)}\\
& \le e^{\operatorname{Lip}(F)t}\|x\|_{L^2(\mathbb{S}^n)} + \int_0^t g(s) \mathrm{d} s
 +  \operatorname{Lip}(F) \int_0^t g(s) e^{\operatorname{Lip}(F)(t-s)} \mathrm{d} s,
\end{aligned}
\end{gathered}
\end{equation}
where
\[
g(s) =  \|F(0)\|_{L^2(\mathbb{S}^n)}
+ \operatorname{Lip}(\mathfrak{C}) \|u(s)\|_{L^2(\mathbb{S}^n)},
 \quad \text{for a.e. } s \in [0, T].
\]
Moreover, since by assumption $u(t)$ takes value in a compact thus bounded set
 $U$ for each $u \in \mathcal{U}_{ad}$, the a priori estimates
\eqref{solution_bounds_heat_eq} also ensure the required uniform boundedness
estimates \eqref{Eq_y_uniform-in-u_bounds} stated in Assumption (A6).
\medskip

\noindent\textbf{Step 4:} Checking (A7). Due to our assumptions and from what
precedes, the conditions of Lemma~\ref{Lem_examples} are satisfied and thus
Assumption (A7) is satisfied. The proof is complete.
\end{proof}

\begin{remark} \label{local_lipman} \rm
Corollary \ref{Cor:heat_Galerkin_approx} has been formulated in the case where
$F$ and $\mathfrak{C}$ are globally Lipschitz, but actually the conclusions
of this corollary still hold if these conditions are relaxed to be
locally Lipschitz  as long as Assumption (A6) is satisfied with the relevant
a priori estimates as a consequence of Theorem \ref{Lem:uniform_in_u_conv}.
\end{remark}


\begin{remark} \label{Rmk_heat_F} \rm
Similar to Remark~\ref{Rmk:time-dependent-F}, we note that
Corollary~\ref{Cor:heat_Galerkin_approx} still holds when the nonlinearity
$F$ depends also on time, i.e.,
$F: [0,T] \times L^2(\mathbb{S}^n) \to L^2(\mathbb{S}^n)$, and satisfies for
instance that $F(\cdot,y)
\in L^\infty(0,T; L^2(\mathbb{S}^n))$ for each $y\in L^2(\mathbb{S}^n)$,
$F(t,\cdot)$ is globally Lipschitz for almost every $t \in [0, T]$ and the
mapping $t\mapsto \operatorname{Lip}(F(t, \cdot))$ is in $L^\infty(0,T)$.
\end{remark}

\begin{remark} \label{Rmk_heat_general_metric} \rm
Note also that Corollary~\ref{Cor:heat_Galerkin_approx} still holds when
the semilinear heat problem \eqref{heat_eq} is posed on a general
$n$-dimensional Riemannian smooth and compact manifold $(\mathfrak{M}, \mathbf{g})$
without boundary, with the Riemannian metric $\mathbf{g}$ not limited thus
to $\mathfrak{g}$ defined in \eqref{Def_gij}. Similarly the case of semilinear
heat problem  posed on a non-empty relatively compact subset $\Omega$
of $(\mathfrak{M}, \mathbf{g})$ with homogenous Dirichlet boundary conditions
can also be dealt with.  This is because Theorems~\ref{Thm_deltag}
and \ref{Thm_heat_semigroup} still hold for such cases;
see again \cite[Thm.~4.9 and Thm.~10.13]{Grigoryan09}. In particular,
Corollary~\ref{Cor:heat_Galerkin_approx} holds when the Riemannian metric
 $\mathfrak{g}$ on $\mathbb{S}^n$ is replaced by another Riemannian metric
$\widetilde{\mathfrak{g}}$ and the Laplacian $\Delta_\mathfrak{g}$
in \eqref{heat_eq} is replaced by $\Delta_{\widetilde{\mathfrak{g}}}$ accordingly.
This is remark about the change of Riemannian metric is used in Sect.~\ref{Sec_EBM}
that follows.
\end{remark}

\subsection{Energy balance models} \label{Sec_EBM}

Energy balance models (EBMs) are among the simplest climate models that can
be used for the study of climate sensitivity.  They are formulated based on
the energy balance on the Earth surface \cite{North_al81,stephens2012update}
and have the Earth surface temperature as the only dependent variable.
 First made popular by the works \cite{Budyko69,Sellers69}, these models have
 been extensively studied since both analytically and numerically;
see e.g.~\cite{bermejo2009mathematical,North_al81,Roques_al14} and references
therein.

With suitable tuning of their parameters, EBMs that resolve the Earth's
land-sea geography and are forced by the seasonal insolation cycle have been
shown to mimic, to a certain extent, the observed zonal temperatures for the
observed present climate \cite{North_al83,crowley2000causes}.
Once EBMs are fitted to observations \cite{Sellers69,Ghil76,graves1993new}
or to simulations from general circulation models
(GCMs)\cite{hyde1989comparison,crowley2000causes}, they can be used to estimate
the temporal response patterns to various forcing scenarios; such a methodology
is of particular interest in the detection and attribution of climate
change \cite{stone2007detection}.

Depending on whether zonal or meridional averages are used, the modeled surface
temperature can either depend on the latitude only, or depend on both  the
latitude and the longitude, resulting respectively in  1D, or 2D models.
In the 2D case, the model is posed on the two-dimensional unit sphere
$\mathbb{S}^2$, and takes typically the following form \cite{North_al83}:
\begin{equation} \label{Eq_EBM}
\frac{\partial T(\xi,t)}{\partial t}
= \operatorname{div}_\mathfrak{g}( D(x) \nabla_{\mathfrak{g}} T(\xi, t) )
+ f(t, x, T(\xi,t)) - g(T(\xi,t)) + E(\xi,t),
\end{equation}
for $\xi \in \mathbb{S}^2$ and $t > 0$.
Here the gradient $\nabla_{\mathfrak{g}}$ and the divergence
$\operatorname{div}_\mathfrak{g}$ on the Riemannian manifold
$(\mathbb{S}^2, \mathfrak{g})$ are given respectively by \eqref{Eq_grad}
and \eqref{Eq_div}, and the Riemannian metric $\mathfrak{g}$ is given
by \eqref{Def_gij}.  The diffusion term
$\operatorname{div}_\mathfrak{g} ( D(x) \nabla_{\mathfrak{g}} T(\xi, t) )$
describes the redistribution of heat on the surface of the Earth by conduction
and convection, the reaction terms $f(t, x, T(\xi,t)) - g(T(\xi,t))$
express the balance between incoming and outgoing radiations, and $E(\xi,t)$
denotes an anthropogenic forcing. See Table~\ref{tab_EBM} for the precise
meaning of the symbols involved in  \eqref{Eq_EBM}.  We refer to
\cite{bermejo2009mathematical} for the rigorous approximation of
\eqref{Eq_EBM} via finite elements on manifolds.


\begin{table}[htb]
\caption{Glossary of model's parameters \& variables}
\label{tab_EBM}  
\begin{center}
\begin{tabular}{|cl|} 
\hline
Symbol & Interpretation \\ \hline
$\xi := (\rho, \theta)$ & $\rho \in (0, \pi)$ is the latitude and $\theta \in (-\pi, \pi)$, the longitude \\
%
$T(\xi,t)$ & sea surface temperature at $\xi,t$ \\
%
$x$ &  sine of the latitude, i.e. $x = \sin (\rho)$ \\
%
$D(x)$ &  diffusion coefficient for heat transport, zonally averaged \\
& and hence does not dependent on the longitude $\theta$ \\
%
$f(t, x, T(\xi,t))$ & incoming solar radiation \\
%
$g(T(\xi,t))$ &  outgoing infrared radiation \\
%
$E(\xi,t)$ &  forcing representing greenhouse gas emissions   \\
\hline
\end{tabular}
\end{center}
\end{table}


The functions $f(t, x, T(\xi,t))$ and $g(T(\xi,t))$ are typically of
 the  form \cite{Budyko69}
\begin{equation} \label{Eq_radiation}
\begin{gathered}
 f(t, x, T(\xi,t)) = Q S(x,t) (1 - \alpha(x,T)), \\
 g(T(\xi,t)) = a + b T(\xi,t).
\end{gathered}
\end{equation}
Here $Q$ is the so-called solar constant, $S(x,t)$ denotes a solar insolation
distribution function, $\alpha(x,T)$ denotes the albedo, and $a$ and $b$
are empirical constants typically estimated from satellite observations;
see e.g.~\cite{graves1993new}. We refer to \cite{alexeev2005polar} for the
calibration of other parameters including $Q$, or coefficients such as $S(x,t)$
or contained in $\alpha(x,T)$; see also \cite{Roques_al14}.

We also note that the LHS of \eqref{Eq_EBM} should be multiplied by a factor 
$\kappa(\xi)$, which measures the effective heat capacity per unit area. 
Here, we have assumed that $\kappa(\xi)$ is a constant which is taken to be 
$1$ after a scaling in the time variable.

As a preparation to cast a controlled version of \eqref{Eq_EBM} into the form 
of \eqref{heat_eq}, we will make use of a new Riemannian metric so that the 
diffusion term in \eqref{Eq_EBM} becomes simply the Laplician under this new metric.
 For this purpose, we assume that
\begin{itemize}

\item[(A9)] the diffusion coefficient $D(x)$ is $C^1$-smooth and is 
strictly positive.
\end{itemize}

 By introducing the new Riemannian metric
\begin{equation}
\widetilde{\mathfrak{g}} = \frac{1}{D(x)} \mathfrak{g},
\end{equation}
it is known that the Laplace operator under this new Riemannian metric is given by
\begin{equation}
\Delta_{\widetilde{\mathfrak{g}}} = \operatorname{div}_\mathfrak{g}
( D(x) \nabla_{\mathfrak{g}}).
\end{equation}
Therefore, \eqref{Eq_EBM} can be rewritten into the following form on
$(\mathbb{S}^2, \widetilde{\mathfrak{g}})$:
\begin{equation} \label{Eq_EBM_v2a}
\frac{\partial T(\xi,t)}{\partial t} = \Delta_{\widetilde{\mathfrak{g}}} T(\xi,t) + f(t, x, T(\xi,t)) - g(T(\xi,t)) + E(\xi,t).
\end{equation}

With this rewriting, we consider the operator 
$\mathcal{L}_{\widetilde{\mathfrak{g}}}=-\Delta_{\widetilde{\mathfrak{g}}}$ 
with domain $\mathcal{D}(\mathcal{L}_{\widetilde{\mathfrak{g}}})$ given by 
\eqref{dom_L} in which $\widetilde{\mathfrak{g}}$ replaces $\mathfrak{g}$.
We are now in position to apply the general results of Sect.~\ref{Sec_optctr_man} 
in particular Corollary \ref{Cor:heat_Galerkin_approx} to a contemporary problem 
related to geoengineering that we address here in the framework of optimal control 
of EBMs such as \eqref{Eq_EBM_v2a}.

\subsection{Optimal control of climate?}

In 1955, John von Neumann envisioned  that ``probably intervention in atmospheric
 and climate matters will come in a few decades, and will unfold on a scale 
difficult to imagine at present;'' see \cite{Neumann55}. As our planet enters 
a period of changing climate never before experienced in recorded human history,
 primarily caused by the rapid buildup of carbon dioxide in the atmosphere from 
the burning of fossil fuels, interest is growing in the potential for deliberate 
large-scale intervention in the climate system to counter climate change; 
see e.g.~\cite{NAP15b, NAP15a, Shepherd09}. Although we are still far away 
from large-scale implementation of what John von Neumann envisioned decades ago, 
the consideration of climate engineering --also known as geoengineering 
--is raising in the scientific community with
a literature that became more abundant on the topic over the recent years; 
see e.g.\ \cite{NAP15b,NAP15a, Lenton09,Shepherd09, Vaughan_al11}.

At the simplest level, the surface temperature of the Earth results from the 
net balance of incoming solar (shortwave) radiation
and outgoing terrestrial (longwave) radiation \cite{Kiehl97}. 
Proposed geoengineering methods attempt to rectify the current and potential 
future radiative imbalance and they are usually divided into two basic 
categories: (i) carbon dioxide removal techniques which remove CO$_2$ from the 
atmosphere to increase the  amount of longwave radiation emitted by the Earth; 
and (ii) solar radiation management techniques that reduce the amount of solar 
(shortwave) radiation absorbed by the Earth by reflecting a small percentage 
of the sun's light and heat back into space.

While a lot of efforts have been devoted to describing different geoengineering 
options in detail and discussing their advantages, effectiveness, potential 
side effects and drawbacks, still more understanding is required before any 
method could even be seriously considered for deployment on the requisite 
international scale \cite{Shepherd09}.  On the other hand, policies to reduce 
global greenhouse gas (GHG) emissions is a pressing topic on any political agenda, 
and uncertainties to climate change 
\cite{meinshausen2009greenhouse,murphy2004quantification} add to the difficulty 
in quantifying unambiguously the effects of forcing variations on the climate system.


From a mathematical perspective, since any geoengineering methods or GHG 
mitigation policies can be expressed as controls acting on the climate system, 
it is natural and important to investigate whether a given type of controls, 
corresponding e.g.~to one or a combination of several geoengineering methods, 
can drive the climate system from a given ``current'' state to a desired state 
over a targeted finite time horizon. This controllability aspect has indeed 
been investigated within the context of climatology based on some types 
of EBMs; see e.g.~\cite{Diaz94b, Diaz94}.

Given that any large-scale decision for addressing climate change have 
economic \cite{hallegatte2009strategies}, societal or physical constraints, 
it also seems natural to frame the problem as an optimal control of the climate 
system to seek for controls within a chosen set of geoengineering strategies 
that lead to the minimization of a relevant cost functional.  
To our knowledge, this optimal control perspective has not yet been investigated 
much from a fundamental viewpoint. In the following, we aim to provide a 
sufficiently general formulation for this purpose, based on the class of EBMs 
encompassed by \eqref{Eq_EBM}. The latter equation will serve as our 
underlying state equation in what follows.

Since EBMs are known to provide reliable models of the mean annual global 
temperature distribution around the globe 
\cite{hyde1989comparison,crowley2000causes,stone2007detection},
they constitute a natural laboratory for such an investigation before one 
moves onto more sophisticated and detailed climate models such as GCMs \cite{GCS08}. 
In that respect, it is also worth mentioning that EBMs can actually be derived 
from the thermodynamics equation of the atmosphere primitive equations via an 
averaging procedure \cite{Kiehl92}.  See also \cite{Brock13} for the design 
of optimal economic mitigation policies based on EBMs coupled with an economic 
growth model.

\subsection{Optimal control of EBMs: Convergence results of value functions}
\label{Sec_OC_EBM}

We formulate the optimal control of EBMs within the general setting of 
Sect.~\ref{Sect_Galerkin}, by relying on the properties of the heat semigroup 
on the sphere recalled in Sect.~\ref{Sec_optctr_man}, here generated by 
$-\mathcal{L}_{\widetilde{\mathfrak{g}}}$.

First, in order to allow for geoengineering strategies of different 
nature in different geographic regions, we consider a collection of open subsets
\[
\{\Omega_i \subset \mathbb{S}^2 : i = 1,\dots, M\},
\]
 where $M$ denotes the number of such strategies, one for each region $\Omega_i$,
with possible overlapping.


The set of admissible controls is defined as follows.  For region $\Omega_i$ 
we define the Hilbert space of functions
\begin{equation}
V_i=L^2(\Omega_i, \mathbb{R}^{n_i}),
\end{equation}
with $n_i$ some positive integer, and introduce
\begin{equation}
V := V_1 \times  \dots \times V_M.
\end{equation}
Consider for each $i$, $U_i$ to be a compact subset of $V_i$ and let us
introduce the set
\begin{equation}
U := \{v = (v_1, \dots, v_M) \in V :  v_i \in U_i, \; i = 1, \dots, M\}.
\end{equation}

Let the set of admissible controls be 
\begin{equation} \label{Eq_U_bounded2}
\mathcal{U}_{ad}:=\{u\in L^q(0,t_f; V): u(s) \in U \text{ a.e.}\}.
\end{equation}
where $q >  1$ is fixed.
Note that since each $V_i$ is a space of functions defined over a region
$\Omega_i$, an admissible control $u$ in $\mathcal{U}_{ad}$ is actually a
locally distributed control.  Note that given $u$ in $\mathcal{U}_{ad}$ and
$t$ in $(0,t_f)$, its $i^{{\rm th}}$-component $u_i(t)$ is a spatial function
that lies in $V_i$. We will denote hereafter by $u_i(t)[\xi]$ its value taken
at $\xi \in \mathbb{S}^2$.

Finally, we assume that the combined effects of the geoengineering strategies
 on the global temperature field $T(\xi,t)$, is represented via a nonlinear function
\begin{equation}
\begin{gathered}
G: \mathbb{R}^{n_1} \times \dots \times\mathbb{R}^{n_M} \to \mathbb{R}\\
 (\zeta_1,\dots,\zeta_M)\longmapsto G(\zeta_1,\dots,\zeta_M),
\end{gathered}
\end{equation}
that forces \eqref{Eq_EBM_v2a}. In practice, the modeler has to specify
the function $G$ (and $V$), depending on the geoengineering strategy or the
GHG mitigation policy adopted as well as the EBM retained. As explained below,
our framework ensures that a global Lipschitz  assumption
 on $G$ allows for convergence of
Galerkin approximations and thus provide a rigorous basis for a numerical
investigation of various control scenarios.
This can be relaxed to a local Lipschitz  assumption as long
as a priori error estimates are available to ensure Assumption (A6);
see Remark \ref{local_lipman}.

We consider thus, for each $u$ in  $\mathcal{U}_{ad}$, the following controlled
 version of the EBM \eqref{Eq_EBM_v2a} which writes for each 
$\xi \in \mathbb{S}^2$ and $t \in [0, t_f]$ as,
\begin{equation} \label{Eq_EBM_v2}
\begin{aligned}
\frac{\partial T(\xi,t)}{\partial t}
&= \Delta_{\widetilde{\mathfrak{g}}} T(\xi,t) + f(t, x, T(\xi,t)) - g(T(\xi,t))
 + E(\xi,t)\\
&\quad + G(\widetilde{u}_1(t,\xi),\dots, \widetilde{u}_M(t,\xi)),
\end{aligned}
\end{equation}
supplemented with an initial condition $T_0$ in $L^2(\mathbb{S}^2).$  Here
\begin{equation}
\widetilde{u}_i(t,\xi)=
\begin{cases}
u_i(t)[\xi], & \text{if } \xi  \in \Omega_i,\\
0, & \text{otherwise}.
\end{cases}
\end{equation}
To recast the IVP associated with \eqref{Eq_EBM_v2} into the abstract
form \eqref{heat_eq}, we introduce the following function spaces
\begin{equation}
\mathcal{H}:= L^2(\mathbb{S}^2), \quad
\mathcal{H}_1 := \mathcal{D}(\mathcal{L}_{\widetilde{\mathfrak{g}}}),
\end{equation}
where $\mathcal{D}(\mathcal{L}_{\widetilde{\mathfrak{g}}})$ is defined in \eqref{dom_L}.

We make the following assumption.
\begin{itemize}

\item[(A10)]  The functions $f$ and $g$ take the forms given by
 \eqref{Eq_radiation}, where the solar insolation distribution function $S$ 
therein lives in the space $L^\infty((0, \infty), L^\infty(\mathbb{S}^2))$ 
and the albedo $\alpha(x,T)$ is a continuous, piecewise-linear ramp function 
such as given in \cite[Eq.~(2a)]{Ghil76} or \cite[Eq.~(2.2)]{Roques_al14}.  
The GHG emission term $E$ belongs to 
$L^1_{\mathrm{loc}}((0, \infty), L^2(\mathbb{S}^2))$.

\end{itemize}
We define now the nonlinearity $F:  [0,t_f] \times \mathcal{H}  \to \mathcal{H}$ to be:
\begin{equation} \label{Eq_EBM_F}
F(t, v)[\xi] :=  f(t, x, v(\xi)) - g(v(\xi)) + E(\xi,t),
\end{equation}
for all   $v$ in $\mathcal{H}$, and a.e.~$\xi$  in $\mathbb{S}^2$, $t \in [0, t_f]$.

Under Assumption  (A10), for each $v$ in $\mathcal{H}$ and almost every 
$t\in [0, t_f]$, $F(t,v)$ belongs to $\mathcal{H}$.

Finally, we define the nonlinear operator $\mathfrak{C}: V \to \mathcal{H}$ 
associated with the control to be:
\begin{equation} \label{Eq_EBM_C}
\mathfrak{C} (v)[\xi] :=  G(\widetilde{v}_1(\xi),\dots,\widetilde{v}_M(\xi)),  \quad  \text{ for all } v \in V, \text{ and a.e.} \; \xi \in \mathbb{S}^2,
\end{equation}
with
\begin{equation}
\widetilde{v}_i(\xi)=
\begin{cases}
v_i(\xi), & \text{if } \xi  \in \Omega_i,\\
0, &\text{otherwise}.
\end{cases}
\end{equation}


Then, \eqref{Eq_EBM_v2} can be rewritten as \eqref{heat_eq} of 
Sect.~\ref{Sec_optctr_man}, with the (nonlinear) operators $F$ and 
$\mathfrak{C}$ defined above. Having the purpose in mind of driving the 
temperature field $T(\xi,t)$ to a state sufficiently close to a specified 
profile at the final time $t_f$, while keeping the control cost ``low'',
we consider the cost functional:
\begin{equation} \label{Eq_EBM_J}
J(T_0, u) = \int_{0}^{t_f} \Big( \frac{1}{2} \|T(\cdot, t; T_0, u)
- T_d\|_{\mathcal{H}}^2 + \frac{\mu}{2} \|u(\cdot, t)\|_{V}^2 \Big) \mathrm{d} t,   \quad
 T_0 \in \mathcal{H}, \; \mu \geq 0.
\end{equation}
Here $T_d$  denotes the targeted temperature field over the globe
(that lies in $\mathcal{H}$) and $T(\cdot, t; T_0, u)$ denotes the mild solution
to \eqref{Eq_EBM_v2} that emanates from $T_0$.


The associated optimal control problem reads then:
\begin{equation} \label{P_EBM}
\begin{gathered}
\min  J(T_0,u)  \quad \text{s.t.}  \quad (T, u) \in L^2(0,T; \mathcal{H})
\times  \mathcal{U}_{ad} \text{ solves  Eq.~\eqref{Eq_EBM_v2}}  \\
 \text{subject to the initial condition }  T(\cdot, 0)  = T_0 \in \mathcal{H}.
\end{gathered}
\end{equation}


\subsection*{Approximation of the value function and error estimates about 
the optimal control}  
Note that thanks to Assumption  (A10), the nonlinearity $F$ defined in 
\eqref{Eq_EBM_F} satisfies the conditions required in Remark~\ref{Rmk_heat_F}. 
If we assume furthermore that the nonlinear operator $\mathfrak{C}$ defined by 
\eqref{Eq_EBM_C} to be globally Lipschitz as a mapping from $V$ to $\mathcal{H}$ 
(and $\mathfrak{C}(0) = 0$) then by Corollary \ref{Cor:heat_Galerkin_approx} 
and Remarks~\ref{Rmk_heat_F}--\ref{Rmk_heat_general_metric}, 
the uniform convergence result given by \eqref{heat_eqn_uniform_in_u_conv} 
in Corollary~\ref{Cor:heat_Galerkin_approx} holds for the IVP associated with 
\eqref{Eq_EBM_v2}. Namely,
\begin{equation} \label{Cve_y}
\lim_{N\to \infty}  \sup_{u\in \mathcal{U}_{ad}}
\sup_{t \in [0, T]} \|y_N(t; \Pi_N x, u) - y(t; x,u)\|_{\mathcal{H}} = 0,
\end{equation}
where $y_N(\cdot; \Pi_N x, u)$ denotes the solution to the Galerkin
approximation of ~\eqref{Eq_EBM_v2} associated with the eigen-subspace
spanned by the first $N$ eigenfunctions of the Laplacian
$\Delta_{\widetilde{\mathfrak{g}}}$.

Note also that Condition \eqref{C1} on the cost functional $J$ defined 
in \eqref{Eq_EBM_J} is clearly satisfied. Then, Theorem~\ref{Thm_cve_Galerkin_val} 
applies if we assume furthermore that there exists for each pair $(t,x)$ a  
minimizer $u_{t,x}^*$ (resp.~$u_{t,x}^{N,*}$) in $\mathcal{U}_{ad}[t,T]$ of 
the minimization problem in \eqref{subEq1} (resp.~in \eqref{subEq2}) 
associated here with the optimal control problem\eqref{P_EBM}. 
Thus, for any $x$ in $\mathcal{H}$, it holds that
\begin{equation} \label{Cve_v}
\lim_{N \to \infty} \sup_{t \in [0, T]} |v_N(t,\Pi_N x) - v(t,x)| = 0.
\end{equation}
Observe that since  $\mathfrak{C}$ is globally Lipschitz, Assumption (A10)
 leads to simple a priori error estimates such as \eqref{solution_bounds_heat_eq},
showing thus that Assumption (A6) is satisfied; see also Remark \ref{Rmk_heat_F}.
The other conditions in Assumption {\rm (A8)} of Sect.~\ref{Sec_Err_estimates}
are trivially satisfied here and thus the error estimates of
Sect.~\ref{Sec_Err_estimates} hold. In particular Corollary \ref{Lem_controller_est}
applies with $q=2$ and $\sigma=\mu/2$ which, using the notations of this corollary,
leads to
\begin{equation} \label{Err_estu}
\begin{aligned}
&\|u^\ast - u^\ast_{N}\|_{L^2(0,T; V)}^2 \\
& \le \frac{4\mathcal{C}+4\|T_d\|_{\mathcal{H}}}{\mu}
[\sqrt{T} + \gamma T ] \Bigl( \| \Pi_N^\perp y(\cdot;u^*)\|_{L^2(0,T; \mathcal{H})}
+ 2 \|  \Pi_N^\perp y (\cdot; u^{*}_{N})\|_{L^2(0,T; \mathcal{H})} \Bigr),
\end{aligned}
\end{equation}
after a simple estimate  of $\operatorname{Lip}(\mathcal{G}\vert_{\mathfrak{B}})$
 where $\mathcal{G}(y)=\|y-T_d\|_{\mathcal{H}}^2$, $y \in \mathcal{H}$.

With the rigorous convergence results \eqref{Cve_y} and \eqref{Cve_v}  
and error estimate  \eqref{Err_estu}, the numerical approximation of solutions 
to \eqref{P_EBM} becomes affordable via e.g.~a Pontryagin-Maximum-Principle 
approach applied to Galerkin approximations \cite{CL15} of Eq.~\eqref{Eq_EBM} 
built here from spherical harmonics.
Indeed, a relatively realistic EBM such as given by \eqref{Eq_EBM} is known 
to be simulated accurately out of few spherical harmonics (typically 
$20 \leq N \leq 30$); see e.g.~\cite{North_al83,hyde1989comparison}.


\section{Concluding remarks} \label{Sect_concluding_remarks}

Thus, by means of rigorous Galerkin approximations of nonlinear evolution equations 
in Hilbert spaces, this article provides a natural framework for the synthesis of 
approximate optimal controls, along with approximations of the value functions.
 The framework opens up several possible directions for future research. 
We outline some of these issues below.

1. The usage of spectral methods for solving more complex climate models 
than EBMs considered in Sect.~\ref{Sec_appl} is standard.
By its natural assumptions to verify in practice, the framework presented above 
makes possible to address  the problem of geoengineering strategies or GHG 
mitigation policies in terms of optimal control of Galerkin approximations of 
such models, enabling thus, at least theoretically, to reduce the dimension of 
the problem.
However, very often these models include e.g.~nonlinear advection terms that 
require to deal with a loss of regularity. Our framework needs thus to be amended 
to deal with such a situation.  The use of interpolated spaces to deal with 
the loss of regularity and formulations of the Trotter-Kato theorem exploiting
 Gelfand triple are natural tools to cope with this difficulty. Analogues of 
Theorems \ref{Lem:uniform_in_u_conv} and  \ref{Thm_cve_Galerkin_val}, as well 
as Corollary \ref{Lem_controller_est}, seem thus to be reasonably accessible 
within this approach.  This way, more realistic models, including e.g.~the 
coupling of an EBM with a deep ocean such as dealt with in \cite{diaz2014multiple}, 
could be considered. Similarly, the inclusion of more realistic dynamic boundary 
conditions for such systems could benefit from the approximate controllability 
study of \cite{bejenaru2001abstract}.

2. Another promising direction  is the synthesis of (approximate) optimal controls 
in a feedback form from the Hamilton-Jacobi-Bellman (HJB)  equation associated 
with Galerkin approximations \cite{KroenerKunischZidani2015,GarckeKroener2016}.  
This is particularly relevant for the optimal control of systems near the 
first criticality in which only very few 
modes\footnote{Such as a pair of modes in the case of a Hopf bifurcation 
\cite{ma2005bifurcation}.} 
have lost their stability and where Galerkin approximations are very often useful 
to approximate the dynamics near the bifurcated states \cite{dijkstra_al16} 
although center manifold reduction techniques lead often to further reducing the 
number of resolved modes needed to approximate accurately the dynamics 
\cite{ma2005bifurcation,PTD-MW,CLW15_vol1}.
We refer to \cite{CKL17_DDE} for a first study along this direction, 
in the context of a Hopf bifurcation arising in a nonlinear delay differential 
equation (DDE).

3. However, far from the first criticality or when the nonlinear effects get 
amplified  a larger number of modes is required to dispose of good Galerkin 
approximations of, already,  the uncontrolled dynamics; see \cite{CL15,CLW15_vol2}.  
The numerical burden of the synthesis of controls at a nearly optimal cost
--by solving the HJB equation corresponding to the Galerkin approximation-- 
becomes then quickly prohibitive, especially for the case of locally distributed 
controls; see \cite[Sect.~7]{CL15}.  One avenue to deal with reduced state space 
of further reduced dimension, is to search for high-mode parameterizations that 
help reduce the residual energy contained in the unresolved modes, i.e.~to 
reduce the RHS of \eqref{Est_contr_diff} involving the terms 
$\| \Pi_N^\perp y(\cdot;u^*)\|_{L^2(0,T; \mathcal{H})}$ and 
$\|  \Pi_N^\perp y (\cdot; u^{*}_{N})\|_{L^2(0,T; \mathcal{H})}$ 
in Corollary \ref{Lem_controller_est}. The theory of parameterizing manifolds 
(PM) \cite{CL15,CL16post,CLMcW2016} allows for such a reduction leading typically 
to approximate controls  coming with error estimates that introduce multiplying 
factors $0\leq Q <1$
in the ``RHS-like'' of \eqref{Est_contr_diff}; 
see \cite[Theorem 1 \& Corollary 2]{CL15}. The combination of the Galerkin 
framework introduced here with the PM reduction techniques of \cite{CL15} 
constitutes thus an idea that is worth pursuing.

4. Finally,  we emphasize that the framework introduced here is not limited 
to Galerkin approximations built from eigenfunctions of the linear part. 
This is particularly useful for evolution equations for which such eigenfunctions 
are not the best choice to build Galerkin approximations. 
As explained in \cite{CGLW15}, systems of nonlinear DDEs constitute such a 
type of evolution systems. The optimal control of systems of nonlinear DDEs 
may thus benefit from the framework introduced here and will be pursued elsewhere. 
The work \cite{CKL17_DDE} illustrates promising results exploiting this idea.
Such an approach may be also relevant to study the possible impact of 
geoengineering strategies or GHG mitigation policies on large-scale 
climatic phenomena such as the El Ni\~no--Southern Oscillation (ENSO) and 
for which DDEs are known to provide good models able to capture some of the 
essential features of ENSO's irregularity;  see 
\cite{Chek_al14_RP,CGN17, neelin1998enso,Tzip_al94}.


\section{Appendix: Existence of optimal controls}\label{Sec_existence_opt_contr}

We recall hereafter some standard sufficient conditions for the existence of
 optimal controls. Our approach follows
\cite{HPUU09} that we adapt to our framework.
Let $\mathcal U:=L^q(0,T;U)$ with $q\geq 1$, with here $U$ denoting a bounded,
 closed and convex subset of a separable Hilbert space $V$.
In particular,  $\mathcal U$ is also bounded, closed and convex.

Let $Y$ denote a separable Hilbert space. Let us assume that we can write 
the state equation in the form
\begin{align}\label{state-equation}
 \mathcal{M}(y,u)=0,
\end{align}
with $ \mathcal{M}\colon Y \times  \mathcal{U} \to Z$ a continuous mapping 
taking values in a Hilbert space $Z$. In practice, the mapping $\mathcal{M}$ 
characterizes the model equation and involves, typically, differential operators.

The optimal control problem reads as follows.
\begin{align}\label{problem}
 \min_{(y,u) \in Y \times \mathcal U} J(y,u),\quad \text{subject to } 
  \mathcal{M}(y,u) =0.
\end{align}

Existence to this optimal control problem can be ensured under conditions 
grouped into the following assumption.
\begin{itemize}
\item[(A11)]
 \begin{itemize}
  \item[(i)] The state equation \eqref{state-equation} has a bounded
 solution operator
 \begin{equation}
\begin{gathered}
 \mathcal{U} \to Y, \\
 u\mapsto y(u).
 \end{gathered}
\end{equation}
  \item[(ii)] The mapping
  \begin{equation}
\begin{gathered}
\mathcal{M}:  Y \times \mathcal{U} \to Z,\\
(y,u) \longmapsto \mathcal{M}(y,u),
\end{gathered}
\end{equation}
 is continuous for the weak topology.
  \item[(iii)] The cost function $J\colon Y\times  \mathcal{U} \to \mathbb{R}^+$
is weakly lower semicontinuous.
 \end{itemize}
\end{itemize}

Note that Assumption (A11)(iii) is satisfied if $J$ is convex and continuous.

We introduce the feasible set
\begin{equation}
F_{\text{ad}}:=\{ (y,u) \in Y \times \mathcal U  : \mathcal{M}(y,u)=0 \}.
\end{equation}

\begin{definition} \rm 
 The pair $(\bar y,\bar u) \in Y \times \mathcal U$ is called a solution
 of \eqref{problem} if
 \begin{align}
 J(\bar u , \bar y) \le J(y,u) \quad \text{for all } (y,u) \in F_{\text{ad}}.
 \end{align}
\end{definition}

\begin{theorem}
 Under Assumption {\rm (A11)}, problem \eqref{problem} has a non-empty 
set of solutions.
\end{theorem}

\begin{proof}
 The proof is classical. We present only a brief sketch; e.g.\ 
\cite[Sect.~1.5.2]{HPUU09}.
 Since $J\ge 0$ and $F_{\text{ad}}$ is nonempty, the infimum
 exists  and there is a minimizing sequence $(y_k,u_k) \subset F_{\text{ad}}$ with 
$  J^*:=\lim_{k\to \infty} J(y_k,u_k)$.
 Furthermore, $(u_k)$ is bounded as a sequence in $\mathcal{U}$, and by 
Assumption (A11)(i) the sequence $(y_k)$ is bounded. Thus, by reflexivity 
of $L^2(0,T;\mathcal{H})\times Y$ we can select a subsequence that converges weakly 
to some limit $(\bar u,\bar y)$.
 Since $\mathcal U$ is convex and closed, we have that $\bar u$  lies in 
$\mathcal U$, and together with Assumption (A11)(ii) we have that the set 
$F_{\text{ad}}$ is sequentially weakly closed; hence, we have 
$(\bar y, \bar u) \in F_{\text{ad}}$. With Assumption (A11)(iii) we obtain 
the assertion by a classical argument.
\end{proof}

\subsection*{Acknowledgments}
The authors are grateful to the referees for their comments and for having
 pointed out relevant references for Sect.~\ref{Sec_appl}.
This work has been partially supported by the Office of Naval Research (ONR) 
Multidisciplinary University Research Initiative (MURI) grant 
N00014-12-1-0911 and N00014-16-1-2073 (MDC), and by the National Science 
Foundation grants DMS-1616981 (MDC) and DMS-1616450 (HL). 
MDC and AK were supported by the project ``Optimal control of partial 
differential equations using parameterizing manifolds, model reduction, 
and dynamic programming'' funded by the  Foundation Hadamard/Gaspard Monge 
Program for Optimization and Operations Research (PGMO).


\begin{thebibliography}{10}

\bibitem{alexeev2005polar}
V.  A. Alexeev, P.L. Langen,  J. R. Bates;
\newblock Polar amplification of surface warming on an aquaplanet in ``ghost
  forcing`` experiments without sea ice feedbacks.
\newblock {\em Climate Dynamics}, 24(7-8):655--666, 2005.

\bibitem{Alt_al89}
W.~Alt, U.~Mackenroth;
\newblock Convergence of finite element approximations to state constrained
  convex parabolic boundary control problems.
\newblock {\em SIAM J. Control Optim.}, 27:718--736, 1989.

\bibitem{Banks_al84}
H.~T. Banks, K.~Kunisch;
\newblock The linear regulator problem for parabolic systems.
\newblock {\em SIAM J. Control Optim.}, 22:684--698, 1984.

\bibitem{bejenaru2001abstract}
I.~Bejenaru, J.~I. D{\'\i}az, I.~I. Vrabie;
\newblock An abstract approximate controllability result and applications to
  elliptic and parabolic systems with dynamic boundary conditions.
\newblock {\em Electron.~J.~Diff.~Eqns.}, 2001(50):1--19, 2001.

\bibitem{bensoussan2007representation}
A.~Bensoussan, G.~Da~Prato, M. C. Delfour, S.~Mitter;
\newblock {\em Representation and Control of Infinite Dimensional Systems}.
\newblock Springer Science \& Business Media, 2007.

\bibitem{bermejo2009mathematical}
R.~Bermejo, J.~Carpio, J. I. D{\'\i}az, L.~Tello;
\newblock Mathematical and numerical analysis of a nonlinear diffusive climate
  energy balance model.
\newblock {\em Mathematical and Computer Modelling}, 49(5):1180--1210, 2009.

\bibitem{Brezis10}
H.~Br{\'e}zis;
\newblock {\em {Functional Analysis, Sobolev Spaces and Partial Differential
  Equations}}.
\newblock Springer, 2010.

\bibitem{Brock13}
W.~A. Brock, G.~Engstr{\"o}m, D.~Grass, A.~Xepapadeas;
\newblock Energy balance climate models and general equilibrium optimal
  mitigation policies.
\newblock {\em J. Economic Dynamics and Control}, 37:2371--2396, 2013.

\bibitem{Budyko69}
M.~I. Budyko;
\newblock The effect of solar radiation variations on the climate of the
  {E}arth.
\newblock {\em Tellus}, 21:611--619, 1969.

\bibitem{Cazenave_al98}
T.~Cazenave, A.~Haraux;
\newblock {\em {An Introduction to Semilinear Evolution Equations}}, volume~13
  of {\em Oxford Lecture Series in Mathematics and its Applications}.
\newblock The Clarendon Press, Oxford, 1998.

\bibitem{CGLW15}
M.~D. Chekroun, M.~Ghil, H.~Liu, S.~Wang;
\newblock Low-dimensional {G}alerkin approximations of nonlinear delay
  differential equations.
\newblock {\em Disc. Cont. Dyn. Sys.~A}, 36(8):4133--4177, 2016.

\bibitem{CKL17_DDE}
M.~D. Chekroun, A.~Kr\"oner, H.~Liu;
\newblock Galerkin approximations for the optimal control of nonlinear delay
  differential equations.
\newblock {\em submitted}, 2017.
\newblock https://arxiv.org/abs/1706.02360 {arXiv:1706.02360}.

\bibitem{CL15}
M.~D. Chekroun, H.~Liu;
\newblock {F}inite-horizon parameterizing manifolds, and applications to
  suboptimal control of nonlinear parabolic {PDEs}.
\newblock {\em Acta Applicandae Mathematicae}, 135(1):81--144, 2015.

\bibitem{CL16post}
M.~D. Chekroun, H.~Liu;
\newblock {Post-processing finite-horizon parameterizing manifolds for optimal
  control of nonlinear parabolic PDEs}.
\newblock In {\em 2016 IEEE 55th Conference on Decision and Control (CDC)},
  pages 1411--1416. IEEE, 2016.

\bibitem{CLW15_vol1}
M.~D. Chekroun, H.~Liu, S.~Wang;
\newblock {\em {Approximation of Stochastic Invariant Manifolds: Stochastic
  Manifolds for Nonlinear SPDEs I}}.
\newblock Springer Briefs in Mathematics, Springer, New York, 2015.

\bibitem{CLW15_vol2}
M.~D. Chekroun, H.~Liu, S.~Wang;
\newblock {\em {Stochastic Parameterizing Manifolds and Non-Markovian Reduced
  Equations: Stochastic Manifolds for Nonlinear SPDEs II}}.
\newblock Springer Briefs in Mathematics, Springer, New York, 2015.

\bibitem{Chek_al14_RP}
M.~D. Chekroun, J.~D. Neelin, D.~Kondrashov, J.~C. McWilliams, M.~Ghil;
\newblock {Rough parameter dependence in climate models: The role of
  Ruelle-Pollicott resonances}.
\newblock {\em Proc. Natl. Acad. Sci. USA}, 111(5):1684--1690, 2014.

\bibitem{CGN17}
M. D. Chekroun, M.~Ghil, J.~D. Neelin;
\newblock {Pullback attractor crisis in a delay differential ENSO model}.
\newblock In A.~Tsonis, editor, {\em {Advances in Nonlinear Geosciences, to
  appear}}. Springer, 2017.

\bibitem{CLMcW2016}
M. D. Chekroun, H.~Liu, J. C. McWilliams;
\newblock The emergence of fast oscillations in a reduced primitive equation
  model and its implications for closure theories.
\newblock {\em Computers \& Fluids}, 151:3--22, 2017.

\bibitem{NAP15b}
National~Research Council;
\newblock {\em Climate Intervention: Carbon Dioxide Removal and Reliable
  Sequestration}.
\newblock National Academies Press, 2015.

\bibitem{NAP15a}
National~Research Council;
\newblock {\em Climate Intervention: Reflecting Sunlight to Cool Earth}.
\newblock National Academies Press, 2015.

\bibitem{crowley2000causes}
T. J. Crowley.
\newblock Causes of climate change over the past 1000 years.
\newblock {\em Science}, 289(5477):270--277, 2000.

\bibitem{deckelnick2004semidiscretization}
K.~Deckelnick, M.~Hinze.
\newblock {Semidiscretization and error estimates for distributed control of
  the instationary Navier-Stokes equations}.
\newblock {\em Numerische Mathematik}, 97(2):297--320, 2004.

\bibitem{Diaz94b}
J.~I. D{\'\i}az.
\newblock Approximate controlability for some simple climate models;
\newblock In {\em Environment, economic and their mathematical models (J. I.
  D{\'\i}az and J. L. Lions, eds)}, Research Notes in Applied Mathematics, no.
  35, pages 29--43. Masson, Paris, France, 1994.

\bibitem{Diaz94}
J.~I. D{\'\i}az.
\newblock Controllability and obstruction for some non linear parabolic
  problems in climatology;
\newblock {\em Modelado de Sistemas en Oceanograf{\'\i}a, Climatolog{\'\i}a y
  Ciencias Medio Ambientales (C. Pares and A. Valle, eds), Universidad de
  M{\'a}laga}, pages 43--58, 1994.

\bibitem{diaz2014multiple}
J.~I. D{\'\i}az, A.~Hidalgo, L.~Tello;
\newblock Multiple solutions and numerical analysis to the dynamic and
  stationary models coupling a delayed energy balance model involving latent
  heat and discontinuous albedo with a deep ocean.
\newblock {\em Proc. R. Soc. A}, 470(2170), 2014.

\bibitem{Diaz98}
J.I. D{\'\i}az, G.~Hetzer;
\newblock A quasilinear functional reaction-diffusion equation arising in
  climatology.
\newblock In {\em {E}quations aux d{\'{e}}riv{\'{e}}es partielles et
  applications (Articles d{\'{e}}di{\'{e}}s {\`{a}} J.-L. Lions)}, pages
  461--480. Gauthier-Villars ({\'E}ditions Scientifique et M{\'{e}}dicales
  Elsevier), 1998.

\bibitem{dijkstra_al16}
H. A. Dijkstra, A.~Tantet, J.~Viebahn, E.~Mulder, M.~Hebbink, D.~Castellana,
  H.~van~den Pol, J.~Frank, S.~Baars, F.~Wubs, M. D. Chekroun, and Ch. Kuehn;
\newblock A numerical framework to understand transitions in high-dimensional
  stochastic dynamical systems.
\newblock {\em Dynamics and Statistics of the Climate System}, 1(1):dzw003,
  2016.

\bibitem{Fattorini99}
H.~O. Fattorini;
\newblock {\em {Infinite Dimensional Optimization and Control Theory}},
  volume~62 of {\em Encyclopedia of Mathematics and its Applications}.
\newblock Cambridge University Press, 1999.

\bibitem{Ferretti97}
R.~Ferretti.
\newblock {Internal approximation schemes for optimal control problems in
  Hilbert spaces}.
\newblock {\em J. Mathematical Systems Estimation and Control}, 7:1--25, 1997.

\bibitem{Fur00}
A.~V. Fursikov;
\newblock {\em {Optimal Control of Distributed Systems: Theory and
  Applications}}, volume 187 of {\em Translations of Mathematical Monographs}.
\newblock American Mathematical Society, 2000.

\bibitem{GarckeKroener2016}
J.~Garcke, A.~Kr{\"o}ner;
\newblock {Suboptimal feedback control of PDEs by solving HJB equations on
  adaptive sparse grids}.
\newblock {\em Journal of Scientific Computing}, pages 1--28, 2016.

\bibitem{Ghil76}
M.~Ghil;
\newblock {Climate stability for a Sellers-type model}.
\newblock {\em J. Atmos. Sci.}, 33:3--20, 1976.

\bibitem{GCS08}
M.~Ghil, M.~D. Chekroun, E.~Simonnet;
\newblock Climate dynamics and fluid mechanics: Natural variability and related
  uncertainties.
\newblock {\em Physica D: Nonlinear Phenomena}, 237(14):2111--2126, 2008.

\bibitem{Gibson79}
J.~S. Gibson;
\newblock {The Riccati integral equations for optimal control problems on
  Hilbert spaces}.
\newblock {\em SIAM J. Control Optim.}, 17:537--565, 1979.

\bibitem{Goldstein85}
J.~A. Goldstein;
\newblock {\em {Semigroups of Linear Operators and Applications}}.
\newblock Oxford University Press, 1985.

\bibitem{graves1993new}
C.E. Graves, W.-H. Lee, G.R. North;
\newblock New parameterizations and sensitivities for simple climate models.
\newblock {\em Journal of geophysical research}, 98(D3):5025--5036, 1993.

\bibitem{Grigoryan09}
A.~Grigor'yan;
\newblock {\em {Heat Kernel and Analysis on Manifolds}}.
\newblock American Mathematical Soc., 2009.

\bibitem{hallegatte2009strategies}
S.~Hallegatte;
\newblock Strategies to adapt to an uncertain climate change.
\newblock {\em Global environmental change}, 19(2):240--247, 2009.

\bibitem{HPUU09}
M.~Hinze, R.~Pinnau, M.~Ulbrich, S.~Ulbrich;
\newblock {\em {Optimization with PDE Constraints}}, volume~23 of {\em
  Mathematical Modeling: Theory and Applications}.
\newblock Springer, 2009.

\bibitem{hyde1989comparison}
W. T. Hyde, T. J. Crowley, K.-Y. Kim, G. R. North;
\newblock {Comparison of GCM and energy balance model simulations of seasonal
  temperature changes over the past 18 000 years}.
\newblock {\em Journal of Climate}, 2(8):864--887, 1989.

\bibitem{Kiehl92}
J.~T. Kiehl;
\newblock Atmospheric general circulation modeling.
\newblock In {\em Climate system modeling (K. E. Trenberth, ed.)}, pages
  317--370. Cambridge University Press, 1992.

\bibitem{Kiehl97}
J.~T. Kiehl, K.~E. Trenberth;
\newblock Earth's annual global mean energy budget.
\newblock {\em Bull. Am. Meteorol. Soc.}, 78:197--208, 1997.

\bibitem{knowles1982finite}
G.~Knowles;
\newblock Finite element approximation of parabolic time optimal control
  problems.
\newblock {\em SIAM Journal on Control and Optimization}, 20(3):414--427, 1982.

\bibitem{KroenerKunischZidani2015}
A.~Kr{\"o}ner, K.~Kunisch, H.~Zidani;
\newblock Optimal feedback control for undamped wave equations by solving a
  {HJB} equation.
\newblock {\em ESAIM Control Optim. Calc. Var.}, 21(2):442--464, 2015.

\bibitem{lasiecka1980unified}
I.~Lasiecka;
\newblock Unified theory for abstract parabolic boundary problems-a semigroup
  approach.
\newblock {\em Applied mathematics \& optimization}, 6(1):287--333, 1980.

\bibitem{lasiecka1987regulator}
I.~Lasiecka, R.~Triggiani;
\newblock {The regulator problem for parabolic equations with {D}irichlet
  boundary control}.
\newblock {\em Applied Mathematics and Optimization}, 16(1):147--168, 1987.

\bibitem{Lasiecka_al00}
I.~Lasiecka, R.~Triggiani;
\newblock {\em {Control Theory for Partial Differential Equations: Continuous
  and Approximation Theories. {I}}}, volume~74 of {\em Encyclopedia of
  Mathematics and its Applications}.
\newblock Cambridge University Press, Cambridge, 2000.

\bibitem{Lenton09}
T.~M. Lenton, N.~E. Vaughan;
\newblock The radiative forcing potential of different climate geoengineering
  options.
\newblock {\em Atmos. Chem. Phys.}, 9:5539--5561, 2009.

\bibitem{Lions71}
J.-L. Lions;
\newblock {\em {Optimal Control of Systems Governed by Partial Differential
  Equations}}.
\newblock Translated from the French by S. K. Mitter. Die Grundlehren der
  mathematischen Wissenschaften, Band 170. Springer-Verlag, New York-Berlin,
  1971.

\bibitem{ma2005bifurcation}
T.~Ma, S.~Wang;
\newblock {\em {Bifurcation Theory and Applications}}, volume~53.
\newblock World Scientific, 2005.

\bibitem{PTD-MW}
T.~Ma and S.~Wang.
\newblock {\em {Phase Transition Dynamics}}.
\newblock Springer, New York, 2014.

\bibitem{malanowski1982convergence}
K.~Malanowski;
\newblock {Convergence of approximations vs regularity of solutions for convex,
  control-constrained optimal-control problems}.
\newblock {\em Applied Mathematics \& Optimization}, 8(1):69--95, 1982.

\bibitem{Mcknight_al73}
R.~S. McKnight, W.~E. Bosarge~JR;
\newblock {The Ritz-Galerkin procedure for parabolic control problems}.
\newblock {\em SIAM J. Control Optim.}, 11:510--524, 1973.

\bibitem{medjo2008optimal}
T. T. Medjo, R.~Temam,  M.~Ziane;
\newblock Optimal and robust control of fluid flows: some theoretical and
  computational aspects.
\newblock {\em Applied Mechanics Reviews}, 61(1):010802, 2008.

\bibitem{meidner2007adaptive}
D.~Meidner, B.~Vexler;
\newblock Adaptive space-time finite element methods for parabolic optimization
  problems.
\newblock {\em SIAM Journal on Control and Optimization}, 46(1):116--142, 2007.

\bibitem{meinshausen2009greenhouse}
M.~Meinshausen, N.~Meinshausen, W.~Hare, S.C.B. Raper, K.~Frieler, R.~Knutti,
  D. J. Frame, M. R. Allen;
\newblock {Greenhouse-gas emission targets for limiting global warming to 2$^o$ C}.
\newblock {\em Nature}, 458(7242):1158--1162, 2009.

\bibitem{murphy2004quantification}
J. M. Murphy, D. M. H. Sexton, D. N. Barnett, G. S. Jones, M. J. Webb, M.~Collins,
D. A. Stainforth;
\newblock Quantification of modeling uncertainties in a large ensemble of
  climate change simulations.
\newblock {\em Nature}, 430(7001):768--772, 2004.

\bibitem{neelin1998enso}
J.~D. Neelin, D.~S. Battisti, A.~C. Hirst, F.-F. Jin, Y.~Wakata, T.~Yamagata,
S.~E. Zebiak;
\newblock {ENSO} theory.
\newblock {\em Journal of Geophysical Research: Oceans (1978--2012)},
  103(C7):14261--14290, 1998.

\bibitem{Neitzel2012}
I.~Neitzel, B.~Vexler.
\newblock A priori error estimates for space--time finite element
  discretization of semilinear parabolic optimal control problems.
\newblock {\em Numerische Mathematik}, 120(2):345--386, 2012.

\bibitem{North_al81}
G.~R. North, R.~F. Cahalan, J.~A. Coakley;
\newblock Energy balance climate models.
\newblock {\em Reviews of Geophysics}, 19:91--121, 1981.

\bibitem{North_al83}
G.~R. North, D.~A. Short, J.~G. Mengel;
\newblock Simple energy balance model resolving the seasons and the continents:
  application to the astronomical theory of the ice ages.
\newblock {\em J. Geophys. Res.}, 88:6576--6586, 1983.

\bibitem{Pazy83}
A.~Pazy;
\newblock {\em {Semigroups of Linear Operators and Applications to Partial
  Differential Equations}}, volume~44 of {\em Applied Mathematical Sciences}.
\newblock Springer-Verlag, New York, 1983.

\bibitem{Roques_al14}
L.~Roques, M.~Chekroun, M.~Cristofol, S.~Soubeyrand, M.~Ghil;
\newblock Parameter estimation for energy balance models with memory.
\newblock {\em Proc. R. Soc. A}, 470:20140349, 2014.

\bibitem{Sellers69}
W.~D. Sellers;
\newblock A global climatic model based on the energy balance of the
  {E}arth-{A}tmosphere system.
\newblock {\em J. Appl. Meteorol.}, 8:392--400, 1969.

\bibitem{Shepherd09}
J.~G. Shepherd;
\newblock {\em Geoengineering the climate: {S}cience, governance and
  uncertainty}.
\newblock Royal Society, 2009.

\bibitem{stephens2012update}
G. L. Stephens, J.~Li, M.~Wild, C.~A. Clayson, N.~Loeb, S.~Kato, T.~Lecuyer,
  P. W. Stackhouse~Jr., M.~Lebsock, T.~Andrews;
\newblock An update on {E}arth's energy balance in light of the
  latest global observations.
\newblock {\em Nature Geoscience}, 5(10):691--696, 2012.

\bibitem{stone2007detection}
D.~Stone, M.~R. Allen, F.~Selten, M.~Kliphuis, P.A. Stott;
\newblock The detection and attribution of climate change using an ensemble of
  opportunity.
\newblock {\em Journal of Climate}, 20(3):504--516, 2007.

\bibitem{Tem97}
R.~Temam;
\newblock {\em {I}nfinite-{D}imensional {D}ynamical {S}ystems in {M}echanics
  and {P}hysics}, volume~68 of {\em Applied Mathematical Sciences}.
\newblock Springer-Verlag, New York, 2nd edition, 1997.

\bibitem{MR1297998}
F.~Tr{\"o}ltzsch;
\newblock Semidiscrete {R}itz-{G}alerkin approximation of nonlinear parabolic
  boundary control problems.
\newblock In {\em Optimal control ({F}reiburg, 1991)}, volume 111 of {\em
  Internat. Ser. Numer. Math.}, pages 57--68. Birkh\"auser, Basel, 1993.

\bibitem{MR1264014}
F.~Tr{\"o}ltzsch;
\newblock Semidiscrete {R}itz-{G}alerkin approximation of nonlinear parabolic
  boundary control problems--strong convergence of optimal controls.
\newblock {\em Appl. Math. Optim.}, 29(3):309--329, 1994.

\bibitem{Tro10}
F.~Tr{\"o}ltzsch;
\newblock {\em {Optimal Control of Partial Differential Equations: Theory,
  Methods and Applications}}, volume 112 of {\em Graduate Studies in
  Mathematics}.
\newblock American Mathematical Society, 2010.

\bibitem{Tzip_al94}
E.~Tziperman, L.~Stone, M.A. Cane, H.~Jarosh;
\newblock El {N}i{\~n}o chaos: {O}verlapping of resonances between the seasonal
  cycle and the {P}acific ocean-atmosphere oscillator.
\newblock {\em Science}, 264(5155):72--74, 1994.

\bibitem{Vaughan_al11}
N.~E. Vaughan, T.~M. Lenton;
\newblock A review of climate geoengineering proposals.
\newblock {\em Climatic change}, 109:745--790, 2011.

\bibitem{Neumann55}
J.~Von~Neumann;
\newblock Can we survive technology?
\newblock {\em Fortune}, June, 1955.

\end{thebibliography}

\end{document}
