\documentclass[reqno]{amsart}
\usepackage{hyperref}

\AtBeginDocument{{\noindent\small
\emph{Electronic Journal of Differential Equations},
Vol. 2015 (2015), No. 309, pp. 1--13.\newline
ISSN: 1072-6691. URL: http://ejde.math.txstate.edu or http://ejde.math.unt.edu
\newline ftp ejde.math.txstate.edu}
\thanks{\copyright 2015 Texas State University.}
\vspace{9mm}}

\begin{document}
\title[\hfilneg EJDE-2015/309\hfil Differential inclusions]
{Differential inclusions and exact penalties}

\author[A. V. Fominyh, V. V. Karelin, L. N. Polyakova \hfil EJDE-2015/309\hfilneg]
{Alexander V. Fominyh, Vladimir V. Karelin, Lyudmila N. Polyakova}

\address{Alexander V. Fominyh \newline
Saint Petersburg State University,
7-9, University emb., 199034 St. Petersburg, Russia}
\email{alexfomster@mail.ru}

\address{Vladimir V. Karelin \newline
Saint Petersburg State University,
7-9, University emb., 199034 St. Petersburg, Russia}
\email{vlkarelin@mail.ru}

\address{Lyudmila N. Polyakova \newline
Saint Petersburg State University,
7-9, University emb., 199034 St. Petersburg, Russia}
\email{lnpol07@mail.ru}

\thanks{Submitted July 23, 2015. Published December 21, 2015.}
\subjclass[2010]{34A60, 49J52}
\keywords{Nonsmooth functional; differential inclusion;
support function; \hfill\break\indent 
exact penalty function; maximum principle}

\begin{abstract}
 The article considers differential inclusion with a given set-valued mapping
 and initial point. It is required to find a solution of this differential
 inclusion that minimizes an integral functional. Some classical results
 about the maximum principle for differential inclusions are obtained using
 the support and exact penalty functions. This is done for differentiable
 and for non-differentiable set-valued mappings in phase variables.
\end{abstract}

\maketitle
\numberwithin{equation}{section}
\newtheorem{theorem}{Theorem}[section]
\newtheorem{lemma}[theorem]{Lemma}
\newtheorem{remark}[theorem]{Remark}
\newtheorem{definition}[theorem]{Definition}
\allowdisplaybreaks

\section{Introduction}

Nowadays, differential inclusions (or differential
 equations with a multivalued right-hand side) are almost indispensable in
 mathematical modeling of systems with incomplete description \cite{blag_fil}
 and analyzing behavior of discontinuous systems \cite{filip}.
Applications of differential inclusions to the problem of constructing
Lyapunov functions and optimization are known. The problem of finding
solutions for a differential inclusion is important for applications
\cite{clnl,chg,gmsm}, \cite{tng}--\cite{zlv}.
 As a rule, it is possible to obtain an analytical solution
of a differential inclusion only in special cases but in the other cases
we have to use numerical methods for this purpose.

It should be noted that the conditions known of the existence of solutions
 \cite{aben,blag_fil} usually contain either a continuity requirement,
or both the semi-continuities and the convexity of the corresponding
multivalued mapping.


\begin{definition} \label{def1} \rm
 A differential inclusion is a relation of the form
 \begin{equation}\label{eq:0}
 \dot{x}(t) \in F(x(t), t)
 \end{equation}
with respect to the unknown function $x: I \to \mathbb{R}^n$,
where $I \subset \mathbb{R}$ is an interval,
$F: R \times \mathbb{R}^n \subset 2^{\mathbb{R}^n}$ ($2^{M}$ hereinafter means
 the set of all subsets of $M$).
\end{definition}

\begin{definition} \label{def2}\rm
 A function $x: I \to \mathbb{R}^n$ is
called a solution of differential inclusion \eqref{eq:0} on the interval
$I$ ($I \subset \mathbb{R}$) if it is absolutely continuous in $I$ and
almost everywhere in $I$ satisfies relation \eqref{eq:0}.
If the gradient of $x$ has only discontinuities
of the first kind, such a solution is called the proper one.
\end{definition}


\begin{definition} \label{def3} \rm
 A multivalued mapping $F: X \to 2^{Y}$ is called lower
 semicontinuous in $x_0$ if for every $y_0 \in F(x_0)$ and for every neighborhood
 $U(y_0)$ of the point $y_0$ there exists such a neighborhood $U(x_0)$ of the
 point $x_0$ that $F(x) \cap U(ó_0) \neq 0$ for every
$x \in U(x_0)$.
\end{definition}

\begin{definition} \label{def4} \rm
 A support function of multivalued mapping $F$ from $X$ to $Y$
 is the function
\begin{equation*}
 c(F(x), p) : = \sup_{y \in F(x)} (y, p) \quad\forall x \in X,\;
 \forall p \in Y^{*},
\end{equation*}
where $Y^{*}$ is a dual space, $(\cdot,\cdot)$ is a scalar product of vectors.
It describes all closed semispaces which contain $F(x)$.
\end{definition}

\begin{definition} \label{def5} \rm
 A subdifferential of the lower semicontinuous
 convex function $V$ on Hilbert space $X$ with the values in
$\mathbb{R} \cup \{+\infty\}$
 is the set
\begin{equation*}
 \partial V(x) = \{p \in X^{*} : (p,x) - V(x) = \max_{y \in X}[(p,y) - V(y)]\}.
\end{equation*}
 It is a closed convex subset of $X^{*}$. If $V$ has the gradient
$\nabla V(x) \in X^{*}$ at the point $x$, then
$\partial V(x)=\{\nabla V(x)\}$.

 If the function $U(x)$ is a concave one, then the set
\begin{gather*}
\bar{\partial}U(x)=\{u : U(y) - U(x) \leq (u, y-x)\; \forall y \in X \}
 \end{gather*}
is called a superdifferential of the function $U$ at the point $x$.
\end{definition}

 Differential inequalities, implicit differential equations,
 differential equations with restrictions on the phase coordinates may
 be represented in the form of the differential inclusion $\dot{x} \in F(x, t)$.
 So a differential inclusion is generalization of ordinary differential equations
 and since it has a whole family of trajectories which come out from the initial
 point $x_0$, then it is natural to state the problem of picking out the
solutions with definite properties, for example, those which minimize a
certain functional.

In \cite{blag_fil}, \cite{filip} some classical results are given which extend
 the known Pontryagin's maximum principle for differential inclusions.
 The maximum principle is obtained under sufficiently stringent assumptions,
 in particular, provided that the support function $c(F(t,x),\psi)$ of the
 multivalued mapping $F(t,x)$ is continuously differentiable in the
vector of phase coordinates.
 This article studies the problem in this case using the apparatus of
 support functions \cite{rockaf} and exact penalty functions \cite{karelin}.
 With the help of this apparatus it is comparatively easy to obtain the
known Blagodatskih's maximum principle. The case is additionally
investigated when differentiability in $x$ of the support function
$c(F(t,x),\psi)$ is not assumed.

\section{Statement of the problem}

Consider the differential inclusion
\begin{equation} \label{eq:1}
\dot{x} \in F(x, t)
\end{equation}
with the initial condition
\begin{equation} \label{eq:2}
x(0) = x_0.
\end{equation}
Here $F(x, t)$, $t \in [0, T]$, is a given multivalued mapping,
which is supposed to be upper semicontinuous, $x(t)$ is a $n$-dimensional
vector-function of the phase coordinates, which is supposed to be continuous
 with partially continuous in $[0, T]$ gradient, $T > 0$ is a given
moment of time.
 We assume that the function $F(x, t)$ puts in correspondence a certain
convex compact set from $\mathbb{R}^n$ for every moment of time
$t \in [0, T]$ and for every phase point $x \in \mathbb{R}^n$.
It is required to find such a vector-function $x^{*}(t) \in C_{n}[0, T]$,
which is the solution of inclusion \eqref{eq:1}, satisfies initial
condition \eqref{eq:2} and minimizes the functional
\begin{equation} \label{eq:3}
I(x) = \int ^{T}_0 f_0(x,t) dt,
\end{equation}
where $f_0$ is a given real scalar function which is supposed to be
continuous in both arguments and continuously differentiable in $x$.

\section{Equivalent statement of the Problem}

Further, for brevity, we sometimes write $F$ instead of $F(x,t)$.
Since for all $t \in [0, T]$ and all $x \in \mathbb{R}^n$
the multivalued mapping $F(x, t)$ is a convex, closed and bounded set,
inclusion \eqref{eq:1} may be rewritten as follows \cite{blag}
$$
(\dot{x}, \psi) \leq c(F, \psi) \quad \forall t \in [0, T],
 $$
where $\psi \in \mathbb{R}^n$, $\| \psi \| = 1$.
 Denote $z(t) = \dot{x}(t)$,
then from \eqref{eq:2} we have
$$
x(t) = x_0 + \int_0^{t} z(\tau) d\tau.
$$
We introduce the functions
\begin{gather}\label{eq:4}
l(\psi,z,t) = (z, \psi) - c(F, \psi), \\
\label{eq:5}
h(\psi,z,t) = \max\{0, l(\psi,z,t)\}
 \end{gather}
and construct the functional
\begin{equation} \label{eq:6}
\varphi(\psi,z) = \Big( \int ^{T}_0 h^2(\psi,z,t) dt \Big)^{1/2}.
 \end{equation}
We consider the sets
\[
\Omega = [z \in P_{n} [0, T] : \varphi(\psi,z) = 0],\quad
\Omega_{\delta} = [z \in P_{n} [0, T] \ | \ \varphi(\psi,z) <\delta].
\]
 Then
 $$
\Omega_{\delta}/ \Omega = [z \in P_{n} [0, T] : 0<\varphi(\psi,z) <\delta].
$$
One may easily check that for functional \eqref{eq:6} the following relation holds
\[
z \begin{cases}
  \in \Omega, & \text{if } (\dot{x}, \psi) \leq
c(F, \psi) \; \forall t \in [0, T], \\
  \notin \Omega, & \text{if not}.
\end{cases}
\]
Let us write the functional
\begin{equation} \label{eq:7}
\Phi(\psi,z) = I(z) + \lambda \varphi(\psi,z),
 \end{equation}
in which
$$
I(z) = I\Big(x_0 + \int_0^t z(\tau) d\tau\Big),
$$
where $\lambda$ is a sufficiently big positive number which is called
a penalty parameter.
It will be shown that under some additional assumptions it is an exact
penalty function.
 Then the problem of minimization of functional \eqref{eq:3}
 under constraints \eqref{eq:1}, \eqref{eq:2} may be reduced to
 unconstrained minimization of functional \eqref{eq:7}.

\section{Differential properties of $\varphi(z)$ and $I(z)$}

Further we assume that the vector-function $f(x, t)$ is continuous
 in both of its arguments and continuously differentiable in $x$ and that for
 all $t \in [0,T]$ and for all $x \in \mathbb{R}^n$ the inclusion
$f(x,t) \in F(x, t)$ takes place.
 In the paper we sometimes write $f$ instead of $f(x,t)$. Further we consider
 the functions $l(\psi, z, t)$, $h(\psi, z, t)$, $\varphi(\psi, z)$ and
$\Phi(\psi, z)$ for a fixed value $\psi$, so we write $l(z, t)$, $h(z, t)$,
$\varphi(z)$ and $\Phi(z)$ respectively instead of them.

 Consider the functional $\varphi(z)$. Let $v \in P_{n} [0, T]$.
 Put
$$
 z_{\alpha}(t) = z(t) + \alpha v(t).
$$
We calculate
$$
l(z_{\alpha}, t) = l(z,t) + \alpha H_{1}(z_{\alpha},t) + o(\alpha, t),
$$
where
\begin{gather*}
\frac{o(\alpha, t)}{\alpha} \to 0 \quad \text {as } \alpha \downarrow 0, \\
H_{1}(z_{\alpha},t)
= (\psi, v(t)) - \max_{f \in F}
 \Big( \frac{\partial f}{\partial x} \int_0^{t} v(\tau) d\tau, \psi \Big).
\end{gather*}
Here the definition of a support function and the property of additivity
 of a support function in the first argument are used \cite{blag_fil}.
 Using \eqref{eq:4} and \eqref{eq:5}, we find
$$
h(z_{\alpha}, v) = h(z,t) + \alpha H(z_{\alpha},t) + o(\alpha, t),
$$
where
\begin{gather*}
\frac{o(\alpha, t)}{\alpha} \to 0 \quad \text {as } \alpha \downarrow 0,\\
H(z_{\alpha},t) = H_1(z_{\alpha},t), \quad l(z,t) > 0, \\
H(z_{\alpha},t) = 0, \quad l(z,t) < 0, \\
H(z_{\alpha},t) = \max \{0, H_1(z_{\alpha},t)\}, \quad l(z,t) = 0.
\end{gather*}
We introduce the sets
\begin{gather*}
T_+(z) = [t \in [0, T] : l(z,t) > 0],\\
T_-(z) = [t \in [0, T] : l(z,t) < 0],\\
T_0(z) = [t \in [0, T] : l(z,t) = 0].
\end{gather*}
At first, consider the case $z \notin \Omega$.

\begin{lemma}\label{l:1}
 If $z \notin \Omega$, then the functional $\varphi(z)$ is superdifferentiable
 \cite{dem_vas} and its superdifferential at a point $z$ is expressed as follows
$$
\overline{\partial} {\varphi}(z) = \frac{h(z,t)}{\varphi(z)}\psi +
\int_{t}^{T} -\Big(\frac{\partial f}{\partial x}\Big)'
\frac{h(z,\tau)}{\varphi(z)} \psi \,d\tau, \quad f \in F,
$$
where $'$ means the transpose operation.
\end{lemma}

\begin{proof}
 From \eqref{eq:6} we have
$$
\varphi(z_{\alpha}) = \varphi(z) + \alpha \int_0^{T}
 \frac{h(z,t)}{\varphi(z)} H(z_{\alpha},t) dt + o(\alpha),
 $$
 where
 $$
 \frac{o(\alpha)}{\alpha} \to 0 \quad \text {as } \alpha \downarrow 0.
 $$
Since $z \notin \Omega$, we have $H = H_1$. Then, using the expression for $H_{1}$,
 the theorem of the integral of a support function and positive homogeneity
 of a support function in the second argument \cite{blag}, one obtains
\begin{align*}
\varphi'(z,v)
&= \lim_{\alpha \downarrow 0} \frac{\varphi(z + \alpha v) - \varphi(z)}{\alpha}\\
&= \int_0^{T} \Big(\frac{h(z,t)}{\varphi(z)}\psi, v(t) \Big) dt
 -\max_{f \in F} \int_0^{T} \Big(\frac{\partial f}{\partial x}
\int_0^{t} v(\tau) d\tau, \frac{h(z,t)}{\varphi(z)} \psi\Big) dt.
\end{align*}
Integrating by parts in the last summand, we obtain
\begin{equation} \label{eq:8}
\begin{aligned}
&\varphi'(z,v)\\
&= \int_0^{T} \Big(\frac{h(z,t)}{\varphi(z)}\psi, v(t)\Big) dt
- \max_{f \in F} \int_0^{T} \Big(v(t),
 \int_{t}^{T} \big(\frac{\partial f}{\partial x}\big)'
 \frac{h(z,\tau)}{\varphi(z)} \psi \,d\tau\Big) dt \\
& = \int_0^{T} \Big(\frac{h(z,t)}{\varphi(z)}\psi, v(t)\Big) dt
+ \min_{f \in F} \int_0^{T} \Big(v(t), \int_{t}^{T} -
\big(\frac{\partial f}{\partial x}\big)'
\frac{h(z,\tau)}{\varphi(z)} \psi \,d\tau\Big) dt\\
& = \min_{V \in \overline{\partial} {\varphi}(z)} (V, v),
\end{aligned}
\end{equation}
where
$$
 \overline{\partial} {\varphi}(z)
 = \big\{ V \in P_{n} [0, T] :
 V(t) = \frac{h(z,t)}{\varphi(z)}\psi + \int_{t}^{T} -
 \big(\frac{\partial f}{\partial x}\big)' \frac{h(z,\tau)}{\varphi(z)}
 \psi \,d\tau, \, f \in F \big\}.
$$
We denote
$$
\kappa(z,t) = \frac{h(z,t)}{\varphi(z)}, \quad \kappa(z) \in P [0, T]\,.
$$
Then
$\kappa(z,t) \geq 0$ for all $t \in [0, T]$, $\|\kappa (z)\| = 1$,
where $\|\cdot \|$ is the norm in $L_2[0, T]$. From \eqref{eq:8}
it is clear that the functional $\varphi(z)$ is superdifferentiable and
its subdifferential is of the form
\begin{equation} \label{eq:9}
\overline{\partial} {\varphi}(z) =
 \kappa (z,t)\psi + \int_{t}^{T} -\big(\frac{\partial f}{\partial x}\big)'
 \kappa (z,\tau) \psi \,d\tau, \quad f \in F.
 \end{equation}
The proof is complete.
\end{proof}

Now consider the case $z \in \Omega$.

\begin{lemma}\label{l:2}
 If $z \in \Omega$, then the functional $\varphi(z)$ is Dini differentiable
in any direction $v \in P_n [0, T]$ and its $D$-derivative in the direction
$v$ at a point $z$ is expressed as follows
$$
\varphi'(z,v) = \max_{\|w\| \leq 1} \Big[ \int_0^{T} \big(w(t)\psi, v(t)\big) dt
 + \min_{f \in F} \int_0^{T} \Big(\int_{t}^{T}
-\big(\frac{\partial f}{\partial x}\big)'
 w(\tau)\psi \,d\tau, v(t)\Big) dt \Big],
$$
where $w \in P [0, T]$, $\|w\| \leq 1$.
\end{lemma}

\begin{proof}
 Since $z \in \Omega$, we have $\varphi(z) = 0$. Then from expression \eqref{eq:6}
we obtain
$$
\varphi'(z,v) = \lim_{\alpha \downarrow 0} \frac{\varphi(z + \alpha v)
- \varphi(z)}{\alpha} = \|H(z_{\alpha})\|
= \max_{\|w\| \leq 1} \int_0^{T} H(z_{\alpha},t)w(t) dt.
$$
Under the assumptions of this theorem we have $T_{+}(z) = \emptyset$, so
\begin{align*}
\varphi'(z,v)
& = \max_{\|w\| \leq 1} \int_{T_0 \cup T_{-}} w(t)
\max_{\overline{w}(t) \in [0,1]} (\overline{w}(t) H_1(z_{\alpha},t)) dt \\
&= \max_{w \in W_1} \int_0^{T} H_1(z_{\alpha},t) w(t) dt,
\end{align*}
where
\begin{equation} \label{eq:10}
 W_1 = \{w \in P [0, T] : \|w\| \leq 1, \ w(t) \geq 0 \,
 \forall t \in T_0, \, w(t) = 0 \, \forall t \in T_- \}.
 \end{equation}
From the expression for $H_1$ we obtain
\begin{equation} \label{eq:11}
\begin{aligned}
&\varphi'(z,v) \\
&= \max_{w \in W_1} \Big[ \int_0^{T} (w(t)\psi, v(t)) dt +
\min_{f \in F} \int_0^{T} \Big(\int_{t}^{T} -
\big(\frac{\partial f}{\partial x}\big)' w(\tau)\psi \,d\tau, v(t)\Big) dt \Big].
\end{aligned}
\end{equation}
The proof is complete.
\end{proof}

Finding the derivative of the functional $I(z)$ in the direction
$v \in P_{n} [0, T]$,
 we show that $I$ is Gateaux differentiable
$$
I'(z, v) = \int ^{T}_0\Big(\int ^{T}_{t} \frac{\partial f_0}{\partial x} d\tau,
 v(t)\Big) dt,
$$
and its gradient on the set $P_{n} [0, T]$ is expressed by the formula
\begin{equation} \label{eq:12}
\nabla I(z) = \int ^{T}_{t} \frac{\partial f_0}{\partial x} d\tau.
\end{equation}

\begin{lemma}\label{l:3}
If the support function $c(F, \psi)$ of the multivalued mapping $F(x, t)$
 is continuously differentiable in the phase variable $x$, then:
\begin{itemize}
 \item if $z \notin \Omega$, then the functional $\varphi(z)$ is
Gateaux differentiable and its gradient on the set $P_{n} [0, T]$
 may be found by the formula
$$
\nabla \varphi(z) = \frac{h(z,t)}{\varphi(z)} \psi
 + \int_{t}^{T} -\frac{h(z,\tau)}
{\varphi(z)} \frac{\partial c(F(x,\tau), \psi)}{\partial x} d\tau;
$$

 \item if $z \in \Omega$, then the functional $\varphi(z)$ is
subdifferentiable \cite{dem_vas}
 and its subdifferential at a point $z$ may be found by the formula
$$
\partial \varphi(z) = \big\{W \in P_{n} [0, T] \ |
 \ W(t) = w(t)\psi + \int_{t}^{T} -w(\tau) \frac{\partial c(F(x,\tau), \psi)}
 {\partial x} d\tau, \ w \in W_1 \big\},
$$
where the set $W_1$ is defined by the formula \eqref{eq:10}.
\end{itemize}
\end{lemma}

\begin{proof}
 By the definition of the support function
 $$
c(F, \psi) = \max_{f \in F} (f, \psi).
$$
 It is clear that this function is subdifferentiable, and its subdifferential is
 expressed by the formula
$$
\partial {c} (F, \psi) = \operatorname{co} \big\{ 
\big(\frac{\partial f}{\partial x}\big)' \psi \big\},
 \quad  f \in R = \{f \in F : c(F, \psi) = (f, \psi) \}.
 $$
Hence $c(F, \psi)$ is differentiable in $x$ if and only if the set
 $R$ consists of the only element. Let us denote it $f^{*}$.
 Thus, in this case we can assume that
$$
c(F, \psi) = (f^{*}, \psi),
$$
and the following relations hold
\begin{equation} \label{eq:13}
\big(\frac{\partial f^{*}}{\partial x}\big)' \psi 
= \frac{\partial (f^{*}, \psi)}{\partial x} 
= \frac{\partial c(F, \psi)}{\partial x}.
 \end{equation}

Let $z \notin \Omega$. From expression \eqref{eq:9} we conclude that the
 superdifferential of the functional ${\varphi}(z)$ consists of the only element,
 therefore $\varphi(z)$ is Gateaux differentiable.
 Its gradient on the set $P_{n} [0, T]$ is as follows
\begin{equation} \label{eq:14}
 \nabla \varphi(z) = \frac{h(z,t)}{\varphi(z)} \psi + \int_{t}^{T}
 - \frac{h(z,\tau)}{\varphi(z)} \big(\frac{\partial f^{*}}{\partial x}\big)'
 \psi \,d\tau. 
\end{equation}
Using \eqref{eq:13}, from \eqref{eq:14} we finally get the expression
$$
\nabla \varphi(z) = \frac{h(z,t)}{\varphi(z)} \psi + \int_{t}^{T} -\frac{h(z,\tau)}
{\varphi(z)} \frac{\partial c(F(x,\tau), \psi)}{\partial x} d\tau,
$$
which proves the first part of the lemma.

Let $z \in \Omega$. From expression \eqref{eq:11} we
 conclude that the derivative of the functional $\varphi(z)$ in the direction $v$
 may be expressed as 
\begin{equation} \label{eq:15}
\begin{aligned}
\varphi'(z,v)
&= \max_{\|w\| \leq 1} \Big[ \int_0^{T} (w(t)\psi, v(t)) dt +
\Big( \int_{t}^{T} -\big(\frac{\partial f^{*}}{\partial x}\big)'
w(\tau)\psi \,d\tau, v(t) \Big) dt \Big]\\
&= \max_{W \in \partial \varphi(z) }(W, v),
\end{aligned}
\end{equation}
where
$$
 \partial \varphi(z) 
=\big\{W \in P_{n} [0, T] \ \bigm |
 \ W(t) = w(t)\psi + \int_{t}^{T} -w(\tau)
 \big(\frac{\partial f^{*}}{\partial x}\big)' \psi \,d\tau, \ w \in W_1\big\},
$$
and $W_1$ is defined in \eqref{eq:10}.
Using \eqref{eq:13}, from \eqref{eq:15} we finally get the expression
\begin{equation} \label{eq:16}
\begin{aligned}
\partial \varphi(z) 
&= \Big\{W \in P_{n} [0, T] :  W(t) = w(t)\psi \\
&\quad + \int_{t}^{T} -w(\tau) \frac{\partial c(F(x,\tau), \psi)}
{\partial x} d\tau, \ w \in W_1 \Big\},
\end{aligned}
\end{equation}
which proves the second part of the lemma.
Note that in this case the following equality also holds
\begin{equation} \label{eq:17}
\gamma w(t) \frac{\partial c(F(x,t), \psi)}{\partial x} =
\frac{\partial c(F(x,t), \gamma w(t) \psi)}{\partial x} \quad \forall t \in [0, T],
\; \forall \gamma > 0.
\end{equation}
\end{proof}

\section{Necessary minimum conditions}

\begin{theorem}\label{t:1}
 Let $\inf _{z \in \Omega} I(z) = I(z^{*}) > -\infty$
 and there exists such a positive number
 $\lambda_0 < \infty$ that $\forall \lambda > \lambda_0$
 there exists $z(\lambda) \in P_{n}[0, T]$, for which
 $$
\Phi_{\lambda}(z(\lambda)) = \inf _{z \in P_{n}[0, T]} \Phi_{\lambda}(z).
$$
 Let the functional $I(z)$ be locally Lipschitz on the set
 $\Omega_{\delta} / \Omega$.
 Then functional \eqref{eq:7} will be an exact penalty function.
 \end{theorem}

\begin{proof}
It is sufficient \cite{dem} to show  that there exist
such numbers $a > 0$, $\delta > 0$ that
\begin{equation} \label{eq:18}
 \varphi^{\downarrow}(z) = \liminf _{y \to z}
 \frac{\varphi(y)-\varphi(z)}{\rho(z,y)} < -a < 0 \quad
 \forall z \in \Omega_{\delta}/ \Omega.
 \end{equation}
Here
$y \in P_{n} [0, T]$, $\rho(z, y)$ is the following metric on the set $P_{n} [0, T]$
$$
\rho(z,y) = \max_{t\in[0,T]} \Big| \int ^{t}_0z(t)-y(t)dt \Big|.
$$
Put
$$
y(t) = z(t) + \alpha v^{*}(t), \ v^{*}(t) =
 -\Big(\frac{h(z,t)}{\varphi(z)} \psi + \int_{t}^{T} -
 \big(\frac{\partial f}{\partial x}\big)' \frac{h(z,\tau)}{\varphi(z)} \psi 
\,d\tau\Big).
 $$
Then using Lemma \ref{l:1}, one gets
\begin{gather*}
\varphi'(z, v^{*}) 
= \min_{f \in F} \int ^{T}_0 - \Big ( \frac{h(z,t)}{\varphi(z)} \psi 
+ \int_{t}^{T} - \big(\frac{\partial f}{\partial x}\big)' 
 \frac{h(z,\tau)}{\varphi(z)} \psi \,d\tau,\\
 \frac{h(z,t)}{\varphi(z)} \psi + \int_{t}^{T} 
-\big(\frac{\partial f}{\partial x}\big)'
 \frac{h(z,\tau)}{\varphi(z)} \psi \,d\tau \Big) dt.
\end{gather*}
Let us show that
$$
 \frac{h(z,t)}{\varphi(z)} \psi + \int_{t}^{T} 
-\big(\frac{\partial f}{\partial x}\big)'
 \frac{h(z,\tau)}{\varphi(z)} \psi \,d\tau \neq \mathbf{0}, \quad f \in F,
 $$
identically on the interval $[0,T]$.
Assume the contrary.
Then $\frac{h(z,t)}{\varphi(z)} \psi = \mathbf{0}$ for all $t\in [0, T]$
which contradicts the constraints on $\psi$ and $\frac{h(z,t)}{\varphi(z)}$.
Let $\varphi(y) \to \varphi(z)$ if $y \to z$, i. e.
 there exists sequence $\{z_{k}\} \in \Omega_{\delta} / \Omega$
 such that $\varphi'(z_{k}, v^{*}) \to 0$ if $k \to \infty$, where
\begin{gather*}
\frac{\partial f}{\partial x} = \frac{\partial f(x_{k}, t)}{\partial x}, \quad
 f \in F, \\
x_k(t) = x_0 + \int_0^{t} z_k(\tau) d\tau.
\end{gather*}
Therefore,
$$
\|\frac{h(z_k,t)}{\varphi(z_k)} \psi +
\int_{t}^{T} -\Big(\frac{\partial f}{\partial x}\Big)' 
\frac{h(z_k,\tau)}{\varphi(z_k)}
 \psi \,d\tau \| \to 0, \quad \text{as } k \to \infty,\; f \in F,
 $$
hence
 $$
\|\frac{h(z_k,t)}{\varphi(z_k)} \psi \| \to 0
 \quad  \text{as } k \to \infty,
 $$ 
that also contradicts the assumptions
 $$
\|\psi\| = 1, \quad \| \frac{h(z)}{\varphi(z)} \| = 1.
$$
Then we conclude that
$$
\varphi(y) - \varphi(z) = \alpha \varphi'(z, v^{*}) + o(\alpha) < 0 \quad
\forall z \in \Omega_{\delta}/ \Omega.
$$
Now find that
$$
\rho(z,y) = \alpha \max_{t\in[0,T]} \Big| \int ^{t}_0v^{*}(t)dt \Big| > 0.
$$
From the last two inequalities follows \eqref{eq:18}.
The proof is complete.
\end{proof}


\begin{theorem}\label{t:2}
 Let the conditions of Theorem \ref{t:1} be satisfied. 
Let the support function of  the multivalued mapping $F(x,t)$ from \eqref{eq:1} 
be continuously  differentiable in $x$.
 For the point
 $$
x^{*} = x_0 + \int_0^{t} z^{*}(\tau) d\tau
$$
 to satisfy inclusion \eqref{eq:1} and condition \eqref{eq:2} and
 to minimize functional \eqref{eq:3}, the existence of such a
 vector-function $\Psi(t)$ that for all $t \in [0, T]$ the following relations hold
\begin{equation} \label{eq:19}
\dot{\Psi}(t) = -\frac {\partial c(F(x^{*}, t), \Psi(t))}{\partial x} +
\frac{\partial f_0(x^{*},t)} {\partial{x}},
\end{equation}
\begin{equation} \label{eq:20}
 (\dot{x}^{*}, \Psi(t)) - c(F(x^{*}, t), \Psi(t)) = 0,
 \end{equation}
\begin{equation} \label{eq:21} \Psi(T) = \mathbf{0}\end{equation}
is necessary.
 \end{theorem}

\begin{proof}
In Theorem \ref{t:1} it has been shown that the functional \eqref{eq:7}
is an exact penalty function,
 hence there exists such a number $\lambda^{*} > 0$ that
 for all $\lambda > \lambda^{*}$ functional \eqref{eq:3}
 minimization problem under constraints \eqref{eq:1}, \eqref{eq:2}
 is equivalent to the unconstrained optimization problem of functional \eqref{eq:7}
 minimization.

Let us put $\Psi(t) = \lambda w(t) \psi$, where the vector-function $w(t)$
 is an element of the set $W_1$. Since by Lemma \ref{l:3} if $z \in \Omega$,
 the functional $\varphi(z)$ is subdifferentiable and its subdifferential
 is represented in \eqref{eq:16}, and the functional $I(z)$ is Gateaux
 differentiable and its gradient is represented in \eqref{eq:12},
 then from necessary minimum condition \cite{dem}
$$
0_n \in \partial \Phi(z^*).
$$
Considering \eqref{eq:17} we have that at the minimum point for all
$t \in [0, T]$,
 \begin{equation} \label{eq:22} 
\int ^{T}_{t} \frac{\partial f_0(x^{*},t)}{\partial x} d\tau
 + \Psi(t) + \int_{t}^{T} -\frac{\partial c(F(x^{*},t), \Psi(t))}{\partial x} d\tau 
= 0_n,
 \end{equation}
 where $0_n$ is a zero element of the space $P_n [0, T]$.
 Differentiating \eqref{eq:22} on the interval $[0, T]$, one obtains a system of
 differential equations
 $$ 
\dot{\Psi}(t) = -\frac {\partial c(F(x^{*}, t), \Psi(t))}{\partial x} +
 \frac{\partial f_0(x^{*},t)} {\partial{x}} 
$$
 with the terminal condition $\Psi(T) = \mathbf{0}$, hence we obtain the relations
 \eqref{eq:19}, \eqref{eq:21}.

 If $t \in T_0$, from the formula of the functional $l(z,t)$ one gets 
$(z, \Psi) = c(F, \Psi)$, if $t \in T_-$, then $w(t) = 0$ and 
relation \eqref{eq:20} still takes place. Thus \eqref{eq:20} 
holds for all $t \in [0, T]$.
The proof is complete.
\end{proof}

\begin{remark} \label{rmk5.3} \rm
Theorem \ref{t:2} has been formulated for the problem with the free right end.
It is not difficult to show that relations \eqref{eq:19}, \eqref{eq:20}
will also hold for the problem with the fixed right end, but the terminal
 value $\Psi(T)$ for this problem will not be equal to zero in the general 
case, i. e.  relation \eqref{eq:21} will not hold in this case.
\end{remark}

Using the known minimum conditions  in terms of the derivative in directions 
from Lemma \ref{l:2} one gets the following lemma.

\begin{lemma}\label{l:4}
 Let the conditions of Theorem \ref{t:1} be satisfied. For the point $x^{*}$ 
to satisfy inclusion \eqref{eq:1} and condition \eqref{eq:2} and to minimize 
functional \eqref{eq:3}, it is necessary to have
\begin{equation} \label{eq:23}
\begin{aligned}
& \max_{\|w\| \leq 1} \Big[ \int_0^{T}
\Big( \int_{t}^{T} \frac{\partial f_0(x^{*},\tau)} {\partial{x}} d\tau 
+ \lambda w(t)\psi,  v(t) \Big) dt \\
& + \min_{f \in F} \int_0^{T} \Big(\int_{t}^{T} -
\Big(\frac{\partial f(x^{*}, \tau)}{\partial x}\Big)'
\lambda w(\tau)\psi \,d\tau, v(t)\Big) dt \Big] \geq 0 \quad
\forall v\in P_{n}[0,T].
\end{aligned}
 \end{equation}
\end{lemma}

Let $\overline{F} \subset F$ be a set of such $f \in F$ that \eqref{eq:23} holds.
It can be shown that the following lemma holds.

\begin{lemma}\label{l:5}
 Relation \eqref{eq:23} is equivalent to the condition: for every fixed
 $\overline{f} \in \overline{F}$ there exists such a vector-function 
$\overline{w} \in W_1$ that the following relation holds
\begin{equation} \label{eq:24}
\int_{t}^{T} \frac{\partial f_0(x^{*},\tau)} {\partial{x}} d\tau +
\lambda \overline{w}(t) \psi + \int_{t}^{T} -
\Big(\frac{\partial \overline{f}(x^{*}, \tau)} {\partial x}\Big)' 
\lambda \overline{w}(\tau) \psi \,d\tau = 0_n 
 \end{equation}
for all $t \in [0,T]$.
\end{lemma}



\begin{theorem}\label{t:3}
 Let the conditions of Theorem \ref{t:1} be satisfied.
 For the point $x^{*}$ to satisfy inclusion \eqref{eq:1}
 and condition \eqref{eq:2} and to minimize functional \eqref{eq:3},
 the existence of such a vector-function $\overline{f} \in F$
 and such a vector-function $\overline{\Psi}(t)$, for which for
 all $t \in [0, T]$ the following relations hold
\begin{gather} \label{eq:25}
\dot{\overline{\Psi}}(t) 
= -\Big(\frac{\partial \overline{f}(x^{*}, t)}{\partial x}\Big)'
 \overline{\Psi}(t) + \frac{\partial f_0(x^{*},t)} {\partial{x}}, \\
\label{eq:32}
 \big(\dot{x}^{*}, \overline{\Psi}(t)) - c(F(x^{*}, t), \overline{\Psi}(t)\big) = 0,\\
 \label{eq:26}
\overline{\Psi}(T) = \mathbf{0}, 
\end{gather}
is necessary.
\end{theorem}

\begin{proof}
In view of Lemma \ref{l:4} it is sufficient to show that \eqref{eq:23}
 is equivalent to \eqref{eq:25}, \eqref{eq:26} for some
 $\overline{f} \in F$ and $\overline{\Psi}(t)$.

In view of Lemma \ref{l:5} relation \eqref{eq:23} is equivalent to
 \eqref{eq:24} for every fixed $\overline{f} \in \overline{F}$.
 Differentiating \eqref{eq:24} on the interval $[0, T]$ and denoting
 $$
\overline{\Psi}(t) = \lambda \overline{w}(t)\psi,
$$ 
one gets a system of differential equations \eqref{eq:25} with
 terminal condition \eqref{eq:26}.
Relation \eqref{eq:32} can be proved in the same way as in Theorem \ref{t:2}.
\end{proof}


\begin{remark}\label{r:2}\rm
Theorem \ref{t:3} has been formulated for the problem with the free right end.
 It is not difficult to show that relations \eqref{eq:25}, \eqref{eq:32} 
will also hold for the problem with the fixed right end, but the terminal 
value $\Psi(T)$ for this problem will not be equal to zero in the general 
case, i. e. relation \eqref{eq:26} will not hold in this case.
\end{remark}

\section{Example}

Consider the system of differential equations
$$ 
\dot{x}_1 = u_1, \quad \dot{x}_2 = x_1, 
$$
where the restriction on control is given by the set
$$
U = \{ u \in R^2 : |u_1| \leq 1, \, u_2 = 0 \}.
$$
Let the initial condition $x_0 = (0, 0)$ and the terminal state
 $x(1) = (-1/2, -1/3)$ of the system be given.
It is required to find such control $u^* \in U$, which minimizes the functional
$$ 
I(x) = \int_0^1 x_2(t) dt. 
$$
This system can be rewritten in the form of the inclusion
$\dot{x} \in F(x)$,
where
$$
F(x) = \begin{pmatrix}
[-1, 1] \\
x_1
\end{pmatrix}.
$$
Since the support function $c(A, b)$ of the segment
$ A = \{ a \in R : a \in [-1, 1] \}$ is $|b|$,
then in this case the support function of the multivalued
mapping $F(x)$ is expressed by the formula
$$
c(F, \psi) = |\psi_1| + x_1\psi_2.
$$
One can see that the function $c(F, \psi)$ is
continuously differentiable in the phase variables and its gradient 
may be written as follows
$$
\frac{\partial{c}}{\partial{x}} = (\psi_2, 0).
$$
Further, we have
$$
\frac{\partial{f_0}}{\partial{x}} = (0, 1).
$$
From Theorem \ref{t:2} and Remark \ref{r:2} it
follows that the vector-function $\psi(t)$ must satisfy the system 
of differential equations
\begin{equation} \label{eq:28}
\dot{\psi}_1 = -\psi_2, \quad \dot{\psi}_2 = 1.
\end{equation}

From Theorem \ref{t:2} and Remark \ref{r:2} one also gets that
 for $\psi(t)$ and for all $t$ the following relations hold
$$
(\dot{x}, \psi(t)) = u_1 \psi_1 + x_1 \psi_2 = c(F,\psi)
 = |\psi_1| + x_1\psi_2,
$$
therefore for all $t$,
\begin{equation} \label{eq:29} 
u_1(t) \psi_1(t) = |\psi_1(t)|. 
\end{equation}

From \eqref{eq:28}, \eqref{eq:29} it is not difficult to obtain the optimal control
\begin{equation} \label{eq:30} 
\begin{gathered}
u_1^*(t) = -1, \quad t \in [0, \tau_1), \\
u_1^*(t) = 1, \quad t \in [\tau_1, \tau_2), \\
 u_1^*(t) = -1, \quad t \in [\tau_2, 1], 
\end{gathered}
\end{equation}
and the corresponding optimal trajectory
\begin{equation} \label{eq:31}
\begin{gathered}
x_1(t) = -t, \quad x_2(t) = -t^2/2, \quad t \in [0, \tau_1), \\
 x_1(t) = t + S_1, \quad  x_2(t) = t^2/2 + S_1t + S_2,
 \quad  t \in [\tau_1, \tau_2), \\
 x_1(t) = -t + 1/2, \quad x_2(t) = -t^2/2 + 1/2t -1/2, \quad t \in [\tau_2, 1],
\end{gathered}
\end{equation}
where
$$
\tau_1 = 13/24, \quad \tau_2 = 19/24, \quad S_1 = -13/12, S_2 = 169/576.
$$
The values $\tau_1$, $\tau_2$, $S_1$, $S_2$ in \eqref{eq:30}, \eqref{eq:31}
are found using the boundary conditions and the condition of trajectory continuity.

One can easily check that conditions \eqref{eq:28}, \eqref{eq:29} may be obtained
directly from the Pontryagin's maximum principle. Here a different approach has
 been demonstrated, when we transit from the original system to the corresponding
 differential inclusion, for which we apply the conditions of optimality 
(Theorem \ref{t:2})  to find the optimal process $(x^*(t), u^*(t))$.

\subsection*{Conclusion}
Thus, in this paper application of the theory of exacts penalty functions to
the problem of optimal control of differential inclusion is demonstrated.
 The apparatus of support functions gives opportunity to reduce the original problem
 to the optimization problem under constraints. With the help of exact penalties 
this problem is reduced to minimization of the nonsmooth functional $\Phi(z)$ 
on the whole space.
 Provided that the support function $c(F(x,t), \psi)$ is continuously 
differentiable in the vector of the phase coordinates, this functional appears 
to be subdifferentiable,  which allows to write out the necessary minimum 
conditions in terms of a subdifferential,
 which coincide with some classical results for this problem.
In the case of nondifferentiability
 of $c(F(x,t), \psi)$ in the phase variable $D$-derivative in directions 
of the functional $\Phi(z)$ is found, which allows to formulate necessary
minimum conditions. The example of theoretical results application is given.


\subsection*{Acknowledgments}
The work is supported by the Saint Petersburg State
University (project no. 9.38.205.2014).


\begin{thebibliography}{00}


\bibitem{aben} Aubin, J.- P.; Ekeland, I.;
 \emph{ Applied nonlinear analysis.} Wiley-Interscience, 1984. 518 p.

\bibitem{blag} Blagodatskih, V. I.;
\emph{ The maximum principle for differential inclusions},
 Proceedings of the Steklov Institute of Mathematics. 1984. Vol. 166. P. 23--43. 
(in Russ.)

\bibitem{blag_upr} Blagodatskih, V. I.;
\emph{ Introdution to optimal control.}
 Moscow, Vysshaya shkola, 2001. 239 p. (in Russ.)

\bibitem{blag_fil} Blagodatskih, V. I.; Filippov, A. F.;
 \emph{ Differential inclusions and optimal control}, Proceedings of the
 Steklov Institute of Mathematics. 1985. Vol. 169. P. 194--252. (in Russ.)

\bibitem{clnl} Cellina, A.; Ornelas A.;
 \emph{A Sufficient Condition for Exact Penalty in Constrained Optimization.}
 SIAM J. Control Optim.. 2003. Vol. 42 , no. 1. P. 250--265.


\bibitem{chg} Chengi, Yi;
 \emph{ Existence of Solutions for a Class of Nonlinear Evolution Inclusions
 with Nonlocal Conditions.}
 Journal of Optimization Theory and Applications. 2014. Vol. 162, no. 1. P. 13--33.

\bibitem{dem} Demyanov, V. F.;
 \emph{ Extremum conditions and variation calculus.}
Moscow, Vysshaya shkola, 2005. 335 p. (in Russ.)

\bibitem{dem_vas} Demyanov, V. F.; Vasilyev, L. V.;
 \emph{ Nondifferentiable optimization.}
 Moscow, Nauka, 1981. 384 p. (in Russ.)

\bibitem{filip} Filippov, A. F.;
\emph{Differential equations with discontinuous right-hand side.}
 Moscow, Nauka, 1985. 226 p. (in Russ.)

\bibitem{gmsm}  Gama, R.; Smirnov, G.; Watbled,  F.;
 \emph{Stability and optimality of solutions to differential inclusions via 
averaging method.}
Set-Valued and Variational Analysis. 2014. Vol. 22, no. 2. P. 349--374.

\bibitem{ioffe} Ioffe, A.;
 \emph{ Euler-lagrange and hamiltonian formalisms in dynamic optimization},
 Transactions of the american mathematical society. 1997. Vol. 349, 
no. 7. P. 2871--2900.

\bibitem{karelin} Karelin, V. V.;
 \emph{Penalty functions in a control problem},
Automation and Remote Control. 2004. no. 3. P. 483--492. (in Russ.)

\bibitem{rockaf} Rockafellar, R.;
\emph{Convex analysis.} Princeton, Princeton University Press,
1970. 470 p.

\bibitem{tng} Taniguchi, T.;
\emph{Global existence of solutions of differential inclusions.}
 Journal of Mathematical Analysis and Applications. 2004. 
Vol. 166, no. 1. P. 41--51.

\bibitem{wtbl} Watbled,  F.;
\emph{On singular perturbations for differential inclusions on the infinite interval.}
 Journal of Mathematical Analysis and Applications. 2005. Vol. 310, no. 2.
 P. 362--378.

\bibitem{zlv} Zaslavski, A.;
 \emph{A Sufficient Condition for Exact Penalty in Constrained Optimization.}
SIAM Journal on Optimization. 2005. Vol. 16 , no. 1. P. 250--262.

\end{thebibliography}

\end{document}