\documentclass[reqno]{amsart} \usepackage{hyperref} \AtBeginDocument{{\noindent\small \emph{Electronic Journal of Differential Equations}, Vol. 2015 (2015), No. 309, pp. 1--13.\newline ISSN: 1072-6691. URL: http://ejde.math.txstate.edu or http://ejde.math.unt.edu \newline ftp ejde.math.txstate.edu} \thanks{\copyright 2015 Texas State University.} \vspace{9mm}} \begin{document} \title[\hfilneg EJDE-2015/309\hfil Differential inclusions] {Differential inclusions and exact penalties} \author[A. V. Fominyh, V. V. Karelin, L. N. Polyakova \hfil EJDE-2015/309\hfilneg] {Alexander V. Fominyh, Vladimir V. Karelin, Lyudmila N. Polyakova} \address{Alexander V. Fominyh \newline Saint Petersburg State University, 7-9, University emb., 199034 St. Petersburg, Russia} \email{alexfomster@mail.ru} \address{Vladimir V. Karelin \newline Saint Petersburg State University, 7-9, University emb., 199034 St. Petersburg, Russia} \email{vlkarelin@mail.ru} \address{Lyudmila N. Polyakova \newline Saint Petersburg State University, 7-9, University emb., 199034 St. Petersburg, Russia} \email{lnpol07@mail.ru} \thanks{Submitted July 23, 2015. Published December 21, 2015.} \subjclass[2010]{34A60, 49J52} \keywords{Nonsmooth functional; differential inclusion; support function; \hfill\break\indent exact penalty function; maximum principle} \begin{abstract} The article considers differential inclusion with a given set-valued mapping and initial point. It is required to find a solution of this differential inclusion that minimizes an integral functional. Some classical results about the maximum principle for differential inclusions are obtained using the support and exact penalty functions. This is done for differentiable and for non-differentiable set-valued mappings in phase variables. \end{abstract} \maketitle \numberwithin{equation}{section} \newtheorem{theorem}{Theorem}[section] \newtheorem{lemma}[theorem]{Lemma} \newtheorem{remark}[theorem]{Remark} \newtheorem{definition}[theorem]{Definition} \allowdisplaybreaks \section{Introduction} Nowadays, differential inclusions (or differential equations with a multivalued right-hand side) are almost indispensable in mathematical modeling of systems with incomplete description \cite{blag_fil} and analyzing behavior of discontinuous systems \cite{filip}. Applications of differential inclusions to the problem of constructing Lyapunov functions and optimization are known. The problem of finding solutions for a differential inclusion is important for applications \cite{clnl,chg,gmsm}, \cite{tng}--\cite{zlv}. As a rule, it is possible to obtain an analytical solution of a differential inclusion only in special cases but in the other cases we have to use numerical methods for this purpose. It should be noted that the conditions known of the existence of solutions \cite{aben,blag_fil} usually contain either a continuity requirement, or both the semi-continuities and the convexity of the corresponding multivalued mapping. \begin{definition} \label{def1} \rm A differential inclusion is a relation of the form \begin{equation}\label{eq:0} \dot{x}(t) \in F(x(t), t) \end{equation} with respect to the unknown function $x: I \to \mathbb{R}^n$, where $I \subset \mathbb{R}$ is an interval, $F: R \times \mathbb{R}^n \subset 2^{\mathbb{R}^n}$ ($2^{M}$ hereinafter means the set of all subsets of $M$). \end{definition} \begin{definition} \label{def2}\rm A function $x: I \to \mathbb{R}^n$ is called a solution of differential inclusion \eqref{eq:0} on the interval $I$ ($I \subset \mathbb{R}$) if it is absolutely continuous in $I$ and almost everywhere in $I$ satisfies relation \eqref{eq:0}. If the gradient of $x$ has only discontinuities of the first kind, such a solution is called the proper one. \end{definition} \begin{definition} \label{def3} \rm A multivalued mapping $F: X \to 2^{Y}$ is called lower semicontinuous in $x_0$ if for every $y_0 \in F(x_0)$ and for every neighborhood $U(y_0)$ of the point $y_0$ there exists such a neighborhood $U(x_0)$ of the point $x_0$ that $F(x) \cap U(ó_0) \neq 0$ for every $x \in U(x_0)$. \end{definition} \begin{definition} \label{def4} \rm A support function of multivalued mapping $F$ from $X$ to $Y$ is the function \begin{equation*} c(F(x), p) : = \sup_{y \in F(x)} (y, p) \quad\forall x \in X,\; \forall p \in Y^{*}, \end{equation*} where $Y^{*}$ is a dual space, $(\cdot,\cdot)$ is a scalar product of vectors. It describes all closed semispaces which contain $F(x)$. \end{definition} \begin{definition} \label{def5} \rm A subdifferential of the lower semicontinuous convex function $V$ on Hilbert space $X$ with the values in $\mathbb{R} \cup \{+\infty\}$ is the set \begin{equation*} \partial V(x) = \{p \in X^{*} : (p,x) - V(x) = \max_{y \in X}[(p,y) - V(y)]\}. \end{equation*} It is a closed convex subset of $X^{*}$. If $V$ has the gradient $\nabla V(x) \in X^{*}$ at the point $x$, then $\partial V(x)=\{\nabla V(x)\}$. If the function $U(x)$ is a concave one, then the set \begin{gather*} \bar{\partial}U(x)=\{u : U(y) - U(x) \leq (u, y-x)\; \forall y \in X \} \end{gather*} is called a superdifferential of the function $U$ at the point $x$. \end{definition} Differential inequalities, implicit differential equations, differential equations with restrictions on the phase coordinates may be represented in the form of the differential inclusion $\dot{x} \in F(x, t)$. So a differential inclusion is generalization of ordinary differential equations and since it has a whole family of trajectories which come out from the initial point $x_0$, then it is natural to state the problem of picking out the solutions with definite properties, for example, those which minimize a certain functional. In \cite{blag_fil}, \cite{filip} some classical results are given which extend the known Pontryagin's maximum principle for differential inclusions. The maximum principle is obtained under sufficiently stringent assumptions, in particular, provided that the support function $c(F(t,x),\psi)$ of the multivalued mapping $F(t,x)$ is continuously differentiable in the vector of phase coordinates. This article studies the problem in this case using the apparatus of support functions \cite{rockaf} and exact penalty functions \cite{karelin}. With the help of this apparatus it is comparatively easy to obtain the known Blagodatskih's maximum principle. The case is additionally investigated when differentiability in $x$ of the support function $c(F(t,x),\psi)$ is not assumed. \section{Statement of the problem} Consider the differential inclusion \begin{equation} \label{eq:1} \dot{x} \in F(x, t) \end{equation} with the initial condition \begin{equation} \label{eq:2} x(0) = x_0. \end{equation} Here $F(x, t)$, $t \in [0, T]$, is a given multivalued mapping, which is supposed to be upper semicontinuous, $x(t)$ is a $n$-dimensional vector-function of the phase coordinates, which is supposed to be continuous with partially continuous in $[0, T]$ gradient, $T > 0$ is a given moment of time. We assume that the function $F(x, t)$ puts in correspondence a certain convex compact set from $\mathbb{R}^n$ for every moment of time $t \in [0, T]$ and for every phase point $x \in \mathbb{R}^n$. It is required to find such a vector-function $x^{*}(t) \in C_{n}[0, T]$, which is the solution of inclusion \eqref{eq:1}, satisfies initial condition \eqref{eq:2} and minimizes the functional \begin{equation} \label{eq:3} I(x) = \int ^{T}_0 f_0(x,t) dt, \end{equation} where $f_0$ is a given real scalar function which is supposed to be continuous in both arguments and continuously differentiable in $x$. \section{Equivalent statement of the Problem} Further, for brevity, we sometimes write $F$ instead of $F(x,t)$. Since for all $t \in [0, T]$ and all $x \in \mathbb{R}^n$ the multivalued mapping $F(x, t)$ is a convex, closed and bounded set, inclusion \eqref{eq:1} may be rewritten as follows \cite{blag} $$ (\dot{x}, \psi) \leq c(F, \psi) \quad \forall t \in [0, T], $$ where $\psi \in \mathbb{R}^n$, $\| \psi \| = 1$. Denote $z(t) = \dot{x}(t)$, then from \eqref{eq:2} we have $$ x(t) = x_0 + \int_0^{t} z(\tau) d\tau. $$ We introduce the functions \begin{gather}\label{eq:4} l(\psi,z,t) = (z, \psi) - c(F, \psi), \\ \label{eq:5} h(\psi,z,t) = \max\{0, l(\psi,z,t)\} \end{gather} and construct the functional \begin{equation} \label{eq:6} \varphi(\psi,z) = \Big( \int ^{T}_0 h^2(\psi,z,t) dt \Big)^{1/2}. \end{equation} We consider the sets \[ \Omega = [z \in P_{n} [0, T] : \varphi(\psi,z) = 0],\quad \Omega_{\delta} = [z \in P_{n} [0, T] \ | \ \varphi(\psi,z) <\delta]. \] Then $$ \Omega_{\delta}/ \Omega = [z \in P_{n} [0, T] : 0<\varphi(\psi,z) <\delta]. $$ One may easily check that for functional \eqref{eq:6} the following relation holds \[ z \begin{cases} \in \Omega, & \text{if } (\dot{x}, \psi) \leq c(F, \psi) \; \forall t \in [0, T], \\ \notin \Omega, & \text{if not}. \end{cases} \] Let us write the functional \begin{equation} \label{eq:7} \Phi(\psi,z) = I(z) + \lambda \varphi(\psi,z), \end{equation} in which $$ I(z) = I\Big(x_0 + \int_0^t z(\tau) d\tau\Big), $$ where $\lambda$ is a sufficiently big positive number which is called a penalty parameter. It will be shown that under some additional assumptions it is an exact penalty function. Then the problem of minimization of functional \eqref{eq:3} under constraints \eqref{eq:1}, \eqref{eq:2} may be reduced to unconstrained minimization of functional \eqref{eq:7}. \section{Differential properties of $\varphi(z)$ and $I(z)$} Further we assume that the vector-function $f(x, t)$ is continuous in both of its arguments and continuously differentiable in $x$ and that for all $t \in [0,T]$ and for all $x \in \mathbb{R}^n$ the inclusion $f(x,t) \in F(x, t)$ takes place. In the paper we sometimes write $f$ instead of $f(x,t)$. Further we consider the functions $l(\psi, z, t)$, $h(\psi, z, t)$, $\varphi(\psi, z)$ and $\Phi(\psi, z)$ for a fixed value $\psi$, so we write $l(z, t)$, $h(z, t)$, $\varphi(z)$ and $\Phi(z)$ respectively instead of them. Consider the functional $\varphi(z)$. Let $v \in P_{n} [0, T]$. Put $$ z_{\alpha}(t) = z(t) + \alpha v(t). $$ We calculate $$ l(z_{\alpha}, t) = l(z,t) + \alpha H_{1}(z_{\alpha},t) + o(\alpha, t), $$ where \begin{gather*} \frac{o(\alpha, t)}{\alpha} \to 0 \quad \text {as } \alpha \downarrow 0, \\ H_{1}(z_{\alpha},t) = (\psi, v(t)) - \max_{f \in F} \Big( \frac{\partial f}{\partial x} \int_0^{t} v(\tau) d\tau, \psi \Big). \end{gather*} Here the definition of a support function and the property of additivity of a support function in the first argument are used \cite{blag_fil}. Using \eqref{eq:4} and \eqref{eq:5}, we find $$ h(z_{\alpha}, v) = h(z,t) + \alpha H(z_{\alpha},t) + o(\alpha, t), $$ where \begin{gather*} \frac{o(\alpha, t)}{\alpha} \to 0 \quad \text {as } \alpha \downarrow 0,\\ H(z_{\alpha},t) = H_1(z_{\alpha},t), \quad l(z,t) > 0, \\ H(z_{\alpha},t) = 0, \quad l(z,t) < 0, \\ H(z_{\alpha},t) = \max \{0, H_1(z_{\alpha},t)\}, \quad l(z,t) = 0. \end{gather*} We introduce the sets \begin{gather*} T_+(z) = [t \in [0, T] : l(z,t) > 0],\\ T_-(z) = [t \in [0, T] : l(z,t) < 0],\\ T_0(z) = [t \in [0, T] : l(z,t) = 0]. \end{gather*} At first, consider the case $z \notin \Omega$. \begin{lemma}\label{l:1} If $z \notin \Omega$, then the functional $\varphi(z)$ is superdifferentiable \cite{dem_vas} and its superdifferential at a point $z$ is expressed as follows $$ \overline{\partial} {\varphi}(z) = \frac{h(z,t)}{\varphi(z)}\psi + \int_{t}^{T} -\Big(\frac{\partial f}{\partial x}\Big)' \frac{h(z,\tau)}{\varphi(z)} \psi \,d\tau, \quad f \in F, $$ where $'$ means the transpose operation. \end{lemma} \begin{proof} From \eqref{eq:6} we have $$ \varphi(z_{\alpha}) = \varphi(z) + \alpha \int_0^{T} \frac{h(z,t)}{\varphi(z)} H(z_{\alpha},t) dt + o(\alpha), $$ where $$ \frac{o(\alpha)}{\alpha} \to 0 \quad \text {as } \alpha \downarrow 0. $$ Since $z \notin \Omega$, we have $H = H_1$. Then, using the expression for $H_{1}$, the theorem of the integral of a support function and positive homogeneity of a support function in the second argument \cite{blag}, one obtains \begin{align*} \varphi'(z,v) &= \lim_{\alpha \downarrow 0} \frac{\varphi(z + \alpha v) - \varphi(z)}{\alpha}\\ &= \int_0^{T} \Big(\frac{h(z,t)}{\varphi(z)}\psi, v(t) \Big) dt -\max_{f \in F} \int_0^{T} \Big(\frac{\partial f}{\partial x} \int_0^{t} v(\tau) d\tau, \frac{h(z,t)}{\varphi(z)} \psi\Big) dt. \end{align*} Integrating by parts in the last summand, we obtain \begin{equation} \label{eq:8} \begin{aligned} &\varphi'(z,v)\\ &= \int_0^{T} \Big(\frac{h(z,t)}{\varphi(z)}\psi, v(t)\Big) dt - \max_{f \in F} \int_0^{T} \Big(v(t), \int_{t}^{T} \big(\frac{\partial f}{\partial x}\big)' \frac{h(z,\tau)}{\varphi(z)} \psi \,d\tau\Big) dt \\ & = \int_0^{T} \Big(\frac{h(z,t)}{\varphi(z)}\psi, v(t)\Big) dt + \min_{f \in F} \int_0^{T} \Big(v(t), \int_{t}^{T} - \big(\frac{\partial f}{\partial x}\big)' \frac{h(z,\tau)}{\varphi(z)} \psi \,d\tau\Big) dt\\ & = \min_{V \in \overline{\partial} {\varphi}(z)} (V, v), \end{aligned} \end{equation} where $$ \overline{\partial} {\varphi}(z) = \big\{ V \in P_{n} [0, T] : V(t) = \frac{h(z,t)}{\varphi(z)}\psi + \int_{t}^{T} - \big(\frac{\partial f}{\partial x}\big)' \frac{h(z,\tau)}{\varphi(z)} \psi \,d\tau, \, f \in F \big\}. $$ We denote $$ \kappa(z,t) = \frac{h(z,t)}{\varphi(z)}, \quad \kappa(z) \in P [0, T]\,. $$ Then $\kappa(z,t) \geq 0$ for all $t \in [0, T]$, $\|\kappa (z)\| = 1$, where $\|\cdot \|$ is the norm in $L_2[0, T]$. From \eqref{eq:8} it is clear that the functional $\varphi(z)$ is superdifferentiable and its subdifferential is of the form \begin{equation} \label{eq:9} \overline{\partial} {\varphi}(z) = \kappa (z,t)\psi + \int_{t}^{T} -\big(\frac{\partial f}{\partial x}\big)' \kappa (z,\tau) \psi \,d\tau, \quad f \in F. \end{equation} The proof is complete. \end{proof} Now consider the case $z \in \Omega$. \begin{lemma}\label{l:2} If $z \in \Omega$, then the functional $\varphi(z)$ is Dini differentiable in any direction $v \in P_n [0, T]$ and its $D$-derivative in the direction $v$ at a point $z$ is expressed as follows $$ \varphi'(z,v) = \max_{\|w\| \leq 1} \Big[ \int_0^{T} \big(w(t)\psi, v(t)\big) dt + \min_{f \in F} \int_0^{T} \Big(\int_{t}^{T} -\big(\frac{\partial f}{\partial x}\big)' w(\tau)\psi \,d\tau, v(t)\Big) dt \Big], $$ where $w \in P [0, T]$, $\|w\| \leq 1$. \end{lemma} \begin{proof} Since $z \in \Omega$, we have $\varphi(z) = 0$. Then from expression \eqref{eq:6} we obtain $$ \varphi'(z,v) = \lim_{\alpha \downarrow 0} \frac{\varphi(z + \alpha v) - \varphi(z)}{\alpha} = \|H(z_{\alpha})\| = \max_{\|w\| \leq 1} \int_0^{T} H(z_{\alpha},t)w(t) dt. $$ Under the assumptions of this theorem we have $T_{+}(z) = \emptyset$, so \begin{align*} \varphi'(z,v) & = \max_{\|w\| \leq 1} \int_{T_0 \cup T_{-}} w(t) \max_{\overline{w}(t) \in [0,1]} (\overline{w}(t) H_1(z_{\alpha},t)) dt \\ &= \max_{w \in W_1} \int_0^{T} H_1(z_{\alpha},t) w(t) dt, \end{align*} where \begin{equation} \label{eq:10} W_1 = \{w \in P [0, T] : \|w\| \leq 1, \ w(t) \geq 0 \, \forall t \in T_0, \, w(t) = 0 \, \forall t \in T_- \}. \end{equation} From the expression for $H_1$ we obtain \begin{equation} \label{eq:11} \begin{aligned} &\varphi'(z,v) \\ &= \max_{w \in W_1} \Big[ \int_0^{T} (w(t)\psi, v(t)) dt + \min_{f \in F} \int_0^{T} \Big(\int_{t}^{T} - \big(\frac{\partial f}{\partial x}\big)' w(\tau)\psi \,d\tau, v(t)\Big) dt \Big]. \end{aligned} \end{equation} The proof is complete. \end{proof} Finding the derivative of the functional $I(z)$ in the direction $v \in P_{n} [0, T]$, we show that $I$ is Gateaux differentiable $$ I'(z, v) = \int ^{T}_0\Big(\int ^{T}_{t} \frac{\partial f_0}{\partial x} d\tau, v(t)\Big) dt, $$ and its gradient on the set $P_{n} [0, T]$ is expressed by the formula \begin{equation} \label{eq:12} \nabla I(z) = \int ^{T}_{t} \frac{\partial f_0}{\partial x} d\tau. \end{equation} \begin{lemma}\label{l:3} If the support function $c(F, \psi)$ of the multivalued mapping $F(x, t)$ is continuously differentiable in the phase variable $x$, then: \begin{itemize} \item if $z \notin \Omega$, then the functional $\varphi(z)$ is Gateaux differentiable and its gradient on the set $P_{n} [0, T]$ may be found by the formula $$ \nabla \varphi(z) = \frac{h(z,t)}{\varphi(z)} \psi + \int_{t}^{T} -\frac{h(z,\tau)} {\varphi(z)} \frac{\partial c(F(x,\tau), \psi)}{\partial x} d\tau; $$ \item if $z \in \Omega$, then the functional $\varphi(z)$ is subdifferentiable \cite{dem_vas} and its subdifferential at a point $z$ may be found by the formula $$ \partial \varphi(z) = \big\{W \in P_{n} [0, T] \ | \ W(t) = w(t)\psi + \int_{t}^{T} -w(\tau) \frac{\partial c(F(x,\tau), \psi)} {\partial x} d\tau, \ w \in W_1 \big\}, $$ where the set $W_1$ is defined by the formula \eqref{eq:10}. \end{itemize} \end{lemma} \begin{proof} By the definition of the support function $$ c(F, \psi) = \max_{f \in F} (f, \psi). $$ It is clear that this function is subdifferentiable, and its subdifferential is expressed by the formula $$ \partial {c} (F, \psi) = \operatorname{co} \big\{ \big(\frac{\partial f}{\partial x}\big)' \psi \big\}, \quad f \in R = \{f \in F : c(F, \psi) = (f, \psi) \}. $$ Hence $c(F, \psi)$ is differentiable in $x$ if and only if the set $R$ consists of the only element. Let us denote it $f^{*}$. Thus, in this case we can assume that $$ c(F, \psi) = (f^{*}, \psi), $$ and the following relations hold \begin{equation} \label{eq:13} \big(\frac{\partial f^{*}}{\partial x}\big)' \psi = \frac{\partial (f^{*}, \psi)}{\partial x} = \frac{\partial c(F, \psi)}{\partial x}. \end{equation} Let $z \notin \Omega$. From expression \eqref{eq:9} we conclude that the superdifferential of the functional ${\varphi}(z)$ consists of the only element, therefore $\varphi(z)$ is Gateaux differentiable. Its gradient on the set $P_{n} [0, T]$ is as follows \begin{equation} \label{eq:14} \nabla \varphi(z) = \frac{h(z,t)}{\varphi(z)} \psi + \int_{t}^{T} - \frac{h(z,\tau)}{\varphi(z)} \big(\frac{\partial f^{*}}{\partial x}\big)' \psi \,d\tau. \end{equation} Using \eqref{eq:13}, from \eqref{eq:14} we finally get the expression $$ \nabla \varphi(z) = \frac{h(z,t)}{\varphi(z)} \psi + \int_{t}^{T} -\frac{h(z,\tau)} {\varphi(z)} \frac{\partial c(F(x,\tau), \psi)}{\partial x} d\tau, $$ which proves the first part of the lemma. Let $z \in \Omega$. From expression \eqref{eq:11} we conclude that the derivative of the functional $\varphi(z)$ in the direction $v$ may be expressed as \begin{equation} \label{eq:15} \begin{aligned} \varphi'(z,v) &= \max_{\|w\| \leq 1} \Big[ \int_0^{T} (w(t)\psi, v(t)) dt + \Big( \int_{t}^{T} -\big(\frac{\partial f^{*}}{\partial x}\big)' w(\tau)\psi \,d\tau, v(t) \Big) dt \Big]\\ &= \max_{W \in \partial \varphi(z) }(W, v), \end{aligned} \end{equation} where $$ \partial \varphi(z) =\big\{W \in P_{n} [0, T] \ \bigm | \ W(t) = w(t)\psi + \int_{t}^{T} -w(\tau) \big(\frac{\partial f^{*}}{\partial x}\big)' \psi \,d\tau, \ w \in W_1\big\}, $$ and $W_1$ is defined in \eqref{eq:10}. Using \eqref{eq:13}, from \eqref{eq:15} we finally get the expression \begin{equation} \label{eq:16} \begin{aligned} \partial \varphi(z) &= \Big\{W \in P_{n} [0, T] : W(t) = w(t)\psi \\ &\quad + \int_{t}^{T} -w(\tau) \frac{\partial c(F(x,\tau), \psi)} {\partial x} d\tau, \ w \in W_1 \Big\}, \end{aligned} \end{equation} which proves the second part of the lemma. Note that in this case the following equality also holds \begin{equation} \label{eq:17} \gamma w(t) \frac{\partial c(F(x,t), \psi)}{\partial x} = \frac{\partial c(F(x,t), \gamma w(t) \psi)}{\partial x} \quad \forall t \in [0, T], \; \forall \gamma > 0. \end{equation} \end{proof} \section{Necessary minimum conditions} \begin{theorem}\label{t:1} Let $\inf _{z \in \Omega} I(z) = I(z^{*}) > -\infty$ and there exists such a positive number $\lambda_0 < \infty$ that $\forall \lambda > \lambda_0$ there exists $z(\lambda) \in P_{n}[0, T]$, for which $$ \Phi_{\lambda}(z(\lambda)) = \inf _{z \in P_{n}[0, T]} \Phi_{\lambda}(z). $$ Let the functional $I(z)$ be locally Lipschitz on the set $\Omega_{\delta} / \Omega$. Then functional \eqref{eq:7} will be an exact penalty function. \end{theorem} \begin{proof} It is sufficient \cite{dem} to show that there exist such numbers $a > 0$, $\delta > 0$ that \begin{equation} \label{eq:18} \varphi^{\downarrow}(z) = \liminf _{y \to z} \frac{\varphi(y)-\varphi(z)}{\rho(z,y)} < -a < 0 \quad \forall z \in \Omega_{\delta}/ \Omega. \end{equation} Here $y \in P_{n} [0, T]$, $\rho(z, y)$ is the following metric on the set $P_{n} [0, T]$ $$ \rho(z,y) = \max_{t\in[0,T]} \Big| \int ^{t}_0z(t)-y(t)dt \Big|. $$ Put $$ y(t) = z(t) + \alpha v^{*}(t), \ v^{*}(t) = -\Big(\frac{h(z,t)}{\varphi(z)} \psi + \int_{t}^{T} - \big(\frac{\partial f}{\partial x}\big)' \frac{h(z,\tau)}{\varphi(z)} \psi \,d\tau\Big). $$ Then using Lemma \ref{l:1}, one gets \begin{gather*} \varphi'(z, v^{*}) = \min_{f \in F} \int ^{T}_0 - \Big ( \frac{h(z,t)}{\varphi(z)} \psi + \int_{t}^{T} - \big(\frac{\partial f}{\partial x}\big)' \frac{h(z,\tau)}{\varphi(z)} \psi \,d\tau,\\ \frac{h(z,t)}{\varphi(z)} \psi + \int_{t}^{T} -\big(\frac{\partial f}{\partial x}\big)' \frac{h(z,\tau)}{\varphi(z)} \psi \,d\tau \Big) dt. \end{gather*} Let us show that $$ \frac{h(z,t)}{\varphi(z)} \psi + \int_{t}^{T} -\big(\frac{\partial f}{\partial x}\big)' \frac{h(z,\tau)}{\varphi(z)} \psi \,d\tau \neq \mathbf{0}, \quad f \in F, $$ identically on the interval $[0,T]$. Assume the contrary. Then $\frac{h(z,t)}{\varphi(z)} \psi = \mathbf{0}$ for all $t\in [0, T]$ which contradicts the constraints on $\psi$ and $\frac{h(z,t)}{\varphi(z)}$. Let $\varphi(y) \to \varphi(z)$ if $y \to z$, i. e. there exists sequence $\{z_{k}\} \in \Omega_{\delta} / \Omega$ such that $\varphi'(z_{k}, v^{*}) \to 0$ if $k \to \infty$, where \begin{gather*} \frac{\partial f}{\partial x} = \frac{\partial f(x_{k}, t)}{\partial x}, \quad f \in F, \\ x_k(t) = x_0 + \int_0^{t} z_k(\tau) d\tau. \end{gather*} Therefore, $$ \|\frac{h(z_k,t)}{\varphi(z_k)} \psi + \int_{t}^{T} -\Big(\frac{\partial f}{\partial x}\Big)' \frac{h(z_k,\tau)}{\varphi(z_k)} \psi \,d\tau \| \to 0, \quad \text{as } k \to \infty,\; f \in F, $$ hence $$ \|\frac{h(z_k,t)}{\varphi(z_k)} \psi \| \to 0 \quad \text{as } k \to \infty, $$ that also contradicts the assumptions $$ \|\psi\| = 1, \quad \| \frac{h(z)}{\varphi(z)} \| = 1. $$ Then we conclude that $$ \varphi(y) - \varphi(z) = \alpha \varphi'(z, v^{*}) + o(\alpha) < 0 \quad \forall z \in \Omega_{\delta}/ \Omega. $$ Now find that $$ \rho(z,y) = \alpha \max_{t\in[0,T]} \Big| \int ^{t}_0v^{*}(t)dt \Big| > 0. $$ From the last two inequalities follows \eqref{eq:18}. The proof is complete. \end{proof} \begin{theorem}\label{t:2} Let the conditions of Theorem \ref{t:1} be satisfied. Let the support function of the multivalued mapping $F(x,t)$ from \eqref{eq:1} be continuously differentiable in $x$. For the point $$ x^{*} = x_0 + \int_0^{t} z^{*}(\tau) d\tau $$ to satisfy inclusion \eqref{eq:1} and condition \eqref{eq:2} and to minimize functional \eqref{eq:3}, the existence of such a vector-function $\Psi(t)$ that for all $t \in [0, T]$ the following relations hold \begin{equation} \label{eq:19} \dot{\Psi}(t) = -\frac {\partial c(F(x^{*}, t), \Psi(t))}{\partial x} + \frac{\partial f_0(x^{*},t)} {\partial{x}}, \end{equation} \begin{equation} \label{eq:20} (\dot{x}^{*}, \Psi(t)) - c(F(x^{*}, t), \Psi(t)) = 0, \end{equation} \begin{equation} \label{eq:21} \Psi(T) = \mathbf{0}\end{equation} is necessary. \end{theorem} \begin{proof} In Theorem \ref{t:1} it has been shown that the functional \eqref{eq:7} is an exact penalty function, hence there exists such a number $\lambda^{*} > 0$ that for all $\lambda > \lambda^{*}$ functional \eqref{eq:3} minimization problem under constraints \eqref{eq:1}, \eqref{eq:2} is equivalent to the unconstrained optimization problem of functional \eqref{eq:7} minimization. Let us put $\Psi(t) = \lambda w(t) \psi$, where the vector-function $w(t)$ is an element of the set $W_1$. Since by Lemma \ref{l:3} if $z \in \Omega$, the functional $\varphi(z)$ is subdifferentiable and its subdifferential is represented in \eqref{eq:16}, and the functional $I(z)$ is Gateaux differentiable and its gradient is represented in \eqref{eq:12}, then from necessary minimum condition \cite{dem} $$ 0_n \in \partial \Phi(z^*). $$ Considering \eqref{eq:17} we have that at the minimum point for all $t \in [0, T]$, \begin{equation} \label{eq:22} \int ^{T}_{t} \frac{\partial f_0(x^{*},t)}{\partial x} d\tau + \Psi(t) + \int_{t}^{T} -\frac{\partial c(F(x^{*},t), \Psi(t))}{\partial x} d\tau = 0_n, \end{equation} where $0_n$ is a zero element of the space $P_n [0, T]$. Differentiating \eqref{eq:22} on the interval $[0, T]$, one obtains a system of differential equations $$ \dot{\Psi}(t) = -\frac {\partial c(F(x^{*}, t), \Psi(t))}{\partial x} + \frac{\partial f_0(x^{*},t)} {\partial{x}} $$ with the terminal condition $\Psi(T) = \mathbf{0}$, hence we obtain the relations \eqref{eq:19}, \eqref{eq:21}. If $t \in T_0$, from the formula of the functional $l(z,t)$ one gets $(z, \Psi) = c(F, \Psi)$, if $t \in T_-$, then $w(t) = 0$ and relation \eqref{eq:20} still takes place. Thus \eqref{eq:20} holds for all $t \in [0, T]$. The proof is complete. \end{proof} \begin{remark} \label{rmk5.3} \rm Theorem \ref{t:2} has been formulated for the problem with the free right end. It is not difficult to show that relations \eqref{eq:19}, \eqref{eq:20} will also hold for the problem with the fixed right end, but the terminal value $\Psi(T)$ for this problem will not be equal to zero in the general case, i. e. relation \eqref{eq:21} will not hold in this case. \end{remark} Using the known minimum conditions in terms of the derivative in directions from Lemma \ref{l:2} one gets the following lemma. \begin{lemma}\label{l:4} Let the conditions of Theorem \ref{t:1} be satisfied. For the point $x^{*}$ to satisfy inclusion \eqref{eq:1} and condition \eqref{eq:2} and to minimize functional \eqref{eq:3}, it is necessary to have \begin{equation} \label{eq:23} \begin{aligned} & \max_{\|w\| \leq 1} \Big[ \int_0^{T} \Big( \int_{t}^{T} \frac{\partial f_0(x^{*},\tau)} {\partial{x}} d\tau + \lambda w(t)\psi, v(t) \Big) dt \\ & + \min_{f \in F} \int_0^{T} \Big(\int_{t}^{T} - \Big(\frac{\partial f(x^{*}, \tau)}{\partial x}\Big)' \lambda w(\tau)\psi \,d\tau, v(t)\Big) dt \Big] \geq 0 \quad \forall v\in P_{n}[0,T]. \end{aligned} \end{equation} \end{lemma} Let $\overline{F} \subset F$ be a set of such $f \in F$ that \eqref{eq:23} holds. It can be shown that the following lemma holds. \begin{lemma}\label{l:5} Relation \eqref{eq:23} is equivalent to the condition: for every fixed $\overline{f} \in \overline{F}$ there exists such a vector-function $\overline{w} \in W_1$ that the following relation holds \begin{equation} \label{eq:24} \int_{t}^{T} \frac{\partial f_0(x^{*},\tau)} {\partial{x}} d\tau + \lambda \overline{w}(t) \psi + \int_{t}^{T} - \Big(\frac{\partial \overline{f}(x^{*}, \tau)} {\partial x}\Big)' \lambda \overline{w}(\tau) \psi \,d\tau = 0_n \end{equation} for all $t \in [0,T]$. \end{lemma} \begin{theorem}\label{t:3} Let the conditions of Theorem \ref{t:1} be satisfied. For the point $x^{*}$ to satisfy inclusion \eqref{eq:1} and condition \eqref{eq:2} and to minimize functional \eqref{eq:3}, the existence of such a vector-function $\overline{f} \in F$ and such a vector-function $\overline{\Psi}(t)$, for which for all $t \in [0, T]$ the following relations hold \begin{gather} \label{eq:25} \dot{\overline{\Psi}}(t) = -\Big(\frac{\partial \overline{f}(x^{*}, t)}{\partial x}\Big)' \overline{\Psi}(t) + \frac{\partial f_0(x^{*},t)} {\partial{x}}, \\ \label{eq:32} \big(\dot{x}^{*}, \overline{\Psi}(t)) - c(F(x^{*}, t), \overline{\Psi}(t)\big) = 0,\\ \label{eq:26} \overline{\Psi}(T) = \mathbf{0}, \end{gather} is necessary. \end{theorem} \begin{proof} In view of Lemma \ref{l:4} it is sufficient to show that \eqref{eq:23} is equivalent to \eqref{eq:25}, \eqref{eq:26} for some $\overline{f} \in F$ and $\overline{\Psi}(t)$. In view of Lemma \ref{l:5} relation \eqref{eq:23} is equivalent to \eqref{eq:24} for every fixed $\overline{f} \in \overline{F}$. Differentiating \eqref{eq:24} on the interval $[0, T]$ and denoting $$ \overline{\Psi}(t) = \lambda \overline{w}(t)\psi, $$ one gets a system of differential equations \eqref{eq:25} with terminal condition \eqref{eq:26}. Relation \eqref{eq:32} can be proved in the same way as in Theorem \ref{t:2}. \end{proof} \begin{remark}\label{r:2}\rm Theorem \ref{t:3} has been formulated for the problem with the free right end. It is not difficult to show that relations \eqref{eq:25}, \eqref{eq:32} will also hold for the problem with the fixed right end, but the terminal value $\Psi(T)$ for this problem will not be equal to zero in the general case, i. e. relation \eqref{eq:26} will not hold in this case. \end{remark} \section{Example} Consider the system of differential equations $$ \dot{x}_1 = u_1, \quad \dot{x}_2 = x_1, $$ where the restriction on control is given by the set $$ U = \{ u \in R^2 : |u_1| \leq 1, \, u_2 = 0 \}. $$ Let the initial condition $x_0 = (0, 0)$ and the terminal state $x(1) = (-1/2, -1/3)$ of the system be given. It is required to find such control $u^* \in U$, which minimizes the functional $$ I(x) = \int_0^1 x_2(t) dt. $$ This system can be rewritten in the form of the inclusion $\dot{x} \in F(x)$, where $$ F(x) = \begin{pmatrix} [-1, 1] \\ x_1 \end{pmatrix}. $$ Since the support function $c(A, b)$ of the segment $ A = \{ a \in R : a \in [-1, 1] \}$ is $|b|$, then in this case the support function of the multivalued mapping $F(x)$ is expressed by the formula $$ c(F, \psi) = |\psi_1| + x_1\psi_2. $$ One can see that the function $c(F, \psi)$ is continuously differentiable in the phase variables and its gradient may be written as follows $$ \frac{\partial{c}}{\partial{x}} = (\psi_2, 0). $$ Further, we have $$ \frac{\partial{f_0}}{\partial{x}} = (0, 1). $$ From Theorem \ref{t:2} and Remark \ref{r:2} it follows that the vector-function $\psi(t)$ must satisfy the system of differential equations \begin{equation} \label{eq:28} \dot{\psi}_1 = -\psi_2, \quad \dot{\psi}_2 = 1. \end{equation} From Theorem \ref{t:2} and Remark \ref{r:2} one also gets that for $\psi(t)$ and for all $t$ the following relations hold $$ (\dot{x}, \psi(t)) = u_1 \psi_1 + x_1 \psi_2 = c(F,\psi) = |\psi_1| + x_1\psi_2, $$ therefore for all $t$, \begin{equation} \label{eq:29} u_1(t) \psi_1(t) = |\psi_1(t)|. \end{equation} From \eqref{eq:28}, \eqref{eq:29} it is not difficult to obtain the optimal control \begin{equation} \label{eq:30} \begin{gathered} u_1^*(t) = -1, \quad t \in [0, \tau_1), \\ u_1^*(t) = 1, \quad t \in [\tau_1, \tau_2), \\ u_1^*(t) = -1, \quad t \in [\tau_2, 1], \end{gathered} \end{equation} and the corresponding optimal trajectory \begin{equation} \label{eq:31} \begin{gathered} x_1(t) = -t, \quad x_2(t) = -t^2/2, \quad t \in [0, \tau_1), \\ x_1(t) = t + S_1, \quad x_2(t) = t^2/2 + S_1t + S_2, \quad t \in [\tau_1, \tau_2), \\ x_1(t) = -t + 1/2, \quad x_2(t) = -t^2/2 + 1/2t -1/2, \quad t \in [\tau_2, 1], \end{gathered} \end{equation} where $$ \tau_1 = 13/24, \quad \tau_2 = 19/24, \quad S_1 = -13/12, S_2 = 169/576. $$ The values $\tau_1$, $\tau_2$, $S_1$, $S_2$ in \eqref{eq:30}, \eqref{eq:31} are found using the boundary conditions and the condition of trajectory continuity. One can easily check that conditions \eqref{eq:28}, \eqref{eq:29} may be obtained directly from the Pontryagin's maximum principle. Here a different approach has been demonstrated, when we transit from the original system to the corresponding differential inclusion, for which we apply the conditions of optimality (Theorem \ref{t:2}) to find the optimal process $(x^*(t), u^*(t))$. \subsection*{Conclusion} Thus, in this paper application of the theory of exacts penalty functions to the problem of optimal control of differential inclusion is demonstrated. The apparatus of support functions gives opportunity to reduce the original problem to the optimization problem under constraints. With the help of exact penalties this problem is reduced to minimization of the nonsmooth functional $\Phi(z)$ on the whole space. Provided that the support function $c(F(x,t), \psi)$ is continuously differentiable in the vector of the phase coordinates, this functional appears to be subdifferentiable, which allows to write out the necessary minimum conditions in terms of a subdifferential, which coincide with some classical results for this problem. In the case of nondifferentiability of $c(F(x,t), \psi)$ in the phase variable $D$-derivative in directions of the functional $\Phi(z)$ is found, which allows to formulate necessary minimum conditions. The example of theoretical results application is given. \subsection*{Acknowledgments} The work is supported by the Saint Petersburg State University (project no. 9.38.205.2014). \begin{thebibliography}{00} \bibitem{aben} Aubin, J.- P.; Ekeland, I.; \emph{ Applied nonlinear analysis.} Wiley-Interscience, 1984. 518 p. \bibitem{blag} Blagodatskih, V. I.; \emph{ The maximum principle for differential inclusions}, Proceedings of the Steklov Institute of Mathematics. 1984. Vol. 166. P. 23--43. (in Russ.) \bibitem{blag_upr} Blagodatskih, V. I.; \emph{ Introdution to optimal control.} Moscow, Vysshaya shkola, 2001. 239 p. (in Russ.) \bibitem{blag_fil} Blagodatskih, V. I.; Filippov, A. F.; \emph{ Differential inclusions and optimal control}, Proceedings of the Steklov Institute of Mathematics. 1985. Vol. 169. P. 194--252. (in Russ.) \bibitem{clnl} Cellina, A.; Ornelas A.; \emph{A Sufficient Condition for Exact Penalty in Constrained Optimization.} SIAM J. Control Optim.. 2003. Vol. 42 , no. 1. P. 250--265. \bibitem{chg} Chengi, Yi; \emph{ Existence of Solutions for a Class of Nonlinear Evolution Inclusions with Nonlocal Conditions.} Journal of Optimization Theory and Applications. 2014. Vol. 162, no. 1. P. 13--33. \bibitem{dem} Demyanov, V. F.; \emph{ Extremum conditions and variation calculus.} Moscow, Vysshaya shkola, 2005. 335 p. (in Russ.) \bibitem{dem_vas} Demyanov, V. F.; Vasilyev, L. V.; \emph{ Nondifferentiable optimization.} Moscow, Nauka, 1981. 384 p. (in Russ.) \bibitem{filip} Filippov, A. F.; \emph{Differential equations with discontinuous right-hand side.} Moscow, Nauka, 1985. 226 p. (in Russ.) \bibitem{gmsm} Gama, R.; Smirnov, G.; Watbled, F.; \emph{Stability and optimality of solutions to differential inclusions via averaging method.} Set-Valued and Variational Analysis. 2014. Vol. 22, no. 2. P. 349--374. \bibitem{ioffe} Ioffe, A.; \emph{ Euler-lagrange and hamiltonian formalisms in dynamic optimization}, Transactions of the american mathematical society. 1997. Vol. 349, no. 7. P. 2871--2900. \bibitem{karelin} Karelin, V. V.; \emph{Penalty functions in a control problem}, Automation and Remote Control. 2004. no. 3. P. 483--492. (in Russ.) \bibitem{rockaf} Rockafellar, R.; \emph{Convex analysis.} Princeton, Princeton University Press, 1970. 470 p. \bibitem{tng} Taniguchi, T.; \emph{Global existence of solutions of differential inclusions.} Journal of Mathematical Analysis and Applications. 2004. Vol. 166, no. 1. P. 41--51. \bibitem{wtbl} Watbled, F.; \emph{On singular perturbations for differential inclusions on the infinite interval.} Journal of Mathematical Analysis and Applications. 2005. Vol. 310, no. 2. P. 362--378. \bibitem{zlv} Zaslavski, A.; \emph{A Sufficient Condition for Exact Penalty in Constrained Optimization.} SIAM Journal on Optimization. 2005. Vol. 16 , no. 1. P. 250--262. \end{thebibliography} \end{document}