From 7fd51f8babe0b5bc1431b377bd3e2eb2c7230b04 Mon Sep 17 00:00:00 2001
From: =?utf8?q?J=C3=A9r=C3=B4me=20Benoit?= <jerome.benoit@piment-noir.org>
Date: Sun, 4 Nov 2018 18:55:35 +0100
Subject: [PATCH] Add the maths for the SQP method.
MIME-Version: 1.0
Content-Type: text/plain; charset=utf8
Content-Transfer-Encoding: 8bit

Signed-off-by: JÃ©rÃ´me Benoit <jerome.benoit@piment-noir.org>
---
 rapport/ProjetOptimRO.tex | 87 +++++++++++++++++++++++++++++++++++----
 1 file changed, 78 insertions(+), 9 deletions(-)

diff --git a/rapport/ProjetOptimRO.tex b/rapport/ProjetOptimRO.tex
index 5fc4678..809d31f 100644
--- a/rapport/ProjetOptimRO.tex
+++ b/rapport/ProjetOptimRO.tex
@@ -20,6 +20,7 @@
 \usepackage{fancyhdr}
 \usepackage{tocbibind}
 \usepackage{lmodern}
+\usepackage{enumitem}
 
 
 %%%%%Marges & en-t\^etes
@@ -78,7 +79,7 @@
  \begin{tabular}{c}
   \hline
   ~                                                             \\
-  \LARGE\textbf {Programmation SÃ©quentielle Quadratique ou PQS} \\
+  \LARGE\textbf {Programmation Quadratique SÃ©quentielle ou PQS} \\
   \LARGE\textbf {en}                                            \\
   \LARGE\textbf {Optimisation non linÃ©raire sous contraintes}   \\
   ~                                                             \\
@@ -181,7 +182,7 @@ DÃ©finissons le problÃ¨me central $ \mathcal{P} $ que se propose de rÃ©soudre la
  La problÃ¨matique $ \mathcal{P} $ se dÃ©finit par :
  $$
   \mathcal{P} \left \{
-  \begin{array}{r}
+  \begin{array}{l}
    \displaystyle\min_{x \in \mathbb{R}^n} J(x) \\
    g(x) \leq 0                                 \\
    h(x) = 0
@@ -210,7 +211,7 @@ DÃ©finissons quelques notions supplÃ©mentaires de base nÃ©cessaires Ã  la suite
  On dÃ©finit le Lagrangien associÃ© Ã  $ \mathcal{P} $ par :
  $$ \begin{array}{r c l}
    L : \mathbb{R}^n \times \mathbb{R}^q \times \mathbb{R}_+^p & \longrightarrow & \mathbb{R}                                                                                                      \\
-   (x,\lambda,\mu)                                            & \longmapsto     & L(x,\lambda,\mu) = J(x) + \sum\limits_{i=0}^{q} \lambda_i h_i(x) + \sum\limits_{j=0}^{p} \mu_j g_j(x)           \\
+   (x,\lambda,\mu)                                            & \longmapsto     & L(x,\lambda,\mu) = J(x) + \sum\limits_{i=1}^{q} \lambda_i h_i(x) + \sum\limits_{j=1}^{p} \mu_j g_j(x)           \\
                                                               &                 & L(x,\lambda,\mu) = J(x) + \langle \lambda,h(x) \rangle_{\mathbb{R}^q} + \langle \mu,g(x) \rangle_{\mathbb{R}^p}
   \end{array} $$
  oÃ¹ lâon note $ \lambda $  et $ \mu $ les vecteurs de coordonnÃ©es respectives $ (\lambda_1,\ldots,\lambda_q) $ et $ (\mu_1,\ldots,\mu_p) $.
@@ -508,7 +509,9 @@ $$ \underset{d \in \mathbb{R}^n}{\mathrm{argmin}} \ J(x_k) + \langle \nabla J(x_
 Autrement dit, $ d_k $ est le point de minimum global de lâapproximation de second ordre de
 $ J $ au voisinage du point courant $ x_k $.
 A condition que la matrice $ H[J](x_k) $ soit dÃ©finie positive Ã  chaque itÃ©ration, la mÃ©thode
-de Newton est bien une mÃ©thode de descente Ã  pas fixe Ã©gal Ã  $ 1 $ . Les propriÃ©tÃ©s remarquables de cet algorithme sont :
+de Newton est bien une mÃ©thode de descente Ã  pas fixe Ã©gal Ã  $ 1 $.
+\newline
+Les propriÃ©tÃ©s remarquables de cet algorithme sont :
 
 \begin{tabular}{|p{20em}|p{20em}|}
  \hline
@@ -539,7 +542,7 @@ Plusieurs questions se posent alors :
  \item Comment dÃ©terminer une matrice $ H_k $ qui soit une âbonneâ approximation de la hessienne Ã  lâitÃ©ration $ k $ sans utiliser les informations de second ordre et garantir que $ H_k^{-1} \nabla J(x_k) $ soit bien une direction de descente de $ J $ en $ x_k $, sachant que la direction de Newton, si elle existe, nâen est pas nÃ©cessairement une ?
  \item Comment conserver les bonnes propriÃ©tÃ©s de lâalgorithme de Newton ?
 \end{itemize}
-Nous ne rÃ©pondrons pas Ã  ces questions qui sont hors du cadre de ce projet. Cette section permet de rendre compte de la filiation entre la mÃ©thode PQS et celle Newtonienne.
+Nous ne rÃ©pondrons pas Ã  ces questions qui sont hors du cadre de ce projet. Cette section permet d'introduire certains prÃ©requis pour l'Ã©tude de la mÃ©thode PQS et de rendre compte de sa filiation.
 
 \section{MÃ©thode PQS (ou SQP)}
 
@@ -549,7 +552,7 @@ Trouver une solution dâun problÃ¨me dâoptimisation sous contraintes fonction
 
 \subsection{Algorithmes newtoniens}
 
-Les algorithmes newtoniens sont basÃ©s sur la linÃ©arisation dâÃ©quations caractÃ©risant les solutions que lâon cherche, fournies par les conditions dâoptimalitÃ© dâordre $ 1 $. Ces algorithmes sont \textit{primaux-duaux} dans le sens oÃ¹ ils gÃ©nÃ¨rent Ã  la fois une suite primale $ (x_k )_{k \in \mathbb{N}} $ convergeant vers une solution $ \overline{x} $ du problÃ¨me considÃ©rÃ©, et une suite gÃ©omÃ©trique duale $ (\lambda^k)_{k \in \mathbb{N}} $ de multiplicateurs convergeant vers un multiplicateur optimal $ \overline{\lambda} $ associÃ© Ã  $ \overline{x} $.
+Les algorithmes newtoniens sont basÃ©s sur la linÃ©arisation dâÃ©quations caractÃ©risant les solutions que lâon cherche, fournies par les conditions dâoptimalitÃ© dâordre $ 1 $. Ces algorithmes sont \textit{primaux-duaux} dans le sens oÃ¹ ils gÃ©nÃ¨rent Ã  la fois une suite primale $ (x_k )_{k \in \mathbb{N}} $ convergeant vers une solution $ \overline{x} $ du problÃ¨me considÃ©rÃ©, et une suite duale $ (\lambda_k)_{k \in \mathbb{N}} $ de multiplicateurs convergeant vers un multiplicateur optimal $ \overline{\lambda} $ associÃ© Ã  $ \overline{x} $.
 
 \subsection{Algorithme PQS}
 
@@ -558,7 +561,7 @@ Les algorithmes newtoniens sont basÃ©s sur la linÃ©arisation dâÃ©quations cara
 ConsidÃ©rons un problÃ¨me dâoptimisation diffÃ©rentiable $ \mathcal{P} $ avec contraintes dâÃ©galitÃ© :
 $$
  \mathcal{P} \left \{
- \begin{array}{r}
+ \begin{array}{l}
   \displaystyle\min_{x \in \mathbb{R}^n} J(x) \\
   h(x) = 0
  \end{array}
@@ -567,13 +570,79 @@ $$
 oÃ¹ $ J: \mathbb{R}^n \longrightarrow \mathbb{R} $ et $h: \mathbb{R}^n \longrightarrow \mathbb{R}^q$ sont supposÃ©es au moins diffÃ©rentiables.
 \newline
 Les conditions dâoptimalitÃ© de Lagrange (ou \textit{KKT}) sâÃ©crivent :
-$$ \nabla L(x,\lambda) = 0 \iff \nabla J(x) + \sum\limits_{i=0}^{q} \lambda_i \nabla h_i(x) = 0 $$
+$$ \nabla J(x) + \sum\limits_{i=1}^{q} \lambda_i \nabla h_i(x) = 0 \iff \nabla L(x,\lambda) = 0 $$
 donc $ \mathcal{P} $ devient :
 $$ \begin{pmatrix}
- \nabla J(x) + \sum\limits_{i=0}^{q} \lambda_i \nabla h_i(x) \\
+ \nabla J(x) + \sum\limits_{i=1}^{q} \lambda_i \nabla h_i(x) \\
  h(x)
  \end {pmatrix} = 0 $$
 Pour rÃ©soudre ce systÃ¨me dâÃ©quations, utilisons la mÃ©thode de Newton dont une itÃ©ration sâÃ©crit ici :
+$$ H[L](x_k,\lambda_k)\begin{pmatrix}
+  x_{k+1} - x_k \\
+  \lambda_{k+1} - \lambda_k
+ \end{pmatrix} = -\nabla L(x_k,\lambda_k) $$
+soit :
+$$ \begin{pmatrix}
+  H_x[L](x_k,\lambda_k) & D_h(x_k)^\top \\
+  D_h(x_k)              & 0
+ \end{pmatrix} \begin{pmatrix}
+  x_{k+1} - x_k \\
+  \lambda_{k+1} - \lambda_k
+ \end{pmatrix} = -\begin{pmatrix}
+  \nabla_x L(x_k,\lambda_k) \\
+  h(x_k)
+ \end{pmatrix}  $$
+oÃ¹ $ D_h(x) $ dÃ©signe la matrice jacobienne de lâapplication $ h : \mathbb{R}^n \longrightarrow \mathbb{R}^q $ dÃ©finie par :
+$$ D_h(x)^\top = [\nabla h_1(x)\ldots\nabla h_q(x)] $$
+Posons : $ H_k = H_x[L](x_k,\lambda_k), \ d = x_{k+1} - x_k $ et $ \mu = \lambda_{k+1} $. L'itÃ©ration s'Ã©crit donc :
+$$ \begin{pmatrix}
+  H_k      & D_h(x_k)^\top \\
+  D_h(x_k) & 0
+ \end{pmatrix} \begin{pmatrix}
+  d \\
+  \mu - \lambda_k
+ \end{pmatrix} = -\begin{pmatrix}
+  \nabla_x L(x_k,\lambda_k) \\
+  h(x_k)
+ \end{pmatrix} $$
+et est bien dÃ©finie Ã  condition que la matrice $ H_x[L](x_k,\lambda_k) $ soit inversible. Ce sera le cas si :
+\begin{enumerate}[label=(\roman*)]
+ \item Les colonnes $ \nabla h_1(x_k),\ldots,\nabla h_q(x_k) $ de $ D_h(x_k)^\top $ sont linÃ©airement indÃ©pendants : câest lâhypothÃ¨se de qualification des contraintes.
+ \item Quel que soit $ d \neq 0 $ tel que $ D_h(x_k)d = 0, \ d^\top H_k d > 0 $ : câest la condition suffisante dâoptimalitÃ© du second ordre dans le cas de contraintes dâÃ©galitÃ©.
+\end{enumerate}
+Revenons Ã  lâitÃ©ration. Elle sâÃ©crit encore :
+$$
+ \left \{
+ \begin{array}{r c l}
+  H_kd + \sum\limits_{i=1}^q(\mu_i - \lambda_{k_i})\nabla h_i(x_k) & = & -\nabla_x L(x_k,\lambda_k)        \\
+  \nabla h_i(x_k)^\top d + h_i(x_k)                                & = & 0, \ \forall i \in \{1,\ldots,q\}
+ \end{array}
+ \right .
+$$
+Or $ \nabla_x L(x_k,\lambda_k) =  \nabla J(x_k) + \sum\limits_{i=1}^{q} \lambda_{k_i} \nabla h_i(x_k) $, d'oÃ¹ :
+$$
+ \left \{
+ \begin{array}{r c l}
+  H_kd + \sum\limits_{i=1}^q\mu_i\nabla h_i(x_k) & = & -\nabla J(x_k)                    \\
+  \nabla h_i(x_k)^\top d + h_i(x_k)              & = & 0, \ \forall i \in \{1,\ldots,q\}
+ \end{array}
+ \right .
+$$
+On reconnait dans le systÃ¨me ci-dessus les conditions dâoptimalitÃ© de Lagrange du
+problÃ¨me quadratique suivant :
+$$
+ \mathcal{PQ}_k \left \{
+ \begin{array}{l}
+  \displaystyle\min_{d \in \mathbb{R}^n} \nabla J(x_k)^\top d + \frac{1}{2}d^\top H_k d \\
+  h_i(x_k) + \nabla h_i(x_k)^\top d = 0, \ \forall i \in \{1,\ldots,q\}
+ \end{array}
+ \right .
+$$
+Le problÃ¨me $ \mathcal{PQ}_k $ peut Ãªtre vu comme la minimisation dâune approximation quadratique du Lagrangien de $ \mathcal{P} $ avec une approximation linÃ©aire des contraintes.
+\newline
+Comme son nom lâindique, la mÃ©thode PQS consiste Ã  remplacer le problÃ¨me initial par une suite de problÃ¨mes quadratiques sous contraintes linÃ©aires plus faciles Ã  rÃ©soudre. Lâalgorithme est le suivant :
+
+\subsubsection{Contraintes dâinÃ©galitÃ©}
 
 \bibliographystyle{plain}
 \bibliography{stdlib_sbphilo}
-- 
2.34.1