1: \NeedsTeXFormat{LaTeX2e}
2: % LaTeX 2.09 can't be used (nor non=LaTeX) [1994/12/01]
3: % LaTeX date must December 1994 or later
4:
5: %%%%%%%%%%%%%%% Macros and Definitions %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
6: %\newcommand{\revision}{kryolit}
7: %\newcommand{\pending}[1]{ \par\medskip{\sc #1}
8: %\marginpar{\sc {\Writinghand} } \par\medskip }
9: %\newcommand{\pig}{{\Writinghand}\marginpar{{\Writinghand}}}
10:
11: \newif\ifpdf \ifx\pdfoutput\undefined \pdffalse \else \pdfoutput=1
12: \pdftrue \fi
13:
14: \newenvironment{fig}[2] { \begin{center}
15: \begin{figure}
16: \def\myfigcaptionlar{#1} \def\myfigcaptionvar{{#2}}}
17: {\caption{\myfigcaptionvar}\label{\myfigcaptionlar}
18: \end{figure}\end{center}}
19:
20: \newcommand{\psfig}[3] {\begin{fig}{#1}{#2}\if 0#3 \else
21: \begin{center}\includegraphics{#3}\end{center}\fi
22: \end{fig} }
23:
24: \newcommand{\texfig}[3] {\begin{fig}{#1}{#2} \if 0#3 \else
25: \begin{center}
26: \input{#3}
27: \end{center}
28: \fi
29: \end{fig}
30: \if 0#3 \fi }
31:
32: \newcommand{\citez}[1]{\cite{#1}} \newcommand{\In}[1]{{\tt
33: In$[$#1$]$}}
34:
35: %%%%%%%%%%%%%%% Document Openings %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
36: \documentclass[openany,oneside,fleqn,11pt]{article}
37: \usepackage{amsmath,amssymb,amscd,amsthm}
38: % \usepackage{marvosym}
39: % \usepackage{makeidx}
40: \usepackage{url}
41: \usepackage[numbers]{natbib}
42: % \usepackage[small,compact,sc]{titlesec}
43: \usepackage{float}
44: \ifpdf \usepackage[pdftex]{graphicx}
45: \else
46: % \usepackage{pandora}
47: \usepackage{graphicx}
48: \fi
49: %\usepackage[mathcal]{euscript}
50: %\usepackage{showkeys}
51: \usepackage[bookmarks=true]{hyperref} %this one must be the last one
52: %\usepackage[a4paper, left=15mm, right=15mm]{geometry}
53: \newcommand{\hyref}[1]{\href{#1}{\tt{#1}}}
54: \newcommand{\hyreff}[2]{\href{#1}{\tt{#2}}}
55:
56: \begin{document}
57: %\DeclareGraphicsExtensions{.pdf}
58: \DeclareGraphicsExtensions{.mps}
59:
60:
61: %%%%%%%%%%%%%%% Textual Macros %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
62: \newcommand{\Ito}{It\^o }
63:
64: \newcommand{\Mathematica}{{\it
65: Mathematica }}
66: \newcommand{\MathReader}{{\it
67: MathReader }}
68:
69: \newcommand{\abbrev}[1]{#1. }
70: \newcommand{\ie}{\abbrev{i.e}}
71: \newcommand{\pg}{\abbrev{p}}
72: \newcommand{\eg}{\abbrev{eg}}
73: \newcommand{\etc}{\abbrev{etc}}
74: \newcommand{\vs}{\abbrev{vs}}
75: \newcommand{\propan}{\abbrev{Propos}}
76: \newcommand{\theopan}{Theorem}
77:
78: %%%%%%%%%%%%%%% Propositions %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
79: \theoremstyle{theorem}
80: \newtheorem{prop}{Proposition}
81: \newtheorem{lemma}[prop]{Lemma}
82: \newtheorem{theo}[prop]{Theorem}
83: \newtheorem{coroll}[prop]{Corollary}
84: \newcommand{\refprop}[1]{Proposition~\ref{#1}}
85: \newcommand{\refppropag}[1]{\propan~\ref{#1} \pg~\pageref{#1}}
86: \newcommand{\reftpropag}[1]{\theopan~\ref{#1} \pg~\pageref{#1}}
87: \newcommand{\refcorol}[1]{Corollary~\ref{#1} \pg~\pageref{#1}}
88: \theoremstyle{definition}
89: \newtheorem{adefn}[prop]{Definition}
90: \newenvironment{defn}{\begin{adefn}}{\hfill$\blacksquare$\end{adefn}}
91: \theoremstyle{remark}
92: \newtheorem{arem}[prop]{Remark}
93: \newtheorem{aexample}[prop]{Example}
94: \newcommand{\defbf}[1]{{\bf #1}}
95: \newenvironment{solution}{\begin{proof}[Solution]}{\end{proof}}
96: \newenvironment{rem}{\begin{arem}}{\hfill$\triangledown$\end{arem}}
97: \newenvironment{example}{\begin{aexample}}{\hfill$\vartriangle$\end{aexample}}
98:
99: \newcommand{\algitem}[1]{\item #1}
100:
101: \floatstyle{boxed} \newfloat{Algorithm}{H}{lop}
102: \newenvironment{alg}[5]{ \def\myalgcaptionvar{{\bf #2}$\quad[$#1$]$}
103: \if 0#5 \def\myalgcaptionvarl{\relax} \else
104: \def\myalgcaptionvarl{\noindent{#5}} \fi
105: \begin{Algorithm}
106: \noindent{\bf input: }#3
107: \noindent{\bf output: }#4
108: \begin{itemize}
109: } {
110: \end{itemize}
111: \myalgcaptionvarl
112: % \hrule
113: \caption{\myalgcaptionvar}
114: \end{Algorithm}
115: }
116:
117: \newenvironment{romanenu}
118: {\begin{enumerate}\renewcommand{\labelenumi}{(\roman{enumi})}}
119: {\end{enumerate}}
120:
121:
122:
123: %%%%%%%%%%%%%%% Notation %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
124: % common ==========================
125: \newcommand{\rfor}[1]{\quad\text{for}\quad#1}
126: \newcommand{\firstfor}{\qquad&&\text{for}\quad}
127: \newcommand{\nextfor}{&&\text{for}\quad}
128:
129: \newcommand{\alterbar}{\vec}
130:
131: \newcommand{\origi}[1]{{#1}_0} \newcommand{\define}{:=}
132: \newcommand{\definer}{=:} \newcommand{\compose}{\circ}
133: \newcommand{\frahalf}{{\frac{1}{2}}}
134:
135: % iteration =======================
136: \newcommand{\iva}[1]{0 \le i \le #1} \newcommand{\jva}[1]{0 \le j \le
137: #1}
138: %\newcommand{\ssum}[3]{{\sum_{#2 \le #1 \le #3}}}
139: \newcommand{\ssum}[3]{{\sum_{#1 = #2}^{#3}}}
140: \newcommand{\ssumi}[1]{{\ssum{i}{1}{#1}}}
141:
142: % sets and spaces =================
143: \newcommand{\RR}{{\mathbb R}} \newcommand{\NN}{{\mathbb N}}
144: \newcommand{\ZZ}{{\mathbb Z}} \newcommand{\CC}{{\mathbb C}}
145:
146: \newcommand{\RntoRn}{{\colon\RR^n \to \RR^n}}
147: \newcommand{\RntoR}{{\colon\RR^n \to \RR}}
148: \newcommand{\RtoRn}{{\colon\RR \to \RR^n}}
149: \newcommand{\RtoR}{{\colon\RR \to \RR}}
150:
151: % systems =========================
152: \newcommand{\dsys}[3]{\left(#1,#2,U,\origi{#3}\right)}
153: \newcommand{\ssys}[4]{\left(#1,#2,#3,U,\origi{#4}\right)}
154: \newcommand{\osys}[4]{\left(#1,#2,#3,U,\origi{#4}\right)}
155: % \newcommand{\dsys}[3]{\left(#1(#3),#2(#3),U,\origi{#3}\right)}
156: % \newcommand{\ssys}[4]{\left(#1(#4),#2(#4),#3(#4),U,\origi{#4}\right)}
157: % \newcommand{\osys}[4]{\left(#1(#4),#2(#4),#3(#4),U,\origi{#4}\right)}
158: \newcommand{\dsysfgx}{\dsys{f}{g}{x}}
159: \newcommand{\dosysfghx}{\osys{f}{g}{h}{x}}
160: \newcommand{\ssysfgx}{\ssys{f}{g}{\sigma}{x}}
161:
162: \newcommand{\bigdsys}[3]{\left(#1\, , \, #2\, , \, U\, , \,
163: \origi{#3}\right)} \newcommand{\bigssys}[4]{\left(#1\, , \, #2\, ,
164: \, #3\, , \, U\, , \, \origi{#4}\right)}
165:
166: \newcommand{\clssys}{{\mathbb X}} \newcommand{\clssysdet}{\clssys_D}
167: \newcommand{\clssysito}{\clssys_I}
168: \newcommand{\clssysstrat}{\clssys_S}
169:
170: \newcommand{\clsys}{\clssys(n,1,1)}
171: \newcommand{\clsysdet}{\clssysdet(n,1)}
172: \newcommand{\clsysito}{\clssysito(n,1,1)}
173: \newcommand{\clsysstrat}{\clssysstrat(n,1,1)}
174:
175: \newcommand{\clmisys}{\clssys(n,m,k)}
176: \newcommand{\clmisysdet}{\clssysdet(n,m)}
177: \newcommand{\clmisysito}{\clssysito(n,m,k)}
178: \newcommand{\clmisysstrat}{\clssysstrat(n,m,k)}
179:
180: \newcommand{\dsdef}{$\Theta_D = \dsysfgx \in \clsysdet$ }
181: \newcommand{\isdef}{$\Theta_I = \ssysfgx \in \clsysito$ }
182: \newcommand{\ssdef}{$\Theta_S = \ssysfgx \in \clsysstrat$ }
183:
184: \newcommand{\dsdefmiuu}{$\Theta = \ssysfgx \in \clmisys$ }
185: \newcommand{\dsdefmi}{$\Theta_D = \dsysfgx \in \clmisysdet$ }
186: \newcommand{\isdefmi}{$\Theta_I = \ssysfgx \in \clmisysito$ }
187: \newcommand{\ssdefmi}{$\Theta_S = \ssysfgx \in \clmisysstrat$ }
188:
189: \newcommand{\smooth}{C^{\infty}} \newcommand{\analytic}{C^{\omega(x)}}
190: \newcommand{\kdifferentiable}{C^{k}}
191:
192: % operations
193:
194: % differentiation ============
195: \newcommand{\parby}[2]{\frac{\partial #1}{\partial #2}}
196: \newcommand{\parbyx}[1]{\parby{#1}{x}}
197: \newcommand{\parbyz}[1]{\parby{#1}{z}}
198:
199: \newcommand{\parbysec}[2]{\frac{\partial^2 #1}{\partial #2^2}}
200:
201: \newcommand{\parbyxx}[3]{\frac{\partial^2 #1}{\partial #2 \partial
202: #3}} \newcommand{\parbyxxx}[4]{\frac{\partial^3 #1}{\partial #2
203: \partial #3 \partial #4}}
204: \newcommand{\parbyxxxx}[5]{\frac{\partial^4 #1}{\partial #2 \partial
205: #3 \partial #4 \partial #5 }}
206:
207: \newcommand{\lie}[2]{{\mathcal L}_{#1} {#2}}
208: \newcommand{\multilie}[3]{{\mathcal L}_{#1}^{#2} {#3}}
209: \newcommand{\biglie}[2]{\langle d{#2},{#1}\rangle}
210: %\newcommand{\biglie}[2]{\lie{#1}{#2}}
211:
212: \newcommand{\ad}[3]{\operatorname{ad}_{{#1}}^{{#2}} {{#3}}}
213: \newcommand{\adfg}[1]{\ad{f}{{#1}}{g}}
214: \newcommand{\lighk}[1]{\lie{g}{\multilie{f}{#1}{h}}}
215: \newcommand{\distrofg}[1]{\left\{\ad{f}{i}{g},\,\iva{{#1}}\right\}}
216: \newcommand{\distroabafg}[1]{\left\{\ad{{\alterbar
217: f}}{i}{g},\,\iva{{#1}}\right\}}
218:
219: \newcommand{\compoit}{\compose T^{-1} (z)}
220: \newcommand{\travf}[1]{\parbyx{T} #1 \compoit}
221: \newcommand{\trav}[1]{\parbyx{T} #1}
222:
223: % operators ==================
224: \newcommand{\flow}[1]{Fl^{#1}}
225: \newcommand{\trace}{{\operatorname{trace}}}
226: \newcommand{\grad}{{\operatorname{grad}}}
227: \newcommand{\kernel}{{\operatorname{kernel}}}
228: \newcommand{\annihilator}{{\operatorname{annihilator}}}
229: \newcommand{\rank}{{\operatorname{rank}}}
230: \newcommand{\abs}{{\operatorname{abs}}}
231: \newcommand{\sgn}{{\operatorname{sgn}}}
232: \newcommand{\sspan}{{\operatorname{span}}} \newcommand{\ito}[2]{P_#1
233: #2} \newcommand{\corr}[2]{\operatorname{corr}_#1(#2)}
234: \newcommand{\Corr}[2]{\operatorname{Corr}_#1 #2}
235:
236: \newcommand{\corrxx}[2]{{\frahalf \parby{#1}{#2} #1}}
237: \newcommand{\corrx}{\corrxx{\sigma}{x}}
238:
239: \newcommand{\itox}{{\frahalf \sigma^2 \parbysec{T}{x} \compose T^{-1}
240: (z)}} \newcommand{\itoxs}{{\frahalf \sigma^2 \parbysec{T}{x} }}
241:
242:
243: % coordinate transformation ======
244: \newcommand{\tantra}[1]{#1_\ast} \newcommand{\cotantra}[1]{#1^\ast}
245:
246: \newcommand{\sct}[1]{{\mathcal T}_{#1}} \newcommand{\sctt}{\sct{T}}
247:
248: \newcommand{\scti}[1]{\sct{#1}^{I}}
249: \newcommand{\scts}[1]{\sct{#1}^{S}}
250:
251: \newcommand{\feedback}[2]{{\mathcal F}_{#1,#2}}
252: \newcommand{\feedbackab}{\feedback{{\alpha}}{{\beta}}}
253:
254: \newcommand{\combinedz}{{\mathcal J}}
255: \newcommand{\combined}[3]{\combinedz_{#1,#2,#3}}
256: \newcommand{\combinedtab}{\combined{T}{{\alpha}}{{\beta}}}
257:
258:
259: % stochastic
260: \newcommand{\expected}[1]{{\cal E}\left\{#1\right\}}
261: \newcommand{\var}[1]{\operatorname{var}\left\{#1\right\}}
262: \newcommand{\cov}[1]{\operatorname{cov}\left\{#1\right\}}
263:
264: \newcommand{\wrong}{^\#}
265:
266: %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
267: \newcommand{\tpDate}{2002/10/09}
268: \newcommand{\tpAuthor}{Ladislav Sl\'ade\v cek}
269: \newcommand{\tpeAddress}{\v R\'\i{}kovice 18, CZ 751 18, Czech Republic}
270:
271: \newcommand{\tpEmail}{\hyreff{mailto:lsla@post.cz}{lsla@post.cz}}
272: \newcommand{\tpeTitle}{Exact Feedback Linearization of Stochastic
273: Control Systems}
274: % #3
275: \newcommand{\tpeAbstractN}{Abstract}
276: % #4
277: \newcommand{\tpeAbstract}{This paper studies exact linearization
278: methods for stochastic SISO affine controlled dynamical systems. The
279: systems are defined as vectorfield triplets in Euclidean space. The
280: goal is to find, for a given nonlinear stochastic system, a
281: combination of invertible transformations which transform the system
282: into a controllable linear form. Of course, for most nonlinear
283: systems such transformation does not exist.
284:
285: We are focused on linearization by state coordinate transformation
286: combined with feedback. The difference between \Ito and Stratonovich
287: systems is emphasized. Moreover, we define three types of linearity
288: of stochastic systems --- $g$-linearity, $\sigma$-linearity, and
289: $g\sigma$-linearity.
290:
291: Six variants of the stochastic exact linearization problem are
292: studied. The most useful problem --- the \Ito-~$g\sigma$
293: linearization is solved using the correcting term, which proved to be
294: a very useful tool for \Ito systems. The results are illustrated on
295: a numerical example solved with help of symbolic algebra. }
296: % #5
297: \newcommand{\tpeKeywordsN}{Keywords}
298: % #6
299: \newcommand{\tpeKeywords}{ exact linearization, feedback
300: linearization, nonlinear dynamical system, \Ito integral,
301: Stratonovich integral, correcting term
302: {\bf MCS classification:} 93B18, 93E03}
303:
304:
305:
306: % ============================================================
307: \title{\tpeTitle} \author{\tpAuthor}
308:
309: \newcommand{\tp}[6]{ \vfill
310: \begin{titlepage}
311: \begin{center}
312: {~\\} \vspace{25mm}
313: {\Large #1}\\
314: \vspace{1cm}
315: {\large \tpAuthor}\\
316: {\tpEmail}\\
317: {#2}\\
318:
319: \vspace{0.5cm}
320: {\large \tpDate}\\
321: \end{center}
322: \begin{quote}\small
323: \vspace{15mm}
324: {\sc\bf #3:} #4\\
325: {\sc\bf #5:} #6\\
326: \end{quote}
327: \end{titlepage}
328: }
329:
330: \newcommand{\tpe}{ \tp {\tpeTitle} {\tpeAddress} {\tpeAbstractN}
331: {\tpeAbstract} {\tpeKeywordsN} {\tpeKeywords} }
332:
333:
334: %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
335: \tpe
336:
337: \tableofcontents
338: %%%%%%%%%%%%%%% Section %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
339:
340:
341: \section{Introduction}
342: \pagenumbering{arabic}\count1=0
343: \label{sec:intro}
344:
345: The theory of exact linearization of deterministic dynamical systems
346: has been thoroughly studied since seventies. This paper attempts to
347: apply some of the results to the stochastic area. We emphasize the
348: exact linearization by state coordinate transformation combined with
349: feedback (further abbreviated as SFB linearization). Our main goal is
350: to identify the main difficulties of this approach and to consider
351: applicability of the methods known from the deterministic systems.
352:
353: The task of SFB linearization is following: given a dynamical
354: systems~$\Theta$ we are looking for a combination of coordinate
355: transformation~$\sctt$ and feedback~$\feedbackab$ which will make the
356: resulting system~$\feedbackab \compose \sctt (\Theta)$ linear and
357: controllable. One can also define the feedback-less linearization by
358: coordinate transformation only (here abbreviated as SCT) or several
359: variants of the input-output linearization. These variants are not
360: considered here.
361: \begin{rem}
362: The notation for composition of mappings sometimes differs;
363: right-to-left convention is used here:~$f \compose g(x) \define
364: f(g(x))$.
365: \end{rem}
366:
367:
368: The subject of exact linearization of stochastic controlled dynamical
369: systems lies on the intersection of three branches of science:
370: differential geometry, control theory, and the theory of stochastic
371: processes. Each of them is very broad and it is virtually impossible
372: to cover all details of their combination. Hence it is necessary to
373: choose a minimalistic simplified model for our problem and to refrain
374: from most technical details. {\em We decided to represent dynamical
375: systems under investigation by triplets of smooth vectorfields and to
376: concentrate on transformation rules for these triplets\/}. The detailed
377: interpretation of the vectorfield systems (\ie solvability of
378: underlying differential equations, properties of flows and
379: trajectories) will be considered only on an informal, motivational level.
380:
381: For simplicity, we shall confine all the definitions of geometrical
382: object to the Euclidean space; we will work in a fixed coordinate
383: system using explicit local coordinates, which may be considered to be
384: local coordinates of some manifold. This is mainly because we are
385: unable to capture all consequences of the modern,
386: coordinate-free differential geometry to the stochastic calculus (see
387: \eg~\citet{kendall86},~\citet{malliavin},~\citet{emery89}). We believe
388: that this approach is quite satisfactory for the majority of practical
389: applications.
390:
391:
392: \subsection{Dynamical systems}
393:
394: \begin{defn}
395: In this paper, a stochastic dynamical system~$\Theta \define
396: \ssysfgx$ is defined to be a triplet of smooth and bounded
397: vectorfields~$f$,~$g$, and~$\sigma$ defined on an open
398: neighborhood~$U$ of a point~$\origi{x} \in \RR^n$. We usually
399: call~$U\in \RR^n$ the \defbf{state space},~$f$ the \defbf{drift
400: vectorfield},~$g$ the \defbf{control vectorfield}, and ~$\sigma$ the
401: \defbf{dispersion vectorfield}.
402: \end{defn}
403:
404: From now on, let's assume that all functions, vectorfields, forms, and
405: distributions are smooth and bounded on~$U$.
406:
407: In this paper, we will study almost only SISO systems, but in the case
408: of stochastic MIMO systems with~$m$ control inputs and~$k$-dimensional noise the
409: symbols~$g$ and~$\sigma$ stand for~$n\times m$ ($n \times k$
410: respectively) matrix of smooth vectorfields having its rank equal
411: to~$m$ ($k$ respectively). The class of all
412: deterministic~$n$-dimensional dynamical systems with~$m$ inputs will
413: be called~$\clmisysdet$ and the class of stochastic systems
414: with~$k$-dimensional noise will be denoted with~$\clmisys$.
415:
416: Similarly, autonomous deterministic dynamical system
417: corresponds to a single vectorfield and a controlled
418: deterministic dynamical system corresponds to a vectorfield pair. It
419: is obvious that this approach is limited to time invariant, affine
420: systems.
421:
422:
423: \begin{rem}
424: The acronyms SISO and MIMO are used in the usual meaning even for
425: systems without outputs, where the wording ``scalar-input''and
426: ``vector-input'' will be appropriate. Stochastic systems with~$m =1$
427: and~$k=1$ will be considered SISO.
428: \end{rem}
429:
430: The definition may be interpreted as follows: there is a stochastic
431: process~$x_t$ defined on~$\RR^n$ which is a strong solution of the
432: stochastic differential equation $dx_t = f(x_t)\,dt + g(x_t) u(t)\,dt
433: + \sigma(x_t)\,dw_t$, with initial condition~$\origi{x}$,
434: where~$u(t)$ is a smooth function with bounded derivatives and~$w_t$
435: is a one-dimensional Brownian motion. The differential $dw_t$ is just
436: a notational shortcut for the stochastic integral.
437:
438: Details of the theory of stochastic processes are beyond the scope of
439: this article. The reader is referred to \citet{wong84},
440: \citet{oksendal}, \citet{sagemelsa}, \citet{malliavin},
441: \citet{kendall86}, \citet{karatzas}; the text of \citet{kohlman} is
442: freely available on the Internet.
443:
444: Theory of stochastic processes offers several alternative definitions
445: of the stochastic integral, among them the \Ito integral and the
446: Stratonovich integral; each of them is used to model different
447: physical problems. Consequently there are two classes of differential
448: equations and two alternative definitions of a stochastic dynamical
449: system --- \Ito dynamical systems defined by \Ito integrals and
450: Stratonovich systems defined by Stratonovich integrals.
451:
452: Serious differences between these integrals exists but from out point
453: of view there is a single important one: {\em the rules for
454: coordinate transformations of dynamical systems defined by \Ito
455: stochastic integral are quite different from the transformation rules
456: which are valid for Stratonovich systems\/}.
457:
458: The definition of the \Ito dynamical system used by us is formally
459: equivalent to the definition of the Stratonovich system; the only
460: difference will be in the corresponding coordinate transformation.
461:
462: If necessary, \Ito and Stratonovich dynamical
463: systems will be distinguished by a subscript: $\Theta_I \in
464: \clmisysito$ and~$\Theta_S \in \clmisysstrat$.
465:
466: \begin{rem}
467: In this paper we will use the adjectives {\em \Ito\/} and {\em
468: Stratonovich} rather freely. For example we will speak of
469: 'Stratonovich linearization' instead of `exact linearization of
470: stochastic dynamical system defined by Stratonovich integral'.
471: \end{rem}
472:
473:
474:
475: \subsection{Transformations}
476:
477: Furthermore, we will study two transformations of dynamical systems:
478: the coordinate transformation~$\sctt$ and the
479: feedback~$\feedbackab$. The definition of these transformation should
480: be in accord with their common interpretation. This can be illustrated
481: on the definition of the \defbf{coordinate transformation of a
482: deterministic dynamical system} $\sctt: \clmisysdet \to \clmisysdet$
483: which is induced by a diffeomorphism~$T \colon U \to \RR^n$ between two
484: coordinate systems on an open set~$U \subset \RR^n$.
485: The mapping~$\sctt$ is defined by:
486: \begin{align}
487: \label{eq:83}
488: \sctt \dsys{f}{g}{x} \define \left(
489: \tantra{T} f , \tantra{T} g ,T(U),T(\origi{x})
490: \right)
491: .\end{align}
492:
493: Recall that the symbol~$\tantra{T}$ stands for the contravariant
494: transformation~$(\tantra{T} f)_i = \ssum{j}{0}{n} f_j
495: \parby{T_i}{x_j}$. Moreover, we will require
496: that the coordinate transformation~$T$ preserves the equilibrium state
497: of the system \ie~$T(\origi{x}) = 0$.
498:
499: The definition captures the contravariant transformation
500: rules for differential equations known from the basic calculus.
501:
502: Note that the words ``coordinate transformation'' are used in two
503: different meanings: first as the
504: diffeomorphism~$T\colon U\to \RR^n$ between coordinates;
505: second as the mapping between systems~$\sctt: \clmisysdet \to
506: \clmisysdet$.
507:
508: Coordinate transformation of stochastic systems distinguish between
509: \Ito and Stratonovich systems. One of the major complications of the
510: linearization problems for \Ito systems is the second-order term in
511: the transformation rules for \Ito systems:
512: \begin{defn} \label{def:ctito}
513: Let~$U\in \RR^n$ be an open set and let~$T\colon U\to \RR^n$ be a
514: diffeomorphism from~$U$ to~$\RR^n$ with bounded
515: first derivative on $U$ such that~$T(\origi{x})=0$. The mapping
516: $\sctt\colon \clmisysito \to \clmisysito$ will be called a
517: \defbf{coordinate transformation of an \Ito dynamical system} induced by
518: diffeomorphism~$T$ if the systems $\Theta_1
519: \define \ssys{f}{g}{\sigma}{x}$ and $\Theta_2 \define
520: \left(\tilde f,\tilde g,\tilde \sigma,T(U),\origi{x}\right)$; $\Theta_2
521: = \sctt\left(\Theta_1\right)$ are related by:
522: \begin{align}
523: \label{eq:86}
524: \tilde f &= \tantra{T}f + \ito{\sigma}{T} \\
525: \label{eq:87}
526: \tilde g_i &= \tantra{T}g_i \firstfor 1 \le i \le m\\
527: \label{eq:89}
528: \tilde \sigma_i &= \tantra{T}\sigma_i \firstfor 1 \le i \le
529: k
530: .\end{align}
531: \end{defn}
532:
533: The symbol~$\ito{\sigma}{T}$ stands for the \defbf{\Ito term} which is
534: a second order linear operator defined by the following relation for
535: the~$m$-th component of~$\ito{\sigma}{T}$, $1\le m\le n$
536: \begin{equation}
537: \label{eq:16}
538: \ito{\sigma} T_m \define \frahalf \ssum{{i,j}}{1}{n}
539: \frac{\partial^2 T_m}{\partial x_i x_j} \ssum{l}{1}{k} \sigma_{il}
540: \sigma_{jl}
541: .\end{equation}
542:
543: The transformation rules for Stratonovich
544: systems~$\sctt\colon \clmisysstrat \to \clmisysstrat$,
545: $(f,g,\sigma,U,\origi{x}) \mapsto (\tantra{T}f, \tantra{T}g, \tantra{T}\sigma,
546: T(U), T(\origi{x}))$ are
547: equivalent to rules valid for the deterministic systems; only the
548: rule\eqref{eq:89} for the drift vectorfield must be added.
549:
550: The difference between the coordinate transformation of \Ito and
551: Stratonovich systems should be emphasized: in the Stratonovich case
552: all the vectorfields transform contravariantly; on the other hand, in
553: the \Ito case, the \Ito term~$\ito{\sigma}{T}$ is added to the drift
554: vectorfield of the resulting system.
555:
556: \psfig{fig:introsfee}{Regular State Feedback}{introsfee} Another
557: important transformation of dynamical systems is the regular feedback
558: transformation. A feedback transformation is determined by two smooth
559: nonlinear functions $\alpha \colon \RR^n \to \RR^m$
560: and~$\beta \colon \RR^n \to \RR^m \times \RR^m$ defined on~$U$
561: with~$\beta $ nonsingular for every~$x \in U$ (see
562: Figure~\ref{fig:introsfee}). Usually, $\alpha $ is written as a column~$m \times
563: 1$ matrix; $\beta $ as a square $m \times m$ matrix.
564:
565: \begin{defn} \label{def:feedback}
566: Let~\dsdefmiuu be a stochastic dynamical system. A \defbf{regular
567: state feedback} is the transformation $\feedbackab \colon \clmisys
568: \to \clmisys~$, $ (f,g,\sigma,U,\origi{x}) \mapsto \ssys{f + g\alpha
569: }{g\beta }{\sigma}{x} $.
570: \end{defn}
571:
572: A new input variable~$v$ is introduced by the
573: relation~$u=\alpha +\beta v$. Given the feedback~$\feedbackab$
574: with nonsingular~$\beta $, we can always construct an inverse
575: relation~$\feedback{a}{b} \define \feedbackab^{-1}$ such
576: that~$\feedbackab \compose \feedback{a}{b} = \feedback{a}{b} \compose
577: \feedbackab$ is the identity. The coefficients are related as
578: follows:~$\beta = b^{-1}$, $\alpha = - b^{-1}a$, and~$a = -\beta ^{-1}
579: \alpha $.
580:
581: This definition of feedback transformation can be used also for
582: deterministic systems provided that the drift vectorfield~$\sigma$ is
583: assumed to be zero.
584:
585: The symbol~$\combinedtab$ is used to indicate the combination of
586: coordinate transformation with feedback~$\combinedtab \define
587: \feedbackab\compose\sctt$ can be interchanged.
588:
589: \begin{rem}
590: \label{rem:orderinv}
591: Observe that the order of feedback and
592: coordinate transformation in the
593: composed transformation~$\combinedtab \define \feedbackab \compose
594: \sctt$
595: \begin{multline}
596: \combinedtab = \sctt \compose \feedbackab \bigdsys{f}{g}{x} =
597: \sctt \bigdsys{f+g\alpha }{g\beta }{x}\\
598: = \bigdsys{\tantra{T} f + \tantra{T} g\alpha }{\tantra{T} g\beta }{z}
599: = \bigdsys{\tantra{T} f + (\tantra{T} g) \alpha }{ (\tantra{T} g)
600: \beta }{z} \\
601: = \feedback{\alpha '}{\beta '} \compose \sctt
602: .\end{multline}
603: The functions~$\alpha(z)'$, $\beta(z)'$ are equal to~$\alpha(x) $
604: and~$\beta(x) $ written in the $z$~ coordinates $\alpha(z) '=\alpha(x)
605: \compose T^{-1}(z)$, $\beta(z) '=\beta(x) \compose T^{-1}(z)$.
606: \end{rem}
607:
608:
609: %======== Subsection ================================================
610: \subsection{Linearity}
611:
612: \label{sub:linearity}
613:
614: The definition of linearity is straightforward in the deterministic
615: case. In contrast, the stochastic case is more complex, because there
616: are two ``input'' vectorfields and thereby several degrees of
617: linearity can be specified.
618:
619: \begin{defn} \label{def:linear} The deterministic dynamical
620: system~$\Theta_D = (f,g,U,0) \in \clmisysdet$ is \defbf{linear} if
621: the vectorfield~$f$ is a linear mapping without no constant term and
622: the vectorfields~$g_i$ are constant; that is they can be written as
623: $f(x)= Ax$, $g(x)= B$ with~$A$ a square~$n \times n$ matrix and~$B$
624: an~$n \times m$ matrix. The matrices must be constant on whole~$U$.
625: \end{defn}
626: \begin{defn} \label{def:linearsto}
627: The stochastic dynamical system~$\Theta=(f,g,\sigma,U,0)$ is:
628: \begin{itemize}
629: \item \defbf{$g$-linear} if the mapping~$f(x) = Ax$ is linear without
630: constant term and~$g(x) = B$ is constant on~$U$.
631: \item \defbf{$\sigma$-linear} if the mapping~$f(x) = Ax$ is linear
632: without constant term and~$\sigma(x) = S$ is constant on~$U$.
633: \item \defbf{$g\sigma$-linear} if it is both~$g$-linear and
634: $\sigma$-linear.
635: \end{itemize}
636: The matrices~$A$ and~$B$ have the same dimensions as in
637: Definition~\ref{def:linear}; $S$ is an~$n \times k$ matrix.
638: \end{defn}
639:
640:
641: \begin{rem}
642: The vectorfield~$g$ is \defbf{constant} on~$U$ if the value
643: of~$g(x)$ is the same for every~$x \in U$. The vectorfield~$f$
644: on~$U$ is \defbf{linear without constant term} if~$f(\origi{x})=0$
645: and the superposition principle~$f(x_1+x_2)=f(x_1)+f(x_2)$
646: holds for every~$x_1$, $x_2 \in U$.
647: \end{rem}
648:
649: We study systems at equilibrium \ie we require that~$f(\origi{x})=0$
650: and that all transformations preserve the equilibrium:~$T(\origi{x})
651: =0$,~$\alpha (\origi{x})=0$, and~$\beta(\origi{x})$ is nonsingular.
652: The \Ito systems require an additional
653: condition~$f(\origi{x})+\corr{\sigma}{\origi{x}}=0$. The non-equilibrium case can
654: be easily handled by extending the linear model with a constant term.
655:
656: Moreover we require that the resulting linear systems are
657: controllable. A controlled deterministic dynamical linear
658: system~$\Theta_D = (Ax,B,\RR^n,0) \in \clmisysdet$ is
659: \defbf{controllable} if its first $n$ repeated brackets form an
660: $n$-dimensional space
661: \begin{equation}
662: \label{eq:68}
663: \dim \left\{A^kB, 0\le k\le n-1 \right\} = n
664: .\end{equation}
665: Other definitions of controllability of linear
666: systems exist. For example Theorem 3.1 of~\citet{zhou} gives six
667: definitions with proofs of equivalence.
668:
669: The controllability property deserves some attention in the stochastic
670: case. The linear stochastic dynamical system is characterized by two input
671: vectorfields $g(x)=B$ and $\sigma(x)=S$.
672: \begin{enumerate}
673: \item The definition of the controllability for the control
674: vectorfield~$g$ is identical to the deterministic case;
675: \ie~\eqref{eq:68} must be satisfied. This property will be called
676: \defbf{$g$-controllability}.
677: \item We will also define \defbf{$\sigma$-controllability} as the
678: requirement that the repeated brackets $S,AS,A^2S,\dots,A^{n-1}S$
679: form an $n$-dimensional space.
680: \item Finally, the linear system is \defbf{$g\sigma$-controllable} if
681: \begin{equation}
682: \label{eq:3}
683: \dim \left( \left\{A^kB, 0\le k\le n-1 \right\} \bigcup \left\{A^kS, 0\le
684: k\le n-1 \right\} \right)= n
685: .\end{equation}
686: \end{enumerate}
687: In this paper, we do not deal with the reachability, controllability,
688: accessibility, observability, and similar properties of nonlinear
689: systems.
690:
691:
692: \begin{defn} \label{def:itogssisosfb}
693: Let~\dsdefmiuu be a dynamical system such that~$f(\origi{x}) =0$. We
694: call the combination of a coordinate transformation~$\sctt$ and a
695: regular feedback~$\feedbackab$ such that $T(\origi{x})=0$,
696: $\alpha (\origi{x})=0$, and $\beta (\origi{x})$ is nonsingular the
697: \defbf{linearizing transformation } of $\Theta$ if the
698: transformation~$\feedbackab \compose \sctt $ converts~$\Theta$ into
699: a~{\em controllable\/} linear system.
700:
701: For stochastic system we distinguish:
702: \begin{romanenu}
703: \item \defbf{$g$-linearizing transformation} which transforms~$\Theta$ into
704: a~$g$-linear and~$g$-controllable system
705: \item \defbf{$\sigma$-linearizing transformation} which transforms~$\Theta$ into
706: a~$\sigma$-linear and~$\sigma$-controllable system
707: \item \defbf{$g\sigma$-linearizing
708: transformation} which transforms~$\Theta$ into
709: a~$g\sigma$-linear and~$g$-controllable system
710:
711: Note that for $g\sigma$-linearization we
712: require~$g$-controllability. This is slightly stricter requirement
713: than~$g\sigma$ controllability but it should be naturally fulfilled by
714: the majority of practical control systems. This requirement cancels
715: many ``uncomfortable'' linear forms. Consider for example the system
716: with prefilter of Figure~\ref{fig:prefilter} which
717: is~$g\sigma$-controllable but~$g$-uncontrollable.
718: \end{romanenu}\psfig{fig:prefilter}{Dynamical System with
719: a Prefilter.}{prefilter}
720: The system~$\Theta$ is \defbf{linearizable} if there exists
721: linearizing transformation of~$\Theta$.
722: \end{defn}
723:
724:
725:
726: \subsection{Computational Issues}
727:
728: In most practical circumstances, computational issues are the limiting
729: factor of any application of differential geometric methods in
730: control.
731:
732: The equations of exact linearization algorithms must be dealt in a
733: symbolic form. Even the simplest exact linearization problems are
734: extremely complex from the computational point of view. Therefore,
735: the computer algebra tools are often employed. The results presented
736: in this paper were tested by the author on few simulations of
737: control systems in the symbolic system \Mathematica.
738:
739: Of course, the computer algebra has apparently serious limitations and
740: drawbacks. Viability of the symbolic computational approach to the
741: problems of the nonlinear control is studied by \citet{jager95}. Some
742: very useful theoretical notes about the symbolic computation can be
743: found in~\citet{winkler}. Unfortunately, the limited scope
744: of this article does not allow deeper discussion of these subjects.
745:
746: \subsection{Applications}
747:
748: We propose, very briefly, two applications of the theory presented here:
749: \begin{romanenu}
750: \item \defbf{Control ---}
751: a dynamical systems~$\Theta$ obtained by exact
752: linearization will be controlled using the linear
753: feedback law:
754: \begin{equation}
755: \label{eq:141}
756: v = Kz + \kappa \nu
757: ,\end{equation}
758: where~$K$ is a row matrix of feedback gains,~$\kappa$ is an input
759: gain, $z$~is the state vector, $v$~is the original control input,
760: and~$\nu$ is a new control input.
761:
762: Two approaches can be studied --- classical linear control methods and
763: the more sophisticated stochastic optimal control approach studied
764: for example by \citet{oksendal}.
765:
766: The~$g\sigma$-linear systems are natural candidates for such
767: approach because the other linear forms leave certain
768: part of the resulting system nonlinear.
769:
770: \item \defbf{Filtering} --- the filtering problem is probably the most useful
771: application of the theory of stochastic processes. We want
772: to give the best estimate to the state of a dynamical system defined
773: by the stochastic differential equation:
774: \begin{align}
775: \label{eq:118} dx_t = f(x_t)\,dt + \sigma_f(x_t)\,dw_tf;
776: \end{align} based on observations of the from:
777: \begin{align}
778: \label{eq:119}y_t = h(x_t) +
779: \sigma_h(x_t)\,dw_th .\end{align} $x_t$ is an $n$-dimensional stochastic process, $f$, $\sigma_f$,
780: $\sigma_h$ are smooth vectorfields and $h$ is a
781: smooth function.
782:
783: It would be interesting to use exact linearization of the nonlinear
784: system to design an exact linear filter. Unfortunately, this idea has
785: no direct association with the linearization results presented below,
786: because it requires {\em output\/} exact linearization or
787: linearization of an autonomous system. Therefore, it would be helpful
788: to extend our results to these cases in the future.
789:
790:
791: \end{romanenu}
792:
793:
794: \subsection{Previous Work}
795: \label{ssub:laal}
796:
797: The problem of SFB~$g$-linearization of SISO dynamical system defined in the
798: \Ito formalism has been
799: studied by~\citet{lahdhiri}. The authors derive
800: equations corresponding to~\eqref{eq:50},~\eqref{eq:51} (eq 14, 15, 16
801: in~\citez{lahdhiri}). These equations are combined and then
802: reduced to a set of PDEs of a single
803: unknown function~$T_1$. Because there is no commuting relation
804: similar to~\eqref{eq:103} the equations contain partial derivatives
805: of~$T_1$ up to the~$2n$-th order (eq 23 in~\citez{lahdhiri}).
806: Next, the authors propose a lemma (Lemma 1) that identifies the
807: linearity conditions with non-singularity and involutivness
808: of~$\distrofg{n-2}$. Unfortunately, we disagree with this result.
809:
810: It can be easily verified that for~$\sigma=0$ this
811: statement does not correspond to the deterministic conditions
812: (Proposition~\ref{prop:d1sfb2}), because the deterministic case
813: requires non-singularity up to the~$(n-1)$-th bracket, not only up to
814: the~$(n-2)$-th one. Second, although the method of finding~$T_1$
815: was given (solving PDE), we do not think
816: that the existence of~$T_1$ was proved.
817:
818: After this paper was finished, we discovered recent works
819: of~\citet{pan02} and~\citez{pan01}. In the article~\citez{pan01}
820: Pan defines and solves the problem of {\em feedback complete
821: linearization of stochastic nonlinear systems}. In our terminology,
822: this problem is equivalent to SFB MIMO input--output \Ito $g\sigma$
823: linearization which was not studied by us.
824:
825: In~\citez{pan02} Pan declares and proves so called \index{invariance
826: under transformation rule}{\em invariance under transformation rule}
827: which is exactly equivalent to our Theorem~\ref{prop:corr} which is
828: probably the most important result of our paper.
829:
830: Althougth the problems solved by Pan were slightly different, he uses
831: the same equivalence --- Theorem~\ref{prop:corr}. This proves that
832: our conclusions about applicability of the \index{correcting
833: term}correcting term are perfectly valid.
834:
835: In~\citez{pan02} Pan
836: consider three other \index{canonical form}canonical forms of
837: stochastic nonlinear systems, namely the \index{noise-prone strict
838: feedback form}noise-prone strict feedback form, \index{zero dynamics
839: canonical form}zero dynamics canonical form and \index{and observer
840: canonical form}observer canonical form also not studied by us.
841:
842: %%%%%%%%%%%%%%% Section %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
843: \section{Deterministic Case}
844: \label{sec:detcase}
845:
846: In this section we recapitulate the results of the SFB and SCT exact linearization
847: theory for SISO systems. For detailed treatment and proofs we refer to
848: existing literature, above all the
849: classical monographs of~\citet{isidori85} and~\citet{nijmeijer94}. For a
850: very readable introduction to the field we refer to the seventh
851: chapter of~\citet{vidyasagar93}. The books also contain extensive
852: bibliography. The monograph of~\citet{isidori85} builds mainly on the
853: concept of relative degree. In contrast we will emphasize the approach
854: of~\citet{vidyasagar93} because the method is more suitable for the
855: stochastic case.
856:
857: \subsection{Useful Relations}
858:
859: The solution of the SFB linearization problem as presented
860: here uses the Leibniz rule
861: \begin{align}
862: \label{eq:63}
863: \lie{\lbrack f,g\rbrack }{\alpha } =
864: \lie{f}{(\lie{g}{\alpha })} - \lie{g}{ (\lie{f}{\alpha })}
865: \end{align}
866: with~$f,g$ smooth vectorfields on~$U$; $\alpha\colon U\to \RR $ is
867: a smooth function. The recursive form of the Leibniz rule allows to
868: simplify the chains of differential equations for the
869: transformation~$T$. This can be expressed in the form of the following
870: statement:
871:
872: For all $x \in U$, $k \ge 0$ these two sets of conditions are
873: equivalent:
874:
875: \begin{align}
876: \label{eq:2}
877: \text{(i)}&\qquad&\lie{g}{\alpha } = \lie{g}{\lie{f}{\alpha }} =
878: \cdots = \lie{g}{\multilie{f}{k}{\alpha }}=0 \\
879: \label{eq:10}
880: \text{(ii)}&&\lie{g}{\alpha } = \lie{\adfg{}}{\alpha } = \cdots =
881: \lie{\adfg{k}}{\alpha }=0 .\end{align}
882:
883: Recall that the symbol~$\lie{f}{h}$ stands for the Lie derivative
884: defined by~$\lie{f}{h} = \langle f,\grad\,h \rangle = \ssumi{n} f_i(x)
885: \parby{}{x_i} h(x)$. Higher order Lie derivatives
886: can be defined recursively
887: $\multilie{f}{0}{h} = h$, $\multilie{f}{k+1}{h} =
888: \lie{f}{\multilie{f}{k}{h}}$ for~$k \ge 0$. The Lie Bracket is defined as
889: ~$[f,g] \define \parbyx{g}f-\parbyx{f}g$; there is also a recursive
890: definition:
891: \begin{equation}
892: \ad{f}{0}{g} \define g; \quad \ad{f}{k+1}{g} \define
893: \left[f,\ad{f}{k}{g}\right] \quad \text{for } k \ge 0
894: .\end{equation}
895:
896:
897: Another very important result of the differential geometry is
898: invariance of the Lie bracket under the tangent
899: transformation~$\tantra{T}$
900: (see~\citet{nijmeijer94} Proposition 2.30 \pg~50):
901:
902: Let~$T\colon U\to \RR^n$ be a diffeomorphic coordinate transformation, and~$f$ and~$g$
903: be smooth vectorfields. Then
904: \begin{align}
905: \label{eq:103}
906: \tantra{T} [f,g] = [\tantra{T} f, \tantra{T} g] .\end{align}
907:
908: \subsection{SFB Linearization}
909:
910: Every controllable linear system may be, by a linear coordinate
911: transformation, transformed to the controllable canonical form
912: (\citet{kalman}). Furthermore, this controllable canonical form can
913: be always transformed into the integrator chain by a linear
914: regular feedback. Therefore, the integrator chain is a canonical
915: form for all feedback linearizable systems. (See \citet{vidyasagar93}
916: section 7.4). Consequently, the equations of the integrator chain can be compared
917: with the equations of the nonlinear systems and the following
918: proposition can be proved:
919:
920: \begin{prop} \label{prop:d1sfb1a}
921: There is a SFB linearizing transformation~$\combinedtab$ of a SISO
922: deterministic dynamical system~\dsdef into a controllable linear
923: system if and only if there is a solution~$T_1, T_2, \dots,
924: T_n\RntoR$ to the set of partial differential equations
925: defined on~$U$
926: \begin{alignat}{2}
927: \label{eq:150}
928: \lie{f}{}{T_i} &= T_{i+1} \firstfor 1 \le i \le {n-1}\\
929: \label{eq:151}
930: \lie{g}{}{T_i} &= 0 \nextfor 1 \le i \le {n-1}\\
931: \label{eq:152}
932: \lie{g}{}{T_n} &\ne 0 .\end{alignat} Then the
933: feedback is defined as follows:
934: \begin{align}
935: \label{eq:57}
936: \alpha &=-\frac{\lie{f}{T_n}}{\lie{g}{{T_n}}}\qquad\qquad
937: \beta =\frac{1}{\lie{g}{T_n}} .\end{align}
938: \end{prop}
939: \begin{proof}
940: See \citet{vidyasagar93} equations 7.4.20--21.
941: \end{proof}
942:
943:
944: \begin{prop} \label{prop:d1sfb1}
945: The SFB linearizing transformation~$\combinedtab$ of a SISO
946: deterministic dynamical system~\dsdef into a controllable linear
947: system exists if and only if there is
948: a solution~$\lambda \RntoR$ to the set of partial differential
949: equations:
950: \begin{alignat}3
951: \label{eq:8}
952: \biglie{\adfg{i}}{\lambda }&=0\firstfor{\iva{n-2}}\\
953: \label{eq:9}
954: \biglie{\adfg{{n-1}}}{\lambda }&\not=0 .\end{alignat} The
955: linearizing transformation~$T(x)$ is given by:
956: \begin{alignat}3
957: \label{eq:11}
958: T_{i}&=\multilie{f}{{i-1}}\lambda \firstfor 1\le i\le n\\
959: \alpha &=\frac{-\multilie{f}{{n}}\lambda
960: }{\lie{g}{}\multilie{f}{{n-1}}\lambda }&\qquad\qquad&
961: \label{eq:12}
962: \beta =\frac{1}{\lie{g}{}\multilie{f}{{n-1}}\lambda }
963: .\end{alignat}
964: \begin{proof}
965: See \citet{vidyasagar93} equations 7.4.23--33 and \citet{nijmeijer94} Corollary 6.16.
966: \end{proof}
967:
968: \end{prop}
969: Finally, the geometrical conditions for the
970: existence of the linearizing transformation are studied.
971:
972: \begin{theo} \label{prop:d1sfb2}
973: A deterministic SFB linearizing transformation of~\dsdef into a
974: controllable linear system exists if and only if the
975: distribution~$\Delta_{n} \define \sspan\left\{{\adfg{i},
976: \iva{n-1}}\right\}$ is nonsingular on~$U$ and the
977: distribution~$\Delta_{n-1} \define \sspan\left\{{\adfg{i},
978: \iva{n-2}}\right\}$ is involutive on~$U$.
979: \end{theo}
980: \begin{proof}
981: See \citet{nijmeijer94} Corollary 6.17, \citet{vidyasagar93} Theorem
982: 7.4.16, \citet{isidori89} Theorem 4.2.3 .
983: \end{proof}
984:
985: \subsection{SCT Linearization}
986:
987: \begin{theo} \label{prop:s1ctt2t}
988: There is a SCT~linearizing transformation~$\sctt$ of a deterministic
989: MIMO system~\dsdefmi into a controllable linear system if and only
990: if there exists a reordering of the vectorfields~$g_1 \dots g_m$ and
991: an~$m$-tuple of integers~$\kappa_1 \le \kappa_2 \le \dots \kappa_m$
992: with~$\ssumi{m} \kappa_i = n$ called the \defbf{controllability
993: indexes} such that the following conditions are satisfied for
994: all~$x \in U$:
995: \begin{align}
996: \label{eq:43}
997: \text{(i)}&\qquad\dim\left(\sspan\left\{( \ad{f}{j}{g_i}(x),
998: \iva{m}, \jva{\kappa_i-1})\right\}\right) = n\\
999: \label{eq:44}
1000: \text{(ii)}&\qquad[\ad{f}{k}{g_i},\ad{f}{l}{g_j}]=0
1001: \qquad\text{for}\qquad 0 \le k+l \le \kappa_i+\kappa_j-1,\, 0 \le
1002: i,j \le m . \end{align}
1003: \end{theo}
1004: \begin{proof}
1005: See \citet{nijmeijer94} Theorem 5.3 and Corollary 5.6.
1006: \end{proof}
1007:
1008: The following corollary can be verified for SISO systems:
1009:
1010: \begin{coroll} \label{prop:s1ctt2a}
1011: For a SISO system with~$m=1$ the
1012: condition (ii) of~\ref{prop:s1ctt2t} can be simplified as
1013: follows:
1014: \begin{align}
1015: \label{eq:45}
1016: [g,ad^l_f g] = 0, \quad l = 1, 3, 5, \dots, 2n-1, \forall x \in U
1017: .\end{align}
1018: \end{coroll}
1019: \begin{proof}
1020: See \citet{nijmeijer94} Corollary 5.6 and the text which follows.
1021: \end{proof}
1022:
1023:
1024:
1025:
1026: %%%%%%%%%%%%%%% Section %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
1027: \section{Transformations of \Ito Dynamical Systems}
1028: \label{sec:stotrans}
1029:
1030: The transformation rules of \Ito systems are motivated by the \Ito
1031: differential rule (see \eg~\citet{wong84} Section 3.3), which defines
1032: the influence of nonlinear coordinate transformations on \Ito stochastic
1033: processes.
1034:
1035: The \Ito differential rule applies to the situation where a scalar
1036: valued stochastic process~$x_t$ defined by a stochastic differential
1037: equation~$dx_t = f(x_t)\,dt + \sigma(x_t)\,dw_t$ with~$f\RtoR$ and~$\sigma\RtoR$
1038: smooth real functions and~$w_t$ a Brownian motion, is transformed
1039: by a a diffeomorphic coordinate transformation~$T\colon \RR \to \RR$.
1040: Then the stochastic process~$z_t\define T(x_t)$ exists and is an \Ito
1041: process. Further, the process~$z_t$ is the solution of the stochastic
1042: differential equation
1043: \begin{equation} \label{eq:126}
1044: dz_t = \parbyx{T} {f(x_t)}\,dt + \parbyx{T} {\sigma(x_t)}\,dw_t + \itoxs\,dt
1045: .\end{equation}
1046: All details together with a proof are
1047: available for example in~\citet{karatzas}.
1048:
1049: The \Ito rule can be also derived for the multidimensional case: for
1050: the~$m$-th component of an~$n$-dimensional stochastic process the \Ito
1051: rule can be expressed as follows:
1052: \begin{multline}
1053: dz_m = \ssumi{n} \parby{T_m}{x_i} f_i\,dt + \frahalf \ssum{i}{1}{n}
1054: \ssum{j}{1}{k} \parby{T_m}{x_i} \sigma_{ij}\,dw_j + \frahalf
1055: \ssum{{i,j}}{1}{n} \frac{\partial^2 T_m}{\partial x_i x_j}
1056: \ssum{l}{1}{k} \sigma_{il}
1057: \sigma_{jl}\,dt \\
1058: =\lie{f}T_m\,dt + \ssum{j}{1}{k} \lie{\sigma_j}{T_m}\,dw_j +
1059: \ito{\sigma}T_m\,dt
1060: .\end{multline}
1061:
1062: For the most common case with scalar noise~$k=1$ the equation
1063: can be further simplified to:
1064: \begin{equation}
1065: dz_m =\lie{f}{T_m}\,dt + \lie{\sigma}{T_m}\,dw +
1066: \frahalf \ssum{{i,j}}{1}{n}
1067: \parbyxx{T_m}{x_i}{x_j} \sigma_{i} \sigma_{j}\,dt
1068: .\end{equation}
1069: The operator~$\ito{\sigma} T_m$ is sometimes written using
1070: matrix notation as:
1071: \begin{equation}
1072: \ito{\sigma} T_m = \frahalf \trace \left(\sigma^T\sigma \parbysec{T_m}{x}\right)
1073: .\end{equation}
1074: Generally, $\ito{\sigma}$ vanishes for linear~$T$ or zero~$\sigma$.
1075:
1076:
1077: %======== Subsection ================================================
1078: \subsection{The Correcting Term}
1079: \label{sub:corr}
1080:
1081:
1082: In this section we introduce an extremely useful equivalence
1083: between \Ito and Stratonovich systems, which allows to use some
1084: Stratonovich linearization techniques for \Ito problems. The
1085: motivation is following: let~\isdefmi be an \Ito system. We
1086: are looking for a Stratonovich system $\Theta_S = \ssys{\alterbar
1087: f}{\alterbar g}{\alterbar \sigma}{x}$ such that the trajectories
1088: of~$\Theta_I$ and~$\Theta_S$ are identical. The aim is to find
1089: equations relating the quantities~$\alterbar f$,~$\alterbar
1090: g$, and~$\alterbar \sigma$ with~$f$,~$g$, and~$\sigma$.
1091:
1092: \begin{defn} \label{def:corr}
1093: Let~$\Theta_{1I} = \ssys{f}{g}{\sigma}{x} \in \clmisysito$ be
1094: an~$n$-dimensional \Ito dynamical
1095: system with~$k$-dimensional Brownian
1096: motion~$w$. The vectorfield $\corr{\sigma}{x}$ whose ~$r$-th
1097: coordinate is equal to
1098: \begin{alignat}3
1099: \label{eq:5}
1100: (\corr{\sigma}{x})_r &= -\frahalf \ssum{i}{1}{n} \ssum{j}{1}{k}
1101: \parby{{\sigma_{rj}}}{{x_i}} \sigma_{ij} \firstfor 1 \le r \le n
1102: \end{alignat}
1103: is called the \defbf{correcting term}.
1104: Note that the derivative is always evaluated in the corresponding
1105: coordinate system.
1106: Further, let us define the \defbf{correcting mapping} $\Corr{\sigma} \colon \clmisysito \to \clmisysstrat$ by
1107: \begin{align}
1108: \label{eq:21}
1109: \Corr{\sigma} (f,g,\sigma,U,\origi{x}) \define
1110: (f+\corr{\sigma}{x},g,\sigma,U,\origi{x}) .\end{align}
1111: \end{defn}
1112: The general treatment of the subject can be found for example
1113: in~\citet{wong84} \pg~160 or in \citet{sagemelsa}. The following
1114: theorem describes the
1115: behavior of the correcting term under the coordinate transformation.
1116: \begin{theo} \label{prop:corr}
1117: Let~\isdef be a one-dimensional \Ito dynamical system. Let $T$ be a
1118: diffeomorphism defined on~$U$ and the symbols~$\scti{T}$ and
1119: $\scts{T}$ denote a \Ito coordinate transformation and a
1120: Stratonovich coordinate transformation induced by the same
1121: diffeomorphism~$T$ and~$\tilde\sigma = \tantra{T}{\sigma}$. Then the following diagram commutes:
1122: \begin{equation}
1123: \begin{CD}
1124: \label{eq:4}
1125: \Theta_{1I} @>\scti{T}>> \Theta_{2I}\\
1126: @V{\Corr{\sigma}}VV @AA{\Corr{{\tantra{T} \sigma}}^{-1}}A\\
1127: \Theta_{1S} @>\scts{T}>> \Theta_{2S}\\
1128: \end{CD}
1129: .\end{equation}
1130: In other words:
1131: \begin{align}
1132: \label{eq:19}
1133: \scti{T} &= {\Corr{{\tilde\sigma}}{}}^{-1} \compose \scts{T}
1134: \compose \Corr{\sigma}{} \quad\text{and} \\
1135: \label{eq:20}
1136: \scts{T} &= {\Corr{\sigma}{}}^{-1} \compose \scti{T}
1137: \compose \Corr{{\tilde\sigma}}{}
1138: . \end{align}
1139:
1140: The notation~$\Corr{{\sigma}}{}^{-1}$ is used to denote the
1141: inverse mapping
1142: \begin{align}
1143: \label{eq:23}
1144: {\Corr{\sigma}{}}^{-1} (f,g,\sigma,U,\origi{x}) \define
1145: (f-\corr{\sigma}{x},g,\sigma,U,\origi{x})
1146: .\end{align}
1147: \end{theo}
1148:
1149: \begin{proof}
1150: The correcting term~$\corr{\sigma}{x}\RntoRn$
1151: is equal to
1152: \begin{equation}
1153: \corr{\sigma}{x} = -\corrx
1154: .\end{equation}
1155: The transformations specified in the diagram~\eqref{eq:4} will be
1156: evaluated in the following order:
1157: \begin{equation}
1158: \begin{CD}
1159: \label{eq:6}
1160: \Theta_{1I} @>({\operatorname a})>> \Theta_{2I} \\
1161: @V({\operatorname b})VV \\
1162: \Theta_{1S} @>({\operatorname c})>> \Theta_{2S}
1163: @>({\operatorname d})>> \Theta_{3I}\\
1164: \end{CD}
1165: \end{equation}
1166: We want to prove the equivalence of~$\Theta_{2I}$ and~$\Theta_{3I}$.
1167: The symbols (a) and (c) denote \Ito
1168: coordinate transformations; the
1169: symbols (b) (d) stand for the correcting
1170: mapping and its inverse. Note that the systems~$\Theta_{2I}$,
1171: $\Theta_{2S}$, and $\Theta_{3I}$ are defined in the~$z$-coordinate
1172: systems. Further, let
1173: \begin{align}
1174: \label{eq:243}
1175: \tilde\sigma&\define\trav{\sigma}\\
1176: \kappa&\define \tantra{T} \corr{\sigma}{x} = -\trav{(\corrx)}\\
1177: \origi{z}&\define T(\origi{x}) .\end{align} Then
1178: \begin{align}
1179: \text{(a)}&\qquad \Theta_{2I} =\bigssys{\trav{f} + \itoxs }{
1180: \trav{g}}{ \tilde\sigma }{z}\\
1181: \text{(b)}&\qquad \Theta_{1S} =\bigssys{f - \corrx }{ g }{
1182: \sigma }{x} \\
1183: \text{(c)}&\qquad \Theta_{2S} =\bigssys{\trav{\left(f-\corrx\right)}
1184: }{ \trav{g} }{
1185: \trav{\sigma} }{z}\\
1186: \text{(d)}&\qquad \Theta_{3I} =\bigssys{\trav{f} + \kappa + \frahalf
1187: \parbyz{\tilde\sigma}{\tilde\sigma} }{ \trav{g} }{ \tilde\sigma
1188: }{z}
1189: .\end{align}
1190:
1191: All the terms in (a) are equivalent to the respective terms in (d)
1192: except for the drift terms containing functions of~$\sigma$. Therefore,
1193: we continue comparing these terms only. For (a):
1194:
1195: \begin{align}
1196: \label{eq:37}
1197: L &\define \itoxs .\end{align} For (d):
1198: \begin{multline}
1199: \label{eq:38}
1200: R \define \kappa + \corrxx{{\tilde\sigma}}{z} = \kappa + \frahalf
1201: \parbyz{} \left( \parbyx{T} \sigma \right) \parbyx{T}\sigma = \kappa +
1202: \frahalf \parbyz{x} \parbyx{} \left( \parbyx{T} \sigma \right)
1203: \parbyx{T}\sigma = \\
1204: \kappa + \frahalf \left( \parbysec{T}{x}\sigma +
1205: \parbyx{T}\parbyx{\sigma} \right) \sigma = \kappa + \frahalf
1206: \parbysec{T}{x}\sigma^2 - \kappa= \itoxs .\end{multline} Thus~$L=R$
1207: and $\Theta_{2I} = \Theta_{3I}$.
1208: \end{proof}
1209:
1210: Theorem~\ref{prop:corr} is valid also for combined
1211: transformations:
1212: \begin{coroll} \label{prop:corrcorol}
1213: Let~\isdef, $T$, $\scti{T}$, and
1214: $\scts{T}$ have the same meaning as in Theorem~\ref{prop:corr}.
1215: Then the following diagram commutes for arbitrary regular feedback~$\feedbackab$:
1216: \begin{equation}
1217: \begin{CD}
1218: \label{eq:4000}
1219: \Theta_{1I} @>\scti{T}>> \Theta_{2I} @>\feedbackab>> \Theta_{4I}\\
1220: @V{\Corr{\sigma}}VV @AA{\Corr{{\tantra{T} \sigma}}^{-1}}A @AA{\Corr{{\tantra{T} \sigma}}^{-1}}A\\
1221: \Theta_{1S} @>\scts{T}>> \Theta_{2S} @>\feedbackab>> \Theta_{4S}\\
1222: \end{CD}
1223: .\end{equation}
1224: \end{coroll}
1225:
1226: \begin{proof}
1227: We want to prove equivalence of~$\Theta_{4I}$
1228: and~${\Corr{{\tantra{T} \sigma}}^{-1}} \Theta_{4S}$.
1229:
1230: The control and dispersion vectorfields of~$\Theta_{4I}$
1231: and~$\Theta_{4S}$ are identical and they are not influenced by the
1232: correcting mapping.
1233:
1234: Using the notation of Theorem~\ref{prop:corr} we can express the
1235: drift term of~$\Theta_{4I}$ as~$\tantra{T}f + L + g\alpha $. The
1236: drift term of~${\Corr{{\tantra{T} \sigma}}^{-1}} \Theta_{4S}$
1237: is~$\tantra{T}f + R + g\alpha $. The effect of feedback is purely
1238: additive and both the systems are equal.
1239: \end{proof}
1240:
1241:
1242:
1243: At first glance the correcting term is rather
1244: surprising. How can the second derivative of~$T$ in (\ref{eq:37}) be
1245: compensated by the correcting term, which does
1246: not contain the~$T$ at all? The answer is quite simple: the second
1247: derivative is hidden in the correcting term
1248: implicitly because the correcting term depends
1249: on the coordinate system in which the system~$\Theta_{1I}$ is defined.
1250: The derivative~$\parbyx{\sigma}$ contained in the
1251: correcting term is always taken in the
1252: appropriate coordinate system. To emphasize the dependence of the
1253: correcting term on the coordinate system, we
1254: will never omit the independent variable (\eg $x$ or $z$) from the
1255: symbol~$\corr{\sigma}{x}$.
1256:
1257: Proposition~\ref{prop:corr} is valid for general multidimensional
1258: systems~\isdefmi; the proof is purely mechanical and is not presented
1259: here.
1260:
1261: Let us now turn our attention to several special cases of the
1262: correcting mapping.
1263: \begin{coroll} \label{prop:corrvectr}
1264: Let~$\Theta_I = \ssysfgx \in \clssysito(n,m,1)$ be
1265: an~$n$-dimensional stochastic dynamical system with an
1266: one-dimensional Brownian motion~$w$.
1267: The~$r$-th coordinate of the correcting
1268: term~$(\corr{\sigma}{x})_r$ is equal to
1269: \begin{equation}
1270: \label{eq:214}
1271: (\corr{\sigma}{x})_r = \frahalf \ssum{i}{1}{n}
1272: \parby{{\sigma_{r}}}{{x_i}} \sigma_{i} = \frahalf
1273: \lie{\sigma}{\sigma_r}
1274: \rfor{1\le r\le n}
1275: .\end{equation}
1276: \end{coroll}
1277: \begin{proof}
1278: Substitute~$k = 1$ into~\eqref{eq:5}.
1279: \end{proof}
1280: \begin{coroll}
1281: \label{prop:ic1}
1282: For systems with one-dimensional noise ($k=1$) define the matrix
1283: valued \Ito term~$\ito{\sigma}{T}$ for~$T\RntoRn$
1284: with components~$T_i$, $1\le i\le n$, as a column $n\times 1$
1285: matrix $\ito{\sigma}{T} \define \left[\ito{\sigma}{T_1},
1286: \ito{\sigma}{T_2}, \dots,\ito{\sigma}{T_n}\right]^T$.
1287:
1288: Then the relations~\eqref{eq:214} can be expressed as
1289: \begin{align}
1290: \label{eq:215}
1291: \ito{\sigma}{T} = \tantra{T} \left(\corr{\sigma}{x}\right) -
1292: \corr{{\tilde\sigma}}{z} .\end{align}
1293: \end{coroll}
1294: \begin{proof}
1295: The proof is almost identical to that of
1296: the multidimensional variant of Corollary~\eqref{prop:corr}.The symbols can be
1297: identified as follows:
1298: \begin{alignat}2
1299: L_i &= \left(\ito{\sigma}{T}\right)_i \firstfor 1\le i\le n \\
1300: \kappa_i &= \left( \tantra{T} \left(\corr{\sigma}{x}\right)\right)_i \\
1301: R_i &= \left(\tantra{T} \left(\corr{\sigma}{x}\right) \right)_i -
1302: \left(\corr{{\tilde\sigma}}{z}\right)_i .\end{alignat}
1303: \end{proof}
1304: \begin{coroll}
1305: \label{prop:ic2}
1306: Assume that the conditions of Proposition~\ref{prop:ic1} hold. The
1307: relation~\eqref{eq:215} can be written as:
1308: \begin{alignat}3
1309: \label{eq:140}
1310: \frahalf \lie{\sigma}{\lie{\sigma}{T_i}} &=
1311: \ito{\sigma}{T_i} - \lie{\corr{\sigma}{x}}{T_i} \firstfor 1
1312: \le i \le n
1313: . \end{alignat}
1314: \end{coroll}
1315: \begin{proof}
1316: The formula can be expressed as:
1317: \begin{multline}
1318: \label{eq:139}
1319: \frahalf \lie{\sigma}{{\lie{\sigma}{T_i}}} = \frahalf
1320: \lie{\sigma}{ \left( \ssum{j}{1}{n} \parby{T_i}{x_j} \sigma_j
1321: \right) } = \frahalf \ssum{l}{1}{n} \sigma_k \parby{}{x_k}
1322: \left( \ssum{j}{1}{n} \parby{T_i}{x_j} \sigma_j
1323: \right) =\\
1324: \frahalf \ssum{k,j}{1}{n} \left( \sigma_j\sigma_k
1325: \parbyxx{T_i}{x_k}{x_j} +\parby{T_i}{x_j}
1326: \parby{\sigma_j}{x_k} \sigma_k \right) = \ito{\sigma}{T_i} -
1327: \lie{{\corr{\sigma}{x}}}{T_i} . \end{multline}
1328: \end{proof}
1329:
1330: %======== Subsection ================================================
1331: \subsection{Composition of Coordinate Transformations of \Ito Systems}
1332: \label{sub:stgroup}
1333:
1334: The set of all deterministic coordinate transformations~$\sctt$
1335: together with composition~$\sct{RS} \define \sct{S} \compose \sct{R}$
1336: forms a group. Obviously, this fact is a straightforward result of the
1337: behavior of the contravariant transformation and therefore an
1338: analogous statement must hold for Stratonovich systems. Surprisingly,
1339: this is valid also for \Ito systems as will be shown here. This has an
1340: important consequence: we may always find the inverse transformation
1341: to a given coordinate transformation of \Ito systems. We will prove
1342: the following assertion:
1343: \begin{theo}
1344: \label{prop:compogr}
1345:
1346: Let~$\scti{R}$, $\scti{S} \in \clsysito$ be
1347: coordinate transformations of
1348: one-dimensional \Ito systems induced by
1349: diffeomorphisms~$R$ and~$S$. Then
1350: \begin{equation}
1351: \label{eq:123}
1352: \scti{S} \compose \scti{R} = \scti{S \compose R}
1353: .\end{equation}
1354: \end{theo}
1355: \begin{proof}
1356: We will transform the system in two
1357: different ways and show that the results are equal.
1358: \begin{enumerate}
1359: \item In the first method the system~$A=(0,0,a,U,\origi{x})$ which
1360: corresponds to a differential equation~$dx = a(x)\,dw$ will be
1361: transformed twice:
1362: \begin{enumerate} \item first, by~$y=R(x)$ to~$y$
1363: coordinates \item and then the result~$B=(g,0,b,U,\origi{x})$ which
1364: corresponds to~$dy = g(y)\,dt + b(y)\,dw$
1365: by~$z=S(y)$ to~$z$ coordinates.
1366: \end{enumerate}
1367: \item The other method
1368: transforms the system~$A$ only once by~$z=T(x) = S(R(x)) = (S
1369: \compose R)(x)$.
1370: \end{enumerate}
1371: Without loss of generality, the equation~$dx = a(x)\,dw$ is assumed
1372: to have no drift term because the drift term transforms in the
1373: contravariant fashion. The derivatives will be
1374: denoted by~$\parbyx{T(x)} \definer T'$,~$\parbyx{R(x)} \definer
1375: R'$,~$\parby{S(y)}{y} \definer S'$ and similarly for~$T''$,
1376: $R''$ and $S''$. Note that the prime is always used to denote
1377: derivatives by the argument of the function.
1378:
1379: The transformation by~$R$ gives:
1380: \begin{align}
1381: \label{eq:64}
1382: dx &= a \, dw\\
1383: \label{eq:266}
1384: dy &= R' a\,dw + \frahalf a^2 R'' \,dt .\end{align} Thus the
1385: coefficients of the second SDE are defined
1386: by
1387: \begin{align}
1388: \label{eq:267}
1389: b(y) &\define (R'a) \compose R^{-1}(y)\\
1390: \label{eq:268}
1391: g(y) &\define (\frahalf a^2 R'') \compose R^{-1}(y) .\end{align}
1392:
1393: The second transformation (by~$S$) gives
1394: \begin{align}
1395: \label{eq:269}
1396: dz &= \left( S' g + \frahalf b^2 S'' \right)\,dt + S' b \,dw =\\
1397: \label{eq:270}
1398: &= \left(\frahalf a^2 S' R'' + \frahalf (R')^2 a^2 S'' \right) \,dt +
1399: S' R' a \,dw = \\
1400: \label{eq:272}
1401: &= \frahalf a^2 \left(S'R'' + (R')^2 S'' \right)\,dt + S'R' a\,dw =\\
1402: \label{eq:273}
1403: &= \frahalf a^2 T''\,dt + T' a\,dw .\end{align} The last equality
1404: follows from the fact that~$T''=S''(R')^2+S'R''$.
1405: \end{proof}
1406: One can verify the multidimensional case in the same
1407: spirit.
1408: %======== Subsection ================================================
1409: \subsection{Invariants}
1410: \label{sub:stoinvar}
1411:
1412:
1413: In the deterministic case, some useful propositions about the
1414: invariant properties for example the Leibniz rule~\eqref{eq:63} and
1415: the relation~\eqref{eq:2} were employed.
1416:
1417: Unfortunately, we have not found any analogy for the \Ito systems yet.
1418: To point out the main complications, we will analyze the \Ito
1419: equivalent of the Leibniz rule~\eqref{eq:63}, which is essential for
1420: reducing the order of partial differential equations in the
1421: deterministic exact linearization.
1422:
1423: If the Lie derivative~$\lie{g}{}$ is interpreted
1424: as a general first order operator
1425: \begin{align}
1426: \lie{g}{} = \ssumi{n}g_i \parby{}{x_i}
1427: \end{align}
1428: then the commutator of two such first order
1429: operators $\lie{f}{\lie{g}{}} - \lie{g}{\lie{f}{}}$ is also a first
1430: order operator~$\lie{\lbrack f,g\rbrack }{}$ (see~\eqref{eq:63}).
1431:
1432: Similarly, define the general second order operator as
1433: \begin{align}
1434: \label{eq:17}
1435: O(g,G) &\define \ssumi{n}g_i \parby{}{x_i} + \ssum{i,j}{0}{n}
1436: G_{ij}\parbyxx{}{x_i}{x_j}
1437: \end{align}
1438: where $g_i,G_{ij}\RntoR$ for $1 \le i,j \le n$. We can compute
1439: the commutator
1440: \begin{align}
1441: \label{eq:213}
1442: C(f,F,g,G) \define O(f,F)O(g,G) - O(g,G)O(f,F)
1443: \end{align} of such
1444: second order operators. If this commutator was also
1445: a second order operator (\ie there were~$\varphi$ and $\Phi$
1446: such that the operator~$C(f,F,g,G) = O(\varphi,\Phi)$), then we would
1447: be able to simplify any PDEs of stochastic
1448: transformations. (See Proposition~\ref{prop:sfbooo}).
1449:
1450: Because the operator~$O$ is linear, \ie~$O(f,F) = O(f,0) + O(0,F)$, we
1451: can split the computation into four independent, reusable parts:
1452: \begin{multline}
1453: C(f,F,g,G) = O(f,F)O(g,G) - O(g,G)O(f,F) = \\
1454: =\lie{[f,g]}{} + C(0,F,0,G) + C(f,0,0,G) + C(0,F,g,0)
1455: .\end{multline}
1456:
1457: The first term is already a first order operator. Only the second
1458: and the third terms need to be computed because the fourth term
1459: can be obtained from the third one by formal substitution. For
1460: the third term:
1461: \begin{multline}
1462: O(f,0) O(0,G) = \ssum{i}{1}{n} f_{i} \parby{}{x_i} \left(
1463: \ssum{k,l}{1}{n} G_{kl}
1464: \parbyxx{}{x_k}{x_l} \right) = \\
1465: \ssum{i,k,l}{1}{n} \left( f_{i} \parby{G_{kl}}{x_i}
1466: \parbyxx{}{x_k}{x_l} + f_{i} G_{kl} \parbyxxx{}{x_i}{x_k}{x_l}
1467: \right)
1468: .\end{multline}
1469: Further,
1470: \begin{multline}
1471: O(0,G)0(f,0) = \ssum{k,l}{1}{n} G_{kl} \parbyxx{}{x_k}{x_l} \left(
1472: \ssum{i}{1}{n} f_i \parby{}{x_i}
1473: \right) =\\
1474: \ssum{i,k,l}{1}{n} G_{kl} \left( \parbyxx{f_i}{x_k}{x_l}
1475: \parby{}{x_i} + 2 \parby{f_i}{x_l} \parbyxx{}{x_i}{x_k} + f_i
1476: \parbyxxx{}{x_i}{x_k}{x_l} \right) .\end{multline}
1477:
1478: The intermediate results for the third and the fourth terms
1479: can be combined into
1480: \begin{multline}
1481: O(f,0) O(0,G) + O(0,F) O(g,0) - O(g,0) O(0,F) - O(0,G) O(f,0) =\\
1482: \ssum{i,k,l}{1}{n} \left( f_{i} \parby{G_{kl}}{x_i} - g_{i}
1483: \parby{F_{kl}}{x_i} + 2 F_{ki} \parby{g_l}{x_i} - 2 G_{ki}
1484: \parby{f_l}{x_i}
1485: \right) \parbyxx{}{x_k}{x_l} \\
1486: \left( F_{kl} \parbyxx{f_i}{x_k}{x_l} - G_{kl}
1487: \parbyxx{g_i}{x_k}{x_l} \right) \parby{}{x_i} .\end{multline} All
1488: of them are first and second order operators. Now let's evaluate the
1489: second term
1490: \begin{multline}
1491: O(0,F) O(0,G) = \ssum{i,j}{1}{n} F_{ij} \parbyxx{}{x_i}{x_j} \biggl(
1492: \ssum{k,l}{1}{n} G_{kl} \parbyxx{}{x_k}{x_l} \biggr) =\\
1493: \ssum{i,j,k,l}{1}{n} \biggl( F_{ij} \parbyxx{G_{kl}}{x_i}{x_j}
1494: \parbyxx{}{x_k}{x_l} + (F_{ij} + F_{ji}) \parby{G_{kl}}{x_j}
1495: \parbyxxx{}{x_i}{x_k}{x_l} + F_{ij} G_{kl}
1496: \parbyxxxx{}{x_i}{x_j}{x_k}{x_l} \biggr) .\end{multline}
1497: \begin{multline}
1498: O(0,F) O(0,G) - O(0,G) O(0,F) = \ssum{i,j,k,l}{1}{n} \biggl( \biggl(
1499: F_{ij} \parbyxx{G_{kl}}{x_i}{x_j} - G_{ij}
1500: \parbyxx{F_{kl}}{x_i}{x_j}
1501: \biggr) \parbyxx{}{x_k}{x_l} +\\
1502: \biggl( (F_{ij} + F_{ji}) \parby{G_{kl}}{x_j} - (G_{ij} + G_{ji})
1503: \parby{F_{kl}}{x_j} \biggr) \parbyxxx{}{x_i}{x_k}{x_l} \biggr)
1504: .\end{multline} Unfortunately the last term
1505: \begin{align}
1506: \label{eq:60}
1507: \biggl( (F_{ij} + F_{ji}) \parby{G_{kl}}{x_j} - (G_{ij} + G_{ji})
1508: \parby{F_{kl}}{x_j} \biggr) \parbyxxx{}{x_i}{x_k}{x_l}
1509: \end{align}
1510: is of third order and, in general, it does not vanish. Thus we have
1511: shown that the commutator of two general second order operators is of
1512: third order. Consequently, the Leibniz rule simplifications used in
1513: the deterministic case cannot be applied to the general stochastic
1514: linearization problem.
1515:
1516:
1517:
1518:
1519: %======== Subsection ================================================
1520: \section{Stochastic Case }
1521: \label{sub:stoclass}
1522:
1523: Since there are two definitions of coordinate transformation of stochastic
1524: differential equations (\Ito, Stratonovich) and three
1525: definitions of linearity ($g,\sigma,g\sigma$), we face at least six
1526: stochastic problems per a deterministic one. In this section we will
1527: discuss all of them giving at least partial solutions to the feedback
1528: linearization problem. We consider mainly the SISO problem except for
1529: cases where the MIMO extension is trivial.
1530:
1531: %======== Subsection ================================================
1532: \subsection{Stratonovich $g$-linearization}
1533: \label{sub:stotech}
1534:
1535:
1536: We show that the method known for deterministic systems can
1537: be applied without modifications.
1538:
1539: \begin{prop} \label{prop:stratgprop}
1540: The Stratonovich dynamical system~\ssdefmi is $g$-linearizable if and
1541: only if the deterministic system~\dsdefmi is linearizable. These two
1542: linearizing transformation{}s are equal. This holds both for SISO and
1543: MIMO systems and both for SFB and SCT linearization.
1544: \end{prop}
1545: \begin{proof}
1546: The comparison of transformation laws for deterministic and
1547: Stratonovich systems shows that the coefficients of $f$ and
1548: $g$ transform in the same way. The
1549: controllability conditions and the definition of linearity are
1550: also identical (compare Definition~\ref{def:linear} with
1551: Definition~\ref{def:linearsto}). Identical problems have
1552: identical solutions.
1553: \end{proof}
1554:
1555: %======== Subsection ================================================
1556: \subsection{Stratonovich $g\sigma$-linearization}
1557: \label{sub:ssgsigma}
1558:
1559: The Stratonovich problems are not complicated by the second order \Ito
1560: term. The transformation laws for Stratonovich systems are the same as
1561: the deterministic transformation laws, therefore many results of the
1562: deterministic linearization theory can be used.
1563:
1564: For example, the stochastic SCT $g\sigma$-linearization of a
1565: Stratonovich system is equivalent to the linearization of a
1566: deterministic, non-square MIMO system with two inputs and a single
1567: output. The SFB problem, which is studied in this section, is not as
1568: simple as the SCT one because the feedback influences only the control
1569: input~$u$ (Figure~\ref{fig:picassym}). The ``dispersion input'' is not
1570: a part of the feedback. Consequently, in order to solve the
1571: Stratonovich SFB $g\sigma$-linearization, we have to deal with a
1572: combined deterministic SFB-SCT problem.
1573: \psfig{fig:picassym}{Asymmetry of SFB $g\sigma$-Linearization}{picassym}
1574:
1575: \subsubsection{Canonical Form}
1576: Recall that we require~$g$-controllability of the resulting system
1577:
1578: Since this is a Stratonovich problem, the transformed
1579: vectorfields~$\tilde f$ and~$\tilde g$ do not depend on the dispersion
1580: vectorfield~$\sigma$. Therefore, the {\em control part\/} and the {\em
1581: dispersion part\/} can be studied independently.
1582:
1583: Any~$g$-linear system can be transformed into integrator chain by a
1584: combination of a linear coordinate transformation and linear
1585: feedback. Therefore, if we set~$\sigma=0$, the canonical form is the
1586: integrator chain.
1587:
1588: In general, the dispersion vectorfield~$\tilde \sigma$ is assumed to
1589: be arbitrary constant vectorfield~$\tilde \sigma(x)_i=s_i$, $1\le i\le n$
1590: (See Definition~\ref{def:linearsto}) and this form is preserved by arbitrary linear
1591: transformations. Therefore the canonical form can be written as:
1592: \begin{align}
1593: \label{eq:1000}
1594: \tilde f_i(x) &= x_{i+1} \firstfor 1\le i\le n-1\\
1595: \tilde f_n(x) &= 0\\
1596: \tilde g_i(x) &= 0 \firstfor 1\le i\le n-1\\
1597: \tilde g_n(x) &= 1\\
1598: \label{eq:1077}
1599: \tilde \sigma_i(x) &= s_i \firstfor 1\le i\le n
1600: .\end{align}
1601:
1602: We can compare this canonical form with the equations which
1603: define the transformed system~$\tilde \Theta$.
1604:
1605: \begin{prop} \label{prop:s1sfb1a}
1606: There is a SFB $g\sigma$-linearizing transformation
1607: of the SISO Stratonovich system
1608: \ssdef into a~$g$-controllable linear system if and only if
1609: there is a solution~$\lambda \RntoR$ of the set of partial differential equations:
1610: \begin{alignat}3
1611: \label{eq:7}
1612: \biglie{\adfg{i}}{\lambda }&=0\firstfor 0 \le i \le n-2\\
1613: \label{eq:13}
1614: \biglie{\adfg{{n-1}}}{\lambda }&\ne 0\\
1615: \label{eq:14}
1616: \biglie{\ad{f}{i}{\sigma}}{\lambda }&=s'_{i+1} \nextfor 0 \le i \le
1617: n-1
1618: \end{alignat}
1619: such that~$s'_i \in \RR$ are constants on~$U$ for $1 \le i \le n$.
1620: Then the linearizing transformation is given by:
1621: \begin{alignat}3
1622: \label{eq:22}
1623: T_i&=\multilie{f}{{i-1}}\lambda \firstfor 1\le i\le n\\
1624: \alpha &=\frac{-\multilie{f}{{n}}\lambda
1625: }{\lie{g}{}\multilie{f}{{n-1}}\lambda } &\qquad\qquad&
1626: \label{eq:28}
1627: \beta =\frac{1}{\lie{g}{}\multilie{f}{{n-1}}\lambda }
1628: .\end{alignat}
1629: \end{prop}
1630: \begin{proof}
1631: Assume that~$\Theta_S$ is transformed by~$\combinedtab$ into
1632: $\tilde \Theta \define \left(\tilde f,\tilde g,\tilde
1633: \sigma,T(U),T(\origi{x})\right)$ where the~$i$-th components
1634: of~$f$,$g$, and~$\sigma$ can be expressed as:~$\tilde f_i =
1635: \lie{f}{T_i}$, $\tilde g_i =
1636: \lie{g}{T_i}$, $\tilde \sigma_i =
1637: \lie{\sigma}{T_i}$. Moreover, the feedback is defined by~$ u = \alpha + \beta v $.
1638: The equations of~$\Theta$ can be compared to
1639: the equation of the canonical form~\eqref{eq:1000}-\eqref{eq:1077}.
1640: \begin{alignat}{3}
1641: \label{eq:160}
1642: \lie{f}{T_i} &= T_{i+1} \firstfor 1 \le i \le n-1\\
1643: \label{eq:161}
1644: \lie{g}{T_i} &= 0 \nextfor 1 \le i \le n-1\\
1645: \label{eq:162}
1646: \lie{g}{T_n} &= 1/\beta \ne 0 \\
1647: \label{eq:163}
1648: \lie{f}{T_n} &= -\alpha /\beta .\end{alignat}
1649:
1650: The
1651: relations~\eqref{eq:7}, \eqref{eq:13}, \eqref{eq:22}, and~\eqref{eq:28} are equivalent to
1652: relations~\eqref{eq:8}-\eqref{eq:12} from
1653: Proposition~\ref{prop:d1sfb1}. The relation~\eqref{eq:14} can be
1654: verified in a similar way:
1655: \begin{alignat}{3}
1656: \label{eq:165}
1657: \lie{\sigma}{T_i} &= s_{i} \firstfor 1 \le i \le n
1658: \end{alignat}
1659: thus by ~\eqref{eq:160}
1660: \begin{alignat}{3}
1661: \label{eq:254}
1662: \lie{\sigma}{\lie{f}{T_i}} &= s_{i+1} \firstfor 1 \le i \le n-1
1663: \end{alignat}
1664: and by ~\eqref{eq:63}
1665: \begin{alignat}{3}
1666: \label{eq:255}
1667: \lie{\sigma}{\lie{f}{T_i}} &= \lie{f}{\lie{\sigma}{T_i}}
1668: -\lie{[f,\sigma]}{T_i} \firstfor 1 \le i \le n-1
1669: \end{alignat}
1670: since the Lie derivative of a constant is zero:
1671: \begin{alignat}{3}
1672: \label{eq:256} \lie{f}{\lie{\sigma}{T_i}} &= \lie{f}{s_i} = 0\\
1673: s_{i+1} \define \lie{\sigma}{\lie{f}{T_i}} &=
1674: -\lie{[f,\sigma]}{T_i} \firstfor 1 \le i \le n-1 .\end{alignat}
1675: The equations~\eqref{eq:14} are obtained by successive application of
1676: this relation. The symbols~$s_i$ are equal to~$s'_{i}$ except for the signs.
1677: \end{proof}
1678:
1679: \subsubsection{Conditions for the Control Part}
1680:
1681: The necessary conditions for linearizability of the {\em control
1682: part\/} of~$\Theta$ (\ie the system~$\left(f,g,0,U,\origi{x}
1683: \right)$) can be expressed in geometrical form. We intentionally omit
1684: the dispersion part, using the fact that the resulting system must be
1685: linear when the noise is zero.
1686:
1687: Further, the class of all solutions of this subproblem will be
1688: called~$C$. This class can be studied to find if some member
1689: of~$C$ linearizes the {\em dispersion part\/} of the system.
1690:
1691: We can find a geometrical criterion similar to the conditions of
1692: Proposition~\ref{prop:d1sfb2}. In this case these conditions are
1693: necessary but not sufficient since also \eqref{eq:14} must be
1694: satisfied.
1695:
1696: \begin{prop}
1697: \label{prop:s1sfb1}
1698: SFB~$g\sigma$-linearizing transformation of the Stratonovich system
1699: $\Theta_S$ into a~$g\sigma$-controllable system
1700: linear system exists only if the distribution~$\distrofg{n-2}$ is
1701: involutive and the distribution~$\distrofg{n-1}$ is $n$-dimensional.
1702: \end{prop}
1703: \begin{proof}
1704: This theorem is equivalent to Proposition~\ref{prop:d1sfb2} which is
1705: a direct consequence of Proposition~\ref{prop:d1sfb1a} which
1706: corresponds to Proposition~\ref{prop:s1sfb1a}.
1707: \end{proof}
1708:
1709:
1710: \subsubsection{Condition for the Dispersion Part}
1711: \label{prop:cftdp}
1712: The conditions of Proposition~\ref{prop:s1sfb1} can be written
1713: in matrix form. We are looking for~$T_1 = \lambda\RntoR$ such that
1714: \begin{align}
1715: \label{eq:189}
1716: \left[\,\,\begin{matrix}
1717: \adfg{0}\\
1718: \adfg{1}\\
1719: \vdots\\
1720: \adfg{n-2}\\
1721: \end{matrix}\,\,\right]
1722: \quad \left[\,\,\begin{matrix}
1723: \parby{\lambda }{x_1}\\
1724: \parby{\lambda }{x_2}\\
1725: \vdots\\
1726: \parby{\lambda }{x_n}\\
1727: \end{matrix}\,\,\right]
1728: = \left[0\right]
1729: .\end{align}
1730:
1731:
1732: The vectors~$ \adfg{0} \dots \adfg{n-2}$ are written in coordinates
1733: as~$1\times n$ rows. The first matrix is~$(n-1)\times n$. Moreover it is
1734: required that
1735: \begin{equation}
1736: \label{eq:1020}
1737: \biglie{\adfg{n-1}}{\lambda}
1738: \end{equation} is nonzero.
1739:
1740: We will use the algorithm for SFB deterministic linearization (see
1741: Section~\ref{sec:detcase}) to find such a transformation~$\lambda$.Then we will
1742: verify if the conditions for linearity of the dispersion part of the
1743: system~\eqref{eq:14} are also valid. There are~$n$ additional linearity
1744: conditions ($s_i$ are constants):
1745:
1746: \begin{align}
1747: \label{eq:1001}
1748: \left[\,\,\begin{matrix}
1749: \ad{f}{0}{\sigma}\\
1750: \ad{f}{1}{\sigma}\\
1751: \vdots\\
1752: \ad{f}{n-1}{\sigma}\\
1753: \end{matrix}\,\,\right]
1754: \quad \left[\,\,\begin{matrix}
1755: \parby{\lambda }{x_1}\\
1756: \parby{\lambda }{x_2}\\
1757: \vdots\\
1758: \parby{\lambda }{x_n}\\
1759: \end{matrix}\,\,\right]=
1760: \left[\,\,\begin{matrix}
1761: s_1\\
1762: s_2\\
1763: \vdots\\
1764: s_n\\
1765: \end{matrix}\,\,\right]
1766: .\end{align}
1767:
1768: In the deterministic case we were satisfied with {\em arbitrary\/}
1769: solution~$\lambda $ to the equations~\eqref{eq:189},
1770: and~\eqref{eq:1020} . In this stochastic case we must find the class
1771: of {\em all\/} solutions and then check if this class contains the
1772: solution for the~$\sigma$ part~\eqref{eq:1001}. Details depend on the
1773: methods used for solving the set of PDEs.
1774:
1775: This result is summarized in the following
1776: algorithm:
1777:
1778: \begin{itemize}
1779: \item{Find $\Delta_k \define \adfg{i}$ for $0\le i \le k-1$.}
1780: \item{Verify that $\dim(\Delta_{n})$ is $n$.}
1781: \item{Verify that $\Delta_{n-1}$ is
1782: involutive (see \citet{nijmeijer94} Remark following Definition 2.39)
1783: otherwise no linearizing
1784: transformation exists.}
1785: \item{Find all~$\lambda$ satisfying~\eqref{eq:192} by solving
1786: PDEs~\eqref{eq:192}; denote~$C$ the set of all
1787: such functions.}
1788: \item{Verify that there is a~$\lambda_1\in
1789: C$ such that the conditions~\eqref{eq:1001} are
1790: satisfied, otherwise no linearizing
1791: transformation exists.}
1792: \item{Compute $T$,$\alpha $,$\beta $ from
1793: \eqref{eq:160} -- \eqref{eq:163}.}
1794: \end{itemize}
1795:
1796: Now, we can illustrate one possible practical approach which
1797: worked for several simple problems solved by us (see the example in
1798: Section~\ref{sub:appcrane}).
1799:
1800: First we can compute the kernel of the matrix~$M_g$ to find the
1801: form~$\omega = \left[ \omega_1, \omega_2, \dots, \omega_n
1802: \right]^T$ which satisfies~$M_g \omega = 0$, \ie~$\omega$ is
1803: perpendicular to~$M_g$. In modern computer algebra systems there is a
1804: single command for this.
1805:
1806: Proposition~\ref{prop:s1sfb1} assumes that~$n$
1807: vectorfields~$\Delta_{n} \define \distrofg{n-1}$ form an~$n$
1808: dimensional space. The vectorfields~$\Delta_{n-1} \define
1809: \distrofg{n-2}$ are chosen from them and consequently must form
1810: an~$(n-1)$-dimensional space. Thus their kernel~$d\lambda $ is
1811: exactly one dimensional and arbitrary~$\omega' = c(x)\omega(x)$ also
1812: belongs to the kernel ($c(x)$ is a scalar).
1813:
1814: But not every~$\omega'$ that is perpendicular to~$M_g$ is a
1815: solution to the original linearization problem. The
1816: function~$\omega'$ must be an exact one-form \ie there must be
1817: a scalar function~$\lambda $ such that~$d \lambda =
1818: c(x)\omega(x)$. The Frobenius theorem guarantees that
1819: if~$\Delta_{n-1}$ is involutive, then there is always~$c(x)\in\RR$
1820: such that~$c(x)\omega(x)$ is the exact one-form.
1821:
1822: A necessary condition for a one-form~$\omega =
1823: \ssumi{n} \omega_i$ to be exact is
1824: \begin{equation}
1825: \label{eq:102}
1826: \parby{\omega_i}{x_j} = \parby{\omega_j}{x_i} \qquad \text{for}
1827: \qquad 1 \le i,j \le n
1828: .\end{equation}
1829:
1830: Hence for every~$1\le i,j \le
1831: n$
1832: \begin{alignat}{3}
1833: \parby{}{x_j}\left(c(x)\omega_i \right) &=
1834: \parby{}{x_i}\left(c(x)\omega_j \right),\end{alignat} thus for
1835: every~$1\le i,j \le n$
1836: \begin{alignat}{3}
1837: \label{eq:192}
1838: \parby{c(x)}{x_i}\omega_j - \parby{c(x)}{x_j}\omega_i + c(x)
1839: \left( \parby{\omega_j}{x_i} - \parby{\omega_i}{x_j} \right) = 0
1840: .\end{alignat} The later condition is a set of linear PDEs, with
1841: unknown~$c(x)$, which are guaranteed to have a solution by the
1842: involutivness of~$\Delta_{n-1}$ (the Frobenius theorem).
1843:
1844: In our computations the equation~\eqref{eq:192} was in a simple form
1845: which allowed to determine all the solutions easily. More complicated
1846: cases will require more sophisticated analysis.
1847:
1848:
1849:
1850: %======== Subsection ================================================
1851: \subsection{\Ito $g\sigma$-linearization}
1852: \label{sub:isgsigma}
1853:
1854:
1855: In the previous subsection we tried to find~$g\sigma$-linearizations
1856: for Stratonovich dynamical systems. Once this is done, the
1857: correcting mapping can be used to
1858: construct \Ito $g\sigma$-linearizing
1859: transformation. This method works for both the
1860: SFB and the
1861: SCT case.
1862:
1863: Given an \Ito system~$\Theta_I$, the corresponding
1864: Stratonovich system $\Theta_S$ can be
1865: obtained using the correcting mapping
1866: $\Theta_S = \Corr{\sigma}\left({\Theta_I}\right)$. Afterward, the Stratonovich
1867: $g\sigma$-linearization algorithm can be applied giving a
1868: linear system~$\Theta_{2S}$. Due to linearity of the
1869: drift
1870: vectorfield~$\tilde \sigma$ of~$\Theta_{2S}$, the
1871: correcting term~$\corr{{\tilde \sigma}}{z}$ of
1872: the backward transformation~${\Corr{{\tilde \sigma}}{}}^{-1}$
1873: vanishes.
1874:
1875:
1876: \begin{theo} \label{prop:gsigmaprop}
1877: The SFB
1878: $g\sigma$-linearizing
1879: transformation~$\combinedz_I$ of the~\Ito dynamical system \isdefmi,
1880: $f(\origi{x})=0$, $\corr{\sigma}{\origi{x}}=0$, into a $g\sigma$-controllable linear
1881: system exists if and
1882: only if there is a SFB
1883: $g\sigma$-linearizing
1884: transformation~$\combinedz_S$ of the Stratonovich dynamical
1885: system
1886:
1887: \begin{align}
1888: \label{eq:24}
1889: \Theta_S &= \ssys{\alterbar f}{g}{\sigma}{x} =
1890: \Corr{\sigma}{(\Theta_I)}\\
1891: \alterbar f &= f + \corr{\sigma}{x}
1892: .\end{align}
1893: Moreover~$\combinedz_I = \combinedz_S \compose \Corr{\sigma}{}$.
1894:
1895: \end{theo}
1896: \begin{proof}[Proof (sufficiency)]
1897: We use the properties of the correcting term
1898: (Subsection \ref{sub:corr}). Assume that there is a
1899: mapping~$\combinedz_S$ which transform $\Theta_S$ into a linear
1900: ~$g$-controllable system $(Ax,B,S,U,0)$ . By~(\ref{eq:19})
1901: \begin{align}
1902: \label{eq:248}
1903: \combinedz_I = \Corr{{\tilde\sigma}}{}^{-1} \compose \combinedz_S
1904: \compose \Corr{\sigma}{}
1905: .\end{align}
1906: The backward correcting
1907: transformation $\Corr{{\tilde \sigma}}^{-1}$ is identity because the correcting term
1908: of a linear mapping $\corr{{\tilde \sigma}}{x}$ is zero. Thus~$
1909: \combinedz_I = \combinedz_S \compose \Corr{\sigma}{} $
1910: and ~$\combinedz_I (\Theta_{I})$ equals $(Ax,B,S,U,0)$, which is
1911: linear and~$g$-controllable by assumption.
1912: \end{proof}
1913: \begin{proof}[Proof (necessity)]
1914: Assume that there is the \Ito transformation~$\combinedz_I$ which
1915: linearizes $\Theta_I$ and by~(\ref{eq:24}) $\Theta_I =
1916: {\Corr{\sigma}{}}^{-1}(\Theta_S)$. Construct Stratonovich
1917: linearization by~$\combinedz_S = \combinedz_I \compose
1918: {\Corr{\sigma}{}}^{-1} $. Hence~$\combinedz_I$ linearizes
1919: ${\Corr{\sigma}{}}^{-1}(\Theta_S)$ and~$\combinedz_S$
1920: linearizes~$\Theta_S$ into the same linear and controllable system
1921: as~$\combinedz_I$.
1922: \end{proof}
1923:
1924:
1925:
1926: %======== Subsection ================================================
1927: \subsection{\Ito~$g$-linearization}
1928: \label{sub:sfbig}
1929:
1930: The \Ito $g$-linearization problem is probably the most complicated
1931: variant of exact linearization studied in this paper. The dispersion
1932: vectorfield of an \Ito dynamical system transformed by a coordinate
1933: transformation~$\sctt$ consists of two terms: the transformed
1934: vectorfield~$\tantra{T} f$ and the \Ito term~$\ito{\sigma}$. We
1935: require that the sum of these terms is linear, thus the
1936: nonlinearity of the drift~$\tantra{T}f$ must compensate for the \Ito
1937: term. Since the \Ito term behaves to~$T$ as a second order
1938: differential operator, this problems generates a set of second order
1939: partial differential equations. One can attempt to use simplifications
1940: as in the deterministic linearization, namely, the recursive Leibniz
1941: rule~\eqref{eq:10}. Unfortunately, this approach does not work for the
1942: stochastic case. In general, the \Ito equations cannot be easily
1943: simplified by commutators because the commutator of second order
1944: operators is not a second order operator but a third order operator
1945: (see Subsection~\ref{sub:stoinvar}).
1946:
1947: Nevertheless, there are special cases for which simpler conditions
1948: can be found. The most important special case (commuting $g$
1949: and $\sigma$) will be studied here.
1950:
1951: \subsubsection{Canonical Form ---$n$ unknowns}
1952:
1953: The canonical form for the $g$-linearization
1954: is the integrator chain with a nonlinear drift
1955: \begin{align}
1956: \label{eq:1007}
1957: \tilde f_i(x) &= x_{i+1} \firstfor 1\le i\le n-1\\
1958: \label{eq:1008}
1959: \tilde f_n(x) &= 0\\
1960: \label{eq:1009}
1961: \tilde g_i(x) &= 0 \firstfor 1\le i\le n-1\\
1962: \label{eq:1010}
1963: \tilde g_n(x) &= 1
1964: .\end{align}
1965: Assume that there is a~$g$-linear
1966: system~$\Theta_I = (Ax,B,\sigma(x),U,\origi{x})$. Then the drift part
1967: of~$\Theta_I$ can be transformed by a {\em linear} transformation into
1968: the integrator chain. This is because the \Ito term of a linear
1969: transformation vanishes.
1970:
1971: The equations which define~$T$ can be obtained by comparing this
1972: canonical form with the equations of~$\tilde \Theta$.
1973:
1974: \begin{prop} \label{prop:s1sfb2}
1975: Let~\isdef be an \Ito dynamical system with~$f(\origi{x})=0$ such
1976: that~$\corr{\sigma}{\origi{x}}=0$. There is a SFB~$g$-linearizing
1977: transformation~$\combinedtab$ of the system~$\Theta_{I}$ into a
1978: ~$g$-controllable linear system if and only if there is a solution
1979: $T_i\RntoR$, $1\le i \le n$, to the set of partial differential
1980: equations defined on~$U$:
1981: \begin{alignat}{3}
1982: \label{eq:50}
1983: T_{i+1}&=\lie{f}{T_i}+\ito{\sigma}{T_i} \firstfor 1\le i\le{n-1}\\
1984: \label{eq:51}
1985: \lie{g}{T_i}&=0 \nextfor 1\le i\le{n-1}\\
1986: \label{eq:52}
1987: \lie{g}{T_n}&\not=0 .\end{alignat} The symbol~$\ito{\sigma}$
1988: denotes the \Ito operator (see Definition~\ref{eq:16}). The
1989: feedback can be constructed as:
1990: \begin{align}
1991: \label{eq:53}
1992: \alpha &=-\frac{(\lie{f}{T_n}+\ito{\sigma}{T_n})}{\lie{g}{}T_n}
1993: \qquad\qquad \beta =\frac{1}{\lie{g}{T_n}}
1994: .\end{align}
1995: \end{prop}
1996: \begin{proof}
1997:
1998: The~$i$-th components
1999: of~$f$,$g$, and~$\sigma$ are:~$\tilde f_i =
2000: \lie{f}{T_i} + \ito{\sigma}{T_i}$, $\tilde g_i =
2001: \lie{g}{T_i}$, $\tilde \sigma_i =
2002: \lie{\sigma}{T_i}$.
2003: The partial differential equations \eqref{eq:50}, \eqref{eq:51}
2004: and \eqref{eq:52} are obtained by comparison of \eqref{eq:86}-\eqref{eq:89}
2005: with the equations~\eqref{eq:1007}-\eqref{eq:1010}.
2006: \end{proof}
2007: \subsubsection{PDEs of single unknown}
2008:
2009: One can attempt to reduce the equations~\eqref{eq:50},
2010: \eqref{eq:51}, and~\eqref{eq:52}, to a set of equations of a
2011: single unknown, similarly to the results of Proposition \ref{prop:d1sfb1}.
2012:
2013: \begin{coroll}
2014: \label{prop:sfbooo} Define the general second order
2015: operator~$O(f,F)$ as in~\eqref{eq:17}. The exponential notation
2016: for~$O$ will be defined recursively: $O^0(f,F)T \define T$ and
2017: $O^{l+1}(f,F)T \define O(f,F)O^l(f,F)T$ for~$l \ge 0$. Next, define
2018: \begin{align} F_{ij} \define \frahalf \sigma_i \sigma_j .
2019: \end{align} Then the set of partial differential equations~\eqref{eq:50}-\eqref{eq:52} of~$n$ unknowns has a
2020: solution if and only if there is a
2021: solution~$\lambda \RntoR$ defined on~$U$ to the set of
2022: PDEs of single unknown:
2023: \begin{alignat}{3} \label{eq:153}
2024: O(g,0)O^i(f,F)\lambda &=0\firstfor 0\le i\le n-2\\
2025: \label{eq:154} O(g,0)O^{n-1}(f,F)\lambda &\ne 0 . \end{alignat}
2026: The original solution and the feedback
2027: can be found as \begin{alignat}{3}
2028: T_i&=O^{i-1}(f,F)\lambda \firstfor 1 \le i \le n\\
2029: \label{eq:58} \alpha &= -
2030: \frac{O(f,F)^{n-1}\lambda }{O(g,0)^{n-1}\lambda } \quad\quad \beta =
2031: \frac{1}{O(g,0)^{n-1}\lambda } . \end{alignat}
2032: \end{coroll}
2033: \begin{proof}
2034: Since~$T_1=\lambda $ and by definition
2035: of~$\ito{\sigma}{}$ \eqref{eq:16} and~$O$~\eqref{eq:17}:
2036: \begin{alignat}3
2037: \label{eq:264}
2038: O(f,F)T_i &= \lie{f}{T_i} + \ito{\sigma}{T_i} \firstfor 1\le i\le n\\
2039: \label{eq:265}
2040: O(g,0)T_i &=\lie{g}{T_i} \nextfor 1\le i\le n ;
2041: \end{alignat} then~$T_{i+1} = O(f,F)T_i$ by~\eqref{eq:50} and
2042: $T_i = O^{i-1}(f,F)T_1 = O^{i-1}(f,F)\lambda $. Similarly
2043: the equation \eqref{eq:53} implies~\refprop{eq:58}.
2044: \end{proof}
2045:
2046: Note, that for the deterministic case~$\sigma=0$, the
2047: operators~$O(g,0)$ and~$O(g,0)O^i(f,F)$ degenerate
2048: to~$\lie{g}{}$ and to~$\lie{g}{}\multilie{f}{i}{}$ respectively,
2049: thus the result is the same as that of Proposition~\ref{prop:d1sfb1}.
2050:
2051: In general, the equations of the system are of an order up to~$2n$ and
2052: cannot be reduced to a lower order. The
2053: commutator of two second order operators is of third
2054: order as was pointed out by~\eqref{eq:60}. In particular, for~$i=1$ we
2055: have to evaluate~$C(g,0,f,F) \definer O(a,A)$, which {\em is\/} of
2056: second order due to the fact that~$G=0$. But starting from~$i=2$ the
2057: commutator~$C(f,F,a,A) = C(f,F,C(g,0,f,F))$ is of
2058: third order.
2059:
2060: \subsubsection{Correcting Term}
2061:
2062: The same problem can be reformulated using conversion to the
2063: Stratonovich formalism. One can compute the drift vectorfield~$\alterbar f$
2064: of the equivalent Stratonovich system by applying the
2065: correcting term~$\alterbar f \define f +
2066: \corr{\sigma}{x}$. Then the Stratonovich system~$\ssys{\alterbar
2067: f}{g}{\sigma}{x}$ may be transformed, by a suitable transformation,
2068: to such a form~$(\tilde f,\tilde g,\tilde \sigma,T(U),0)$ that after
2069: applying the backward correcting
2070: term~$-\corr{{\tilde \sigma}}{z}$ the resulting \Ito system will be
2071: linear.
2072:
2073: Compare this formulation with the~$g\sigma$-linearization where the
2074: backward correcting term vanished due to
2075: linearity of~$\tilde \sigma$. This does not happen with
2076: the~$g$-linearization, and the backward correcting term is a part of the equations.
2077:
2078: In general, it may be difficult to solve these equations. Nevertheless
2079: there are special cases when the solution can be obtained. See for example
2080: Section~\ref{sub:appcrane}. Another important case (commuting $g$~
2081: and~$\sigma$) is studied below.
2082:
2083: \begin{coroll} \label{prop:s1sfb3}
2084: The equations of Proposition~\ref{prop:s1sfb2} are equivalent to~$n$
2085: partial differential equations:
2086: \begin{alignat}3
2087: \label{eq:143}
2088: T_{i+1}&=\lie{\alterbar f}{T_i} -\corr{{\alterbar \sigma}}{z}=\\
2089: &\lie{\alterbar f}{T_i} + \frahalf \lie{\sigma}{\lie{\sigma}{T_i}} \firstfor 1 \le i \le{n-1}\\
2090: \label{eq:144}
2091: \lie{g}{T_i}&=0\nextfor 1 \le i \le{n-1}\\
2092: \label{eq:145}
2093: \lie{g}{T_n}&\not=0 .\end{alignat} Then the
2094: feedback can be constructed as
2095: \begin{align}
2096: \alpha &=-\frac{\lie{\alterbar f}{T_n} + \frahalf
2097: \lie{\sigma}{\lie{\sigma}{T_n}}}{\lie{g}{T_n}} \qquad\qquad
2098: \beta =\frac{1}{\lie{g}{T_n}} .\end{align} Where $\alterbar f
2099: \define f + \corr{\sigma}{x}$.
2100: \end{coroll}
2101: \begin{proof}
2102: The equations~\eqref{eq:143} can be obtained
2103: from~\eqref{eq:50} by applying~\eqref{eq:215}
2104: and~\eqref{eq:140}:
2105: \begin{multline}
2106: \label{eq:216}
2107: T_{i+1} = \lie{f}{T_i}+\ito{\sigma}{T_i} = \lie{\left(
2108: \alterbar f - \corr{{\alterbar \sigma}}{x} \right)}{T_i}+
2109: \ito{\sigma}{T_i} = \\
2110: \lie{\alterbar f}{T_i} - \lie{\corr{{\alterbar
2111: \sigma}}{x}}{T_i} + \ito{\sigma}{T_i} = \lie{\alterbar
2112: f}{T_i} + \frahalf\lie{\sigma}{\lie{\sigma}{T_i}}
2113: .\end{multline}
2114:
2115: The other equations are adopted from Proposition~\ref{prop:s1sfb2}.
2116: The set of PDEs of~$n$ unknowns can be transformed into a set
2117: of PDEs of a single unknown~$\lambda =T_1$, but
2118: the order of the equation will be~$2n-1$.
2119: \end{proof}
2120:
2121: \begin{rem} \label{prop:s1sfb4}
2122: Observe that the set of~$n$ second order partial differential
2123: equations~\eqref{eq:143}-~\eqref{eq:145} defined in
2124: Proposition~\ref{prop:s1sfb3} can be transformed, by introducing
2125: new variables~$S_i = \lie{\sigma}{T_i}$, to the following system
2126: of~$2n-1$ first order partial differential equations for~$1 \le i
2127: \le {n-1}$:
2128: \begin{alignat}3
2129: \label{eq:146}
2130: \lie{g}{T_i}&=0\\
2131: \label{eq:147}
2132: \lie{\sigma}{T_i}-S_i&=0\\
2133: \label{eq:148}
2134: \lie{{\alterbar f}}{T_i} + \frahalf\lie{\sigma}{S_i}&=T_{i+1}\\
2135: \label{eq:149}
2136: \lie{g}{T_n}&\not=0 .\end{alignat} $T_i$
2137: and~$S_i\RntoR$ are unknown real valued functions defined on $U$.
2138: \end{rem}
2139:
2140: \subsubsection{Systems with Commuting $g$ and $\sigma$}
2141: There is a special case of \Ito dynamical systems for which the
2142: solution is completely known and can be computed using
2143: only first order PDEs.
2144:
2145: \begin{theo}
2146: \label{prop:ssfbco}
2147: Let~\isdef be a SISO \Ito dynamical system. If the
2148: vectorfield~$\sigma$ commutes with all vectorfields~$\ad{{\alterbar
2149: f}}{i}{g}$ for~$0\le i\le n-1$, \ie ~$[\ad{{\alterbar
2150: f}}{i}{g},\sigma]=0$, where $\alterbar f
2151: \define f + \corr{\sigma}{x}$, then the \Ito system is $g$-linearizable if and
2152: only if the distribution
2153: \begin{align}
2154: \alterbar \Delta_{n} \define
2155: \sspan\left\{{\ad{{\alterbar f}} {i}{g}, \iva{n-1}}\right\}
2156: \end{align}
2157: is
2158: nonsingular on~$U$ and the distribution
2159: \begin{align}
2160: \alterbar \Delta_{n-1}
2161: \define \sspan\left\{{\ad{{\alterbar f}}{i}{g}, \iva{n-2}}\right\}
2162: \end{align}
2163: is involutive on~$U$. If these conditions hold, then a
2164: solution~$\lambda \RntoR$ to the set of partial differential
2165: equations exists
2166: \begin{align}
2167: \label{eq:77}
2168: \biglie{\ad{{\alterbar f}}{i}{g}}{\lambda }&=0\rfor{\iva{n-2}}\\
2169: \label{eq:78}
2170: \biglie{\ad{{\alterbar f}}{{n-1}}{g}}{\lambda }&\not=0 .\end{align}
2171: the linearizing transformation is given by:
2172: \begin{alignat}3
2173: \label{eq:79}
2174: T_1&=\lambda \\
2175: \label{eq:80}
2176: T_{i+1}&= \lie{\alterbar f}{T_i} + \frahalf
2177: \lie{\sigma}{\lie{\sigma}{T_i}} \firstfor 1
2178: \le i \le{n-1}\\
2179: \alpha &=\frac{-\multilie{\alterbar f}{{n}}\lambda
2180: }{\lie{g}{}\multilie{\alterbar f}{{n-1}}\lambda } &\qquad\qquad&
2181: \label{eq:81}
2182: \beta =\frac{1}{\lie{g}{}\multilie{\alterbar f}{{n-1}}\lambda }
2183: .\end{alignat}
2184: \end{theo}
2185: \begin{proof}
2186: We will apply the Leibniz rule to the relation of~(\ref{eq:143})
2187: Corollary~\ref{prop:s1sfb3} to expand the
2188: term~$\lie{g}{T_{i+1}}$ for~$1\le i\le n-1$
2189: \begin{multline}
2190: \label{eq:195}
2191: \lie{g}{T_{i+1}} = \lie{g}{ \left( \lie{{\alterbar f}}{T_i}+
2192: \frahalf \lie{\sigma}{\lie{\sigma}{T_i}} \right) } =
2193: \lie{g}{\lie{{\alterbar f}}{T_i}} + \frahalf
2194: \lie{g}{\lie{\sigma}{\lie{\sigma}{T_i}}}
2195: =\\
2196: \lie{{\alterbar f}}{\lie{g}{T_i}} - \lie{[\alterbar f,g]}{T_i}
2197: + \frahalf \lie{\sigma}{\lie{g}{\left(\lie{\sigma}{T_i}\right)}}
2198: - \frahalf \lie{[\sigma,g]}{\left(\lie{\sigma}{T_i}\right)}
2199: =\\
2200: 0 - \lie{[\alterbar f,g]}{T_i} + \frahalf \lie{\sigma}{ \left(
2201: \lie{\sigma}{\lie{g}{T_i}} - \lie{[\sigma,g]}{T_i} \right)
2202: } - \frahalf \left( \lie{\sigma}{\lie{[\sigma,g]}{T_i}} -
2203: \lie{[\sigma,[\sigma,g]]}{T_i} \right)
2204: =\\
2205: -\lie{[\alterbar f,g]}{T_i} + 0 - \frahalf
2206: \lie{\sigma}{\lie{[\sigma,g]}{T_i}} + \frahalf
2207: \lie{[\sigma,[\sigma,g]]}{T_i} .\end{multline} If the
2208: vectorfields~$g$ and~$\sigma$ commute, then the second and
2209: third terms vanish. If, moreover, $[\sigma,[\alterbar f,g]] = 0$ then
2210: \begin{alignat}{3}
2211: \label{eq:257}
2212: \lie{g}{{T_{i+2}}} &= - \lie{{[\alterbar f,g]}}{ \left(
2213: \lie{{\alterbar f}}{T_i} + \frahalf
2214: \lie{\sigma}{\lie{\sigma}{T_i}} \right)} = \lie{{[\alterbar
2215: f,[\alterbar f,g]]}}{T_i} .\end{alignat} In general
2216: if~$[\sigma,\ad{{\alterbar f}}{i}{g}]=0$ for~$0\le i\le n-1$ then
2217: \begin{alignat}{3}
2218: \label{eq:258}
2219: \lie{g}{T_{k}} &= (-1)^k \lie{{[\ad{{\alterbar f}}{k}{g},]}}{T_1}
2220: .\end{alignat}
2221:
2222: Thus the equations~\eqref{eq:143} and \eqref{eq:144} will be
2223: equivalent to
2224: \begin{alignat}{3}
2225: \label{eq:193}
2226: \biglie{\ad{{\alterbar f}}{i}{g}}{\lambda }&=0\firstfor{\iva{n-2}}\\
2227: \label{eq:194}
2228: \biglie{\ad{{\alterbar f}}{{n-1}}{g}}{\lambda }&\not=0
2229: ,\end{alignat} which are of the same form as the equations of
2230: Proposition~\ref{prop:d1sfb1} and consequently the conditions
2231: from Proposition \ref{prop:d1sfb2} can be used.
2232: \end{proof}
2233:
2234:
2235:
2236: %======== Subsection ================================================
2237: \subsection{\Ito and Stratonovich $\sigma$-linearization}
2238: \label{sub:sfbchsigma}
2239:
2240:
2241: The stochastic SFB $\sigma$-linearization problem is similar to
2242: deterministic SCT linearization.
2243: The dispersion
2244: vectorfield~$\sigma$ transforms in the same way as deterministic
2245: drift vectorfields do. Consequently, no \Ito term
2246: complicates the transformation. Moreover, the \Ito and
2247: Stratonovich cases are equivalent.
2248:
2249: On the other hand, in the SFB $\sigma$-linearization we are free to
2250: choose the feedback~$\feedbackab$ that perturbs the
2251: drift
2252: vectorfield~$f$ into~$\tilde f = f + g \alpha $.
2253:
2254: \psfig{fig:sigmasfb}{Ito and Stratonovich
2255: $\sigma$-linearization}{sigmasfb}
2256: \begin{prop} \label{prop:sfsigma}
2257: Let~$\Theta$ be a SISO stochastic
2258: system~$\Theta = \ssysfgx$. There is a
2259: SFB $\sigma$-linearizing
2260: transformation~$\combinedtab$ into a $\sigma$-controllable linear
2261: system if and only if there is a smooth
2262: feedback function~$\alpha \RntoR$ such that the
2263: deterministic system~$\dsys{f+g\alpha }{\sigma}{x}$ has a
2264: SCT
2265: linearizing
2266: transformation~$\sctt$. Equivalently, there must be
2267: such~$\alpha $ that the the modified odd bracket condition:
2268: \begin{equation}
2269: \label{eq:59}
2270: [\sigma,\ad{f+g \alpha }{l}{\sigma}]=0 \qquad\text{for}\qquad l = 1,\dots,2n-1
2271: \end{equation}
2272: is satisfied (see~\eqref{eq:45}). The resulting combined
2273: transformation consists of composition of the coordinate transformation~$\sctt$ and the
2274: feedback~$\feedbackab$ where~$\beta $ is arbitrary
2275: function of~$x$; for instance~$\beta = 1$.
2276: \end{prop}
2277: \begin{proof}
2278: Compare definition of linearity of a deterministic system with
2279: definition of
2280: $\sigma$-linearity. The system is is $\sigma$-linearizable if and only if the
2281: deterministic systems~$\dsys{f+g\alpha }{\sigma}{x}$ is
2282: SCT linearizable (see Corollary~\ref{prop:s1ctt2a}).
2283:
2284: It is evident that the function~$\beta $ (see
2285: Figure~\ref{fig:sigmasfb}) has no effect on the dispersion part and
2286: can be chosen arbitrarily. (Probably nonzero for otherwise the system will
2287: be $g$-uncontrollable).
2288: \end{proof}
2289:
2290:
2291: The condition~\eqref{eq:59} can be expressed in terms of
2292: derivatives of $\alpha $ using bracket
2293: relations known from differential geometry. For example, for~$l=1$:
2294: \begin{align}
2295: \label{eq:156}
2296: [\sigma,[f+g \alpha ,\sigma ]] &= [\sigma, [f,\sigma ]+[g \alpha
2297: ,\sigma ]] = [\sigma,[f,\sigma ]]+[\sigma,[g \alpha ,\sigma ]]=\\
2298: &=[\sigma,g+[f+g,\sigma ]] + g \lie{\sigma}{\lie{\sigma}{\alpha }}
2299: .\end{align}
2300: The other conditions for~$k=3,5,7,\dots$ can be expressed in a similar
2301: way giving the set of~$n$ partial
2302: differential equations of the order up to~$2n$ for example by a
2303: computer using symbolic algebra tools. The
2304: problem is not very interesting from the practical point of view.
2305:
2306:
2307: %======== Subsection ================================================
2308: \section{Example---Crane}
2309: \label{sub:appcrane}
2310:
2311:
2312: In this section the methods of stochastic exact linearization are
2313: demonstrated on an example --- control of a crane under
2314: the influence of random disturbances. The description of the plant was
2315: adopted from~\citet{ackermann93} where the model of a crane linearized
2316: by approximative methods was studied. Unlike Ackermann, we control the
2317: same system using the exact model. Moreover the influence of random
2318: disturbances is added. \psfig{fig:crane1}{Crane}{crane1} Consider the
2319: crane of Figure~\ref{fig:crane1}, which can be used for example for
2320: loading containers into a ship. The hook must
2321: be automatically placed to a given position.
2322: Feedback control is needed in order to dampen
2323: the motion before the hook is lowered into the ship. The input signal
2324: is the force~$u$ that accelerates the crab. The crab mass is~$m_C$,
2325: the mass of the load~$m_L$, the rope length is~$l$, and the
2326: gravity acceleration~$g$.
2327:
2328: We assume that the driving motor has no nonlinearities, there is no
2329: friction or slip, no elasticity of the rope and no damping
2330: of the pendulum (\eg from air drag). We will define four state
2331: variables: the rope angle $x_1$ (in radian), the angular velocity~$x_2
2332: = \dot x_1$, the position of the crab~$x_3$, and the velocity of
2333: the crab~$x_4 = \dot x_3$. As shown in~\citez{ackermann93}, the
2334: plant is described by two second order differential equations:
2335: \begin{align}
2336: \label{eq:72}
2337: u &= (m_L + m_C) \ddot x_3 + m_L l ( \ddot x_1 \cos x_1 - \dot x_1^2
2338: \sin
2339: x_1) \\
2340: \label{eq:73}
2341: 0 &=m_L \ddot x_3 \cos x_1 + m_L l \ddot x_1 + m_L g \sin x_1
2342: .\end{align}
2343: Additionally, we assume that the load is under influence of random
2344: disturbance, which can be modeled as a white noise
2345: process. The disturbance (wind) is horizontal, has zero mean and
2346: can be described by the \Ito differential~$dw$:
2347: \begin{align}
2348: \label{eq:74}
2349: dx_2 = \frac{F \cos x_1}{m_L l}\,dw,\end{align} where~$F$ is a
2350: constant having the physical unit of force.
2351:
2352: We used symbolic algebraic system \Mathematica to handle the
2353: computations. The complete \Mathematica worksheet can be downloaded
2354: from the web page of the author \hyref{http://www.tenzor.cz/sladecek}.
2355:
2356: \Mathematica was used to solve the equations of the system for
2357: unknown values~$\dot x_2$ and~$\dot x_4$ (angular and
2358: positional acceleration). Values of vectorfields~$f$, $g$, and
2359: $\sigma$ were derived as follows:
2360:
2361: \begin{align}
2362: \label{eq:76}
2363: f &= \left[ x_2, -\frac{\sin x_1 \left( g (m_L+m_C) + l m_L x_2 \cos
2364: x_1 \right) }
2365: {l (m_C + m_L - m_L \cos^2 x_1) }, x_4, 0\right]^T\\
2366: g &= \left[ 0, -\frac{\cos x_1 }
2367: {l (m_C + m_L - m_L \cos^2 x_1) }, 0, u\right]^T\\
2368: \sigma &= \left[0, \frac{F \cos x_1}{m_L l},0,0 \right]^T
2369: .\end{align}
2370:
2371:
2372: The state space model is shown in Figure~\ref{fig:crane2}. We can see
2373: that the positional state variables~$x_3$ and~$x_4$ are isolated from
2374: the angular state variables~$x_1$ and~$x_2$. Later, we will
2375: concentrate on the angular variables pretending that the load will be
2376: stabilized no matter where the crane is. Consequently, we obtain only
2377: two-dimensional system on which the exact linearization techniques can
2378: be demonstrated. \psfig{fig:crane2}{The State Space Model of
2379: Crane}{crane2}
2380:
2381: Next, consider the random disturbances. Because the
2382: correcting term~$\corr{\sigma}{x}$ is zero,
2383: there is no difference in using either the
2384: \Ito or the Stratonovich integral. In case of more ``nonlinear'' noise, one of
2385: the integrals must be selected. If the \Ito model is chosen,
2386: Theorem~\ref{prop:gsigmaprop} must be applied.
2387:
2388: Now we evaluate the conditions of Proposition~\ref{prop:s1sfb1}
2389: to check that the system is linearizable. In fact, we must only
2390: evaluate the non-singularity condition because every one-dimensional
2391: distribution is involutive, and the
2392: integrability is satisfied automatically. To this
2393: end, we will compute the null space (kernel) of the
2394: matrix~$[[f,g],g]$, which is empty and therefore the matrix is
2395: nonsingular. We conclude, that the {\em deterministic\/}
2396: SFB problem is solvable.
2397:
2398: Notice, that the system is already in the integrator chain form and
2399: hence~$\lambda = x_1$ satisfies this condition. Therefore, the
2400: {\em deterministic\/} system is linearizable by feedback only, with no
2401: state space transformation at all, \ie $z=T(x)=x$.
2402:
2403: This choice of the output function~$\lambda $ is natural but does
2404: not cancel the nonlinearity in the dispersion coefficient~$\sigma$.
2405: For this purpose, we must use the algorithm of Section~\ref{prop:cftdp} to construct
2406: another nontrivial coordinate transformation~$T$.
2407:
2408: To obtain this transformation, we must find the space of all
2409: functions~$\lambda $ satisfying conditions for
2410: feedback linearity~\eqref{eq:7}. Observe
2411: that~$\lie{g}{\lambda }$ must be zero hence
2412: \begin{align}
2413: \label{eq:75}
2414: \parby{\lambda }{x_1} g_1 + \parby{\lambda }{x_2} g_2 &= 0
2415: .\end{align}
2416:
2417: Since~$g_1=0$ and~$g_2 \ne 0$ in
2418: neighborhood of~$x_0$, then
2419: $\parby{\lambda }{x_2} = 0$ and $\lambda = c_1(x_1)$ is a
2420: function of~$x_1$ only (\ie without~$x_2$). The coordinate transformation is $T =
2421: \left[\lambda ,\lie{f}{\lambda } \right]^T$. We want to select
2422: such $c_1(x_1)$ that the dispersion
2423: vectorfield~$\tilde \sigma \define \tantra{T}\sigma$ in the new
2424: coordinate system~$z=T(x)$ will be constant:
2425: \begin{align}
2426: \label{eq:70}
2427: \parby{c_1(x_1)}{x_1} \frac{F \cos x_1}{m_L l} = \text{constant}
2428: .\end{align}
2429:
2430: We decided to define the constant as~${F}/{(m_L l)}$, therefore
2431: \begin{align}
2432: \label{eq:221}
2433: \parby{c_1}{x_1} &= \frac{1}{\cos x_1}
2434: \end{align}
2435: and
2436: \begin{multline}
2437: \label{eq:71}
2438: T_1 = \lambda = c_1(x_1) = \int \frac{1}{\cos x_1} \, d x_1 =\\
2439: -\ln \left( \cos \frahalf{x_1} - \sin \frahalf{x_1} \right) +\ln
2440: \left( \cos \frahalf{x_1} + \sin \frahalf{x_1} \right)
2441: .\end{multline}
2442: \begin{align}
2443: \label{eq:222}
2444: T_2 = \lie{f}{\lambda } &= x_2 \sec x_1
2445: .\end{align}
2446:
2447: Finally, we can compute the feedback from~\eqref{eq:28}. In the
2448: \Mathematica worksheet we validate the results by computing~$\tilde \Theta
2449: = \combinedtab \ssysfgx $, The computation showed that the
2450: system~$\ssys{\hat f}{\hat g}{\hat \sigma}{x}$ is in the integrator
2451: chain form in the~$z$ coordinate chart.
2452:
2453:
2454: \begin{multline}
2455: b=\frac{1}{l \left( m_c + m_l \left( \sin (x_1) \right)^2 \right)}\\
2456: a=\tan ({x_1}) \left( \sec (x_1)\,x_2^2 -
2457: b\,g\, ( m_c + m_l ) + l\,m_l\,{x_2}\cos ({x_1}) \right)
2458: .\end{multline}
2459:
2460:
2461: \section{Conclusion}
2462:
2463: \subsection{Main Results}
2464:
2465: \begin{romanenu}
2466:
2467: \item The structure of the stochastic linearization problem is much richer
2468: than the structure of the deterministic one. Two definitions of coordinate
2469: transformation exist and there are differences between the~$g$,~$\sigma$,
2470: and~$g\sigma$-linearization.
2471:
2472: \item In the case of \Ito integrals, the coordinate transformation
2473: laws are of second order (the \Ito rule).
2474:
2475: There is a large difference between
2476: $g\sigma$-linearization and $g$-linearization. In the former case the
2477: effect of the \Ito term can be reduced to the first order operator and
2478: consequently the problem is solvable by differential geometry. On the
2479: other hand, in the later case there is no easy method to elliminate
2480: the \Ito term and the a set of second order partial differential
2481: equations must be solved to get the linearizing transformation.
2482:
2483:
2484: \item We have given (at least partial) solutions to all
2485: SISO SFB problems. The results are listed in Table~\ref{tab:sfb}.
2486:
2487: \begin{table}[htpb]
2488: \begin{center}
2489: \begin{tabular}{llll}
2490: \hline
2491: Linearization&$g$&$g\sigma$&$\sigma$\\
2492: \hline
2493: Deterministic&\reftpropag{prop:d1sfb2}&&\\
2494: Stratonovich &\refppropag{prop:stratgprop}
2495: &\reftpropag{prop:s1sfb1}
2496: &\refppropag{prop:sfsigma}\\
2497: \Ito&\refcorol{prop:sfbooo}
2498: &\reftpropag{prop:gsigmaprop}
2499: &\refppropag{prop:sfsigma}\\
2500: \hline
2501:
2502: \end{tabular}
2503: \caption{Overview of results --- SISO SFB case}
2504: \label{tab:sfb}
2505: \end{center}
2506: \end{table}
2507:
2508: \item \Ito linearization problems can be approached by means of the
2509: correcting term. The \Ito differential
2510: equation can be converted to the Stratonovich equation
2511: whose behavior under coordinate transformations is simpler.
2512: This method is only partially applicable to the $g$-linearization.
2513: \item An important special case was identified for the \Ito
2514: $g$-linearization. The case is characterized by commuting control
2515: vectorfields~$g$ and dispersion
2516: vectorfields~$\sigma$. Solutions can be found
2517: using first order methods.
2518: \item Computer algebra proved to be a useful tool for solving exact
2519: linearization problems.
2520: \item Industrial applications of the exact linearization in general
2521: are still unlikely, mainly due to complexity, sensitivity, and
2522: limited robustness of the control laws designed by the method.
2523: \end{romanenu}
2524:
2525: \subsection{Future Research}
2526:
2527: \begin{romanenu}
2528: \item Find a solution to the \Ito~$g$-linearization problem in general
2529: case, including geometric criteria, using second order geometry.
2530: \item Analyze the computability issues; implement a universal symbolic
2531: algebra toolbox for the problem.
2532: \item Solve the SCT problem.
2533: \item Extend the results to the MIMO systems.
2534: \item Extend the results to the input-output problems and
2535: linearization of autonomous systems. Work out the applications of
2536: nonlinear filtering.
2537: \item Perhaps, some of the results can be used as a starting
2538: point for approaching more general class of problems as the problems
2539: of disturbance decoupling, input invariance of stochastic
2540: non--linear systems, or problems of reachability and
2541: observability.
2542:
2543: \end{romanenu}
2544:
2545:
2546: \bibliography{sladecek}
2547: \bibliographystyle{plainnat}
2548:
2549:
2550: \end{document}
2551: \endinput
2552:
2553:
2554: % LocalWords: ftn Appendices
2555:
2556:
2557:
2558: