math0501035/main.tex
1: \documentclass[11pt]{article}
2: 
3: \usepackage{amssymb,amsmath,latexsym}
4: 
5: %\usepackage{showkeys}
6: 
7: \input psfig.sty
8: \psfull
9: 
10: \topmargin      0.25truein
11: \oddsidemargin  0.0truein
12: \evensidemargin 0.0truein
13: \textheight     8.5truein
14: \textwidth      6.5truein
15: 
16: \footskip       0.6truein
17: \headheight     0.0truein
18: \headsep        0.0truein
19: \parskip 0.3cm
20: 
21: \begin{document}
22: 
23: \newtheorem{lemma}{Lemma}
24: \newtheorem{theorem}{Theorem}
25: \newtheorem{corollary}{Corollary}
26: \newtheorem{definition}{Definition}
27: \newtheorem{example}{Example}
28: \newtheorem{proposition}{Proposition}
29: \newtheorem{condition}{Condition}
30: 
31: \newcommand{\bea}{\begin{eqnarray}}
32: \newcommand{\eea}{\end{eqnarray}}
33: \newcommand{\beaa}{\begin{eqnarray*}}
34: \newcommand{\eeaa}{\end{eqnarray*}}
35: \newcommand{\ben}{\begin{enumerate}}
36: \newcommand{\een}{\end{enumerate}}
37: \newcommand{\bi}{\begin{itemize}}
38: \newcommand{\ei}{\end{itemize}}
39: 
40: \newcommand{\lip}{\langle}
41: \newcommand{\lan}{\langle}
42: \newcommand{\rip}{\rangle}
43: \newcommand{\ran}{\rangle}
44: \newcommand{\uu}{\underline}
45: \newcommand{\oo}{\overline}
46: \newcommand{\til}{\tilde}
47: 
48: \newcommand{\La}{\Lambda}
49: \newcommand{\la}{\lambda}
50: \newcommand{\eps}{\epsilon}
51: \newcommand{\vph}{\varphi}
52: \newcommand{\al}{\alpha}
53: \newcommand{\bet}{\beta}
54: \newcommand{\gam}{\gamma}
55: \newcommand{\Gam}{\Gamma}
56: \newcommand{\kap}{\kappa}
57: \newcommand{\Del}{\Delta}
58: \newcommand{\Th}{\Theta}
59: \newcommand{\s}{\sigma}
60: \newcommand{\sig}{\sigma}
61: \newcommand{\Sig}{\Sigma}
62: \newcommand{\del}{\delta}
63: \newcommand{\om}{\omega}
64: \newcommand{\Om}{\Omega}
65: 
66: \newcommand{\N}{{\mathbb N}}
67: \newcommand{\R}{{\mathbb R}}
68: \newcommand{\Z}{{\mathbb Z}}
69: \newcommand{\bbeta}{{\text{\boldmath$\beta$}}}
70: \newcommand{\bdel}{\delta}
71: \newcommand{\bgamma}{\gamma}
72: \newcommand{\bnu}{\nu}
73: \newcommand{\bDel}{\Delta}
74: \newcommand{\y}{y}
75: \newcommand{\x}{x}
76: \newcommand{\X}{X}
77: \newcommand{\bu}{u}
78: \newcommand{\e}{e}
79: \newcommand{\m}{m}
80: \newcommand{\M}{M}
81: \newcommand{\p}{p}
82: \newcommand{\q}{q}
83: \newcommand{\bv}{v}
84: \newcommand{\z}{z}
85: 
86: \newcommand{\calA}{{\cal A}}
87: \newcommand{\calB}{{\cal B}}
88: \newcommand{\calC}{{\cal C}}
89: \newcommand{\calD}{{\cal D}}
90: \newcommand{\calF}{{\cal F}}
91: \newcommand{\calG}{{\cal G}}
92: \newcommand{\calH}{{\cal H}}
93: \newcommand{\calJ}{{\cal J}}
94: \newcommand{\calL}{{\cal L}}
95: \newcommand{\calM}{{\cal M}}
96: \newcommand{\calP}{{\cal P}}
97: \newcommand{\calS}{{\cal S}}
98: \newcommand{\calT}{{\cal T}}
99: \newcommand{\calU}{{\cal U}}
100: \newcommand{\calV}{{\cal V}}
101: \newcommand{\calX}{{\cal X}}
102: \newcommand{\calY}{{\cal Y}}
103: 
104: \newcommand{\proof}{\noindent {\bf Proof:\ }}
105: \newcommand{\proofOf}[1]{\noindent {\bf Proof of #1:\ }}
106: \newcommand{\remark}{\noindent {\bf Remark:\ }}
107: \newcommand{\remarks}{\noindent {\bf Remarks:\ }}
108: \newcommand{\note}{\noindent {\bf Note:\ }}
109: \newcommand{\esssup}{{\rm ess}\sup}
110: \newcommand{\essinf}{{\rm ess}\inf}
111: \newcommand{\pl}{\partial}
112: \newcommand{\noi}{\noindent}
113: \newcommand{\goto}{\to}
114: \newcommand{\ink}{\rule{.5\baselineskip}{.55\baselineskip}}
115: \newcommand{\qed}{\rule{.5\baselineskip}{.55\baselineskip}}
116: 
117: \def\ve{\varepsilon}
118: \def\vr{\varrho}
119: 
120: \newcommand{\diag}{{\rm diag}}
121: \newcommand{\trace}{{\rm trace}}
122: \newcommand{\tr}{{\rm tr}}
123: \newcommand{\w}{\wedge}
124: \newcommand{\dint}{\int\!\!\!\int}
125: \newcommand{\lt}{\left}
126: \newcommand{\rt}{\right}
127: \newcommand{\dist}{{\rm dist}}
128: 
129: \newcommand{\policy}{{u}}
130: \def\OBdry{\partial_o}
131: \def\CBdry{\partial_c}
132: \newcommand{\Sfrac}[2]{{{#1}\slash {#2}}}
133: 
134: \newcommand{\mean}[1]{\langle#1\rangle}
135: 
136: \date{August 14, 2003}
137: \title{
138: Explicit solution for a network control problem\\
139: in the large deviation regime\thanks{This
140: research  was supported in part by the United States--Israel Binational
141: Science Foundation (BSF 1999179)}}
142: \author{Rami Atar\footnote{Department of Electrical Engineering,
143: Technion -- Israel Institute of Technology,
144: Haifa 32000, Israel.
145: {\tt atar@ee.technion.ac.il}.
146: Research of this author also supported
147: in part by the fund for promotion of research at the Technion.},
148: Paul Dupuis\footnote{Lefschetz Center for Dynamical Systems,
149: Division of Applied Mathematics,
150: Brown University,
151: Providence,  R.I.\  02912.
152: {\tt dupuis@dam.brown.edu}.
153: Research of this author also supported in part by
154: the National
155: Science Foundation (NSF-DMS-0072004, NSF-ECS-9979250) and the Army Research Office 
156: (DAAD19-02-1-0425).}
157: \ and Adam Shwartz\footnote{Department of Electrical Engineering,
158: Technion -- Israel Institute of Technology,
159: Haifa 32000, Israel.
160: {\tt adam@ee.technion.ac.il}.
161: Research of this author also supported
162: in part by INTAS grant 265, and in part by the fund for promotion
163: of research at the Technion.}\\[.2in]
164:  }
165: 
166: \maketitle
167: 
168: \begin{abstract}
169: We consider optimal control of a stochastic network, where service is controlled to prevent buffer overflow.
170: We use a risk-sensitive escape time criterion,
171: which in comparison to the ordinary escape time criteria heavily penalizes exits which occur on short time intervals.
172: A limit as the buffer sizes tend to infinity is considered.  In~\cite{ads} we showed that, for a large class of networks,
173: the limit of the normalized cost agrees with the value function of a differential game.  In this game, one player controls the service discipline 
174: (who to serve and whether to serve),
175: and the other player chooses arrival and service rates in the network.
176: The game's value is characterized in \cite{ads} as the unique solution
177: to a Hamilton-Jacobi-Bellman Partial Differential Equation (PDE). 
178: In the current paper we apply this general theory to the important case of a network of queues in tandem.
179: Our main results are: (i) the construction of an explicit solution to the corresponding PDE,  and (ii) drawing out the implications for optimal risk-sensitive and robust regulation of the network.
180: In particular, the following general principle can be extracted.
181: To avoid buffer overflow there is a natural competition between two tendencies.
182: One may choose to serve a particular queue, since that will help prevent its own buffer from overflowing, or one may prefer to stop service, with the goal of preventing overflow of buffers further down the line.
183: The solution to the PDE indicates the optimal choice between these two, specifying
184: the parts of the state space where each queue must be
185: served (so as not to lose optimality), and where it can idle.
186: Referring to those queues which must be served
187: as bottlenecks, one can use the solution to the PDE to explicitly
188: calculate the bottleneck queues as a function of
189: the system's state, in terms of a simple set of equations.
190: \end{abstract}
191: 
192: %\vspace{\baselineskip}
193: \noindent
194: {\it 1991 Mathematics Subject Classification.}
195: Primary 60F10, 60K25;
196: Secondary 49N70, 93E20.
197: 
198: 
199: \section{Introduction}
200: 
201: In a previous work \cite{ads}
202: we considered a stochastic control problem for a Markovian queueing network
203: with deterministic routing, where the service stations may provide service to
204: one or more queues, with each queue being limited by a finite buffer. The control refers to the service
205: discipline at the service stations, and the cost involves the time till one of the
206: queues first reaches its buffer limit. Such a problem can be regarded as the control of
207: a Markov process up to the time it exits a domain, the domain being the rectangle
208: associated with the buffer sizes. The cost is chosen so as to obtain a risk-sensitive
209: (or rare-event) control problem: one considers $E_xe^{-c\s}$ as a criterion
210: to be minimized, where $c>0$ is fixed and $\s$ denotes the exit time (the time when any
211: one of the buffers first overflows).
212: Such a criterion penalizes short exit times more heavily
213: than ordinary escape time criteria (such as $E_x\s$, a criterion to be maximized).
214: While the main result of \cite{ads} is the characterization of a limiting problem as the buffer sizes tend to infinity,
215: the current work focuses on finding explicit solutions to this limit problem and on the
216: interpretation thereof.
217: 
218: There are at least two motivations for the use of risk-sensitive criteria when designing 
219: policies for the control of a network.
220: The first is that in many communication networks performance is measured in terms of
221: the occurrence of rare but critical events.
222: Buffer overflow is a principal example of such an event.
223: The second motivation follows from the connection between risk-sensitive
224: controls and robust controls. Indeed, as discussed in \cite{dupjampet},
225: the optimization of a single fixed stochastic network with respect to a 
226: risk-sensitive cost criteria automatically produces controls with specific and 
227: predictable robust properties. In particular,
228: these controls give good performance for a family of perturbed network models 
229: (where the perturbation is around the design model and the size of the 
230: perturbation is measured by relative entropy), and with respect to a 
231: corresponding ordinary (i.e., not risk-sensitive) cost.
232: 
233: In many problems, one considers the limit of the risk-sensitive problem as a scaling parameter 
234: of the system converges, in the hope that the limit model is more tractable.
235: This is the path followed in \cite{ads}, in the asymptotic regime
236: where time is accelerated and buffer lengths are enlarged by a factor $n$.
237: The limit of the normalized cost was characterized both as the value function of
238: a differential game, and as the solution to a corresponding nonlinear PDE.
239: Both interpretations are important and useful. 
240: It is the interpretation as the value function of a differential game that is key in quantifying the robust aspects of the resulting control policy.
241: However, because the PDE gives a necessary and sufficient characterization of the (a priori unknown) value function,
242: it can provide qualitative information on the structure of the value function and the optimal controls.
243: In particularly favorable circumstances one can go even further,
244: and use the PDE for exact calculation and control policy synthesis.
245: Indeed,
246: if one can by any means guess a proper parametric form of the value function,
247: then it is sometimes possible to use the PDE to verify that this is the correct form,
248: and identify the unknown parameters in the representation for the value function.
249: The instances in the control theory literature where this has been carried out are few and far between,
250: especially when the state space of the system has dimension greater than two.
251: However, 
252: important information is obtained from these instances on the structure of optimal controls.
253: 
254: 
255: 
256: In this paper the focus is on applying the PDE obtained in \cite{ads} in the manner just described.
257: In particular, we treat in detail the general case of a tandem queueing network, and construct an explicit solution to the PDE.  
258: In a system of queues in tandem, each server offers service to exactly one queue, and therefore
259: the service control refers simply to whether each station should provide service or remain idle. 
260: Naturally, it is important to provide service to a queue in order to keep
261: it from reaching the buffer limit. On the other hand, if the next buffer in line is nearly full,
262: it might be necessary to idle the first queue in order to keep the second from overflowing.
263: Besides factoring in how close all buffers are to their respective limits,
264: one must consider the mean service rates and the likelihood of significant deviations from those mean service rates.  Is it likely that the next queue down will stall and simply stop serving for a while?
265: It is also possible that one will have to look even further ahead,
266: and consider buffers further downstream.
267: 
268: Although the optimal control problem for the Markovian queueing system is fully described
269: by a dynamic programming equation \cite{ads}, such equations are typically solved numerically.
270: It is hard to extract any global structural information from the exact equation,
271: and even a numerical solution may not be feasible when buffers are large or the dimension of the state space is moderate. 
272: As discussed previously, the solution to the PDE for the limiting problem turns out to simplify things
273: significantly. Roughly speaking, the PDE indicates the following structure of
274: the asymptotic optimally controlled
275: network. In the interior of the domain
276: (i.e., when all buffers are away from their maximum capacity), and depending on the state of the system,
277: service must be provided at
278: certain service stations, while other stations may idle without causing loss of optimality.
279: In that sense, the limit problem sharpens the control policy by emphasizing
280: the importance of serving those `bottleneck' buffers
281: (it is crucial to serve the bottleneck buffers, and completely
282: unimportant to serve the others).
283: The identification of the bottlenecks is nontrivial, and indeed queues with the smallest service rate are not necessarily  bottlenecks.
284: Instead, as hinted above, identification of the bottlenecks must include consideration of at least the following: (i) the relative closeness of all buffers to their maximum value,
285: (ii) relative mean service rates,
286: and (iii) relative uncertainties in the service rates.
287: We identify a system of algebraic equations whose solution identifies all bottlenecks.
288: 
289: 
290: There is relatively little work on risk-sensitive and robust control of networks.
291: Ball et.\ al.\ have considered a robust formulation for network problems
292: arising in vehicular traffic \cite{balday2}, where the cost structure is qualitatively
293: different. Dupuis studies a robust control problem for networks in a deterministic setting
294: and obtains explicit solutions for the value function \cite{dup}.
295: The cost there is, in a sense, antipodal to the one considered in the current work,
296: namely the time till the system becomes empty (a criterion to be minimized).
297: For other recent work on queueing control in a large deviation regime
298: see Stolyar and Ramanan \cite{storam}, where a
299: single server non-Markovian system (with quite general stationary increments input flows)
300: is studied, and a particularly simple scheduling control policy is shown
301: to be asymptotically optimal (see also an extension of the work in
302: Stolyar~\cite{sto}).
303: 
304: The paper is organized as follows.
305: Section 2 introduces the model and the PDE and states the main result.
306: Section 3 contains discussion and interpretation.
307: In Section 4 we prove the main result.
308: 
309: Notation:
310: The symbol $\vee $ stands for
311: maximum, while $\w $ stands for minimum. Denote scalar product between two
312: vectors as $ \x \cdot \y $.
313: For integers $i\le j$, let $[i,j]\doteq\{1,\ldots,j\}$.
314: 
315: 
316: \section{Model and preliminaries}
317: 
318: \noi\uu{\bf The queueing network control problem.}
319: %
320: We consider the following tandem network.
321: There are $J$ queues and $J$ servers. Customers present at queue $i$
322: at a certain time are said to be of class $i$ at that time.
323: Customers arrive to queue $1$ according to a
324: Poisson process of rate $\la\ge0$. Service at queue $i$ is provided by
325: server $i$ at exponential time
326: with parameter $ \mu_i>0$, mutually independent and independent of the
327: arrivals.
328: After a customer is served by server $i$, it moves to queue
329: $r(i)$, where $r(i) = i+1 $, $i=1,\ldots,J-1$, $ r(J) = 0$,
330: and $i=0$ is used to denote the ``outside''.
331: The state of the network is the vector of queue lengths, denoted
332: by $\X$.
333: Let $\{ \e_i;i=1,\ldots,J\} $ denote the unit coordinate vectors,
334: let $\e_0 = 0 $ and denote
335: \begin{equation}\label{egam}
336: \bgamma_i=\e_i-\e_{r(i)}.
337: \end{equation}
338: Note that $\bgamma_i=\e_i-\e_{i+1}$ for $i=1,\ldots,J-1$, $\bgamma_J
339: =\e_J$, and that
340: following service to queue $i$ the state changes by $-\bgamma_i$.
341: The control is specified by the vector $ u =(u_1,...,u_J)$,
342: where $u_i=1$ if customers in queue $i$ are given service and $u_i=0$
343: otherwise.
344: We next consider the scaled process $\X^n$ under the scaling
345: which accelerates time by a factor of $n$ and down-scales space by
346: the same factor. We are interested in a
347: risk-sensitive cost functional that is associated with
348: exit from a bounded set.
349: Let $G$ be the rectangle defined through
350: \begin{equation}\label{def:G}
351:  G=\{(x_1,\ldots,x_J): 0\le x_1<z_1;\ 0\le x_i\le z_i, \,
352: i = 2 , \ldots , J \},
353: \end{equation}
354: for some $z_i>0$, $i=1,\ldots,J$.
355: Note that $G$ contains parts of, but not all of its boundary.
356: Let
357: \[
358: \sigma^n \doteq \inf \{t:\X^n(t) \not \in G \}.
359: \]
360: %
361: The control problem is to minimize the cost
362: $E_\x e^{-nc\sigma^n}$, where $E_\x$ denotes expectation starting
363: from $\x$, and $c>0$ is a constant.
364: With this cost structure ``risk-sensitivity'' means that atypically 
365: short exit times are weighted heavily by the cost.
366: As a result, even if exit within short time
367: occurs with small probability, it may have a noticeable effect on the cost,
368: and thus a ``good'' control will attempt to avoid such events
369: as much as possible.
370: 
371: %
372: Although this paper do not directly treat the
373: stochastic control problem but the corresponding PDE, we give here the precise
374: formulation of the former, for completeness.
375: For each $n$, the state space is $G^n \doteq n^{-1}\Z_+^J \cap G$. 
376: The control (or action) space is given by 
377: $$
378:  U \doteq \left\{(u_i), i=1,\ldots,J: 0 \le u_i\le1, \
379:  i=1,\ldots,J\right\}.
380: $$
381: One considers state processes $\X^n$ that are similar
382: to those defined for the original queueing network,
383: except that time is accelerated (equivalently, arrival and service rates
384: are multiplied) by a scaling parameter $n$, and space is scaled
385: down by the same factor. More precisely, for $u\in U$ and $f:\Z_+^J\to\R$,
386: let
387: $$
388: \calL^uf(\x)=\la [f(\x+\e_1)-f(\x)]
389: +\sum_{i=1}^Ju_i\mu_i1_{\{\x-\bgamma_i\in\Z_+^J\}}[f(\x-\bgamma_i)-f(\x)],
390: \quad \x\in\Z_+^J.
391: $$
392: For $n\in\N$ let
393: $$
394: \calL^{n,u}f(\x)=n\calL^ug(n\x),
395: $$
396: where $f:n^{-1}\Z_+^J\to\R$ and $g(\cdot)=f(n^{-1}\cdot)$.
397: A {\em controlled Markov process} starting from $\x\in G^n$
398: will consist of a complete filtered
399: probability space $(\Om,\calF,(\calF_t),P_x^{n,u})$,
400: a state process $\X^n$ taking values in  $G^n$ and
401: a control process $u$ taking values in  $U$,
402: such that $\X^n$ is adapted to $\calF_t$,
403: $u$ is measurable and adapted to $\calF_t$,
404: $P_\x^{u,n}(\X^n(0)=\x)=1$,
405: and for every function $f:G^n\to\R$
406: \[
407: f(\X^n(t))-\int_0^t\calL^{n,u(s)}f(\X^n(s))ds
408: \]
409: is an $\calF_t$-martingale.
410: $E_\x^{n,u}$ denotes expectation with respect to $P_\x^{n,u}$.
411: For a parameter $c>0$,
412: the value function for the stochastic control problem is 
413: defined by
414: \begin{equation}\label{eq:control}
415:   V^n(\x) \doteq -\inf n^{-1}\log E_\x^{u,n}e^{-nc\sig_n},
416:   \quad \x\in G^n,
417: \end{equation}
418: where the infimum is over all controlled Markov processes.
419: 
420: 
421: 
422: 
423: \noi\uu{\bf The domain and its boundary.}
424: It is possible for the controller to prevent any but the first queue
425: from exceeding $ z_i $, simply by turning off service to the preceding
426: queue. However, the controller cannot prevent overflow of the first queue.
427: Although it is in principle possible that the dynamics
428: could exit through the portion of the boundary defined by queues
429: $ 2 , \ldots , J$, it is always optimal for
430: the controller to not allow this.
431: Consider the simple two-class network illustrated in Figure \ref{fig1}.
432: The controller can prevent exit through the dashed portion of the 
433: boundary simply by stopping service at the first queue. 
434: As a consequence, there are in general three different types
435: of boundary--the constraining boundary due to non-negativity constraints on queue length,
436: the part of the boundary where exit can be blocked, and the remainder.
437: These three types of boundary behavior result
438: in the PDE in three types of boundary conditions.
439: The three portions of the boundary are explicitly given as
440: $$
441: \pl_c G=\{(x_1,\ldots,x_J): 0\le x_1<z_1,\ \mbox{ and }\ x_i=z_i\ \mbox{for
442: some}\,i> 1\}
443: $$
444: $$
445: \pl_o G=\{(x_1,\ldots,x_J): x_1=z_1, \ \mbox{ and}\ 0\le x_i\le z_i\ \mbox{for
446: all}\ i>1\}
447: $$
448: $$
449: \pl_+G= \{(x_1,\ldots,x_J):
450: \mbox{$x_i<z_i$ for all $i$, and $x_i=0$ for some $i$}\}.
451: $$
452: Note that $\pl_cG$, $\pl_oG$ and $\pl_+G$
453: partition the boundary $\pl G$ of $G$.
454: Also, $\pl_cG\subset G$ while $\pl_oG\cap G=\emptyset$.
455: As usual, we will denote $G^o=G\setminus\pl G$
456: and $\bar G=G\cup\pl G$.
457: 
458: 
459: \begin{figure}
460: \centerline{
461: \begin{tabular}{cc}
462: \psfig{file=fig_net_1.eps}\qquad\qquad\qquad
463: \psfig{file=fig_ex_1.eps}
464: \end{tabular}
465: }
466: \caption{
467: A simple queueing network, a rectangular domain and three
468: types of boundary.
469: Full line: $~$ \hfill $\pl_+G$, dashed line: $\pl_cG$,
470: and dotted line: $\pl_oG$
471: \hfill $~$ }
472: \label{fig1}
473: \end{figure}
474: 
475: 
476: 
477: \noi\uu{\bf The Hamiltonian, PDE and viscosity solutions.}
478: %
479: It is a standard fact that the value functions $V^n$
480: of the stochastic control problem considered above can be characterized
481: by a dynamic programming equation. The results of \cite{ads}
482: show that also the limit of $V^n$ as $n\to\infty$
483: can be characterized by a certain equation, namely a Hamilton-Jacobi-Bellman
484: PDE, that can in fact be regarded as the dynamic programming equation
485: for a certain deterministic game problem. For details on this PDE
486: we need some notation (the reader is referred to \cite{ads} for details
487: on the game).
488: Let $l:\R\to\R_+\cup\{+\infty\}$
489: be defined as
490: $$
491:  l(x)\doteq \lt\{\begin{array}{ll}x\log x-x+1 & x\ge0,  \\ +\infty & x<0,
492:      \end{array}\rt.
493: $$
494: where $0\log0\doteq0$.
495: Define
496: \begin{equation}
497: \label{em}
498:  \M =\{m=(\bar\la,\bar\mu_1,\ldots,\bar\mu_J):
499: \bar\la \geq 0 ,\ \bar \mu_i \geq 0 \}.
500: \end{equation}
501: For $ u\in U$ and $ m\in \M$ define
502: \begin{align*}
503: v ( u, m)    & \doteq \bar \lambda \e_1 - \sum_{i=1}^J
504:                u_i \bar\mu_i \bgamma_i, \\
505: \rho( u, m) & \doteq \lambda l\left( \frac{\bar{\lambda}}{
506: \lambda}\right) +\sum_{i=1}^{J}u_i\mu _il\left( \frac{\bar{\mu}_i}
507: {\mu_i}\right),
508: \end{align*}
509: where $\bgamma_i$ are as in \eqref{egam}.
510: Let
511: \begin{align}\label{def:H1}
512: H(p, u, m) &= c+ p\cdot v ( u, m)+\rho( u, m)\\ \notag
513: &=
514: c+
515: \lt[\bar\la p_1+\la l\lt(\frac{\bar\la}{\la}\rt)\rt]
516: +\sum_{i=1}^J u_i
517: \lt[-\bar\mu_i\bgamma_i\cdot \p+\mu_i l\lt(\frac{\bar\mu_i}{\mu_i}\rt)\rt]
518: \end{align}
519: and let the Hamiltonian be defined as
520: \begin{equation}\label{def:H}
521:  H(p)=\sup_{ u\in U}\inf_{ m\in\M}H(p,u,m)=\inf_{m\in \M}\sup_{u\in U}
522: H(p, u, m),
523: \end{equation}
524: where the last identity, expressing the {\it Isaacs Condition} is proved in \cite{ads}.
525: %
526: The following simplification in the structure of 
527: the Hamiltonian will be useful.
528: Using convexity and the fact that the slope of $l$ at $0^+$ is
529: $-\infty$, the minimum over $ m$ is attained
530: at $\bar\la=\la e^{-p_1}$, $\bar\mu_i=\mu_i e^{\bgamma_i\cdot \p}$.
531: A straightforward calculation then shows that
532: \begin{align}\notag
533: H(\p, u)\doteq \inf_m H(\p, u, m) &=
534: c+[(\la-\bar\la)+u_i(\mu_i-\bar\mu_i)]\\
535: &=
536: c+\la(1-e^{-p_1})
537: +\sum_{i=1}^Ju_i\mu_i(1-e^{\bgamma_i\cdot \p}).
538: \label{eq:116}
539: \end{align}
540: Define $ I (\x) = \{ i : x_i = 0 \} $.
541: The PDE of interest is the following.
542: \begin{equation}\label{eq:pde}
543: \lt\{
544: \begin{array}{ll}
545:  H(DV(\x))=0, & \x\in G^o,\\ \\
546:  DV(\x)\cdot \bgamma_i=0, & i\in I(\x),\ \x\in\pl_+G ,\\ \\
547:  V(\x)=0, & \x\in\OBdry G.
548: \end{array}\rt.
549: \end{equation}
550: Since typically such equations do not possess classical solutions,
551: the framework of viscosity solutions is useful (see \cite{barcap}).
552: This framework allows
553: for functions that are merely continuous to be regarded as solutions.
554: For $\x\in G$,
555: the set of superdifferentials $D^+V(\x)$ and the set of subdifferentials
556: $D^-V(\x)$ are defined as
557: \begin{equation}\label{def:Dplus}
558: D^+V(\x)=\lt\{\p:\limsup_{\y\to \x}\frac{V(\y)-V(\x)-\p\cdot(\y-\x)}{|\y-\x|}\le0\rt\},
559: \end{equation}
560: \begin{equation}\label{def:Dminus}
561: D^-V(\x)=\lt\{\p:\liminf_{\y\to \x}\frac{V(\y)-V(\x)-\p\cdot(\y-\x)}{|\y-\x|}\ge0\rt\}.
562: \end{equation}
563: 
564: \begin{definition}
565: $V$ is a viscosity solution to (\ref{eq:pde}) if
566: \begin{equation}\label{eq:up}
567: H(\p)\vee\max_{i\in I(\x)}\p\cdot\bgamma_i\ge0, \quad
568: \p\in D^+V(\x),\ \x\in G,
569: \end{equation}
570: \begin{equation}\label{eq:down}
571: H(\p)\w\min_{i\in I(\x)}\p\cdot\bgamma_i\le0, \quad
572: \p\in D^-V(\x),\ \x\in G\setminus\pl_cG,
573: \end{equation}
574: and $V(\x)=0$ for $\x\in\pl_oG$.
575: \end{definition}
576: The following is a special case of Theorem 2 of \cite{ads}.
577: \begin{theorem}\label{th:main}
578: There exists a unique Lipschitz viscosity solution $V$ to (\ref{eq:pde}).
579: Moreover,
580: if $\x_n\in G^n$, $n\in\N$ are such that $\x_n\to \x\in G$, then
581: $\lim_{n\to\infty}V^n(\x_n) = V(\x)$.
582: \end{theorem}
583: For $i=1,\ldots,J$, let $\beta_i$ denote the unique positive solution to
584: \begin{equation}\label{eq:100}
585: c+\la(1-e^{\beta_i})+\mu_i(1-e^{-\beta_i})=0.
586: \end{equation}
587: %
588: Set $b_i=\beta_i\sum_{j=1}^i\e_j$.
589: Our main result is the following.
590: \begin{theorem}\label{th:tandem}
591: Assume $c>0$.
592: Then the viscosity solution to the PDE (\ref{eq:pde}) is given by
593: \begin{equation}\label{eq:101}
594: V(\x )=\min_{i=1,\ldots,J}b_i\cdot(\z -\x ).
595: \end{equation}
596: \end{theorem}
597: 
598: 
599: 
600: 
601: \section{Some remarks}\label{secrems}
602: 
603: \subsection{Interpretation}
604: 
605: %
606: As commented above, it is possible to characterize
607: the value function $V^n$
608: as the solution to a dynamic programming equation on the discrete space
609: $G^n$. Moreover, if $V^n$ is available in explicit form, one can
610: use the dynamic programming equation to specify an optimal control
611: policy for the problem. The results above provide an explicit
612: expression only to the limit $V=\lim_n V^n$, and therefore we are unable
613: to specify an optimal policy for the problem with finite $n$.
614: Instead, we shall use the quantity
615: $V$ along with the HJB equation \eqref{eq:pde} to propose a policy for
616: the queueing network problem (and the corresponding value $V^n$).
617: It is plausible that the proposed policy is, in a sense,
618: asymptotically optimal as $n\to\infty$ but we do not attempt
619: to prove such a statement here.
620: Instead, the discussion below could be regarded as a natural
621: interpretation of the result.
622: Moreover, since $V$ can be considered as a good approximation to
623: $V^n$ (for large $n$), it can be used as an initial condition
624: in a value iteration procedure that calculates $V^n$ and an optimal
625: policy.
626: 
627: The solution to the PDE stated here may be interpreted as follows.
628: Let $\x $ be an interior point of $G$, and assume that
629: $V$ is differentiable at $x$.
630: The form \eqref{eq:101} implies that for some $j=j(\x)$, 
631: \begin{equation}\label{e300}
632: DV(\x)=-b_j
633: =-\beta_j\sum_{i=1}^j\e_i \, .
634: \end{equation}
635: Hence by \eqref{eq:116}, the equation $H(-b_j)=0$ has the form
636: $$
637: \sup_{u\in U}\lt[c+\la(1-e^{\beta_j})+u_j\mu_j(1-e^{-\beta_j})\rt]=0.
638: $$
639: It is seen that the supremum is attained at any $u$ for which $u_j=1$
640: and $u_i\in[0,1]$, $i\ne j$. The interpretation in terms of the service policy
641: is that it is important to serve class $j$, while optimality does not depend
642: on the service given to other classes.
643: {\em The station $j=j(x)$ can therefore be regarded as a bottleneck:}
644: it is crucial to serve station $j$ when at state $x$.
645: Since the PDE describes the limit of the stochastic control problem,
646: one expects
647: the bottleneck stations to have a similar property in the stochastic problem:
648: Although it may be optimal for all servers to not idle when the system is near
649: an interior point $\x$, it is significant for the bottleneck server
650: to work while if the other servers idle the cost is affected only by little.
651: 
652: A closer look at \eqref{e300} reveals that all bottleneck stations
653: belong to a certain set $A'$ defined below.
654: More precisely,
655: given an interior point $x$ where $V$ is differentiable
656: and denoting $y=z-x$, using \eqref{eq:101}, we see
657: that \eqref{e300} holds for $j$ if and only if $j$ satisfies
658: \begin{equation}\label{e301}
659: \beta_j(y_1+\cdots+y_j)\le\beta_i(y_1+\cdots+y_i)\quad
660: \forall\ i\ne j.
661: \end{equation}
662: We claim that
663: a necessary condition for $j$ to satisfy \eqref{e301} (for some $y$)
664: is $j\in A'$, where
665: $$
666: A'=\{k\in[1,J]:\mu_k\le\mu_l,\ \mbox{ for all } l<k\},
667: $$
668: and by convention, $1\in A'$.
669: To this end, write the explicit form of the solution to~\eqref{eq:100} as
670: \begin{equation*}
671: e^{\beta_i } = (2\la)^{-1}[ c + \lambda + \mu_i
672:                    + ( c^2 + \lambda^2 + \mu_i^2 
673:                        + 2 c ( \lambda + \mu_i) )^{1/2}] \, ,
674: \end{equation*}
675: and note that the positive solutions $\beta_i$ to
676: \eqref{eq:100} are monotone in $\mu_i$, in the sense that
677: \begin{equation}\label{eq:mon}
678: \mu_i<\mu_j\quad \Longleftrightarrow\quad \beta_i<\beta_j.
679: \end{equation}
680: If \eqref{e301} holds then $\beta_i\le\beta_j$ for $j=1,\ldots,i$,
681: and it follows from \eqref{eq:mon} that $j\in A'$.
682: 
683: It should be emphasized that the condition $j\in A'$ is only
684: necessary for $j$ to be a bottleneck, and being a bottleneck is
685: really a function of the system's state. A more complicated necessary
686: condition is given in Section \ref{sec:proof}, which is of the form
687: $j\in A(x)$.
688: One interesting and perhaps counterintuitive phenomenon is that it is possible
689: that a station is nearly empty while others are far from being empty,
690: and still it is a bottleneck.
691: 
692: 
693: In the rest of this subsection we discuss a different queueing system
694: for which a similar analysis is possible, including an explicit form
695: for the limit of the value function and a clear interpretation of
696: it regarding nearly optimal service policies for the queueing system
697: (see \cite{ads} for proof of the results quoted below).
698: Consider a single server that provides
699: service to $J$ classes (each customer requires service once).
700: Service rate to queue $i$ is exponential with rate $ \mu_i $,
701: and the arrival process to class $i$ is Poisson of parameter $\la_i>0$,
702: $i=1,\ldots,J$. All arrival and service processes are mutually independent.
703: One considers the control space
704: \[
705: U=\left \{ u: \sum_{i=1}^J u_i\le 1, u_i \ge 0, i=1,\ldots,J \right \},
706: \]
707: where $u_i$ represents the fraction of service allocated to class $i$
708: by the single server.
709: Analogously to the problem discussed above, one defines a domain
710: $G=\{(x_1,\ldots,x_J):0\le x_i< z_i,1=1,\ldots,J\}$, scaled queueing
711: processes $X^n$ and exit time $\s^n$, and attempts minimizing the cost
712: $E_xe^{-nc\s^n}$ over an appropriate class of control processes.
713: Let $V^n(x)$ denote the infimum.
714: One can then show that $\lim_nV^n(x_n)$
715: exits whenever $x_n\to x\in G$.
716: Moreover, the limit $V$ is characterized in terms of a PDE
717: of the form \eqref{eq:pde}, where now $\gamma_i=e_i$, $i=1,\ldots,J$,
718: and $H(p)=\sup_{u\in U}H(p,u)$. Here $H(p,u)$ has the form
719: (analogous to \eqref{eq:116}):
720: \begin{equation}\label{216}
721: H(\p,u)=
722: c+\sum_{i=1}^J[\la_i(1-e^{-p_i})+u_i\mu_i(1-e^{p_i})],
723: \end{equation}
724: and the limit $V(x)$
725: can be explicitly calculated provided $c$ is large enough
726: as follows.
727: For $i=1,\ldots,J$, define $ \alpha_i $ as the unique positive
728: solution to $c+\la_i(1-e^{\al_i})+\mu_i(1-e^{-\al_i})=0$, namely
729: $$
730: e^{\alpha_i } = (2\la)^{-1}[ c + \lambda + \mu_i
731:                    + (( c + \lambda + \mu_i )^2
732: 		   - 4 \lambda \mu_i)^{1/2}]\, .
733: $$
734: Then if $c$ is large enough one has
735: \begin{equation}\label{eq:form}
736: V(\x )=\min_{i=1,\ldots,J}\al_i(z_i-x_i).
737: \end{equation}
738: Let $\x$ be a point in the interior of $G$
739: where the gradient of $V$ is well defined.
740: Then the PDE is satisfied in the classical sense at this point.
741: Thus, $H(DV(\x))=H(-\al_j\e_j)=0$, where $j=j(\x)$.
742: Using \eqref{216}, the equation $H(-\al_i\e_j)=0$ takes the form
743: $$
744: \sup_{u\in U}\lt[c+\la_j(1-e^{\al_j})+
745: u_j\mu_j(1-e^{-\al_j})\rt]=0.
746: $$
747: Clearly the supremum is attained at $u_i=1_{i=j}$,
748: $i=1,\ldots,J$.
749: This means that it is optimal to serve class $j(\x)$ at the
750: state $\x$.
751: In the totally symmetric case, where $\mu_i=\mu$, $\la_i=\la$,
752: $z_i=z$ for all $i$, the solution takes the form
753: $V(\x )=\al\min_i (z-x_i)$, and the optimal
754: service discipline can be interpreted as ``serve the longest
755: queue.'' An asymmetric two dimensional example
756: is given in Figure \ref{fig:example}, where the domain $G$
757: is divided into two subdomains $G_1$ and $G_2$ in accordance
758: with the structure (\ref{eq:form}), and the optimal service
759: discipline corresponds to giving priority to
760: class $i$ when the state is within $G_i$, $i=1,2$.
761: This discipline gives priority {\em to the queue with the (weighted)
762: shortest free buffer space.}
763: 
764: 
765: 
766: \begin{figure}
767: \centerline{
768: \begin{tabular}{cc}
769: \psfig{file=fig_net_2.eps}\qquad\qquad\qquad
770: \psfig{file=fig_ex_2.eps}
771: \end{tabular}
772: }
773: \caption{Priority to class $i$ when the state is in $G_i$, $i=1,2$.}
774: \label{fig:example}
775: \end{figure}
776: 
777: 
778: 
779: \subsection{The perturbed rates}
780: 
781: In the asymptotic analysis of rare events it is often the case
782: that most of the probability mass of an event of interest
783: is concentrated on the event that the stochastic process, say $X^n$,
784: nearly follows a certain deterministic path, for large values of $n$.
785: For example,
786: the most likely way a stable M/M/1 queue overflows is by nearly
787: following a deterministic path that is the solution to a fluid model
788: in which arrival and service rates are reversed.
789: This  appears as a consequence of time-reversal arguments in~\cite{sw}.
790: For many other cases where one can compute
791: deterministic paths about which most mass is concentrated see \cite{swbook}.
792: Similarly, in the current stochastic control problem,
793: when the system operates under the optimal control most
794: contribution to the cost is obtained when the process $X^n$ nearly
795: follows a certain deterministic path. This path is now
796: the solution to a fluid model with a control $u$ and perturbed
797: arrival and service rates $m=(\bar\la,\bar\mu_1,\ldots,\bar\mu_J)$.
798: At a point $x$ where the viscosity solution $V$ to \eqref{eq:pde}
799: is differentiable, the correct values of $u$ and $m$ are those that achieve
800: the max-min in $H(DV(x))=\sup_u\inf_mH(DV(x),u,m)$ (cf.\ \eqref{def:H}).
801: 
802: We remark that in the example of
803: tandem queues the optimal perturbed rates
804: satisfy certain relations with the unperturbed rates, as shown in
805: the two equations below.
806: By \eqref{eq:116}, the relation $H(DV)=0$ implies
807: \begin{equation}\label{e302}
808: \bar\la+\sum_{i=1}^Ju_i\bar\mu_i=c+\la+\sum_{i=1}^Ju_i\mu_i \, .
809: \end{equation}
810: Moreover, by \eqref{eq:116}, by the fact that the minimum over $m$
811: is attained at
812: $\bar\la=\la e^{-p_1}$, $\bar\mu_i=\mu_i e^{\bgamma_i\cdot \p}$,
813: and using $\sum_{i=1}^J \bgamma_i = \e_1$, we have
814: \begin{equation}\label{e303}
815: \bar\la\prod_{i=1}^J\bar\mu_i=\la\prod_{i=1}^J\mu_i.
816: \end{equation}
817: Relation \eqref{e302}
818: was noticed by Avram \cite{avr}.
819: The relation \eqref{e303} appears to be new.
820: A generalization of these equations to a more general network
821: is possible and will appear elsewhere.
822: 
823: \remark An interesting relation between the roots $\al_i$ and $\beta_i$
824: and the busy cycle period was
825: pointed out to us by Boxma \cite{box}.
826: For example, if $B$ denotes the busy cycle period for an M/M/1
827: queue under the stationary distribution, then $Ee^{cB}=e^\beta$,
828: where
829: $$
830: c+\la(1-e^{\beta})+\mu(1-e^{-\beta})=0
831: $$
832: (compare with \eqref{eq:100}).
833: 
834: 
835: 
836: \section{Proof of the main result}\label{sec:proof}
837: 
838: Recall that $I(\x )=\{i\in[1,J]:x_i=0\}$, and denote
839: $B(\x )=\{i\in[1,J]:x_i=z_i\}$. Note that $I( \x )$ and $B(\x )$
840: do not intersect. Since points $\x $ for which $x_1=z_1$ are not in $G$,
841: we have $1\not\in B(\x )$ for all $\x \in G$.
842: 
843: We show that the minimum over $i=1,\ldots,J$
844: in \eqref{eq:101} can equivalently be performed over a smaller
845: (state-dependent) set. 
846: As in Section \ref{secrems}, let 
847: \begin{equation}\label{eq:112}
848: A'=\{i\in[1,J]:\mu_i\le\mu_j,\ \mbox{ for all } j<i\},
849: \end{equation}
850: and by convention let $1\in A'$.
851: Let also
852: $$
853: A(x)=\{i\in A':\text{ either $i+1\not\in B(\x)$; or 
854: $j>i$ and $[i+1,j]\subset B(\x )$
855: imply $\mu_i<\mu_j$}\}.
856: $$
857: 
858: \begin{lemma}\label{lem:1}
859: The minimum in~\eqref{eq:101} is obtained over the indices in the
860: set $A(\x)$ defined above.
861: More precisely,
862: \[
863: V(\x)=\min_{i=1,\ldots,J}b_i\cdot(\z-\x)
864: =\min_{i\in A(\x)}b_i\cdot(\z-\x) \, .
865: \]
866: \end{lemma}
867: \proof
868: Fix $ \x \in G $ and recall that $ z_1 - x_1 > 0 $.
869: If
870: \begin{equation}\label{eq:mon1}
871: b_i\cdot(\z -\x )\le\min_{j\ne i}
872: b_j\cdot(\z -\x ),
873: \end{equation}
874: then $\beta_i\le\beta_j$ for $j \in [1,i]$,
875: and it follows from \eqref{eq:mon} that $i\in A'$.
876: Thus
877: \[
878: V (\x ) = \min_{i=1,\ldots,J}b_i\cdot(\z -\x )
879: =\min_{i\in A'}b_i\cdot(\z -\x )
880: \]
881: for all $\x \in G $ (although not every $ i \in A' $ is a minimizer).
882: Fix now $i \in A'$, and suppose that
883: \begin{equation}\label{eq:assume}
884: \mbox{there is some $j>i$ so that 
885: $[i+1,j]\subset B(\x )$ and $\mu_i \geq \mu_j$.}
886: \end{equation}
887: Since $ i \in A'$, if $ i+1 \not\in A' $ then $ \mu_{i+1} > \mu_i $.
888: But then,
889: if in addition $ i+2 \not\in A' $ we have $ \mu_{i+2} > \mu_i $.
890: So, if $ k \not\in A'$ for all $ i+1 \le k \le j-1 $ then
891: $ \mu_k > \mu_i $, and together with $ \mu_j \le \mu_i $ we have
892: that $ j \in A' $. We conclude that under~\eqref{eq:assume},
893: \begin{equation}\label{eq:200}
894: \mbox{there is $k\in[i+1,j]$ such that $k\in A'$.}
895: \end{equation}
896: By~\eqref{eq:assume},
897: $\beta_i \geq \beta_j$ and so
898: \begin{equation}\label{eq:201}
899: b_i \cdot(\z -\x )\geq b_j \cdot(\z -\x ).
900: \end{equation}
901: Therefore, for $k$ as in \eqref{eq:200} and under the assumptions
902: in~\eqref{eq:assume},
903: \[
904: b_i\cdot(\z-\x)\ge b_k\cdot(\z-\x) ,
905: \]
906: and since $k\in A'$, we need not consider $i$ in the minimum.
907: As a result,
908: \eqref{eq:101} is equivalently given as
909: $$
910: V(\x )=\min_{i\in A(\x )}b_i\cdot(\z -\x ),\quad \x \in G,
911: $$
912: where $ A (\x ) $ is obtained from $ A' (\x ) $ by deleting those
913: $ i \in A' (\x ) $ which are followed by empty queues,
914: $ [ i+1 , j ] \subset B (\x ) $, and such that $\mu_i \ge \mu_j $.
915: This leaves in $ A (\x ) $ an index $i$ from $ A' (\x ) $
916: only if either $ z_{i+1} > x_{i+1} $, or 
917: $ z_{k} = x_{k} $ for $ i+1 < k \le j $ implies $ \mu_i < \mu_j $.
918: More formally,
919: \begin{align}
920: \notag
921: A(\x) &=
922: A'\setminus\{i\in A':\exists\ j>i,\ [i+1,j]\subset B(\x),\ \mu_i\ge\mu_j\}\\
923: \label{eq:113}
924: &=
925: \{i\in A':\text{ either $i+1\not\in B(\x)$; or 
926: $j>i$ and $[i+1,j]\subset B(\x )$
927: imply $\mu_i<\mu_j$}\}.
928: \end{align}
929: \qed
930: 
931: 
932: The form of the proposed solution is the minimum of smooth functions.
933: The set of superdifferentials
934: at a point where the function is not smooth
935: can be seen (using the definition \eqref{def:Dplus})
936: to consist of the convex hull of the gradients of the
937: smooth functions defining it, at that point. Also,
938: at the boundary, the fact that there are less constraints introduced
939: by \eqref{def:Dplus} on $p\in D^+V$ than there are when $x$
940: is in the interior, has an effect of enlarging the set further.
941: Thus, for example, the set of
942: superdifferentials of the zero function from $\R_+$ to $\R$ at zero
943: is $\R_+$.
944: Using these considerations and the rectangular structure
945: of the domain, one finds the general form for the superdifferential
946: as follows.
947: Let $\x \in G$ be fixed. Set $A=A(\x )$, $I=I(\x )$, $B=B(\x )$, and
948: $O=\{1,\ldots,J\}\setminus (I\cup B)$.
949: Then any element $\p \in D^+V(\x )$ is given as
950: $$
951: \p =-\sum_{i\in A}\nu_ib_i+\bdel,
952: $$
953: for some $ \{\nu_i \}$, where
954: \begin{equation}\label{eq:102}
955: \del_i\ge0,\ i\in I,\quad
956: \del_i\le0,\ i\in B,\quad
957: \del_i=0,\ i\in O,
958: \end{equation}
959: and
960: \begin{equation}\label{eq:103}
961: \nu_i\ge0,\ i\in A,\quad \nu_i=0,\ i\not\in A,\quad \sum_{i\in A}\nu_i=1.
962: \end{equation}
963: If we denote
964: \begin{equation}\label{eq:105}
965: \del_{J+1}=0,
966: \end{equation}
967: then, using \eqref{eq:116}, the Hamiltonian is expressed as
968: \begin{align}\label{eq:114}
969: \notag
970: H(\p ) &= c+\la(1-e^{-p_1})+\sum_{i=1}^J0\vee\mu_i(1-e^{\p \cdot\bgamma_i})\\
971:      &= c+\la(1-e^{\sum_{i  \in A}\nu_i\beta_i-\del_1})
972:      +\sum_{i=1}^J0\vee\mu_i(1-e^{-\nu_i\beta_i+\del_i-\del_{i+1}}).
973: \end{align}
974: 
975: \proofOf{Theorem~\ref{th:tandem}}
976: 
977: \noi\uu{\it Verifying the PDE for superdifferentials.}
978: To verify \eqref{eq:up}, it suffices to show that
979: $H(\p )\ge0$ whenever
980: $\p \in DV^+(\x )$ and 
981: $\p \cdot\bgamma_i<0$ for all $i\in I$.
982: 
983: \noi\uu{\it Step 1.} We show first that $H(\p )\ge0$ whenever
984: $\p \in DV^+(\x )$ and  $\p \cdot\bgamma_i\le0$ for all $i=1,\ldots,J$.
985: The forms of $b_i$ and $\bgamma_i=\e _i-\e_{i+1}$ imply the last inequality can be rewritten
986: \begin{equation}\label{eq:104}
987: -\nu_i\beta_i+\del_i-\del_{i+1}\le0,\ i=1,\ldots,J.
988: \end{equation}
989: In this case, \eqref{eq:114} becomes
990: \begin{equation}\label{eq:109}
991: H(\p ) = h(\bnu,\bdel)
992:  \doteq c+\la(1-e^{\sum_{i \in A}\nu_i\beta_i-\del_1})
993: +\sum_{i=1}^J\mu_i(1-e^{-\nu_i\beta_i+\del_i-\del_{i+1}}).
994: \end{equation}
995: The constraints we have put on $(\bnu,\bdel)$ define a convex
996: set $S$, namely, the set of $(\bnu,\bdel)\in\R^J\times\R^{J+1}$ satisfying
997: \eqref{eq:102}, \eqref{eq:103}, \eqref{eq:105} and \eqref{eq:104}.
998: The set $S$ is bounded for the following reasons.
999: First, since $\bnu$ is a probability vector (see \eqref{eq:103}) we have $\nu_i\in[0,1]$.
1000: Next, by \eqref{eq:102} and $1\not\in B$,
1001:  $\del_1\ge0$.
1002: Finally,
1003: it follows from \eqref{eq:104}
1004: (using the convention $\sum_s^t=0$ if $t<s$) that 
1005: $$
1006: \del_1-\sum_{j=1}^{i-1}\nu_j\beta_j
1007: \le\del_i\le\sum_{j=i}^J\nu_j\beta_j,
1008: \quad i=1,\ldots, J.
1009: $$
1010: This shows the boundedness.
1011: 
1012: The function $(\bnu,\bdel)\mapsto h(\bnu,\bdel)$ is concave, and therefore to prove $h\ge0$ on $S$ it suffices to check the inequality
1013: on the set $E$ of extreme points of $S$, which contains a finite number of
1014: points since the constraints are linear.
1015: \begin{lemma}
1016: All points $(\bnu,\bdel)\in E$ have the following form:
1017: \begin{align*}
1018: \nu_k & = 1 \quad \text{for some $k$, and} \\
1019: \del_i^{(r,k)} & =\beta_k(1_{i\ge r+1}-1_{i\ge k+1}),\quad
1020: i=1,\ldots,J,\ r=s,\ldots,t-1,
1021: \end{align*}
1022: where $ t, s $ are defined below.
1023: \end{lemma}
1024: \proof
1025: We will first obtain the general form of $\bnu$
1026: and then that of $\bdel$.
1027: 
1028: We claim that for any $(\bnu,\bdel)\in E$, $\bnu$ is of the form
1029: $\bnu=1_k$ (short for $\nu_i=1_{i=k}$, $i=1,\ldots,J$),
1030: for some $k\in A$. Assume this is false.
1031: Then there are $l,m\in A$, $l<m$, for which $\nu_l,\nu_m\in(0,1)$.
1032: We will show that
1033: there is a vector $\bDel_m$, such that replacing $(\bnu,\bdel)$ by
1034: $(\bnu',\bdel')=(\bnu-\eps \e_m,\bdel+\eps\bDel_m)$ maintains
1035: the relations \eqref{eq:102}, \eqref{eq:105} and \eqref{eq:104}
1036: for both $\eps>0$ and $\eps<0$ (provided $|\eps|$ is small).
1037: A similar statement will hold also for
1038: $(\bnu'',\bdel'')=(\bnu+\eps \e_l-\eps \e_m,\bdel-\eps\bDel_l+\eps\bDel_m)$,
1039: and as a result all of \eqref{eq:102}, \eqref{eq:103},
1040: \eqref{eq:105} and \eqref{eq:104}
1041: will hold for both $\eps>0$ and $\eps<0$, a contradiction to
1042: $(\bnu,\bdel)$ being an extreme point of $S$.
1043: The construction of $\bDel_m$ based on $(\bnu,\bdel)$
1044: can be mimicked to construct $\bDel_l$ based on $(\bnu',\bdel')$
1045: (in particular, no use is made of the fact that $\nu_i$ sum to one,
1046: but only that some of its components are within $(0,1)$),
1047: and therefore the latter construction is omitted.
1048: 
1049: Case 1: {\it Inequality \eqref{eq:104} holds as a strict inequality
1050: for $i=m$, i.e., $-\nu_m\beta_m+\del_m-\del_{m+1}<0$.}
1051: Then $-(\nu_m-\eps)\beta_m+\del_m-\del_{m+1}\le0$
1052: also holds (for both $\eps$ positive and negative),
1053: provided that $|\eps|$ is small. Here we take $\bDel_m=0$.
1054: We see that $(\bnu-\eps \e_m,\bdel)$ satisfies the requirements.
1055: 
1056: Case 2: {\it Inequality \eqref{eq:104} holds with equality
1057: for $i=m$, i.e., $-\nu_m\beta_m+\del_m-\del_{m+1}=0$.}
1058: Since $\nu_m\beta_m>0$, either $\del_m>0$ or $\del_{m+1}<0$.
1059: Assume $\del_m>0$ (the case $\del_{m+1}<0$ can be treated analogously,
1060: and is therefore omitted).
1061: Let $m'$ be the smallest $j\in[1,m]$ for which \eqref{eq:104}
1062: holds with equality for all $i\in[j,m]$. For $i\in[m',m-1]$
1063: (the set being empty and the statement void if $m'=m$)
1064: we have $-\nu_i\beta_i+\del_i-\del_{i+1}=0$, hence if
1065: $\del_{i+1}>0$ then $\del_i>0$. Together with the fact that
1066: $\del_m>0$, this shows that
1067: \begin{equation}\label{eq:108}
1068: \del_i>0,\ i\in[m',m].
1069: \end{equation}
1070: Moreover,
1071: \begin{equation}\label{eq:107}
1072: -\nu_{m'-1}\beta_{m'-1}+\del_{m'-1}-\del_{m'}<0
1073: \end{equation}
1074: (the statement being void in case that $m'=1$).
1075: Set $\bDel_m=-\beta_m\sum_{i=m'}^m \e_i$, $\bnu'=\bnu+
1076: \eps \e_{m}$, and $\bdel'=\bdel+\eps\bDel_m$.
1077: The perturbation $\eps\bDel_m$ is chosen to cancel the change in $-\nu_m\beta_m$,
1078: and to preserve the left hand side of \eqref{eq:104}
1079: for all $i>m'-1$. However, by \eqref{eq:107}
1080: the inequality is maintained for $i=m'-1$ as well, by taking
1081: $|\eps|$ sufficiently small. Similarly, by \eqref{eq:108},
1082: \eqref{eq:102} and \eqref{eq:105} are also maintained on taking
1083: $|\eps|$ small.
1084: 
1085: This completes the construction of $\bDel_m$.
1086: As described above, this leads to a contradiction, and we conclude that
1087: any extreme point $(\bnu,\bdel)\in E$ satisfies $\bnu=1_k$ for some $k\in A$.
1088: 
1089: When $\bnu=1_k$ for some $k\in A$, inequalities \eqref{eq:104} can be rewritten as
1090: $$
1091: \del_i\le\del_{i+1},\ i\ne k,\quad \del_k\le \beta_k+\del_{k+1}.
1092: \eqno{(\ref{eq:104}')}
1093: $$
1094: In particular, $0\le\del_1\le\cdots\le\del_k$.
1095: Let $s$ denote the largest $j\le k$ for which $j\in B\cup O$
1096: (and $s=0$ if there is no such $j$). 
1097: The definitions of $O$ and $B$ imply $\delta_s=0$,
1098: and thus
1099: \stepcounter{equation}
1100: $$
1101: \text{$\del_j=0$ for $1\le j\le s$.}
1102: \eqno{(\theequation a)}
1103: $$
1104: Similarly, $\del_{k+1}\le\cdots\le\del_J\le0$,
1105: and if $t$ denotes the least $j\in [k+1,J]$ for which
1106: $j\in I\cup O$ (and $t=J+1$ if empty), then
1107: $$
1108: \del_j=0,\quad t\le j\le J.
1109: \eqno{(\theequation b)}
1110: $$
1111: Hence $\bdel$ must satisfy
1112: $$
1113: \begin{cases}
1114: 0\le\del_{s+1}\le\cdots\le\del_k\le\beta_k+\del_{k+1},
1115: &
1116: \text{when $s\le k-1$},\\
1117: 0\le\del_k
1118: &
1119: \text{when $s=k$}.
1120: \end{cases}
1121: \eqno{(\theequation c)}
1122: $$
1123: In addition,
1124: $$
1125: \begin{cases}
1126: \del_{k+1}\le\cdots\le\del_{t-1}\le0,&
1127: \text{when }t\ge k+2\\
1128: \del_{k+1}\le0 &
1129: \text{when }t=k+1.
1130: \end{cases}
1131: \eqno{(\theequation d)}
1132: $$
1133: We have just shown that \eqref{eq:102}, \eqref{eq:105}
1134: and (\ref{eq:104}') imply (36$a$--$d$). On the other hand, clearly
1135: (36$a$--$d$) implies (\ref{eq:104}').
1136: Moreover, as follows directly from the definition of $s$ and $t$,
1137: \begin{equation}\label{eq:106}
1138: \text{$i\in I$ for all $i\in[s+1,k]$ and $i\in B$
1139: for all $i\in[k+1,t-1]$}.
1140: \end{equation}
1141: This shows that (36$a$--$d$) implies \eqref{eq:102} and \eqref{eq:105}.
1142: Thus \eqref{eq:102}, \eqref{eq:105} and (\ref{eq:104}')
1143: are equivalent to (36$a$--$d$).
1144: Now, the set of $\bdel$ satisfying
1145: the constraints (36$a$--$d$) is easy to analyze.
1146: In particular, it is not hard to see that it has the following
1147: $t-s$ extreme points, indexed by $k$ and $r\in[s,\ldots,t-1]$, namely
1148: \begin{equation}\label{eq:110}
1149: \del_i^{(r,k)}=\beta_k(1_{i\ge r+1}-1_{i\ge k+1}),\quad
1150: i=1,\ldots,J,\ r=s,\ldots,t-1.
1151: \end{equation}
1152: \qed
1153: 
1154: We now calculate $h$ (cf.\ \eqref{eq:109}) at each extreme point.
1155: To this end, note that if $(\bnu,\bdel)=
1156: (1_k,\bdel^{(r,k)})$ then by \eqref{eq:110}
1157: $$
1158: -\nu_i\beta_i+\del_i-\del_{i+1}=
1159: \begin{cases}
1160: -\beta_k & i=r,\\ 0 & i\ne r,
1161: \end{cases}
1162: \qquad i=1,\ldots,J,
1163: $$
1164: and
1165: $$
1166: \del_1=
1167: \begin{cases}
1168: \beta_k & r=0,\\ 0 & r>0.
1169: \end{cases}
1170: $$
1171: Substituting in \eqref{eq:109}, we have the following possibilities.
1172: If $r=0$ then $\del_i^{(r,k)}=\beta_k1_{i\in[1,k]}$
1173: thus $\sum\nu_i\beta_i-\del_1=0$, and
1174: $-\nu_i\beta_i+\del_i-\del_{i+1}=0$, $i=1,\ldots,J$. Hence
1175: $h(1_k,\bdel^{(r,k)})=c>0$.
1176: Otherwise,
1177: \begin{equation}\label{eq:111}
1178: h(1_k,\bdel^{(r,k)})=c+\la(1-e^{\beta_k})+\mu_r(1-e^{-\beta_k}).
1179: \end{equation}
1180: In case that $r=k$, the right hand side of \eqref{eq:111} vanishes owing to the definition of $\beta_k$ (see \eqref{eq:100}).
1181: In case that $r<k$, recall that $k\in A$, and in particular,
1182: $k\in A'$. By \eqref{eq:112} we therefore have $\mu_k\le\mu_r$,
1183: hence by \eqref{eq:100}, $h(1_k,\bdel^{(r,k)})\ge0$.
1184: Finally, consider the case where $k<r\le t-1$. By \eqref{eq:106},
1185: $[k+1,r]\subset B$. Since $k\in A$, \eqref{eq:113} implies
1186: that $\mu_k<\mu_r$, and we again conclude that $h(1_k,\bdel^{(r,k)})>0$.
1187: Having shown that $h(\bnu,\bdel)\ge0$ for all
1188: extreme points of the set $S$, we conclude that the inequality holds
1189: for all $(\bnu,\bdel)\in S$.
1190: 
1191: \noi\uu{\it Step 2.}
1192: We now relax the condition \eqref{eq:104}.
1193: Let then $(\bnu,\bdel)$ satisfy \eqref{eq:102}, \eqref{eq:103},
1194: \eqref{eq:105}, and assume that the inequality in \eqref{eq:104} holds
1195: for all $i\in I$ (relaxing the assumption made in Step 1, that it
1196: holds for all $1\le i\le J$). Let $P=P(\bnu,\bdel)$ denote the set of
1197: $i$ such that
1198: \begin{equation}\label{eq:130}
1199: -\nu_i\beta_i+\del_i-\del_{i+1}>0.
1200: \end{equation}
1201: If $P$ is empty then the results of Step 1 apply and $H(\p )\ge0$.
1202: Hence assume $P$ is not empty.
1203: Let $j=j(\bnu,\bdel)$ be the least element in $P$.
1204: 
1205: Note that $J\not\in P$. For if $J\in P$ then using
1206: \eqref{eq:130} and \eqref{eq:105} we find $\del_J>0$, and therefore $J\in I$. 
1207: However, we get to assume \eqref{eq:104} for all $i \in I$, which means that 
1208: $-\nu_J\beta_J+\del_J-\del_{J+1}\le0$.  This contradicts $J\in P$.
1209: 
1210: We proceed by backward induction on the value of $j(\bnu,\bdel)$.
1211: Note that the sets $B$ and $I$ depend on $x$. The argument below treats
1212: simultaneously all $x\in G$ by considering all
1213: possible sets $B$ and $I$.
1214: 
1215: \noi
1216: {\it Induction step.} Assumption: For all $(I,B,\bnu,\bdel)$
1217: satisfying \eqref{eq:102}, \eqref{eq:103}, \eqref{eq:105},
1218: such that $P(\bnu,\bdel)\cap I=\emptyset$ and $j(\bnu,\bdel)\in
1219: [i+1,i+2,\ldots,J-1]$, one has $H(\p )\ge0$.
1220: Let $(I,B,\bnu,\bdel)$ be such that $P(\bnu,\bdel)\cap I=\emptyset$
1221: and $j(\bnu,\bdel)=i$ ($i\ge1$). Then
1222: $-\nu_i\beta_i+\del_i-\del_{i+1}>0$.
1223: Modify $\del_{i+1}$ by increasing it so as to get equality i.e.,
1224: set $\del_{i+1}'>\del_{i+1}$ so that
1225: $-\nu_i\beta_i+\del_i-\del'_{i+1}=0$.
1226: This modification does not change the value of
1227: $0\vee\mu_i(1-e^{-\nu_i\beta_i+\del_i-\del_{i+1}})$
1228: (but keeps it zero), and it can only decrease (or leave unchanged)
1229: the value of
1230: $0\vee\mu_{i+1}(1-e^{-\nu_{i+1}\beta_{i+1}+\del_{i+1}-\del_{i+2}})$.
1231: Hence by \eqref{eq:114}, the value of $H(\p )$ is only decreased.
1232: At the same time, $j(\bnu,\bdel')>j(\bnu,\bdel)$.
1233: Note that in modifying $\bdel$, \eqref{eq:102} need not hold
1234: for $B$ and $I$.
1235: However, clearly there are other sets, $B'$ and $I'$
1236: with which it holds. For example,
1237: \begin{equation}\label{eq:151}
1238: B'=\{i\in[1,J]:\del'_i<0\},\quad
1239: I'=\{i\in[1,J]:\del'_i\ge0\},\quad
1240: O'=\emptyset.
1241: \end{equation}
1242: Moreover, $1\not\in B'$, since we had
1243: $1\not\in B$ and $\del_1$ was not modified.
1244: By the induction assumption we therefore obtain that $H(\p )\ge0$.
1245: 
1246: \noi {\it Induction base.} We show that for all $(I,B,\bnu,\bdel)$
1247: satisfying \eqref{eq:102}, \eqref{eq:103}, \eqref{eq:105},
1248: such that $P(\bnu,\bdel)\cap I=\emptyset$ and $j(\bnu,\bdel)=J-1$,
1249: one has $H(\p )\ge0$.
1250: We have $-\nu_{J-1}\beta_{J-1}+\del_{J-1}-\del_J>0$.
1251: Similar to before, we set
1252: $\del_J'>\del_J$ so that $-\nu_{J-1}\beta_{J-1}+\del_{J-1}-\del'_J=0$.
1253: We claim that $P(\bnu,\bdel')=\emptyset$. Indeed, since
1254: $P(\bnu,\bdel)=\{J-1\}$, clearly $P(\bnu,\bdel')\subset\{J\}$.
1255: However,
1256: \begin{align*}
1257: -\nu_J\beta_J+\del'_J &=
1258: -\nu_J\beta_J-\nu_{J-1}\beta_{J-1}+\del_{J-1}\\
1259: &\le
1260: 0,
1261: \end{align*}
1262: where we have used the fact that $J-1\in P(\bnu,\bdel)$
1263: implies $J-1\not\in I$, and hence by \eqref{eq:102} $\del_{J-1}\le0$.
1264: This shows that $P(\bnu,\bdel')=\emptyset$.
1265: As in the previous paragraph, because of the modification of $\bdel$,
1266: \eqref{eq:102} need not hold for the $I$ and $B$ we started with,
1267: but there are other sets $I'$ and $B'$ (defined e.g.\ as in \eqref{eq:151})
1268: with which it holds.
1269: The results of Step 1 therefore apply, and therefore $H(\p )\ge0$.
1270: 
1271: This completes the argument by induction and establishes
1272: \eqref{eq:up} for superdifferentials.
1273: 
1274: \noi\uu{\it Verifying the PDE for subdifferentials.}
1275: We are required to show that \eqref{eq:down} holds for
1276: $\p \in D^-V(\x )$, where $\x \in G\setminus\pl_c G$ (and hence $B(\x )=\emptyset$).
1277: Unless $D^-V(\x )$ is empty, the general form of $\p \in D^-V(\x )$, $\x \in G$ is
1278: $$
1279: \p =-b_k+\bdel,
1280: $$
1281: where $k\in A$, and
1282: \begin{equation}\label{eq:115}
1283: \del_i\le0,\ i\in I,\quad
1284: \del_i=0,\ i\not\in I.
1285: \end{equation}
1286: Here we have used the fact that $V$ is the minimum of smooth functions,
1287: and therefore away from the boundary $D^-V(\x )$ can have at most one element,
1288: equal to the gradient of any minimizing function.
1289: It suffices to show that $H(\p )\le0$ whenever $\p \cdot\bgamma_i
1290: =-1_{i=k}\beta_k+\del_i-\del_{i+1}>0$ for all
1291: $i\in I$. 
1292: Using \eqref{eq:114}, \eqref{eq:115} and \eqref{eq:100},
1293: we find
1294: \begin{align*}
1295: H(\p )
1296: &=
1297: c+\la(1-e^{\beta_k-\del_1})+\sum_{i=1}^J0\vee\mu_i(1-e^{-1_{i=k}\beta_k
1298: +\del_i-\del_{i+1}})\\
1299: &=
1300: c+\la(1-e^{\beta_k-\del_1})+\sum_{i\not\in I}\mu_i(1-e^{-1_{i=k}\beta_k
1301: -\del_{i+1}})\\
1302: &\le
1303: c+\la(1-e^{\beta_k})+\sum_{i\not\in I}\mu_i(1-e^{-1_{i=k}\beta_k})\\
1304: &\le
1305: c+\la(1-e^{\beta_k})+\mu_k(1-e^{-\beta_k})\\
1306: &=0.
1307: \end{align*}
1308: \qed
1309: 
1310: \newpage
1311: \bibliographystyle{plain}
1312: \begin{thebibliography}{99}
1313: 
1314: \bibitem{atadup2} R.~Atar and P.~Dupuis,
1315: ``A differential game with constrained dynamics."
1316: {\em Nonlinear Analysis} Vol. 51, No. 7, p. 1105--1130 (2002)
1317: 
1318: \bibitem{ads} R.~Atar, P.~Dupuis and A.~Shwartz,
1319: ``An escape time criterion for queueing networks:
1320: Asymptotic risk-sensitive control via differential games,''
1321: Math. Op. Res., to appear.
1322: 
1323: \bibitem{avr} F.~Avram,
1324: ``On asymptotic optimal control problems for stochastic networks,''
1325: preprint, 2002.
1326: 
1327: \bibitem{box} O. J. Boxma, personal communication.
1328: 
1329: \bibitem{balday2}
1330: J.~Ball, M.~Day, and P.~Kachroo,
1331: ``Robust feedback control for a single server queueing system."
1332: {\em Mathematics of Control, Signals, and Systems \bf 12}, pp.~307--345, 1999.
1333: 
1334: \bibitem{barcap}
1335: M.~Bardi and I.~Capuzzo-Dolcetta,
1336: {\em Optimal control and viscosity solutions
1337: of Hamilton-Jacobi-Bellman equations.}
1338: Birkhauser, Boston, 1997.
1339: 
1340: \bibitem{dup} P.~Dupuis,
1341: {\em Explicit solution to a robust queueing control problem.}
1342: preprint.
1343: 
1344: \bibitem{dupjampet}
1345: P.~Dupuis, M.R.~James and I.R.~Petersen.
1346: ``Robust properties of risk--sensitive control."
1347: {\em Math.\ of Control, Signals and Systems
1348: \bf 13} pp.~318--332, 2000.
1349: 
1350: \bibitem{dupkus}
1351: P.~Dupuis and H.J.~Kushner,
1352: ``Minimizing escape probabilities: a large deviations approach. "
1353: {\em SIAM J.\ Control Optim.\ \bf 27}, pp.~432--445, 1989.
1354: 
1355: \bibitem{ellkal} R.J.~Elliott and N.J.~Kalton,
1356: {\em The existence of value in differential games,}
1357: Memoirs of the American Mathematical
1358: Society No.\ 126. American Mathematical Society,
1359: Providence, R.I., iv+67 pp., 1972.
1360: 
1361: \bibitem{flesou}
1362: W.H.~Fleming and P.E.~Souganidis,
1363: ``PDE-viscosity solution approach to some problems of large deviations."
1364: {\em Ann.\ Scuola Norm.\ Sup.\ Pisa Cl.\ Sci.\ \bf 4}, pp.~171--192, 1986.
1365: 
1366: \bibitem{sw}
1367: A.~Shwartz and A.~Weiss, ``Induced rare events: analysis
1368: via large deviations and time reversal."
1369: {\em Journal of Applied Prob.\ \bf 25}, pp.~667--689, 1993.
1370: 
1371: \bibitem{swbook}
1372: A. Shwartz and A. Weiss.
1373: \newblock {\it Large Deviations for Performance Analysis: Queues,
1374: Communication
1375:   and Computing}.
1376: \newblock Chapman and Hall, New York, 1995.
1377: 
1378: \bibitem{sto}
1379: A.~Stolyar,
1380: {\em Control of end-to-end delay tails in a multiclass network:
1381: LWDF discipline optimality.} Preprint, 2000.
1382: 
1383: \bibitem{storam}
1384: A.~Stolyar and K.~Ramanan,
1385: ``Largest weighted delay first scheduling:
1386: Large deviations and optimality."
1387: {\em Ann.\ Appl.\ Probab.\ \bf 11}, pp.~1--48, 2001.
1388: 
1389: \end{thebibliography}
1390: 
1391: 
1392: \end{document}
1393: 
1394: 
1395: 
1396: