cs0503088/cs0503088
1: \documentclass[twocolumn]{IEEEtran}
2: %\documentclass[onecolumn,draft,journal,twoside,12pt]{IEEEtran}
3: \usepackage{amsmath}
4: \usepackage{latexsym}
5: \usepackage{amssymb}
6: \usepackage{bm}
7: %This version was revised based on Han's comment.
8: \newtheorem{thm}    {Theorem}%[section]
9: \newtheorem{lem}     {Lemma}%[section]
10: \newtheorem{corollary}  {Corollary}%[section]
11: \newtheorem{proposition}        {Proposition}%[section]
12: \newtheorem{rem}     {Remark}%[section]
13: \newtheorem{define}     {Definition}%[section]
14: \newtheorem{example}  {Example}%[section]
15: \def\argmax{\mathop{\rm argmax}}
16: \def\complex{\mathbb{C}}
17: \newcommand{\defeq}{\stackrel{\rm def}{=}}
18: \newcommand{\bR}{\mathbb{R}}
19: \newcommand{\bC}{\mathbb{C}}
20: \newcommand{\bN}{\mathbb{N}}
21: \newcommand{\cH}{{\cal H}}
22: \newcommand{\cS}{{\cal S}}
23: \def\cY{{\cal Y}}
24: \def\cZ{{\cal Z}}
25: \def\cN{{\cal N}}
26: \def\cM{{\cal M}}
27: \def\cD{{\cal D}}
28: \def\cU{{\cal U}}
29: \def\rE{{\rm E}}
30: \def\rP{{\rm P}}
31: \newcommand{\cC}{\mathfrak{C}}
32: %\newcommand{\cC}{{\cal C}}
33: \newcommand{\cP}{{\cal P}}
34: \newcommand{\cPn}{{\cal P}^{(n)}}
35: \newcommand{\cX}{{\cal X}}
36: \newcommand{\cXn}{{\cal X}^{(n)}}
37: \newcommand{\cXvec}{\vec{\cX}}
38: \newcommand{\cXnhat}{\hat{\cX}^{(n)}}
39: \newcommand{\cXvechat}{\vec{\hat{\cX}}}
40: \newcommand{\Tr}{{\rm Tr}\,}
41: \newcommand{\cHn}{{\cal H}^{(n)}}
42: \newcommand{\cHvec}{\vec{\cH}}
43: \newcommand{\rhon}{\rho^{(n)}}
44: \newcommand{\sigman}{\sigma^{(n)}}
45: \newcommand{\rhovec}{\vec{\bm{\rho}}}
46: \newcommand{\sigmavec}{\vec{\bm{\sigma}}}
47: \newcommand{\Phin}{\Phi^{(n)}}
48: \newcommand{\Phivec}{\vec{\bm{\Phi}}}
49: \newcommand{\cCvec}{\vec{\cC}}
50: \newcommand{\cPvec}{\vec{\cP}}
51: \newcommand{\cSvec}{\vec{\cS}}
52: \newcommand{\Pn}{P^{(n)}}
53: \newcommand{\Pnhat}{\hat{P}^{(n)}}
54: \newcommand{\Pvec}{\vec{\bm{P}}}
55: \newcommand{\bW}{{\bf W}}
56: \newcommand{\bQ}{{\bf Q}}
57: \newcommand{\bX}{{\bf X}}
58: \newcommand{\bY}{{\bf Y}}
59: \newcommand{\by}{{\bf y}}
60: \newcommand{\bp}{{\bf p}}
61: \newcommand{\Wn}{W^{(n)}}
62: \newcommand{\Xn}{X^{(n)}}
63: \newcommand{\Yn}{Y^{(n)}}
64: \newcommand{\cn}{c^{(n)}}
65: \newcommand{\cvec}{\vec{\bm{c}}}
66: \newcommand{\Kn}{K_n}
67: \newcommand{\cQ}{{\cal Q}}
68: \newcommand{\cR}{{\cal R}}
69: \newcommand{\cF}{{\cal F}}
70: \newcommand{\cFn}{{\cal F}_n}
71: \newcommand{\cFvec}{\vec{\cal F}}
72: \newcommand{\fn}{f_n}
73: \newcommand{\fvec}{\vec{\bm{f}}}
74: 
75: \newcommand{\rhonarg}[1]{\rho^{(n)}_{#1}}
76: \newcommand{\Xnarg}[1]{X^{(n)}_{#1}}
77: 
78: 
79: \newcommand{\Pe}{{\rm P_e}}
80: 
81: \makeatletter
82: \newcommand{\lleq}{\mathrel{\mathpalette\gl@align<}}
83: \newcommand{\ggeq}{\mathrel{\mathpalette\gl@align>}}
84: \newcommand{\gl@align}[2]{%\lower.1ex
85: \vbox{\baselineskip\z@skip\lineskip\z@
86: \ialign{$\m@th#1\hfil##\hfil$\crcr#2\crcr{}_{{}_{(=)}}\crcr}}}
87: \makeatother
88: 
89: \newcommand{\supD}{\overline{D}}
90: \newcommand{\infD}{\underline{D}}
91: \newcommand{\supJ}{\overline{J}}
92: \newcommand{\infJ}{\underline{J}}
93: \newcommand{\supI}{\overline{I}}
94: \newcommand{\infI}{\underline{I}}
95: \newcommand{\infH}{\underline{H}}
96: \newcommand{\supH}{\overline{H}}
97: 
98: \newcommand{\cHtensor}{{\cal H}^{\otimes n}}
99: \newcommand{\rhotensor}{\rho^{\otimes n}}
100: \newcommand{\sigmatensor}{\sigma^{\otimes n}}
101: 
102: \newcommand{\rhotvec}{\rhovec}
103: \newcommand{\sigmatvec}{\sigmavec}
104: 
105: %\newcommand{\Ptn}{P^{\times n}}
106: \newcommand{\Ptn}{\Pn}
107: \newcommand{\cXtn}{{\cX}^n}
108: %\newcommand{\Ptvec}{\overrightarrow{P^{\times}}}
109: \newcommand{\Ptvec}{\Pvec}
110: \newcommand{\Ptnhat}{\hat{P}^{\times n}}
111: 
112: %double space
113: %\renewcommand{\baselinestretch}{1.66}
114: \def\Label#1{\label{#1}\ [\ #1\ ]\ }
115: \def\Label{\label}
116: 
117: \newcommand{\spec}[1]{\left\{#1\right\}}
118: 
119: \newcommand{\ch}{W}
120: \newcommand{\chn}{W^{(n)}}
121: \newcommand{\chnhat}{\hat{W}^{(n)}}
122: \newcommand{\chvec}{\vec{\bm{W}}}
123: \newcommand{\charg}[1]{W_{#1}}
124: \newcommand{\chnarg}[1]{W^{(n)}_{#1}}
125: \newcommand{\chvecarg}[1]{\vec{\bm{W}}_{#1}}
126: \newcommand{\code}{\Phi}
127: \newcommand{\coden}{\Phi^{(n)}}
128: \newcommand{\codevarn}{\widetilde{\Phi}^{(n)}}
129: \newcommand{\codevec}{\vec{\bm{\Phi}}}
130: \newcommand{\dec}{Y}
131: \newcommand{\decn}{Y^{(n)}}
132: \newcommand{\decarg}[1]{Y_{#1}}
133: \newcommand{\decnarg}[1]{Y^{(n)}_{#1}}
134: \newcommand{\decvar}{\widetilde{Y}}
135: \newcommand{\decvarn}{\widetilde{Y}^{(n)}}
136: \newcommand{\decvararg}[1]{\widetilde{Y}_{#1}}
137: \newcommand{\decvarnarg}[1]{\widetilde{Y}^{(n)}_{#1}}
138: \newcommand{\enc}{\varphi}
139: \newcommand{\encn}{\varphi^{(n)}}
140: \newcommand{\encarg}[1]{\varphi(#1)}
141: \newcommand{\encnarg}[1]{\varphi^{(n)}(#1)}
142: \newcommand{\encvec}{\vec{\bm{\varphi}}}
143: \newcommand{\xn}{x^n}
144: \newcommand{\xvec}{\vec{\bm{x}}}
145: \newcommand{\cost}{c}
146: \newcommand{\costn}{c^{(n)}}
147: \newcommand{\costvec}{\vec{\bm{c}}}
148: 
149: \newcommand{\Pnrc}{P^{(n)}_{\rm rc}}
150: \newcommand{\Enrc}{E^{(n)}_{\rm rc}}
151: \newcommand{\En}{E^{(n)}}
152: 
153: \newcommand{\restrict}[1]{\!\!\restriction_{#1}}
154: 
155: %\date{\today}
156: \begin{document}
157: \title{General non-asymptotic and asymptotic 
158: formulas \\in channel resolvability and identification capacity\\
159: and their application to wire-tap channel}
160: 
161: \author{
162: Masahito Hayashi
163: \thanks{
164: M. Hayashi is with Quantum Computation and Information Project, ERATO, JST,
165: 5-28-3, Hongo, Bunkyo-ku, Tokyo, 113-0033, Japan.
166: (e-mail: masahito@qci.jst.go.jp)
167: The material in this paper was presented in part
168: at 2004 International Symposium on Information Theory and 
169: its Applications, Parma, Italy, October 2004.}}
170: \date{}
171: \maketitle
172: \begin{abstract}
173: Several non-asymptotic formulas 
174: are established in channel resolvability and 
175: identification capacity,
176: and they are applied to wire-tap channel.
177: By using these formulas, 
178: the $\epsilon$ capacities of
179: the above three problems are
180: considered in the 
181: most general setting, where 
182: no structural assumptions 
183: such as the stationary memoryless property are made on 
184: a channel.  
185: As a result, we solve
186: an open problem proposed in Han \& Verd\'{u}\cite{Han-V} and
187: Han \cite{Han-book}. 
188: Moreover, 
189: we obtain lower bounds of the exponents of 
190: error probability and the wire-tapper's information in wire-tap channel.
191: \end{abstract}
192: \begin{keywords}
193: identification code,
194: channel resolvability,
195: information spectrum,
196: wire-tap channel,
197: non-asymptotic setting
198: \end{keywords}
199: \section{Introduction}
200: \PARstart{I}{n} 1989,
201: Ahlswede \& Dueck \cite{Ah-D} proposed the identification 
202: code as a new framework for communication system using noisy channels.
203: However, 
204: the upper bound of the rate of the reliable identification 
205: codes was not solved in their paper.
206: In 1993, for analysis of the converse part of this problem,
207: Han \& Verd\'{u}\cite{Han-V} proposed the channel resolvability problem, 
208: in which 
209: we approximate the output distribution to a desired output distribution
210: by using a uniform input distribution with smaller support.
211: In particular, 
212: the capacity of this problem is defined as the rate of 
213: the maximal number of the size of support for 
214: every desired output distribution.
215: In order to discuss the channel resolvability problem,
216: they introduced the concepts of `general sequence of channels' and 
217: the `information spectrum method'.
218: They gave the relation between 
219: identification code and channel resolvability,
220: and succeeded in proving the converse part of
221: the capacity of identification code for the discrete memoryless channel.
222: In this method it is essential that the performances of 
223: several problems be characterized by using 
224: the probability distribution of 
225: the random variable with a form of `likelihood' function in this method. 
226: This insight is very useful for obtaining the overview of 
227: information theory\cite{Han-book}.
228: In particular, it gives a useful insight into quantum information theory
229: \cite{ON1,Nag-Hay,Hay-Nag}.
230: Therefore, Han \& Verd\'{u}'s paper\cite{Han-V} is undoubtably the landmark of 
231: information spectrum.
232: 
233: However, while Han \& Verd\'{u}'s paper gives the capacity of 
234: channel resolvability for general sequence of channels\cite{Han-V},
235: their proof of the converse part contains mistakes as is
236: recognized in section 6.3. of Han\cite{Han-book}.
237: They proved the achievability of
238: channel resolvability with the asymptotic zero error setting
239: for a general sequence of channels.
240: Concerning the converse part,
241: their proof is valid for the asymptotic $\epsilon$ error setting
242: when the general sequence of channels
243: has a strong converse property.
244: However, their proof is not valid in the general channel even in
245: the asymptotic zero error setting.
246: 
247: In this paper, we give several useful non-asymptotic formulas 
248: for identification code and channel resolvability,
249: which are divided into two parts.
250: One is the direct part of the identification code.
251: The existence of a good identification code is proved in Theorem \ref{t-1}.
252: This construction is much improved from Ahlswede \& Dueck's construction.
253: The other is the direct part of channel resolvability.
254: The existence of a good approximation regarding the output statistics
255: is proved in the two criteria, variational distance and
256: K-L divergence as in Theorem \ref{t-2}.
257: In this discussion, we derived upper bounds of 
258: the average of the variational distance and K-L divergence
259: between the output distribution of a given distribution $p$ 
260: and the output distribution of 
261: the input uniform distribution on $M$ elements of the input signal space,
262: when the $M$ elements
263: are randomly chosen with the distribution $p$ (Lemma \ref{lem-1-11}).
264: Combining Han \& Verd\'{u}'s relation between identification code and 
265: channel resolvability,
266: we derived 
267: the capacity of the channel resolvability for general sequence of channels
268: with the asymptotic zero error setting, 
269: which was conjectured by Han \& Verd\'{u}\cite{Han-V} 
270: ((\ref{1-13-1}) and (\ref{1-13-2}) of Theorem \ref{t-3}).
271: This discussion is valid even though 
272: the strong converse property does not hold.
273: 
274: As another application, we give an upper bound of the capacity of the 
275: channel resolvability for a general sequence of channels
276: with the asymptotic $\epsilon$ error.
277: As a byproduct, we show that
278: there exists a sequence of codes whose second error probability goes to $0$
279: in any general sequence of channels,
280: and only the first error probability is asymptotically related to 
281: the probability distribution of 
282: the random variable with the form of `likelihood' 
283: ((\ref{3-3-1}) and (\ref{3-3-2}) of Theorem \ref{t-3}).
284: We also derived
285: several lower bounds of exponent of channel resolvability in 
286: the stationary memoryless setting
287: with respective error criteria (Theorem \ref{t-5}).
288: 
289: Moreover, we apply our non-asymptotic formulas for channel resolvability to 
290: wire-tap channel,
291: in which there are two receivers {\it i.e.},
292: the eavesdropper and the normal receiver.
293: Wyner\cite{Wyner} introduced this wire-tap channel,
294: and proved that its capacity is greater then 
295: the difference between 
296: the normal receiver's information 
297: and the eavesdropper's information.
298: Csisz\'{a}r \& Narayan \cite{CN}
299: showed that
300: the capacity does not depend on the following two conditions 
301: for eavesdropper's information:
302: i) The eavesdropper's information must be less than $n \epsilon$ 
303: for given $ \epsilon \,> 0$, where $n$ is the number of
304: transmissions.
305: ii) The eavesdropper's information must go to $0$ exponentially.
306: However, 
307: there are no results giving an explicit lower 
308: bound of the optimal exponents of wire-tapper's information.
309: 
310: Indeed, this problem is closely related to the channel resolvability 
311: as follows.
312: In Wyner's proof \cite{Wyner}, 
313: in the asymptotic i.i.d. setting with a large enough number $M$,
314: he essentially showed that
315: when $M$ elements of the input signal space
316: are randomly chosen with a given distribution $p$,
317: the output distribution of the distribution $p$ 
318: can be approximated with a high probability by the output distribution of 
319: the input uniform distribution on the above 
320: $M$ elements of the input signal space.
321: This idea is also applied in 
322: Devetak\cite{Deve} and Winter, Nascimento \& Imai \cite{WNI}.
323: Using the same idea in the non-asymptotic setting, 
324: we can apply our formulas of channel resolvability 
325: to wire-tap channel, and
326: derive a good non-asymptotic formula for 
327: wire-tap channel (Theorem \ref{3-6}).
328: As consequences we obtain 
329: the capacity of general sequence of wire-tap channel (Theorem \ref{t-1-17}),
330: and lower bounds of the exponents 
331: of error probability and the wire-tapper's information in 
332: the stationary memoryless setting (Theorem \ref{t-7}).
333: We can expect that these results will be applied to evaluations of 
334: the security of channels.
335: 
336: Finally, we should remark that our non-asymptotic resolvability formula 
337: regarding 
338: variational distance can be regarded as 
339: essentially the same results as 
340: Oohama\cite{Oohama2}'s formula, where
341: he treated the partial resolvability.
342: Furthermore, he also derived a lower bound of exponent of 
343: channel resolvability by type method\cite{Oohama}.
344: %We compare compare our exponents with his exponents.
345: \section{Identification code in non-asymptotic setting}
346: Let $W: x \mapsto W_x$ be an arbitrary channel with the input alphabet
347: $\cX$ and the output alphabet $\cY$.
348: The identification channel code for the channel $W$
349: is defined in the following way.
350: First, let $\cN =\{ 1, \ldots, N\}$ be a set of
351: messages to be transmitted, and
352: denote by $\cP(\cX)$ the set of all probability distribution
353: over $\cX$. A transmitter prepares $N$ probability
354: distributions $Q_1, \ldots, Q_N \in \cP(\cX)$.
355: If the transmitter wants to send a message $i \in \cN$,
356: an encoder generates an input sequence $x_i \in \cX$
357: randomly subject to the probability 
358: distribution $Q_i$.
359: In this case, the output signal $y$ obeys the distribution
360: $W_{Q_i}$, where
361: the output distribution $W_p$ of a given input distribution
362: $p$ is defined as
363: \begin{align*}
364: W_p(y)\defeq \sum_{x} p(x) W_x(y).
365: \end{align*}
366: On the other hand, at the decoder side an $N$-tuple of decoders
367: is prepared.
368: For every $i=1, \ldots, N$, the $i$-th decoder judges that
369: $i \in \cN$ is transmitted if a channel output $y$ belongs to 
370: $\cD_i$, where
371: $\{ \cD_1, \ldots, \cD_N\}$ are $N$ subsets of $\cY$ in advance.
372: The $i$-th decoder judges that a message different from $i \in \cN$
373: if $y \notin \cD_i$.
374: Here, $\cD_i$ is called the {\it decoding region},
375: of the message $i$.
376: It is not required that $\cD_1, \ldots, \cD_N$ be disjoint.
377: In the identification coding problem, the $i$-th decoder 
378: is only interested in transmission of the corresponding 
379: message $i$.
380: Thus, we call the tuple of 
381: $\Phi \defeq (N,\{ Q_1, \ldots Q_N \},\{ \cD_1, \ldots, \cD_N\})$
382: an identification code of channel $W$.
383: The performance of this code can be characterized by the following three 
384: quantities.
385: One is the size $N$ of the message sent and is denoted by $|\Phi|$, and 
386: the others are the maximum values of the two-type error probabilities
387: given as:
388: \begin{align*}
389: \mu (\Phi) \defeq \max_i  W_{Q_i} (\cD_i^c) , \quad
390: \lambda (\Phi) \defeq \max_{i\neq j} W_{Q_j} (\cD_i) ,
391: \end{align*}
392: where $\cD_i^c$ is the complement set of $\cD_i$.
393: Concerning this problem, as discussed in the following theorem,
394: the `likelihood' function $\frac{W_x}{W_p}(y)
395: \defeq \frac{W_x(y)}{W_p(y)}$ suitablely characterizes
396: the performance of good identification codes.
397: \begin{thm}\Label{t-1}
398: Assume that real numbers
399: $\alpha, \alpha',\beta,\beta',\tau, \kappa \,> 0$ 
400: satisfy 
401: \begin{align}
402: &\kappa \log (\frac{1}{\tau}- 1)  \,> \log 2 +1, ~
403: 1/3 \,> \tau\,> 0,~1 \,> \kappa \,> 0,
404: \Label{3-3-5}\\
405: &1  \,> \frac{1}{\alpha} + \frac{1}{\alpha'} ,~
406: \gamma  \defeq 1 - \frac{1}{\beta}- \frac{1}{\beta'}\,> 0.
407: \Label{3-3-4}
408: \end{align}
409: Then, 
410: for any integer $M \,> 0$, any real number $C \,>0$,
411: any channel $W$,
412: and any probability distribution
413: $p \in \cP(\cX)$, 
414: there exists an identification code $\Phi$ such that
415: \begin{align*}
416: \mu(\Phi) &\le \alpha \beta \rE_{p,x}
417: W_x \left\{ y \left| \frac{W_x}{W_p}(y) \le C\right.\right\} \\
418: \lambda(\Phi) & \le \kappa + \alpha'\beta'\frac{1}{C}
419: \left\lceil \frac{M}{\gamma}\right\rceil,\quad
420: |\Phi| = 
421: \left\lfloor\frac{e^{\tau M}}{Me}\right\rfloor
422: \end{align*}
423: if
424: \begin{align}
425: \beta \rE_{p,x}
426: W_x \left\{ y \left| \frac{W_x}{W_p}(y) \le C\right.\right\}
427: +
428: \alpha'\beta'\frac{1}{C}
429: \left\lceil \frac{M}{\gamma}\right\rceil
430: < 1,\label{11-23-7-q}
431: \end{align}
432: where $\rE_{p,x}$ denotes the expectation
433: concerning random variable $x$ obeying the probability distribution $p$.
434: \end{thm}
435: In the following, we omit $x$ or $p$ in the notation $\rE_{p,x}$,
436: and abbreviate the set $\left\{ y \left| \frac{W_x}{W_p}(y) \le C\right.
437: \right\}$
438: as $\left\{ \frac{W_x}{W_p}(y) \le C\right\}$.
439: we also denote the probability
440: that the random variable $X$ belongs to
441: the set $\cD$, by $\rP_X (\cD)$ or $\rP_X \cD$.
442: If we do not need to take note of the random variable $X$,
443: we simplify it to $\rP (\cD)$ or $\rP \cD$.
444: This theorem is proven by using the following lemma.
445: 
446: \begin{lem}\Label{A-D}
447: (Ahlswede and Dueck\cite{Ah-D})
448: Let $\cM$ be an arbitrary finite set of the size $M=|\cM|$.
449: Choose constants $\tau$ and $\kappa$ satisfying the condition (\ref{3-3-5}).
450: Then there exist $N (\defeq 
451: \lfloor\frac{e^{\tau M}}{Me}\rfloor)$ subsets 
452: $A_1 , \ldots , A_N \subset \cM$
453: satisfying 
454: \begin{align}
455: |A_i|= \lfloor \tau M \rfloor ,\quad
456: |A_i \cap A_j| \,< \kappa \lfloor \tau M \rfloor (i \neq j).
457: \Label{3-3-7}
458: \end{align}
459: \end{lem}
460: 
461: \noindent
462: \quad{\it Proof of Theorem \ref{t-1}:}
463: In this proof, the subset 
464: $\cU_x \defeq \left\{  \frac{W_x}{W_p}(y) > C 
465: \right\}$ plays an important role.
466: First, we assume the existence of 
467: $M$ distinct elements $x_1, \ldots, x_M$ of $\cX$ satisfying
468: \begin{align}
469: W_{x_i} (\cU_{x_i}^c) &\le \alpha \beta \rE_p
470: W_x \left\{  \frac{W_x}{W_p}(y) \le C \right\} ,\Label{3-3-8}\\
471: W_{x_i} \left(\bigcup_{j\neq i} \cU_{x_j}\right) &\le 
472: \alpha'\beta'\frac{1}{C}
473: \left\lceil \frac{M}{\gamma}\right\rceil .\Label{3-3-9}
474: \end{align}
475: From Lemma \ref{A-D},
476: we can choose 
477: $N \defeq 
478: \lfloor\frac{e^{\tau M}}{Me}\rfloor$ subsets 
479: $A_i , \ldots, A_N$ of the set
480: $\{x_1, \ldots, x_M\}$ satisfying 
481: (\ref{3-3-7}).
482: Let $Q_i$ be 
483: the uniform distribution on the subset $A_i$ whose cardinality is
484: $\lfloor \tau M \rfloor $, that is,
485: $Q_i$ is defined as
486: \begin{align}
487: Q_i(x)\defeq \frac{1}{|A_i|} \sum_{x' \in A_i}
488: 1_{x'}(x),
489: \end{align}
490: where $1_{x'}=1_{x'}(x)$ is an indicator function
491: taking value 1 if $x=x'$ and $0$ otherwise.
492: Defining the subset $\cD_i$ as $\cD_i\defeq \cup_{x \in A_i} \cU_{x}$,
493: we evaluate
494: \begin{align*}
495: & W_{Q_i}(\cD_i) =
496: \sum_{x \in A_i}\frac{1}{|A_i|}
497: W_{x} (\cD_i)
498: \ge
499: \sum_{x \in A_i}\frac{1}{|A_i|}
500: W_{x} (\cU_x) \\
501: \ge & 1- \alpha \beta \rE_p
502: W_x \left\{  \frac{W_x}{W_p}(y) \le C\right\},\\
503: & W_{Q_i}(\cD_j)
504: = \sum_{x \in A_i}\frac{1}{|A_i|}
505: W_{x} (\cD_j) \\
506: = &
507: \sum_{x \in A_i \cap A_j }\frac{1}{|A_i|}
508: W_{x} (\cD_j)
509: +
510: \sum_{x \in A_i \cap A_j ^c }\frac{1}{|A_i|}
511: W_{x} (\cD_j)\\
512: \le &
513: \frac{|A_i \cap A_j |}{|A_i|}
514: +
515: \sum_{x \in A_i \cap A_j ^c }\frac{1}{|A_i|}
516: W_{x} \left(\bigcup_{x'\neq x} \cU_{x'}\right)\\
517: \le &
518: \kappa
519: +
520: \alpha'\beta'\frac{1}{C}
521: \lceil \frac{M}{\gamma}\rceil.
522: \end{align*}
523: Therefore, we obtain the desired argument.
524: 
525: Next, we prove the existence of $M$ elements and 
526: $M$ subsets satisfying (\ref{3-3-8}) and (\ref{3-3-9})
527: by a random coding method.
528: Let $M'$ be $\lceil \frac{M}{\gamma}\rceil$,
529: and $X=(X_1, \ldots, X_{M'})$ be $M$ independent and 
530: identical random variables 
531: subject to the probability distribution
532: $p \in\cP(\cX)$,
533: %The expectations about this probability can be calculated by using 
534: %$\cU_x \defeq \left\{  \frac{W_x}{W_p}(y) \le C \right\}$ as follows.
535: then we have
536: \begin{align*}
537: W_p(\cU_x) \le \frac{1}{C} W_x(\cU_x) \le \frac{1}{C}.
538: \end{align*}
539: Using this inequality, we obtain
540: \begin{align*}
541: & \rE_{X}
542: \frac{1}{M'}
543: \sum_{i=1}^{M'}
544: W_{X_i}
545: \left(\bigcup_{j \neq i} \cU_{X_j}\right)
546: \le 
547: \rE_{X}
548: \sum_{j=1}^{M'}
549: \frac{1}{M'}
550: \sum_{i\neq j}
551: W_{X_i}(\cU_{X_j}) \\
552: &=
553: \sum_{j=1}^{M'}
554: \rE_{X_j}
555: \frac{M'-1}{M'}
556: W_p(\cU_{X_j})
557: \le
558: \sum_{j=1}^{M'}
559: \rE_{X_j}
560: \frac{M'-1}{M'C}
561: \le \frac{M'-1}{C}.
562: \end{align*}
563: Further,
564: \begin{align*}
565: &\rE_{X}\frac{1}{M'}\sum_{i=1}^{M'}
566: W_{X_i}(\cU_{X_i}^c)
567: =
568: \sum_{i=1}^{M'}
569: \rE_{X_i}W_{X_i}\frac{(\cU_{X_i}^c)}{M'}
570: = \rE_p W_x(\cU_x^c) .
571: \end{align*}
572: Using the Markov inequality
573: $\rP_X \{ X  \,> \alpha \rE X\}\,< \frac{1}{\alpha}$,
574: {\em i.e.}, 
575: $\rP_X \{ X  \le \alpha \rE X\}\,> 1-  \frac{1}{\alpha}$,
576: we can show that
577: \begin{align*}
578: \rP_X
579: \left\{
580: \frac{1}{M'}
581: \sum_{i=1}^{M'}
582: W_{X_i}
583: \left(\bigcup_{j \neq i} \cU_{X_j}\right)
584: \le
585: \alpha' \frac{M'-1}{C}
586: \right\}
587: & \,>
588: 1- \frac{1}{\alpha'} \\
589: \rP_X
590: \left\{
591: \frac{1}{M'}\sum_{i=1}^{M'}
592: W_{X_i}(\cU_{X_i}^c)
593: \le
594: \alpha \rE_p W_x(\cU_x^c) 
595: \right\}
596: & \,>
597: 1- \frac{1}{\alpha}.
598: \end{align*}
599: Since
600: $(1- \frac{1}{\alpha'})+(1- \frac{1}{\alpha})\,>1$,
601: there exist $M$ elements
602: $x_1, \ldots, x_{M'}$ such that
603: \begin{align*}
604: \frac{1}{M'}
605: \sum_{i=1}^{M'}
606: W_{x_i}
607: \left(\bigcup_{j \neq i} \cU_{x_j}\right)
608: & \le
609: \alpha' \frac{M'-1}{C} \\
610: \frac{1}{M'}\sum_{i=1}^{M'}
611: W_{x_i}(\cU_{x_i}^c)
612: & \le
613: \alpha \rE_p W_c(\cU_x^c) .
614: \end{align*}
615: In the following, 
616: the above $M$ elements $x_1, \ldots, x_{M'}$ are fixed,
617: and we only focus on 
618: the random variable $i$ subject
619: to the uniform distribution on the set $\{1, \ldots, M' \}$.
620: Combining Markov inequality and the preceding inequalities,
621: we have
622: \begin{align*}
623: \rP_i \left\{
624: W_{x_i}
625: \left(\bigcup_{j \neq i} \cU_{x_j}\right)
626: \le \beta' \alpha' \frac{M'-1}{C} 
627: \right\}
628: & \,> 1- \frac{1}{\beta'} \\
629: \rP_i \left\{
630: W_{x_i}(\cU_{x_i}^c)
631: \le
632: \beta \alpha \rE_p W_x(\cU_x^c)\right\}
633: & \,> 1- \frac{1}{\beta} .
634: \end{align*}
635: Hence, we obtain
636: \begin{align*}
637: & \rP_i \left\{
638: \begin{array}{c}
639: W_{x_i}
640: \left(\bigcup_{j \neq i} \cU_{x_j}\right)
641: \le \beta' \alpha' \frac{M'-1}{C} ,\\
642: W_{x_i}(\cU_{x_i}^c)
643: \le
644: \beta \alpha \rE_p W_x(\cU_x^c)
645: \end{array}
646: \right\} \\
647: \,> &(1- \frac{1}{\beta} )+
648: (1- \frac{1}{\beta'})-1= \gamma,
649: \end{align*}
650: which yields
651: \begin{align*}
652: \left| \left\{
653: i\left|
654: \begin{array}{c}
655: W_{x_i}
656: \left(\bigcup_{j \neq i} \cU_{x_j}\right)
657: \le \beta' \alpha' \frac{M'-1}{C} ,\\
658: W_{x_i}(\cU_{x_i}^c)
659: \le
660: \beta \alpha \rE_p W_x(\cU_x^c)
661: \end{array}
662: \right.\right\} \right|
663: \,>  \lfloor \gamma M'\rfloor.
664: \end{align*}
665: Since
666: $\lfloor \gamma M'\rfloor
667: = \lfloor\gamma 
668: \lceil \frac{M}{\gamma} \rceil \rfloor\ge M$,
669: there exist $M$
670: elements of $\cX$ satisfying (\ref{3-3-8}) and (\ref{3-3-9}).
671: Here, one may think that these $M$ elements 
672: may not be distinct.
673: However, if $x_i= x_{i'} (i \neq i')$,
674: the relation $W_{x_i}(\cU_{x_i}^c)
675: + 
676: W_{x_i} \left(\bigcup_{j\neq i} \cU_{x_j}\right) \ge 1$
677: holds.
678: From condition (\ref{11-23-7-q}),
679: this contradicts 
680: (\ref{3-3-8}) and (\ref{3-3-9}).
681: Hence, we obtain the desired bound.
682: \endproof
683: 
684: \section{Channel resolvability in non-asymptotic setting}
685: In the channel resolvability, 
686: we choose 
687: $M$ elements $x_1, \ldots, x_M$ in the input set $\cX$ 
688: for every probability distribution $p \in \cP(\cX)$,
689: such that 
690: the output distribution of 
691: the input distribution 
692: \begin{align*}
693: \sum_{i=1}^M \frac{1}{M} 1_{x_i}
694: \end{align*}
695: close enough to 
696: the output distribution of 
697: $p$ through the channel $W$.
698: In particular, 
699: we call the distribution 
700: with the preceding form
701: an $M$-type.
702: In this setting, 
703: our purpose is to disenable
704: the receiver of the given channel $W$
705: to distinguish whether
706: the sender generates the input signal based on 
707: `the given distribution $p$'
708: or `the $M$-type $\sum_{i=1}^M \frac{1}{M} 1_{x_i}$ 
709: with a smaller number $M$'.
710: This kind of indistinguishability  
711: can not be applied to any realistic model, directly,
712: but it can be technically related to wire-tap channel.
713: In particular, 
714: we prove Lemma \ref{lem-1-11} in this section as
715: the technically essential part, but
716: this lemma is also the technically essential part
717: for the direct part of wire-tap channel.
718: %This problem does not seem to be useful,
719: %but it can be applied to the treatment of 
720: %the impossibility of the identification code as
721: %was pointed by Han-Verd\'u \cite{}.
722: %Moreover, this 
723: 
724: In the following, we call
725: the pair of the integer $M$ and
726: the $M$ elements $x_1, \ldots, x_M$ of $\cX$,
727: a resolvability code $\Psi$ with the size $|\Psi|\defeq M$.
728: The performance of a resolvability code $\Psi$
729: is characterized by its size $|\Psi|$ and
730: the variational distance
731: \begin{align*}
732: \epsilon (\Psi,W_p)
733: \defeq d\left( 
734: \sum_{i=1}^M \frac{1}{M} W_{x_i}, W_p\right),
735: \end{align*}
736: where
737: the variational distance $d(p,q)$
738: defined by
739: \begin{align*}
740: d(p,q)= \sum_y |p(y)-q(y)|,
741: \end{align*}
742: which equals the $l_1$ norm $\|p-q\|_1$.
743: Another characterization of its performance is given by 
744: K-L divergence
745: \begin{align}
746: D(\Psi,W_p )\defeq D(\sum_{i=1}^M \frac{1}{M} W_{x_i}\| W_p),
747: \Label{3-5-1}
748: \end{align}
749: where
750: $D(p\|q)\defeq \sum_y p(y)\log \frac{p(y)}{q(y)}$.
751: \begin{thm}\Label{t-2}
752: For any integer $M \,> 0$, any real number $C \,> 0$ and
753: any probability distribution $p \in \cP(\cX)$,
754: there exists a resolvability code $\Psi$ such that
755: $|\Psi|= M$ and 
756: \begin{align}
757: \epsilon (\Psi, W_p) &\le 2 \delta_{p,W,C}
758: + \sqrt{\frac{\delta_{p,W,C}'}{M}} ,
759: \Label{3-3-10}\\
760: \delta_{p,W,C}' &\le C , \nonumber
761: \end{align}
762: where $\delta_{p,W,C}
763: \defeq \rE_p W_x \left\{ \frac{W_x}{W_p}(y) \,> C\right\}$,
764: and $\delta_{p,W,C}'\defeq 
765: \rE_p \frac{W_x^2}{W_p} 
766: \left\{ \frac{W_x}{W_p}(y) \le C\right\}$.
767: If the cardinality $|\cY|$ is finite,
768: for any $0\,> t \ge -1/2$, 
769: there exists a resolvability code $\Psi'$ such that
770: $|\Psi'|=M$ and either of 
771: \begin{align}
772: D(\Psi',W_p) \le &
773: \frac{\log (1+M^t e^{\phi(t|W,p)})}{-t},\Label{6-26-1}\\
774: D(\Psi',W_p) \le & \eta(\delta_{p,W,C})+  \delta_{p,W,C}\log |\cY| + 
775: \frac{\delta_{p,W,C}'}{M}\Label{7-1-3}
776: \end{align}
777: holds, where 
778: $\eta(x)\defeq -x\log x$
779: and $\phi(t|W,p)\defeq \log \sum_y 
780: (\rE_p W_x^{1/(1+t)}(y))^{1+t}$.
781: \end{thm}
782: \begin{rem}
783: The partial resolvability version of inequality (\ref{3-3-10})
784: has been obtained by Oohama\cite{Oohama2}.
785: Inequality (\ref{3-3-10}) can be regarded as 
786: the essentially same result as Oohama's inequality.
787: \end{rem}
788: \begin{proof}
789: In the following,
790: the indicator functions 
791: $I_x$ and $I_x^c$ 
792: on the sets $\cU_x
793: =\left\{  \frac{W_x}{W_p}(y) > C \right\}$
794: and their compliment sets $\cU_x^c$
795: play important roles.
796: In our proof of Theorem \ref{t-2}, 
797: we use the random coding method, {\it i.e.},
798: we consider the $M$ independent and identical random variables 
799: $X=(X_1, \ldots, X_M)$
800: subject to $p$. 
801: Using the notations:
802: \begin{align*}
803: W_x^{\alpha}(y)&\defeq W_x(y)I_x^c(y) ,\quad
804: W_x^{\beta}(y)\defeq W_x(y)I_x(y) ,\\
805: W_p^{\alpha}(y)&\defeq \rE_p W_x^{\alpha}(y) ,\quad
806: W_p^{\beta}(y)\defeq \rE_p W_x^{\beta}(y) ,\\
807: W_X^{\alpha}(y)&\defeq \frac{1}{M} \sum_{i=1}^M W_{X_i}^{\alpha}(y), \quad
808: W_X^{\beta}(y)\defeq \frac{1}{M} \sum_{i=1}^M  W_{X_i}^{\beta}(y), \\
809: W_X^{M}(y)&\defeq W_X^{\alpha}(y)+ W_X^{\beta}(y)
810: = \frac{1}{M} \sum_{i=1}^M W_{X_i}(y),
811: \end{align*}
812: we have the following lemma.
813: \begin{lem}\Label{lem-1-11}
814: The $M$ random variables 
815: $X=(X_1, \ldots, X_M)$ satisfy the following inequality
816: \begin{align}
817: \rE_X
818: \left\| W_X^{M} - W_p \right\|_1 
819: \le & 2 \delta_{p,W,C}
820: + \sqrt{\frac{\delta_{p,W,C}'}{M}} \Label{1-11-1}\\
821: \rE_X D(W_X^{M}\|W_p) 
822: \le &
823: \frac{\log (1+ M^t e^{\phi(t|W,p)})}{-t}\Label{1-11-3}
824: \end{align}
825: for $0 \,> t \ge - \frac{1}{2}$.
826: If the cardinality $\cY$ is finite,
827: the inequality 
828: \begin{align}
829: \rE_X D(W_X^{M}\|W_p) 
830: \le & \eta(\delta_{p,W,C})+  \delta_{p,W,C}\log |\cY| + 
831: \frac{\delta_{p,W,C}'}{M} \Label{1-11-2}
832: \end{align}
833: holds.
834: \end{lem}
835: 
836: Since there exists a resolvability code $\Psi$ 
837: with the size $M$ such that 
838: \begin{align*}
839: \epsilon (\Psi,W_p)\le \rE_X
840: \left\| W_X^{M} - W_p \right\|_1 ,
841: \end{align*}
842: the inequality (\ref{1-11-1}) guarantees the existence 
843: of a resolvability code $\Psi$ satisfying (\ref{3-3-10}).
844: On the other hand, 
845: the relation $\frac{W_{x}^{\alpha}(y)}{W_p(y)}= 
846: \frac{W_{x}(y)}{W_p(y)}I_{x}^c(y)\le C$ holds.
847: Thus,
848: \begin{align*}
849: \delta_{p,W,C}'=
850: \sum_y W_x(y) \frac{W_{x}^{\alpha}(y)}{W_p(y)} \le C.
851: \end{align*}
852: Similarly, 
853: since there exists a resolvability code $\Psi$ 
854: with the size $M$ such that 
855: \begin{align*}
856: D(\Psi',W_p) \le 
857: \rE_X D(W_X^{M}\|W_p) ,
858: \end{align*}
859: the inequalities (\ref{1-11-3}) and (\ref{1-11-2}) guarantees the existence 
860: of a resolvability code $\Psi$ satisfying (\ref{6-26-1}) and (\ref{7-1-3}).
861: \end{proof}
862: \quad{\it Proof of Lemma \ref{lem-1-11}}:
863: 
864: First, we show (\ref{1-11-1}). 
865: Since 
866: \begin{align*}
867:  \delta_{p,W,C}
868: =\rE_{p,x} W_{x} (\cU_x)
869: = \rE_p \| W_x^{\beta}\|
870: = \| W_p^{\beta} \|,
871: \end{align*}
872: we can evaluate
873: \begin{align*}
874: & \rE_X
875: \left\| W_X^{M} - W_p \right\|_1 \\
876: = &
877: \rE_X
878: \left\| W_X^{\alpha} - W_p^{\alpha}
879: +W_X^{\beta} - W_p^{\beta} \right\|_1 \\
880: \le &
881: \rE_X
882: \left\| W_X^{\alpha}- W_p^{\alpha} \right\|_1 
883:  + \sum_{i=1}^M \frac{1}{M}\rE_X \left\|W_{X_i}^{\beta}\right\|_1
884: +\left\|W_p^{\beta}\right\|_1 \\
885: = &
886: \rE_X
887: \left\| W_X^{\alpha}- W_p^{\alpha} \right\|_1 
888: + 2\rE_{p,x} W_{x} (\cU_x).
889: \end{align*}
890: Next, we focus on 
891: the Schwarz inequality regarding 
892: the random variable
893: $l_X(y) \defeq \frac{W_X^{\alpha}}{W_p}(y)$
894: and the sign function $\tilde{l}_X(y)\defeq
895: \frac{l_X(y)}{|l_X(y)|}$ 
896: (we can check that $\tilde{l}_X^2=1$.),
897: then we obtain
898: \begin{align*}
899: &(\|W_p l_X\|_1 )^2= 
900: (\rE_{W_p} |l_X(y)|)^2= (\rE_{W_p} l_X (y)\tilde{l}_X(y))^2 \\
901: \le &\rE_{W_p} l_X^2(y) \rE_{W_p} \tilde{l}_X^2(y)
902: = \rE_{W_p} l_X^2(y) .
903: \end{align*}
904: Thus, the Jensen inequality yields that
905: \begin{align*}
906: \left( 
907: \rE_X
908: \left\| W_{X}^{\alpha} - W_p^{\alpha} \right\|_1
909: \right)^2
910: \le \rE_X
911: \left\| W_{X}^{\alpha} - W_p^{\alpha} \right\|_1^2
912: \le \rE_X \rE_{W_p} l_X^2 (y).
913: \end{align*}
914: Since $\rE_x \frac{W_x^{\alpha}(y)}{W_p(y)} = 
915: \frac{W_p^{\alpha}(y)}{W_p(y)}$, we have
916: \begin{align*}
917: & \rE_X \rE_{W_p} l_X^2 
918: =\rE_{W_p} \rE_X l_X^2(y) \\
919: = &
920: \rE_{W_p} \rE_X
921: \frac{1}{M^2} \sum_{i=1}^M 
922: \left(\frac{W_{X_i}^{\alpha}(y)}{W_p(y)}
923: -\frac{W_p^{\alpha}(y)}{W_p(y)}\right)^2 \\
924: = &
925: \rE_{W_p} 
926: \frac{1}{M} \rE_x
927: \left (\left(\frac{W_{x}^{\alpha}(y)}{W_p(y)}\right)^2 
928: -\left(\frac{W_p^{\alpha}(y)}{W_p(y)}\right)^2 \right)\\
929: \le &
930: \rE_x
931: \frac{1}{M} \rE_{W_p} 
932: \left(\frac{W_{x}^{\alpha}(y)}{W_p(y)}\right)^2 
933: = \frac{\delta_{p,W,C}'}{M}.
934: \end{align*}
935: Therefore, we obtain
936: \begin{align*}
937: \rE_X\left\| \sum_{i=1}^M \frac{1}{M} W_{X_i} 
938: - W_p \right\|_1 
939: \le 2 \delta_{p,W,C}
940: + \sqrt{\frac{\delta_{p,W,C}'}{M}} .
941: \end{align*}
942: Hence, we obtain (\ref{1-11-1}).
943: 
944: Next, we show (\ref{1-11-2}).
945: Since $\frac{W_X^{M}(y)}{W_p(y)} 
946: \le \frac{1}{W_p^{\beta}(y)}$,
947: by using the inequality $\log x \le x-1$,
948: we can evaluate
949: \begin{align*}
950: &\rE_X D(W_X^{M}\|W_p) \\
951: =& \rE_X \sum_y \left( W_X^{\alpha}(y)\log 
952: \frac{W_X^{M}(y)}{W_p(y)}
953: + \sum_y W_X^{\beta}(y)\log 
954: \frac{W_X^{M}(y)}{W_p(y)}\right) \\
955: \le& \rE_X \sum_y \left( W_X^{\alpha}(y)\left( 
956: \frac{W_X^{M}(y)}{W_p(y)}-1 \right)
957: + W_X^{\beta}(y)\log 
958:  \frac{1}{W_p^{\beta}(y)} \right)\\
959: =&\sum_y 
960: \rE_X W_X^{\alpha}(y)
961: \left( \frac{W_X^{M}(y)}{W_p(y)}-1 \right)
962: + \sum_y W_p^{\beta}(y)\log 
963: \frac{1}{W_p^{\beta}(y)} .
964: \end{align*}
965: Regarding the first term,
966: we can calculate
967: \begin{align*}
968: & \sum_y \rE_X W_X^{\alpha}(y)
969: \left( \frac{W_X^{M}(y)}{W_p(y)}-1 \right)\\
970: =&
971: \sum_y \rE_X \frac{1}{M^2}\sum_{i,j}
972: W_{X_i}^{\alpha}(y)
973: \left( \frac{W_{X_j}(y)}{W_p(y)}-1 \right)\\
974: = & \sum_y \frac{1}{M}\rE_{p,x}
975: W_{x}^{\alpha}(y)
976: \left( \frac{W_{x}(y)}{W_p(y)}-1 \right) \\
977: \le &\sum_y \frac{1}{M}\rE_{p,x}
978: \frac{W_{x}^{\alpha}(y)}{W_p(y)}
979: W_{x}(y) 
980: = \frac{\delta_{p,W,C}'}{M},
981: \end{align*}
982: where we use the relation $\rE_X
983: W_{X_i}^{\alpha}(y)
984: \left( \frac{W_{X_j}(y)}{W_p(y)}-1 \right)
985: =0$ for $i \neq j$.
986: Concerning the second term, 
987: letting $K\defeq \sum_y W_p^{\beta}(y)$,
988: we have 
989: \begin{align*}
990: &\sum_y W_p^{\beta}(y)\log 
991: \frac{1}{W_p^{\beta}(y)} \\
992: =&
993: - K \log K - K \sum_y \frac{W_p^{\beta}(y)}{K}
994: \log \frac{W_p^{\beta}(y)}{K}\\
995: \le &\eta( \sum_y W_p^{\beta}(y))
996: +  \sum_y W_p^{\beta}(y) \log |\cY|,
997: \end{align*}
998: because $\log |\cY|$ is the maximal entropy 
999: of the distribution on the probability space $\cY$.
1000: Since
1001: $\sum_y W_p^{\beta}(y)=
1002: \delta_{p,W,C}$, 
1003: we obtain 
1004: (\ref{1-11-2}).
1005: 
1006: Finally, we prove (\ref{1-11-3})
1007: by a different method.
1008: The quantity $\rE_X D(W_X^{M}\|W_p)$ can be regarded as
1009: the mutual information of channel
1010: $X\mapsto W_X^{M}$ with the input probability
1011: $p^M(X)$ which equals the $M$-fold i.i.d. of $p$.
1012: We can check that 
1013: the function $t \mapsto \phi(t|W^{M},p^M)$
1014: satisfies the following property:
1015: \begin{align*}
1016: \phi(0|W^{M},p^M)&= 0 \\
1017: \left.\frac{\,d \phi(t|W^{M},p^M)}{\,d t}
1018: \right|_{t=0}& = -\rE_X D(W_X^{M}\|W_p), \\
1019: \frac{\,d^2 \phi(t|W^{M},p^M)}{\,d t^2}
1020: & \ge 0 .
1021: \end{align*}
1022: Hence, its convexity guarantees
1023: the inequality
1024: $-t\, \rE_X D(W_X^{M}\|W_p) \le\phi(t|W^{M},p^M)$,
1025: which implies the inequality
1026: \begin{align}
1027: \rE_X D(W_X^{M}\|W_p)
1028: \le \frac{\phi(t|W^{M},p^M)}{-t}\Label{1-12-1}
1029: \end{align}
1030: for $0 \,> t \ge -\frac{1}{2}$.
1031: 
1032: Let $1+s= \frac{1}{1+t}$, then 
1033: $1\ge s \,> 0$ and $t= \frac{-s}{1+s}$.
1034: Since $x \mapsto x^s$ is concave,
1035: \begin{align}
1036: \rE_X (\sum_{j\neq i} W_{X_j}(y))^s 
1037: \le \bigl[\rE_X \sum_{j\neq i} W_{X_j}(y)\bigl]^s 
1038: = (M-1)^s W_p^s(y). \Label{7-4-1}
1039: \end{align}
1040: Using (\ref{7-4-1}) and the relation $(x+y)^s \le x^s + y^s$ for 
1041: two positive real numbers $x,y$, 
1042: we obtain
1043: \begin{align*}
1044: &e^{\phi(t|W^{M},p^M)}
1045: = \sum_y \left(\rE_X (W_X^{M})^{1+s}(y)\right)^{\frac{1}{1+s}}\\
1046: =& \frac{1}{M}\sum_y \Biggl(\rE_X 
1047: \sum_{i=1}^M W_{X_i}(y)
1048: \Bigl(W_{X_i}(y)+ \sum_{j\neq i} W_{X_j}(y)\Bigr)^s
1049: \Biggr)^{\frac{1}{1+s}}\\
1050: \le &\frac{1}{M}\sum_y \Biggl(\rE_X 
1051: \sum_{i=1}^M W_{X_i}(y)
1052: \Bigl(W_{X_i}^s(y)+ \Bigl(\sum_{j\neq i} W_{X_j}(y)\Bigr)^s\Bigr)
1053: \Biggr)^{\frac{1}{1+s}}\\
1054: = &\frac{1}{M}\sum_y 
1055: \Biggl(
1056: \sum_{i=1}^M \rE_X W_{X_i}^{1+s}(y)\\
1057: & \quad 
1058: +\sum_{i=1}^M \rE_X W_{X_i}(y) 
1059: \Bigl(\sum_{j\neq i} W_{X_j}(y)\Bigr)^s
1060: \Biggr)^{\frac{1}{1+s}}\\
1061: \le& \sum_y 
1062: \frac{1}{M}\left(
1063: \sum_{i=1}^M \rE_X W_{X_i}^{1+s}(y)
1064: +\sum_{i=1}^M (M-1)^s W_p^{1+s}(y)
1065: \right)^{\frac{1}{1+s}}\\
1066: =  &\frac{1}{M}\sum_y
1067: \left(M \rE_x W_{x}^{1+s}(y)
1068: +M (M-1)^s W_p^{1+s}(y)
1069: \right)^{\frac{1}{1+s}}\\
1070: \le &
1071: \frac{1}{M}\sum_y 
1072: \left(M \rE_x W_{x}^{1+s}(y)\right)^{\frac{1}{1+s}}
1073: +\left(M (M-1)^s W_p^{1+s}(y)\right)^{\frac{1}{1+s}}\\
1074: =&
1075: \sum_y 
1076: \frac{\left(\rE_x W_{x}^{1+s}(y)\right)^{\frac{1}{1+s}}}{M^{\frac{s}{1+s}}}
1077: +\Bigl(\frac{M-1}{M}\Bigr)^{\frac{s}{1+s}} W_p(y)\\
1078: \le & 1+
1079: \frac{1}{M^{\frac{s}{1+s}}} 
1080: \sum_y \left(\rE_x W_{x}^{1+s}(y)\right)^{\frac{1}{1+s}}
1081: = 1+ M^t e^{\phi(t|W,p)}.
1082: \end{align*}
1083: Since $-t$ is positive, 
1084: the desired inequality (\ref{1-11-3})
1085: follows from (\ref{1-12-1}) and the above inequality.
1086: \endproof
1087: 
1088: Next, we proceed to the relation with identification codes.
1089: In order to discuss this relation, 
1090: we focus on channel resolvability of the worst input case,
1091: and define the following values:
1092: \begin{align*}
1093: \epsilon(M,W)\defeq&
1094: \max_{p\in \cP(\cX)}
1095: \min_{\Psi:|\Psi|\le M}\epsilon(\Psi,W_p),\\
1096: D(M,W)\defeq&
1097: \max_{p\in \cP(\cX)}
1098: \min_{\Psi:|\Psi|\le M}D(\Psi,W_p),
1099: \end{align*}
1100: which satisfies 
1101: \begin{align}
1102: \epsilon(M,W)\le
1103: 2 \max_p \rE_p 
1104: W_x \left\{ \frac{W_x}{W_p}(y) \,> C\right\} + 
1105: \sqrt{\frac{C}{M}} ,
1106: \Label{3-3-3}
1107: \end{align}
1108: for any real number $C\,>0$.
1109: \begin{lem}\Label{H-V}
1110: (Han \& Verd\'{u}\cite{Han-V})
1111: If 
1112: the cardinality $|\cX|$ is finite, and if
1113: an identification code $\Phi$ and 
1114: an integer $M$
1115: satisfy 
1116: \begin{align*}
1117: 1- \mu (\Phi)-\lambda(\Phi)
1118: \,> \epsilon (M,W),
1119: \end{align*}
1120: then
1121: \begin{align}
1122: |\cX|^{M} \ge |\Phi|.\Label{3-1}
1123: \end{align}
1124: \end{lem}
1125: \begin{proof}
1126: Let the identification code $\Phi$ be a triplet
1127: $(N, \{Q_1 ,\ldots, Q_N\}, \{\cD_1,\ldots,\cD_N\})$,
1128: then 
1129: there exist $N$ $M$-types $Q_1', \ldots Q_N'$ such that
1130: \begin{align*} 
1131: d(W_{Q_i}, W_{Q_i'}) \le \epsilon (M,W).
1132: \end{align*}
1133: Since 
1134: the inequalities
1135: \begin{align*}
1136: & 2 \epsilon (M,W) + d( W_{Q_i'},  W_{Q_j'} )\\
1137: \ge & d( W_{Q_i},  W_{Q_i'} )+ d(W_{Q_j}, W_{Q_j'} )+ d(W_{Q_i'}, 
1138: W_{Q_j'} ) \\
1139: \ge &
1140: d( W_{Q_i}, W_{Q_j} ) \ge 
1141: 2(W_{Q_i}(\cD_i)-  W_{Q_j}(\cD_i)) \\
1142: \ge & 2 (1- \mu (\Phi)-\lambda(\Phi))
1143: \end{align*}
1144: hold for any $i\neq j$,
1145: we can show
1146: \begin{align*}
1147: d(W_{Q_i'}, W_{Q_j'} )\,> 0,
1148: \end{align*}
1149: which implies that $Q_i' $ is different from $Q_j'$.
1150: However, the total number of 
1151: $M$-types
1152: %input distributions with the form $\frac{1}{M}\sum_{i=1}^M 1_{x_i}$
1153: is less than $|\cX|^M$.
1154: Therefore, we obtain (\ref{3-1}).
1155: \end{proof}
1156: 
1157: 
1158: \section{Wire-tap channel in non-asymptotic setting}
1159: Next, we discuss the message transmission with the 
1160: wire-tapper who has less information than
1161: the main receiver.
1162: This problem is formulated as follows.
1163: Let $\cY$ be the probability space of the main receiver,
1164: and $\cZ$ be the space of the wire-tapper,
1165: then the main channel from the transmitter to the main receiver
1166: is described by $W^B:x \mapsto W^B_x$,
1167: and the wire-tapper channel from the transmitter to the 
1168: the wire-tapper is described by $W^E:x \mapsto W^E_x$.
1169: In this setting,
1170: the transmitter choose $M$ 
1171: distributions $Q_1, \ldots, Q_M$ on $\cX$,
1172: and he generates $x\in \cX$ subject to $Q_i$
1173: when he wants to send the message $i \in \{1, \ldots, M\}$.
1174: The normal receiver prepares $M$ disjoint subsets
1175: $\cD_1,\ldots, \cD_M$ of $\cY$ and 
1176: judges that a message is $i$ if $y$ belongs to $\cD_i$.
1177: Therefore, the triplet $(M,\{Q_1, \ldots, Q_M\},
1178: \{\cD_1,\ldots, \cD_M\})$ is called a
1179: code, and is described by $\Phi$.
1180: Its performance is given by the following quantities.
1181: One is the size $M$, which is denoted by $|\Phi|$.
1182: The second one is the average 
1183: error probability $\epsilon_B(\Phi)$:
1184: \begin{align*}
1185: \epsilon_B(\Phi)\defeq
1186: \frac{1}{M} \sum_{i=1}^M  W_{Q_i}^B (\cD_i^c),
1187: \end{align*}
1188: and the third one is the wire-tapper's information
1189: regarding the transmitted message $I_E(\Phi)$:
1190: \begin{align*} 
1191: I_E(\Phi) \defeq \sum_i \frac{1}{M} D(  W_{Q_i}^E\| W^E_{\Phi}),\quad
1192: W^E_{\Phi}  \defeq \sum_i \frac{1}{M} W_{Q_i}^E.
1193: \end{align*}
1194: A different measure of the wire-tapper's information is given 
1195: by the average variational 
1196: distance $d_E(\Phi)$:
1197: \begin{align*}
1198: d_E(\Phi)\defeq \frac{1}{M(M-1)} \sum_{i\neq j} d( W_{Q_i}^E,W_{Q_j}^E).
1199: \end{align*}
1200: \begin{thm}\Label{3-6}
1201: There exists a code $\Phi$ for any
1202: integers $L,M$,
1203: any real numbers $C, C' \,> 0$,
1204: and any probability distribution $p$ on $\cX$
1205: such that
1206: \begin{align}
1207: |\Phi| &=M \nonumber \\
1208: \epsilon_B(\Phi) & \le 3
1209: \min_{0\le s\le 1}
1210: (ML)^{s}\sum_y \left( \rE_p (W_x^B(y))^{1/(1+s)}\right)^{1+s} 
1211: \Label{3-8-1}\\
1212: \epsilon_B(\Phi) & \le 3
1213: \left(\rE_p W_x  \left\{ \frac{W_x^B}{W_p^B}(y) \le C'\right\}+
1214: \frac{ML}{C'}\right)\Label{3-8-2}\\
1215: I_E(\Phi) & \le  3
1216: \left(\eta(\delta_{p,W^E,C})+ \delta_{p,W^E,C} \log |\cZ| + 
1217: \frac{\delta_{p,W^E,C}'}{L}
1218: \right)\Label{3-6-2} \\
1219: I_E(\Phi) & \le  3
1220: \min_{0 > t \ge -1/2}
1221: \frac{\log (1+ L^t e^{\phi(t|W^E,p)})}{-t}
1222: \Label{7-1-2} \\
1223: d_E(\Phi) & \le  6
1224: \left(2 \delta_{p,W^E,C} + 
1225: \sqrt{\frac{\delta_{p,W^E,C}'}{L}}\right).\Label{3-8-12} 
1226: \end{align}
1227: \end{thm}
1228: 
1229: \begin{proof}
1230: We prove Theorem \ref{3-6}
1231: by a random coding method.
1232: Let $X=(X_{l,m})$ be $LM$ independent and identical random
1233: variables subject to the distribution $p$ on $\cX$
1234: for integers $l=1, \ldots, L$ and $m=1,\ldots,M$, and
1235: $\cD_{l,m}'(X)$ be the maximum likelihood decoder
1236: of the code $X_{l,m}$,
1237: then we can evaluate as follows by Gallager upper bound\cite{Gal}.
1238: \begin{align*}
1239: &\rE_X \frac{1}{ML}\sum_{l,m} W^B_{X_{m,l}}(\cD_{l,m}'(X)^c)\\
1240: \le & \min_{0\le s\le 1}
1241: (ML)^{s}\sum_y \left(
1242: \rE_p (W_x^B(y))^{1/(1+s)}\right)^{1+s}.
1243: \end{align*}
1244: Since the maximum likelihood decoder is better than 
1245: the code $\cD_{l,m}''(X)= 
1246: \left\{ \frac{W_x^B}{W_p^B}(y) \,> C'\right\}
1247: \setminus \cup_{(l',m')\neq (l,m)}
1248: \left\{ \frac{W_x^B}{W_p^B}(y) \,> C'\right\}$,
1249: we have another evaluation as
1250: \begin{align*}
1251: &\rE_X \frac{1}{ML}\sum_{l,m} W^B_{X_{m,l}}(\cD_{l,m}'(X)^c)\\
1252: \le 
1253: &\rE_X \frac{1}{ML}\sum_{l,m} W^B_{X_{m,l}}(\cD_{l,m}''(X)^c)\\
1254: \le &
1255: \rE_X 
1256: \frac{1}{ML}\sum_{l,m} W^B_{X_{m,l}}
1257: \left\{ \frac{W_{X_{m,l}}^B}{W_p^B}(y) \le C'\right\} \\
1258: &\quad +
1259: \rE_X 
1260: \frac{1}{ML}\sum_{l,m} W^B_{X_{m,l}}
1261: \sum_{(l',m')\neq (l,m)} 
1262: \left\{ \frac{W_{X_{m',l'}}^B}{W_p^B}(y) \le C'\right\} \\
1263: \le &
1264: \rE_{p,x} 
1265: W^B_{x}
1266: \left\{ \frac{W_x^B}{W_p^B}(y) \le C'\right\} \\
1267: & \quad +
1268: W^B_p
1269: (ML-1) \rE_{p,x} 
1270: \left\{ \frac{W_x^B}{W_p^B}(y) \le C'\right\} \\
1271: \le &
1272: \rE_{p,x} 
1273: W^B_{x}
1274: \left\{ \frac{W_x^B}{W_p^B}(y) \le C'\right\}
1275: +
1276: \frac{ML}{C'}.
1277: \end{align*}
1278: Let $Q_m(X)$ be the uniform distribution on 
1279: $\{X_{1,m},\ldots, X_{L,m}\}$,
1280: $\cD_m(X)$ be $\cup_l \cD_{l,m}'(X)$,
1281: and $\Phi(X)$ be the code
1282: $(M,\{Q_m(X)\},\{\cD_m(X)\})$,
1283: then $\rE_X \epsilon_B(\Phi(X))$ is less than 
1284: the right hand sides of (\ref{3-8-1}) and (\ref{3-8-2})
1285: because the average error probability of $\Phi(X)$
1286: is less than the one of the code 
1287: $(ML,\{X_{m,l}\},\{\cD_{l,m}'(X)\})$.
1288: 
1289: Since
1290: \begin{align*}
1291: & \sum_{m=1}^M  
1292: \frac{1}{M} D( W_{Q_m(X)}^E\|W^E_{\Phi(X)})
1293: + D(W^E_{\Phi(X)}\| W^E_p) \\
1294: = & \sum_{m=1}^M  
1295: \frac{1}{M} D( W_{Q_m(X)}^E\|W^E_p),
1296: \end{align*}
1297: we obtain
1298: \begin{align*}
1299: & \rE_X I_E(\Phi(X))
1300: = \rE_X \sum_{m=1}^M  
1301: \frac{1}{M} D( W_{Q_m(X)}^E\|W^E_{\Phi(X)}) \\
1302: \le &
1303: \rE_X \sum_{m=1}^M  
1304: \frac{1}{M} D( W_{Q_m(X)}^E\|W^E_p) \\
1305: \le &
1306: \eta(\delta_{p,W^E,C})+ \delta_{p,W^E,C} \log |\cZ| + 
1307: \frac{\delta_{p,W,C}'}{L},
1308: \end{align*}
1309: where the last inequality follows from
1310: Lemma \ref{lem-1-11}. Similarly,
1311: we can show
1312: \begin{align*}
1313: \rE_X I_E(\Phi(X)) \le\frac{\log (1+ L^t e^{\phi(t|W^E,p)})}{-t}.
1314: \end{align*}
1315: Regarding $d_E(\Phi(X))$,
1316: we can calculate 
1317: \begin{align*}
1318: &\rE_X \frac{1}{M(M-1)} \sum_{i\neq j} d( W^E_{Q_i(X)},W^E_{Q_j (X)}) \\
1319: \le &
1320: \rE_X \frac{1}{M(M-1)} \sum_{i\neq j} d( W^E_{Q_i(X)},W^E_p)
1321: + d( W^E_{Q_j(X)},W^E_p) \\
1322: =& 2
1323: \rE_X d( W^E_{Q_1(X)},W^E_p) \\
1324: \le & 2 \left(2 \delta_{p,W,C} + \sqrt{\frac{\delta_{p,W,C}'}{L}}\right).
1325: \end{align*}
1326: Using Markov inequality, we obtain
1327: \begin{align*}
1328: \rP_X \{ \epsilon_B(\Phi(X)) \le 3 \rE \epsilon_B(\Phi(X)) \}^c
1329: &\,< \frac{1}{3} \\
1330: \rP_X \{ I_E(\Phi(X)) \le 3 \rE I_E(\Phi(X))\}^c
1331: &\,< \frac{1}{3} \\
1332: \rP_X \{ d_E(\Phi(X)) \le 3 \rE d_E(\Phi(X))\}^c
1333: &\,< \frac{1}{3}.
1334: \end{align*}
1335: Therefore, there exists a code $\Phi$ satisfying desired conditions.
1336: \end{proof} 
1337: %\epsilon_B(\Phi)\le 2 \rE_p
1338: %W_x^B \left\{  \frac{W_x^B}{W_p}(y) \le C_1 \right\} 
1339: %+ (ML) W_p \left\{  \frac{W_x^B}{W_p}(y) \,> C_1 \right\},\\
1340: 
1341: \section{General asymptotic setting}
1342: \subsection{Identification code and channel resolvability}
1343: Next, we focus on an arbitrary sequence of channels
1344: $\bW=\{W^n\}_{n=1}^{\infty}$, in which $W^n$ is an arbitrary channel from 
1345: $\cX^n$ to $\cY^n$.
1346: In this setting,
1347: two-types of $(\mu,\lambda)$-identification capacities are defined by
1348: \begin{align}
1349: &D(\mu,\lambda|\bW) \nonumber \\
1350: \defeq &
1351: \sup_{\{\Phi_n\}}
1352: \left\{\left.
1353: \varliminf \frac{1}{n}\log\log |\Phi_n|
1354: \right|
1355: \varlimsup \mu (\Phi_n)\,< \mu,
1356: \varlimsup \lambda(\Phi_n)\le \lambda
1357: \right\}\nonumber\\
1358: & D^{\dagger}(\mu,\lambda|\bW) \nonumber\\
1359: \defeq & 
1360: \sup_{\{\Phi_n\}}
1361: \left\{\left.
1362: \varliminf \frac{1}{n}\log\log |\Phi_n|
1363: \right|
1364: \varliminf \mu (\Phi_n)\,< \mu,
1365: \varlimsup \lambda(\Phi_n)\le \lambda
1366: \right\}.\nonumber
1367: \end{align}
1368: However, in the case of $\mu =0$,
1369: we replace $\varlimsup \mu (\Phi_n)\,< \mu,
1370: (\varliminf \mu (\Phi_n)\,< \mu)$ by $
1371: \varlimsup \mu (\Phi_n)=0,
1372: (\varliminf \mu (\Phi_n)=0)$ at the above two definitions.
1373: On the other hand,
1374: two-types $\epsilon$-resolvability capacities are defined by
1375: \begin{align*}
1376: S(\epsilon|\bW) & \defeq
1377: \sup
1378: \left\{\left.R
1379: \right|
1380: \varlimsup \epsilon(e^{nR},W^n) \le \epsilon
1381: \right\} \\
1382: S^{\dagger}(\epsilon|\bW) & \defeq
1383: \sup
1384: \left\{\left.R
1385: \right|
1386: \varliminf \epsilon(e^{nR},W^n) \le \epsilon
1387: \right\},
1388: \end{align*}
1389: where the case of $\epsilon=2$,
1390: we replace $\le \epsilon $ by $\,< 2$ 
1391: at the above two definitions.
1392: 
1393: In the information spectrum method,
1394: the following quantities 
1395: are defined for arbitrary sequence $\bp = \{p^n\}_{n=1}^{\infty}$
1396: of input probability distributions:
1397: \begin{align*}
1398: &\overline{I}(\epsilon| \bp, \bW) \\
1399: \defeq &
1400: \inf\left\{
1401: a \left|
1402: \varlimsup \rE_{p^n}
1403: W_x^n\left\{ 
1404: \frac{1}{n}\log \frac{W_x^n}{W_{p^n}^n}(y)\,> a
1405: \right\}
1406: \le \epsilon
1407: \right.
1408: \right\}\\
1409: & \underline{I}(\epsilon| \bp, \bW)\\
1410: \defeq &
1411: \inf\left\{
1412: a \left|
1413: \varliminf \rE_{p^n}
1414: W_x^n\left\{ 
1415: \frac{1}{n}\log \frac{W_x^n}{W_{p^n}^n}(y)\,> a
1416: \right\}
1417: \le \epsilon
1418: \right.
1419: \right\},
1420: \end{align*}
1421: where the case of $\epsilon =1$,
1422: we replace $\le $ by $\,<$ at the above definitions.
1423: These quantities have another expression as
1424: \begin{align*}
1425: &\overline{I}(\epsilon| \bp, \bW) \\
1426: =& \sup \left\{
1427: a \left|
1428: \varliminf 
1429: \rE_{p^n}
1430: W_x^n\left\{ 
1431: \frac{1}{n}\log \frac{W_x^n}{W_{p^n}^n}(y)\le a
1432: \right\}
1433: \,<1- \epsilon
1434: \right.
1435: \right\}, \\
1436: &\underline{I}(\epsilon| \bp, \bW)\\
1437: =& \sup \left\{
1438: a \left|
1439: \varlimsup 
1440: \rE_{p^n}
1441: W_x^n\left\{ 
1442: \frac{1}{n}\log \frac{W_x^n}{W_{p^n}^n}(y)\le a
1443: \right\}
1444: \,<1- \epsilon
1445: \right.
1446: \right\}.
1447: \end{align*}
1448: %of $S(\epsilon|\bW) ,S^{\dagger}(\epsilon|\bW),
1449: %\underline{I}(\epsilon| \bp, \bW),$ and 
1450: %$\overline{I}(\epsilon| \bp, \bW)$.
1451: \begin{thm}\Label{t-3}
1452: Assume that $|\cX^n|= d^n$, then
1453: the above quantities satisfy the following relations.
1454: \begin{align}
1455: & \sup_{\bp} \underline{I}(\epsilon| \bp, \bW) 
1456: \le D (1-\epsilon,0|\bW)
1457: \le S^{\dagger}(\epsilon|\bW) \nonumber \\
1458: \le &\sup_{\bp} \underline{I}(\frac{\epsilon}{2}| \bp, \bW) 
1459: \Label{3-3-1}\\
1460: & \sup_{\bp} \overline{I}(\epsilon| \bp, \bW) 
1461: \le D^{\dagger} (1-\epsilon,0|\bW)
1462: \le S(\epsilon|\bW)\nonumber \\
1463: \le & \sup_{\bp} \overline{I}(\frac{\epsilon}{2}| \bp, \bW) ,
1464: \Label{3-3-2}
1465: \end{align}
1466: for any real number $0 \le \epsilon \,<1$.
1467: However, the first inequalities in (\ref{3-3-1}) and (\ref{3-3-2})
1468: hold for $0 \le \epsilon \le 1$, and 
1469: the third ones hold for $0\le \epsilon \le 2$.
1470: In particular,
1471: we obtain
1472: \begin{align}
1473: \sup_{\bp} \underline{I}(0| \bp, \bW) 
1474: &= D (1,0|\bW)
1475: = S^{\dagger}(0|\bW) \Label{1-13-1}\\
1476: \sup_{\bp} \overline{I}(0| \bp, \bW) 
1477: &= D^{\dagger} (1,0|\bW)
1478: = S(0|\bW),\Label{1-13-2}
1479: \end{align}
1480: which is desired in Han \& Verd\'{u}\cite{Han-V} and 
1481: Han\cite{Han-book}\footnote{Theorem 6 in Han and Verd\'{u}\cite{Han-V}
1482: claims that $S(0|\bW)=\sup_{\bp} \overline{I}(0| \bp, \bW) $
1483: always holds for any channel $\bW$ if the input alphabet is finite.
1484: However, the proof in \cite{Han-V} contains mistake in part, as
1485: is mentioned in section 6.3 in Han\cite{Han-book}.
1486: Therefore, it has been an open problem
1487: as to whether this inequality holds or not.}.
1488: \end{thm}
1489: This theorem indicates the existence of a code satisfying the following:
1490: The second error probability $\lambda$ is asymptotically independent for the 
1491: behavior of the distribution of the random variable of 
1492: likelihood and always goes to $0$, and only the second error 
1493: probability $\mu$ asymptotically depends on it.
1494: \begin{rem}
1495: Steinberg\cite{Steinberg} claims the inequalities 
1496: \begin{align*}
1497: \sup_{\bp} \underline{I}(\epsilon| \bp, \bW) 
1498: &\ge D (\lambda_1,\lambda_2|\bW),\\
1499: \sup_{\bp} \overline{I}(\epsilon| \bp, \bW) 
1500: &\ge D^\dagger (\lambda_1,\lambda_2|\bW)
1501: \end{align*}
1502: for $\lambda_1+\lambda_2 \,< 1- \epsilon$.
1503: If they are proved, 
1504: by combining the above inequalities and Theorem \ref{t-3},
1505: we can prove the equalities of the above inequalities
1506: in the continuous case.
1507: However, it seems that 
1508: his paper has a gap in counting the maximum number of
1509: different pairs of 
1510: a partial response and an $M'$-type measure 
1511: at the proof of Lemma 2,
1512: which is essential for these inequalities.
1513: That is,
1514: he estimated the total number of 
1515: positive functions on $\cX \times \cY$ with the form
1516: \begin{align*}
1517: f(x,y) =\frac{1}{M'}
1518: \sum_{i=1}^{M'}1_{x_i}(x) \sum_{(x',y')\in F}1_{(x',y')} (x,y),
1519: \end{align*}
1520: where $F$ is an arbitrary subset of $\cX \times \cY$.
1521: The total measure of $f$, {\it i.e.},
1522: $\sum_{(x,y)\in \cX \times \cY}f(x,y)$
1523: is not necessarily less than $1$,
1524: while he indicated that it is less than $1$.
1525: Hence, this total number cannot be bounded by 
1526: $|\cX|^{M'}$.
1527: \end{rem}
1528: \begin{proof}
1529: In order to prove the first inequalities,
1530: we choose an arbitrary real number $R \,< \sup_{\bp} 
1531: \underline{I}(\epsilon| \bp, \bW)$ and a sequence of 
1532: input probability distributions $\bp$ such that
1533: $R \,< R'\defeq \underline{I}(1- \mu | \bp, \bW)$.
1534: Substitute $M=e^{nR},C=e^{nR'},\alpha=\beta=1+\frac{2}{n},
1535: \alpha'=\beta'=\frac{1}{n+2},
1536: \tau= \frac{1}{n+2},
1537: \kappa= \frac{\log 2 +1}{\log n}$ in Theorem \ref{t-1},
1538: then the conditions (\ref{3-3-5}) and (\ref{3-3-4}) are satisfied and
1539: $\gamma= \frac{1}{n+2}$.
1540: Thus, there exists an identification code $\Phi_n$ such that
1541: \begin{align*}
1542: |\Phi_n|& = \left\lfloor \frac{e^{\frac{e^{nR}}{n+2}}}{e^{1+nR} }\right\rfloor \\
1543: \mu(\Phi_n)
1544: & \le (1+\frac{2}{n})^2 \rE_{p^n} 
1545: W_x^n\left\{ 
1546: \frac{1}{n}\log \frac{W_x^n}{W_{p^n}^n}(y)\le R'
1547: \right\} \\
1548: \lambda(\Phi_n) 
1549: & \le \frac{\log 2 +1}{\log n}+(n+2)^2 \frac{1}{e^{nR'}} 
1550: \lceil (n+2)e^{nR} \rceil \\
1551: & \cong \frac{\log 2 +1}{\log n}+(n+2)^3 e^{-n(R'-R)} .
1552: \end{align*}
1553: Therefore,
1554: we obtain 
1555: \begin{align}
1556: &\lim \frac{1}{n}\log \log |\Phi_n| = R, \nonumber \\
1557: &\varlimsup \mu(\Phi_n) \le
1558: \varlimsup \rE_{p^n} 
1559: W_x^n\left\{ 
1560: \frac{1}{n}\log \frac{W_x^n}{W_{p^n}^n}(y)\le R'
1561: \right\}\,< \mu \Label{3-2-1}\\
1562: & \lim \lambda(\Phi_n) =0, \nonumber 
1563: \end{align}
1564: which implies that
1565: $D (\mu,0|\bW) \ge R'$.
1566: Thus, we obtain the first inequality in (\ref{3-3-1})
1567: for $0 \le \epsilon \,< 1$.
1568: In the case of $\epsilon = 1$,
1569: we need to replace $\,< \mu$ by $=0$ at (\ref{3-2-1}).
1570: By replacing $\varlimsup$ by $\varliminf$ at (\ref{3-2-1}),
1571: we can similarly prove $D^{\dagger} (\mu,0|\bW) \ge 
1572: \sup_{\bp} \overline{I}(1-\mu| \bp, \bW) $.
1573: 
1574: Next,
1575: we proceed to the second inequalities.
1576: Let $R$ be an arbitrary real number such that
1577: $R\,> D(1-\epsilon,0|\bW)$.
1578: Then, there exists a sequence $\{\Phi_n\}$
1579: of identification codes
1580: such that
1581: \begin{align*}
1582: R= \varlimsup \frac{1}{n} \log \log |\Phi_n|,
1583: \varlimsup \mu (\Phi_n) < 1-\epsilon,
1584: \lim \lambda (\Phi_n)=0.
1585: \end{align*}
1586: Therefore, we can choose an integer $N$ large enough, 
1587: such that
1588: $1 - \mu(\Phi_n) -\lambda (\Phi_n) \ge
1589: 1- \varlimsup \mu (\Phi_n)\,> \epsilon$.
1590: Moreover, we choose a strictly increasing sequence $\{a_n\}$
1591: of integers such that
1592: $a_1\ge N$ and
1593: $1- \varlimsup \mu (\Phi_{a_n})\,> 
1594: \epsilon (e^{a_n R'},W^n)$,
1595: where $R'= S^{\dagger}(\epsilon, \bW)$.
1596: 
1597: Thus, Lemma \ref{H-V} yields that
1598: $(d^{a_n})^{e^{a_n R'}} \ge |\Phi_{a_n}|$,
1599: which implies that
1600: $R'\ge R$.
1601: We obtain the second inequalities in (\ref{3-3-1}).
1602: We can prove the second inequalities in (\ref{3-3-2})
1603: by choosing a strictly increasing sequence $\{a_n\}$
1604: of integers such that
1605: $1 - \mu(\Phi_{a_n}) -\lambda (\Phi_{a_n}) \ge
1606: 1- \varliminf \mu (\Phi_n)\,> \epsilon$.
1607: 
1608: Finally, we prove the third inequalities
1609: by using another expression of
1610: $\sup_{\bp}\underline{I}(\epsilon| \bp, \bW)
1611: $:
1612: \begin{align*}
1613: & \sup_{\bp}\underline{I}(\epsilon| \bp, \bW) \\
1614: = &\inf \left\{
1615: a \left|
1616: \varlimsup 
1617: \max_{p^n} \rE_{p^n}
1618: W_x^n\left\{ 
1619: \frac{1}{n}\log \frac{W_x^n}{W_{p^n}^n}(y)\,> a
1620: \right\}
1621: \le\epsilon
1622: \right.
1623: \right\}.
1624: \end{align*}
1625: Let $R$ and $R'$ be arbitrary real numbers such that
1626: $R \,>\sup_{\bp}\underline{I}(\epsilon/2| \bp, \bW)$
1627: and 
1628: $R \,>R'\,> \sup_{\bp}\underline{I}(\epsilon| \bp, \bW)$,
1629: then the inequality (\ref{3-3-3}) yields that
1630: \begin{align*}
1631: &\epsilon(e^{n R} ,W^n)\\
1632: \le &
1633: 2 \min_{p^n} \rE_{p ^n}
1634: W_x^n \left\{ \frac{1}{n} \log \frac{W_x^n}{W_{p^n}^n}(y) \,>
1635: R'\right\} + e^{-n (R-R')/2}.
1636: \end{align*}
1637: Taking the limit $\varliminf$,
1638: we obtain
1639: \begin{align}
1640: \varliminf \epsilon(e^{n R} ,W^n)
1641: \le \epsilon, \Label{3-3-6}
1642: \end{align}
1643: which implies 
1644: $S^{\dagger}(2 \epsilon, \bW) \le R$.
1645: Thus, we obtain the third inequality in (\ref{3-3-1})
1646: for $0 \le \epsilon \,< 1$.
1647: In the case of $\epsilon =2$,
1648: we need to replace $\le \epsilon$ by $\,< 1$
1649: at (\ref{3-3-6}).
1650: By replacing $\varliminf$ by $\varlimsup$ in the above,
1651: we can prove the third one in (\ref{3-3-2}).
1652: \end{proof}
1653: 
1654: \subsection{Wire-tap channel}
1655: Next, we focus on a general sequence 
1656: $(\bW^B=\{W^{B,n}\}, \bW^E=\{W^{E,n}\})$  
1657: of 
1658: wire-tap channels, and define the 
1659: following two kinds of capacities
1660: by
1661: \begin{align*}
1662: &C_d(\bW^B,\bW^E ) \\
1663: \defeq &
1664: \sup_{\{\Phi_n\}}
1665: \left\{\left.
1666: \varliminf \frac{1}{n}\log |\Phi_n|
1667: \right|
1668: \lim \epsilon_B (\Phi_n)=
1669: \lim d_E(\Phi_n)= 0
1670: \right\} \\
1671: &C_I (\bW^B,\bW^E ) \\
1672: \defeq &
1673: \sup_{\{\Phi_n\}}
1674: \left\{\left.
1675: \varliminf \frac{1}{n}\log |\Phi_n|
1676: \right|
1677: \lim \epsilon_B (\Phi_n)=
1678: \lim \frac{I_E(\Phi_n)}{n}= 0
1679: \right\} .
1680: \end{align*}
1681: %In this setting, 
1682: %the following information spectrum quantity
1683: %plays a key role.
1684: %\begin{align*}
1685: %&\underline{I}(\bp,\bW^B,\bW^E)\defeq \\
1686: %&\inf\left\{ a \left|\varliminf \rE_{p^n}
1687: %W_x^n\left\{ \frac{1}{n}
1688: %\log \frac{W_x^{B,n}(y)}{W_{p^n}^{B,n}(y)}\cdot
1689: %\frac{W_{p^n}^{E,n}(y)}{W_x^{E,n}(y)}
1690: %\,> a\right\}=0\right.\right\}.
1691: %\end{align*}
1692: 
1693: \begin{lem}\Label{t-1-11}
1694: The inequality
1695: \begin{align}
1696: C_d(\bW^B,\bW^E) 
1697: \ge \underline{I}(1|\bp,\bW^B)
1698: - \overline{I}(0|\bp,\bW^E)
1699: \Label{3-8-13}
1700: \end{align}
1701: holds for any sequence of input distributions $\bp=\{p^n\}$.
1702: Furthermore, if $|\cZ^n|= d^n$,
1703: \begin{align}
1704: C_I(\bW^B,\bW^E) 
1705: \ge \underline{I}(1|\bp,\bW^B)
1706: - \overline{I}(0|\bp,\bW^E) \Label{3-8-13-1}.
1707: \end{align}
1708: \end{lem}
1709: This theorem is an information spectrum version of Wyner's result
1710: \cite{Wyner},
1711: that will be mentioned in the next section.
1712: 
1713: \begin{proof}
1714: Let $R' \,> \overline{I}(0|\bp,\bW^E)$,
1715: $R\,< \underline{I}(1|\bp,\bW^B)- R'$ and 
1716: choose a real number $a$ such that $0\,< a \,< 
1717: \min \{\underline{I}(1|\bp,\bW^B) -(R+R'), 
1718: R'- \overline{I}(0|\bp,\bW^E)\}$.
1719: Substituting $M= e^{n R}, L=e^{n R'},
1720: C= e^{n(R'-a)}, C'=e^{n(R+R'+a)}$,
1721: we can show that the right hand side of (\ref{3-8-2}) goes to $0$,
1722: and that 
1723: \begin{align*}
1724: \delta_{p^n,W^{E,n},e^{n(R'-a)}}  \to 0 , \quad
1725: \frac{\delta_{p^n,W^{E,n},e^{n(R'-a)}}'}{e^{n R'}}  \to 0.
1726: \end{align*}
1727: Hence, 
1728: the right hand side of (\ref{3-8-12}) go to $0$.
1729: Concerning (\ref{3-6-2}),
1730: the relations
1731: \begin{align*}
1732: & \frac{1}{n}
1733: \Bigl( 
1734: \eta(\delta_{p^n,W^{E,n},e^{n(R'-a)}})+ \delta_{p,W^{E,n},e^{n(R'-a)}} 
1735: \log |\cZ^n| \\
1736: & \quad + \frac{\delta_{p^n,W^{E,n},e^{n(R'-a)}}'}{e^{n R'}}
1737: \Bigr)\\
1738: = &
1739: \frac{1}{n}
1740: \eta(\delta_{p^n,W^{E,n},e^{n(R'-a)}})+ \delta_{p,W^E,e^{n(R'-a)}}
1741: \log d \\
1742: & \quad + 
1743: \frac{1}{n}
1744: \frac{\delta_{p^n,W^{E,n},e^{n(R'-a)}}'}{e^{n R'}}\\
1745: \to & 0
1746: \end{align*}
1747: hold. Therefore, we obtain (\ref{3-8-13}) and (\ref{3-8-13-1}).
1748: \end{proof}
1749: 
1750: Conversely, we obtain the following lemma.
1751: \begin{lem}\Label{l-1-14}
1752: Let $\bQ= \{Q^n\}$ be a sequence of channels from 
1753: arbitrary set $\tilde{\cX}^n$ to the set
1754: $\cX^n$ and $\bp=\{p^n\}$ be a sequence of
1755: distributions on $\tilde{\cX}^n$.
1756: Then, the inequalities
1757: \begin{align}
1758: C_d(\bW^B,\bW^E) 
1759: \le &
1760: \sup_{\bp, \bQ}
1761: \left\{
1762: \underline{I}(1|\bp,\bW^B \bQ)- \overline{I}(0|\bp,\bW^E\bQ)
1763: \right\}\Label{1-14-4}\\
1764: C_I(\bW^B,\bW^E)
1765: \le &
1766: \sup_{\bp, \bQ}
1767: \left\{
1768: \underline{I}(1|\bp,\bW^B \bQ)- \overline{I}(0|\bp,\bW^E\bQ)
1769: \right\}\Label{1-14-5}
1770: \end{align}
1771: hold, where
1772: $\bW \bQ =\{W^{n} Q^n \}$ denotes the sequence of channels 
1773: from $\tilde{\cX}^n$ to $\cY^n$:
1774: \begin{align*}
1775: (W^n Q^n)_{\tilde{x}}(y)\defeq \sum_{x \in \cX^n} W^n_{x}(y) 
1776: Q^n_{\tilde{x}}(x)
1777: \end{align*}
1778: for a sequence of channels $\bW=\{W^n\}$ 
1779: from $\cX^n$ to $\cY^n$.
1780: \end{lem}
1781: 
1782: Hence, applying Lemma \ref{t-1-11} to the sequence of the channels 
1783: $\bW^B \bQ, \bW^E\bQ$,
1784: we obtain the following theorem.
1785: \begin{thm}\Label{t-1-17}
1786: \begin{align*}
1787: &C_d(\bW^B,\bW^E) 
1788: =C_I(\bW^B,\bW^E)  \\
1789: =& \sup_{\bp, \bQ}
1790: \left\{
1791: \underline{I}(1|\bp,\bW^B \bQ)- \overline{I}(0|\bp,\bW^E\bQ)\right\}.
1792: \end{align*}
1793: \end{thm}
1794: 
1795: \quad
1796: {\it Proof of Lemma \ref{l-1-14}:}
1797: Let $\{\Phi_n =(M_n,\{Q_1^n, \ldots, Q_{M_n}^n\},
1798: \{\cD_1^n, \ldots, \cD_{M_n}^n\})\}$ 
1799: be a sequence of codes of wire-tap channel such that
1800: \begin{align*}
1801: R= \varliminf \frac{1}{n}\log |\Phi_n|,
1802: \quad
1803: \lim \epsilon_B (\Phi_n) =0, \quad
1804: \lim d_E (\Phi_n) =0.
1805: \end{align*}
1806: Hence, Verd\'{u}-Han's result \cite{V-H} yields that
1807: the transmission capacity of the sequence of channel 
1808: $\bW^B \bQ$ is less than $\underline{I}(1|\bp,\bW^B \bQ)$,
1809: which implies 
1810: \begin{align*}
1811: R \le \underline{I}(1|\bp,\bW^B \bQ) .
1812: \end{align*}
1813: Furthermore,
1814: the property $\lim d_E (\Phi_n) =0$ implies that
1815: $S(0|\bW^E\bQ)= 0$.
1816: Hence, we have
1817: \begin{align}
1818: \overline{I}(0|\bp,\bW^E\bQ)= 0. \Label{1-17-4}
1819: \end{align}
1820: Thus, we obtain
1821: \begin{align*}
1822: R = \underline{I}(1|\bp,\bW^B \bQ)- \overline{I}(0|\bp,\bW^E\bQ),
1823: \end{align*}
1824: which implies (\ref{1-14-4}).
1825: 
1826: Next, we assume that
1827: a sequence of codes of wire-tap channel 
1828: $\{\Phi_n =(M_n,\{Q_1^n, \ldots, Q_{M_n}^n\},
1829: \{\cD_1^n, \ldots, \cD_{M_n}^n\})\}$ 
1830: satisfies that
1831: \begin{align*}
1832: R= \varliminf \frac{1}{n}\log |\Phi_n|,
1833: \quad
1834: \lim \epsilon_B (\Phi_n) =0, \quad
1835: \lim \frac{I_E (\Phi_n)}{n} =0.
1836: \end{align*}
1837: Since the mutual information 
1838: \begin{align*}
1839: I_E (\Phi_n)= \sum_{i=1}^{M_n} 
1840: \frac{1}{M_n} \rE_{(W^{E,n}Q^n)_{i},y}
1841: \log \frac{(W^{E,n}Q^n)_{i}}{
1842: \sum_{i=1}^{M_n} \frac{1}{M_n}(W^{E,n}Q^n)_{i}}(y)
1843: \end{align*}
1844: can be regarded as KL-divergence,
1845: Lemma \ref{l-1-17} yields that
1846: \begin{align*}
1847: & \sum_{i=1}^{M_n} 
1848: \frac{1}{M_n}
1849: (W^{E,n}Q^n)_{i}
1850: \left\{
1851: \frac{1}{n}\log \frac{(W^{E,n}Q^n)_{i}}{
1852: \sum_{i=1}^{M_n} \frac{1}{M_n}(W^{E,n}Q^n)_{i}}(y)
1853: \ge a \right\} \\
1854: & \le 
1855: \frac{I_E (\Phi_n) + \frac{1}{e}}{n a} \to 0
1856: \end{align*}
1857: for any $a\,> 0$.
1858: Thus, we obtain (\ref{1-17-4}).
1859: Therefore, similarly to (\ref{1-14-4}), we obtain (\ref{1-14-5}).
1860: \endproof
1861: 
1862: \begin{lem}\Label{l-1-17}
1863: Assume that $p$ and $q$ are two probability distributions
1864: on $\Omega$.
1865: Then, we have
1866: \begin{align}
1867: D(p\|q)+ \frac{1}{e}
1868: \ge \alpha 
1869: \cdot p \left\{ \log \frac{p(\omega)}{q(\omega)} \ge \alpha \right\}
1870: .\Label{1-17-1}
1871: \end{align}
1872: \end{lem}
1873: \begin{proof}
1874: We focus on the two probability distributions on 
1875: $\Omega_0 \defeq\left\{ \log \frac{p}{q}(\omega) \,< \alpha \right\}$:
1876: \begin{align*}
1877: p_0(\omega) \defeq \frac{p(\omega)}{p\{\Omega_0\}} , \quad
1878: q_0(\omega) \defeq \frac{q(\omega)}{q\{\Omega_0\}}.
1879: \end{align*}
1880: Hence,
1881: \begin{align*}
1882: &D(p\|q) = 
1883: \sum_{\omega \in \Omega_0^c} p(\omega) \log \frac{p(\omega)}{q(\omega)}
1884: + \sum_{\omega \in \Omega} p(\omega) \log \frac{p(\omega)}{q(\omega)} \\
1885: \ge & \alpha p\{\Omega_0^c\}
1886: + \sum_{\omega \in \Omega} p_0(\omega) 
1887: \left(\log \frac{p\{\Omega_0\}}{q\{\Omega_0\}}
1888: + \log \frac{p_0(\omega)}{q_0(\omega)}\right) \\
1889: = & \alpha p\{\Omega_0^c\}
1890: + p\{\Omega_0\}\log \frac{p\{\Omega_0\}}{q\{\Omega_0\}}
1891: + D(p_0\|q_0) \\
1892: \ge & \alpha p\{\Omega_0^c\}
1893: + p\{\Omega_0\}\log \frac{p\{\Omega_0\}}{q\{\Omega_0\}}
1894: \ge \alpha p\{\Omega_0^c\}
1895: + p\{\Omega_0\}\log p\{\Omega_0\}.
1896: \end{align*}
1897: Finally, the convexity of the map $x \mapsto x \log x $ guarantees that
1898: $p\{\Omega_0\}\log p\{\Omega_0\}\ge -\frac{1}{e}$.
1899: We obtain (\ref{1-17-1}).
1900: \end{proof}
1901: 
1902: \section{Exponents in stationary memoryless channel}
1903: \subsection{Channel resolvability}
1904: Next, we proceed to 
1905: the stationary memoryless 
1906: channel of a given channel $W$ as a special case.
1907: 
1908: First, we treat channel resolvability.
1909: As was shown by 
1910: Han \& Verd\'{u}\cite{Han-V} and Han \cite{Han-book},
1911: the information spectrum quantities of discrete memoryless channel of $W$
1912: is calculated as
1913: \begin{align*}
1914: \sup_{\bp}\overline{I}(\epsilon|\bp,\bW)
1915: =\sup_{\bp}\underline{I}(\epsilon|\bp,\bW)
1916: = \max_p I(p;W)
1917: \end{align*}
1918: for $1\ge \epsilon \ge 0$,
1919: where
1920: \begin{align*}
1921: I(p;W) & \defeq \rE_p D(W_x\|W_p).
1922: \end{align*}
1923: Hence, Theorem \ref{t-3} yields 
1924: \begin{align*}
1925: S(\epsilon|\bW)
1926: =S^{\dagger}(\epsilon|\bW)
1927: = \max_p I(p;W),
1928: \end{align*}
1929: which has been obtained by Han \& Verd\'{u}\cite{Han-V}.
1930: Furthermore, using Theorem \ref{t-2},
1931: we can discuss these problems 
1932: in more details by treating the following 
1933: optimal exponents:
1934: \begin{align*}
1935: & e_\epsilon (R|W,p) \\
1936: \defeq &
1937: \sup_{\{\Psi_n\}} \left\{\left. 
1938: \varliminf \frac{-1}{n}\log \epsilon (\Psi_n,W^n_{p^n}) 
1939: \right|
1940: \varlimsup \frac{1}{n}\log |\Psi_n|\le R
1941: \right\} \\
1942: & e_D (R|W,p) \\
1943: \defeq &
1944: \sup_{\{\Psi_n\}} \left\{\left. 
1945: \varliminf \frac{-1}{n}\log D (\Psi_n, W^n_{p^n}) 
1946: \right|
1947: \varlimsup \frac{1}{n}\log |\Psi_n|\le R
1948: \right\} ,\\
1949: \end{align*}
1950: and 
1951: \begin{align*}
1952: e_\epsilon (R|W) &\defeq \varliminf \frac{-1}{n}\log \epsilon (e^{nR},W^n) ,\\
1953: e_D (R|W) &\defeq \varliminf \frac{-1}{n}\log D (e^{nR},W^n) ,
1954: \end{align*}
1955: where $p^n$ is the $n$-fold identical independent distribution of
1956: $p$.
1957: As is discussed by Oohama \cite{Oohama},
1958: by using Lemma \ref{H-V}, the exponent $e_{\epsilon}(R,W)$
1959: gives a lower bound of strong converse exponent of 
1960: identification code.
1961: \begin{thm}\Label{t-5}
1962: Assume that the cardinality $|\cY|$ is finite, then
1963: \begin{align}
1964: e_\epsilon (R|W,p) & \ge
1965: \max_{1\ge s \ge 0} \left\{\frac{-\psi(s|W,p)+ sR}{1+s} \right\}
1966: \Label{3-8-7}\\
1967: e_D (R|W,p) & \ge
1968: \max_{0 \ge t \ge -1/2}\left\{ - \phi(t|W,p) - tR\right\}
1969: %\max_{1\ge s \ge 0} -\psi(s|W,p)+ sR,
1970: \Label{3-8-8} \\
1971: e_\epsilon (R|W) & \ge
1972: \max_{1\ge s \ge 0} \left\{ \frac{-\psi(s|W)+ sR}{1+s} \right\}\Label{3-9-2}\\
1973: e_D(R|W) & \ge
1974: \max_{0 \ge t \ge -1/2} \left\{ - \max_p \phi(t|W,p) - tR \right\},
1975: \Label{7-1-1}
1976: \end{align}
1977: where $\psi(s|W,p)\defeq \log \rE_p \sum_y W_x^{1+s}(y)W_p^{-s}(y)$
1978: and $\psi(s|W)\defeq \log \max_p \sum_y 
1979: \left(\rE_p W_x^{1+s}(y)\right)^{1-s}$.
1980: \end{thm}
1981: Using Pinsker's inequality
1982: $D(p\|q)\ge \|p-q\|^2$,
1983: we obtain two inequalities
1984: $\frac{1}{2}e_D (R|W,p) \le e_\epsilon (R|W,p)$ and 
1985: $\frac{1}{2}e_D(R|W) \le e_\epsilon (R|W)$,
1986: which implies different lower bounds of exponents:
1987: \begin{align}
1988: e_\epsilon (R|W,p) & \ge
1989: \frac{1}{2} \max_{0 \ge t \ge -1/2}  \left\{- \phi(t|W,p) - tR\right\}
1990: \Label{7-1-5}\\
1991: e_\epsilon (R|W) & \ge
1992: \frac{1}{2}
1993: \max_{0 \ge t \ge -1/2}  \left\{- \max_p \phi(t|W,p) - tR \right\}
1994: .\Label{7-1-6}
1995: \end{align}
1996: We can derive different lower bounds of $e_D (R|W,p)$ and $e_D (R|W)$
1997: from the inequality (\ref{7-1-3}).
1998: However, these bounds are smaller than the bound presented here.
1999: 
2000: \begin{rem}
2001: Arimoto's strong converse exponent \cite{Arimoto} of 
2002: channel coding of transmission code equals
2003: \begin{align*}
2004: \max_{0 \ge t \ge -1}  \left\{- \max_p \phi(t|W,p) - tR\right\},
2005: \end{align*}
2006: which is a bit greater than the RHS of (\ref{3-8-8})
2007: when $R$ is sufficiently large.
2008: 
2009: \end{rem}
2010: \begin{rem}
2011: By using inequality (\ref{3-3-10}) and type method,
2012: Oohama \cite{Oohama} has obtained a lower bound of $e_\epsilon (R|W)$:
2013: \begin{align*}
2014: \frac{1}{2}
2015: \max_{0 \ge t \ge -1}  \left\{- \max_p \phi(t|W,p) - tR\right\},
2016: \end{align*}
2017: which is a bit better than (\ref{7-1-6})
2018: when $R$ is sufficiently large.
2019: It is interesting that his approach
2020: is in contrast to our approach to (\ref{7-1-6}),
2021: which is based on (\ref{6-26-1}) not on (\ref{3-3-10}).
2022: \end{rem}
2023: \begin{rem}
2024: It is difficult to treat the exponent of 
2025: the sum of two error probabilities in identification code
2026: based on Theorem \ref{t-1}.
2027: For this purpose, we need a modified version of Theorem \ref{t-1}.
2028: \end{rem}
2029: 
2030: %Since $\left.\frac{\,d -\psi(s|W,p) }{\,d s}\right|_{s=0}
2031: %= \rE_p D(W_x\|W_p)$,
2032: %we can show $ \max_{s \ge 0} \frac{-\psi(s|W,p)+ sR}{1+2s} \,> 0$
2033: %and $\max_{s \ge 0} \frac{-\psi(s|W,p)+ sR}{1+s}\,> 0$
2034: %for any real number $R \,< \rE_p D(W_x\|W_p)$.
2035: The following lemma is a preparation of our proof of Theorem \ref{t-5}.
2036: 
2037: \begin{lem}\Label{3-9-1}
2038: For any $s \ge 0$ and $0 \ge t \,> -1$,
2039: the equalities
2040: \begin{align}
2041: & \max_{p \in \cP(\cX^n)} 
2042: \sum_{y^n \in \cY^n} \left (\rE_{p} (W_x^n(y^n))^{1+s} \right)^{1-s}
2043: \nonumber\\
2044: = &
2045: \left(\max_{p\in \cP(\cX)} 
2046: \sum_y \left( \rE_p W_x^{1+s}(y) \right)^{1-s}
2047: \right)^n \label{6-27-1}\\
2048: & \max_{p \in \cP(\cX^n)} 
2049: \sum_{y^n \in \cY^n} \left (\rE_{p} (W_x^n(y^n))^{\frac{1}{1+t}} \right)^{1+t}
2050: \nonumber\\
2051: = &
2052: \left(\max_{p\in \cP(\cX)} 
2053: \sum_y \left( \rE_p W_x^{\frac{1}{1+t}}(y) \right)^{1+t}
2054: \right)^n \label{7-1-4}
2055: \end{align}
2056: hold.
2057: \end{lem}
2058: \begin{proof}
2059: Since (\ref{7-1-4}) has been shown by Arimoto \cite{Arimoto}, 
2060: we prove only (\ref{6-27-1})
2061: by the same method.
2062: Since the function $f: p \mapsto 
2063: \max_{p\in \cP(\cX)} 
2064: \sum_y \left( \rE_p W_x^{1+s}(y) \right)^{1-s}$ is continuous and
2065: convex function,
2066: if and only if
2067: $f(p^*)= \max_p f(p)$,
2068: there exists a constant $\lambda$ such that
2069: \begin{align*}
2070: &\sum_y W_x^{1+s}(y) \left(
2071: \sum_x p^*(x) W_x^{1+s}(y)\right)^{-s}\\
2072: =& \frac{\partial f}{\partial p(x)}
2073: \left\{
2074: \begin{array}{cc}
2075: = \lambda & \hbox{if } p^*(x)\,> 0 \\
2076: \le \lambda & \hbox{if } p^*(x)= 0 
2077: \end{array}
2078: \right.
2079: \end{align*}
2080: Indeed, $\lambda$ is calculated as
2081: \begin{align*}
2082: \sum_x p(x) \lambda 
2083: &=
2084: \sum_x p(x) 
2085: \sum_y W_x^{1+s}(y) \left(
2086: \sum_x p^*(x) W_x^{1+s}(y)\right)^{-s}\\
2087: &=
2088: \left(
2089: \sum_x p^*(x) W_x^{1+s}(y)\right)^{1-s}.
2090: \end{align*}
2091: Thus,
2092: if and only if
2093: $f(p^*)= \max_p f(p)$,
2094: \begin{align}
2095: &\sum_y W_x^{1+s}(y) \left(
2096: \sum_x p^*(x) W_x^{1+s}(y)\right)^{-s}\nonumber \\
2097: &\left\{
2098: \begin{array}{cc}
2099: = \left(
2100: \sum_x p^*(x) W_x^{1+s}(y)\right)^{1-s} & \hbox{if } p^*(x)\,> 0 \\
2101: \le \left(
2102: \sum_x p^*(x) W_x^{1+s}(y)\right)^{1-s}& \hbox{if } p^*(x)= 0 
2103: \end{array}
2104: \right.\nonumber,
2105: \end{align}
2106: $p^*$ gives the maximum.
2107: Hence, if $p^*$ satisfies the above condition,
2108: $(p^*)^n$ also satisfies the following condition:
2109: \begin{align*}
2110: &\sum_{y^n} (W_{x^n}^n)^{1+s}(y^n) \left(
2111: \sum_{x^n} (p^*)^n(x^n) (W_{x^n}^n)^{1+s}(y^n)\right)^{-s}\nonumber \\
2112: &\left\{
2113: \begin{array}{cc}
2114: = \left(
2115: \sum_{x^n} (p^*)^n(x^n) (W_{x^n}^n)^{1+s}(y^n)\right)^{1-s}
2116: & \hbox{if } (p^*)^n(x^n)\,> 0 \\
2117: \le \left(
2118: \sum_{x^n} (p^*)^n(x^n) (W_{x^n}^n)^{1+s}(y^n)\right)^{1-s}
2119: & \hbox{if } (p^*)^n(x^n)= 0 ,
2120: \end{array}
2121: \right. 
2122: \end{align*}
2123: which is a necessary and sufficient condition for 
2124: \begin{align*}
2125: & \sum_{y^n \in \cY^n} 
2126: \left(\rE_{(p^*)^n} (W_x^n(y^n))^{1+s} \right)^{1-s}\\
2127: = &
2128: \max_{p \in \cP(\cX^n)} 
2129: \sum_{y^n \in \cY^n} 
2130: \left(\rE_{p} (W_x^n(y^n))^{1+s} \right)^{1-s}.
2131: \end{align*}
2132: It implies the equation (\ref{6-27-1}).
2133: \end{proof}
2134: 
2135: \quad{\it Proof of Theorem \ref{t-5}:}
2136: By inequality (\ref{6-26-1}) of Theorem \ref{t-2},
2137: we have
2138: \begin{align}
2139: D(e^{nR},W^^n_{p^n})
2140: &\le
2141: \frac{\log (1+ (e^{nR})^t e^{ \phi(t|W^n,p^n)})}{-t}\nonumber \\
2142: & \le
2143: \frac{(e^{nR})^t e^{ \phi(t|W^n,p^n)}}{-t}\nonumber \\
2144: & =
2145: \frac{e^{n( \phi(t|W,p)+t R)}}{-t},\label{A1}
2146: \end{align}
2147: for $0 > t \ge -1/2$, where 
2148: the second inequality follows from $\log (1+x) \le x$.
2149: From (\ref{A1}), we obtain 
2150: \begin{align}
2151: e_D(R|W,p)\ge -\phi(t|W,p)-t R
2152: \end{align}
2153: for $0 > t \ge -1/2$.
2154: Since $\phi(t|W,p)+ tR$ is 
2155: continuous for $t$,
2156: the inequality (\ref{3-8-8}) holds.
2157: By inequality (\ref{6-26-1}) and Lemma \ref{3-9-1},
2158: we have
2159: \begin{align}
2160: D(e^{nR},W^n)
2161: & \le
2162: \max_{p \in \cP(\cX^n)}
2163: \frac{\log (1+ (e^{nR})^t e^{ \phi(t|W^n,p)})}{-t}\nonumber \\
2164: & \le
2165: \frac{
2166: (e^{nR})^t \cdot
2167: \max_{p \in \cP(\cX^n)}
2168: e^{ \phi(t|W^n,p)}
2169: }{-t} \nonumber \\
2170: = &
2171: \frac{
2172: (e^{nR})^t \cdot
2173: \max_{p \in \cP(\cX)}
2174: e^{n \phi(t|W,p)}
2175: }{-t} \label{A2}
2176: \end{align}
2177: for $0 > t \ge - 1/2$.
2178: Hence, in a manner similar to the derivation of 
2179: (\ref{3-8-8}) from (\ref{A1}), we obtain (\ref{7-1-1}) from (\ref{A2}).
2180: 
2181: Next, we derive (\ref{3-8-7}) and (\ref{3-9-2}).
2182: To this end, we first derive an upper bound of 
2183: \begin{align*}
2184: 2\delta_{p,W,e^{R'}}+
2185: \sqrt{
2186: \frac{\delta'_{p,W,e^{R'}}}
2187: {e^R}}.
2188: \end{align*}
2189: For any $1\ge s \ge 0$,
2190: we choose $R'\defeq \frac{\psi(s|W,p)+R}{1+s}$.
2191: By using Markov inequality, we can evaluate 
2192: $\delta_{p,W,e^{R'}}$ and $\delta_{p,W,e^{R'}}'$ as
2193: \begin{align}
2194: & \delta_{p,W,e^{R'}}
2195: \le \rE_p \sum_{y \in 
2196: \left\{ \frac{W_x}{W_p}(y) \,> e^{R'} \right\}}
2197: W_x (y) \left(\frac{e^{- R'} W_x(y)}{W_p(y)}\right)^s
2198: \nonumber\\
2199: \le &
2200: \rE_p \sum_{y} 
2201: W_x (y) \left(\frac{ W_x(y)}{W_p(y)}\right)^s e^{- s R'} 
2202: =e^{ \psi(s|W,p)-s R'}\nonumber\\
2203: =& e^{\frac{ \psi(s|W,p)-sR}{1+s}}\label{A3}
2204: \end{align}
2205: and
2206: \begin{align}
2207: & \delta_{p,W,e^{R'}}'
2208: \le \rE_p \sum_{y \in 
2209: \left\{ \frac{W_x}{W_p}(y) \le e^{R'} \right\}}
2210: \frac{W_x (y)^2}{W_p (y)} 
2211: \left(\frac{W_p(y)}{e^{- R'} W_x(y)}\right)^{1-s}\nonumber\\
2212: \le &
2213: \rE_p \sum_{y} 
2214: W_x (y) \left(\frac{ W_x(y)}{W_p(y)}\right)^s e^{(1- s) R'} 
2215: =e^{ \psi(s|W,p)+(1- s) R'},\label{A4}
2216: \end{align}
2217: respectively.
2218: Inequality (\ref{A4}) yields
2219: \begin{align}
2220: \sqrt{\frac{\delta_{p,W,e^{R'}}'}{e^{R}}}
2221: \le e^{ \frac{\psi(s|W,p)+(1- s) R'-R }{2}}= 
2222: e^{\frac{ \psi(s|W,p)-sR}{1+s}}.\label{A5}
2223: \end{align}
2224: Combining (\ref{A3}) and (\ref{A5}), 
2225: we have
2226: \begin{align}
2227: 2\delta_{p,W,e^{R'}}+
2228: \sqrt{
2229: \frac{\delta'_{p,W,e^{R'}}}
2230: {e^R}}
2231: \le 3 e^{\frac{ \psi(s|W,p)-sR}{1+s}}.\label{A6}
2232: \end{align}
2233: Hence, (\ref{A6}) and (\ref{3-3-10}) in Theorem \ref{t-2}
2234: guarantee that
2235: \begin{align}
2236: \epsilon(e^{nR},W^n_{p^n})
2237: \le 3 e^{\frac{ \psi(s|W^n,p^n)-snR}{1+s}}
2238: = 3 e^{n\frac{ \psi(s|W,p)-sR}{1+s}}\label{A7}
2239: \end{align}
2240: for $1 \ge s \ge 0$
2241: because $\psi(s|W^n,p^n)= n \psi(s|W,p)$.
2242: Thus, (\ref{A7}) implies that
2243: \begin{align}
2244: e_\epsilon(R|W,p)
2245: \ge 
2246: \frac{-\psi(s|W,p)+sR}{1+s}\label{A8}
2247: \end{align}
2248: for $1 \ge s \ge 0$.
2249: Taking the maximum for $1 \ge s \ge 0$, 
2250: we obtain (\ref{3-8-7}).
2251: 
2252: %Similarly, by using Markov inequality, we can evaluate
2253: %\begin{align*}
2254: %\delta_{p^n,W^n,e^{nR}}
2255: %&\le e^{ n(\psi(s|W,p)-s R)}\\
2256: %\frac{\delta_{p,W,e^{nR}}}{e^{nR}}
2257: %& \le e^{ n(\psi(s|W,p)-s R)}\quad\hbox{for}\quad 1 \ge \forall s \ge 0.
2258: %\end{align*}
2259: %Thus, we obtain (\ref{3-8-8}) from (\ref{6-26-1}).
2260: 
2261: 
2262: We proceed to the proof of (\ref{3-9-2}).
2263: By inequalities (\ref{3-3-10}) and (\ref{A6}), we obtain 
2264: \begin{align}
2265: \epsilon(e^{nR},W^n)\le
2266: \max_{p \in \cP(\cX^n)}
2267: 3 e^{\frac{\psi(s|W^n,p)-snR}{1+s}}\nonumber \\
2268: =
2269: 3 e^{\frac{-snR}{1+s}}
2270: \left[
2271: \max_{p \in \cP(\cX^n)}
2272: e^{\frac{\psi(s|W^n,p)}{1+s}}
2273: \right]^{\frac{1}{1+s}}\label{A9}.
2274: \end{align}
2275: Now, we estimate an upper bound of 
2276: \begin{align}
2277: e^{\psi(s|W^n,p)}
2278: = \rE_p\sum_y W_x^{1+s}(y)W_p^{-s}(y).
2279: \end{align}
2280: Since the map $x \mapsto x^{1+s}$ is convex,
2281: we have
2282: \begin{align*}
2283: W_p(y) = \rE_p W_x(y) \ge
2284: \rE_p W_x^{1+s}(y),
2285: \end{align*}
2286: which imply that
2287: \begin{align*}
2288: W_p^{-s} (y) \le \left(\rE_p (W_x(y))^{1+s}\right)^{-s}.
2289: \end{align*}
2290: Hence, the relations
2291: \begin{align}
2292: & \rE_p \sum_y W_x^{1+s}(y)W_p^{-s} (y)
2293: = \sum_y \rE_p W_x^{1+s}(y)W_p^{-s} (y)\nonumber \\
2294: \le & \sum_y \left (\rE_p W_x^{1+s}(y) \right)^{1-s}\Label{3-12-1}
2295: \end{align}
2296: hold. Using (\ref{3-12-1}) and Lemma \ref{3-9-1}, 
2297: we can evaluate
2298: \begin{align}
2299: &\max_{p \in \cP(\cX^n)} 
2300: \rE_{p} \sum_{y\in \cY^n} W_x^n(y)^{1+s}
2301: W_{p}^n (y)^{-s} \nonumber \\
2302: \le &
2303: \max_{p \in \cP(\cX^n)} 
2304: \sum_{y \in \cY^n} \left (\rE_{p} (W_x^n(y))^{1+s} \right)^{1-s}
2305: \nonumber \\
2306: = &
2307: \left(\max_{p\in \cP(\cX)} 
2308: \sum_y \left( \rE_p W_x^{1+s}(y) \right)^{1-s}
2309: \right)^n = e^{n (\psi(s|W))}.
2310: \label{A10}
2311: \end{align}
2312: Combining (\ref{A9}) and (\ref{A10}), 
2313: we have
2314: \begin{align}
2315: \epsilon(e^{nR}, W^n)
2316: \le e^{n \frac{\psi(s|W)-sR}{1+s}},
2317: \label{A11}
2318: \end{align}
2319: for any $1 \ge s \ge 0$.
2320: In a manner similar to the derivation of (\ref{3-8-7})
2321: from (\ref{A7}), we can derive (\ref{3-9-2}) from (\ref{A11}).
2322: \endproof
2323: 
2324: 
2325: \subsection{Wire-tap channel}
2326: Next, we proceed to discrete memoryless wire-tap channel.
2327: Applying Theorem \ref{t-1-11} 
2328: to this case with the input identical and independent distribution,
2329: we obtain 
2330: \begin{align*}
2331: & C(\bW^B,\bW^E) \\
2332: \defeq &
2333: \sup_{\{\Phi_n\}}
2334: \left\{\left.
2335: \varliminf \frac{1}{n}\log\log |\Phi_n|
2336: \right|
2337: \lim \epsilon_B (\Phi_n)=
2338: \lim d_E(\Phi_n)= 0
2339: \right\} \\
2340: \ge &\sup_p \left\{I(p;W^B)- I(p;W^E)\right\},
2341: %\rE_p D(W_x^B\|W_p^B)- \rE_p D(W_x^E\|W_p^E),
2342: \end{align*}
2343: which has been obtained by Wyner \cite{Wyner}.
2344: Hence, Theorem \ref{t-1-11} can be 
2345: regarded as a general extension of Wyner's result.
2346: Moreover, using Lemma \ref{3-6},
2347: we derived several explicit lower bounds of exponents.
2348: \begin{thm}\Label{t-7}
2349: Assume that the cardinality $|\cZ|$ is finite,
2350: then there exists a sequence $\{\Phi_n\}$ of codes
2351: for any real numbers $R, R'$ and any probability distribution $p$
2352: such that
2353: \begin{align}
2354: \lim \frac{1}{n}\log |\Phi_n|& = R \nonumber \\
2355: \varliminf \frac{-1}{n}\log \epsilon_B(\Phi_n) & \ge
2356: \max_{1 \ge s \ge 0}  \left\{-\phi(s|W^B,p) - s(R+R')\right\}\Label{3-8-10} \\
2357: \varliminf \frac{-1}{n}\log I_E(\Phi_n) & \ge
2358: \max_{0\ge t \ge -1/2} \left\{ -\phi(t|W^E,p)- tR'\right\} \Label{6-8-10} \\
2359: \varliminf \frac{-1}{n}\log d_E(\Phi_n) & \ge
2360: \max_{1\ge s \ge 0} \left\{\frac{-\psi(s|W^E,p)+ sR'}{1+s}\right\}
2361: \Label{7-8-10}\\
2362: \varliminf \frac{-1}{n}\log d_E(\Phi_n) &\ge
2363: \frac{1}{2} \max_{0\ge t \ge -1/2}  \left\{-\phi(t|W^E,p)- tR'\right\}.
2364: \Label{1-12-3}
2365: \end{align}
2366: %where
2367: %$\phi(s|W,p)\defeq \log 
2368: %\sum_y \left( \rE_p (W_x(y))^{1/(1+s)}\right)^{1+s} $.
2369: Indeed, these exponents are very useful for evaluating
2370: error and wire-tapper's information
2371: for a finite $n$.
2372: \end{thm}
2373: \begin{proof}
2374: The inequality (\ref{3-8-10}) immediately follows from
2375: (\ref{3-8-1}).
2376: By using an evaluation similar to (\ref{3-8-8}),
2377: we can show (\ref{6-8-10}) from (\ref{3-6-2}).
2378: Furthermore, by using an evaluation similar to (\ref{3-8-7}),
2379: we can show (\ref{7-8-10}) from (\ref{3-8-12}).
2380: \end{proof}
2381: \section{Comparison of lower bounds of exponents}
2382: Finally, we compare the lower bounds
2383: (\ref{3-8-7}), (\ref{3-9-2}), (\ref{7-1-5}), and (\ref{7-1-6})
2384: of error exponents of channel resolvability.
2385: 
2386: \begin{thm}
2387: Assume that $\Delta \defeq R- I(p;W)$ is sufficiently small.
2388: Then, 
2389: RHSs of (\ref{3-8-7}) and (\ref{7-1-5}) 
2390: (which are lower bounds of exponent of the variational distance)
2391: are approximately
2392: calculated as
2393: \begin{align*}
2394: \hbox{RHS of } (\ref{3-8-7})~&
2395: \max_{1\ge s \ge 0} \left\{ \frac{-\psi(s|W,p)+ sR}{1+s} \right\}
2396:  \cong \frac{\Delta^2}{4 J(p;W)}\\
2397: \hbox{RHS of } (\ref{7-1-5})~&
2398: \frac{1}{2}\max_{0 \ge t \ge -1/2} \left\{ - \phi(t|W,p) - tR\right\} 
2399:  \cong \frac{\Delta^2}{8 J(p;W)}, 
2400: \end{align*}
2401: where 
2402: \begin{align*}
2403: &J(p;W) \\
2404: \defeq 
2405: &\frac{1}{2} 
2406: \left( 
2407: \rE_{p,x} \rE_{W_x,y}
2408: (\log W_x(y) - \log W_p(y))^2- I^2(p;W) \right) .
2409: \end{align*}
2410: Moreover, 
2411: RHSs of (\ref{3-9-2}) and (\ref{7-1-6}) 
2412: (which are lower bounds of exponent of the worst variational distance)
2413: are approximately
2414: calculated as
2415: \begin{align*}
2416: \hbox{RHS of } (\ref{3-9-2})~
2417: &\max_{s \ge 0}\left\{
2418: \frac{-\psi(s|W)+sR}{1+s}\right\}\\
2419: & \cong \frac{\Delta^2}{4 (J(p_0;W)+\rE_{p_0} H(W_x))}, \\
2420: \hbox{RHS of } (\ref{7-1-6})~
2421: &\frac{1}{2}\max_{0 \ge t \ge -1/2} \left\{- \max_p\phi(t|W,p) - tR\right\}\\
2422: & \cong \frac{\Delta^2}{8 J(p_0;W) },
2423: \end{align*}
2424: where $p_0 \defeq \argmax_p I(p;W)$.
2425: \end{thm}
2426: Thus, when $R$ is sufficiently close to
2427: $\max_p I(p;W)$,
2428: (\ref{3-8-7}) gives a better lower bound than
2429: (\ref{7-1-5}).
2430: Of course, this comparison can be applied to 
2431: exponents of eavesdropper's information in wire-tap channel,
2432: {\it i.e.},
2433: the comparison of RHSs of (\ref{7-8-10}) and (\ref{1-12-3}).
2434: On the other hand, 
2435: (\ref{3-9-2}) gives a better lower bound than
2436: (\ref{7-1-6}),
2437: if and only if
2438: \begin{align*}
2439: &\rE_{p_0} H(W_x)\\
2440: &\le \frac{1}{2} 
2441: \left( 
2442: \rE_{p,x} \rE_{W_x,y}
2443: (\log W_x(y) - \log W_p(y))^2
2444: - I^2(p;W) \right).
2445: \end{align*}
2446: Therefore, although $R- \max_p I(p;W)$ is small enough,
2447: the relation between 
2448: bounds (\ref{3-9-2}) and (\ref{7-1-6}) is not clear.
2449: 
2450: \begin{proof}
2451: By using a Taylor expansion, we obtain the approximations:
2452: \begin{align*}
2453: \psi(s|W,p)&\cong  I(p;W)s + J(p;W)s^2\\
2454: \phi(t|W,p)&\cong - I(p;W)t + J(p;W)t^2\\
2455: \psi(s|W) &\cong I(p_0;W) s + (J(p_0;W)+\rE_{p_0} H(W_x)) s^2,
2456: %
2457: %&\max_p \log \sum_y (\rE_p W_x(y)^{1+s})^{1/(1+s)}\\
2458: %&\cong I(p_0;W) s + J(p_0;W) s^2.
2459: \end{align*}
2460: Thus,
2461: \begin{align*}
2462: &\max_{1\ge s \ge 0} \left\{ \frac{-\psi(s|W,p)+ sR}{1+s} \right\}\\
2463: \cong &\max_{1\ge s \ge 0} \left\{ 
2464: \frac{-I(p;W)s - J(p;W)s^2+(I(p;W)+\Delta)s }{1+s}\right\} \\
2465: \cong &\max_{1\ge s \ge 0}\left\{
2466: - J(p;W)s^2 + \Delta s \right\}\cong 
2467: \frac{\Delta^2}{4 J(p;W)} \\
2468: & \max_{0 \ge t \ge -1/2} \left\{- \phi(t|W,p) - tR \right\}\\
2469: \cong & \max_{0 \ge t \ge -1/2} \left\{
2470: I(p;W)t - J(p;W)t^2 - (I(p;W)+\Delta)t \right\}\\
2471: = & \max_{0 \ge t \ge -1/2}\left\{- J(p;W)t^2 - \Delta t \right\}
2472: = \frac{\Delta^2}{4 J(p;W)}\\
2473: & \max_{s \ge 0}\left\{
2474: \frac{-\psi(s|W)+sR}{1+s}\right\} \\
2475: \cong &
2476: \max_{s \ge 0}\Biggl\{
2477:  \frac{-I(p_0;W) s - (J(p_0;W)+\rE_{p_0} H(W_x)) s^2}{1+s}\\
2478: &\qquad +\frac{s(I(p_0;W)+\Delta)}{1+s} \Biggr\}\\
2479: \cong &
2480: \max_{s \ge 0}\left\{
2481: - (J(p_0;W)+\rE_{p_0} H(W_x)) s^2 + \Delta s \right\}\\
2482: = &\frac{\Delta^2}{4 (J(p_0;W)+\rE_{p_0} H(W_x))}.
2483: %&\max_{s \ge 0} -\log \sum_y (\rE_p W_x(y)^{1+s})^{1/(1+s)}
2484: %+\frac{s}{1+s}R \\
2485: %\cong &
2486: %\max_{s \ge 0} 
2487: %-I(p_0;W) s - (J(p_0;W)+I(p;W) s^2 \\
2488: %&\qquad+(s-s^2)I(p_0;W)+s \Delta\\
2489: %= &
2490: %\max_{s \ge 0} 
2491: %- J(p_0;W) s^2 + \Delta s\\
2492: %=& \frac{\Delta^2}{4 J(p_0;W) }.
2493: \end{align*}
2494: \end{proof}
2495: 
2496: \section{Conclusion}
2497: We give several non-asymptotic formulas
2498: in identification code, channel resolvability, and
2499: wire-tap channel.
2500: Using these formulas,
2501: we give the achievable rate channel resolvability
2502: for the general channel, which had been an open problem.
2503: Also, we derived several asymptotic relations among
2504: divergence rates, capacities of identification code,
2505: and $\epsilon$ capacities of channel resolvability.
2506: 
2507: From these non-asymptotic formulas,
2508: we obtained lower bounds of error exponents of 
2509: channel resolvability in the stationary memoryless setting.
2510: Moreover, we derived lower bounds of 
2511: error probability and wire-tapper's information
2512: in the stationary memoryless setting in
2513: wire-tap channel.
2514: 
2515: Concerning the quantum setting,
2516: wire-tap channel has been discussed in the discrete memoryless channel case
2517: by Devetak \cite{Deve}, Winter {\it et. al.}\cite{WNI}
2518: and Cai \& Yeung\cite{CY},
2519: and identification codes has been discussed by Ahlswede \& Winter\cite{AW}.
2520: Hence, several quantum extensions of the results presented here
2521: can be expected.
2522: Some has been obtained by the author.
2523: And some of them have appeared in the author's textbook\cite{H-text}.
2524: Those not already presented 
2525: will appear in a forthcoming paper.
2526: 
2527: 
2528: \section*{Acknowledgments}
2529: The author would like to thank Professor Hiroshi Imai of the
2530: QCI project for support.
2531: He is grateful to Professor Yasutada Oohama for 
2532: useful discussions.
2533: He is also grateful to reviewers
2534: for their kind and useful comments.
2535: 
2536: 
2537: \bibliographystyle{IEEE}
2538: \begin{thebibliography}{1}
2539: %%%%%%%%%
2540: \bibitem{Ah-D}
2541: R. Ahlswede and G. Dueck,
2542: ``Identification via Channels,''
2543: {\em IEEE Trans. Inform. Theory}, vol.35, 15-29, 1989.
2544: %%%%%%%
2545: \bibitem{Han-V}
2546: T.S.\ Han and S.\ Verd\'{u},
2547: ``Approximation Theory of Output Statistics,''
2548: {\em IEEE Trans. Inform. Theory}, vol.39, 
2549: 752--772, 1993.
2550: %%%%%%%%%
2551: \bibitem{Han-book}
2552: T.S.\ Han, 
2553: {\em Information-Spectrum Methods in 
2554: Information Theory}, Springer-Verlag, 2003.
2555: (The original Japanese edition was published 
2556: from Baifukan-Press, Tokyo, in 1998.)  
2557: %%%%%%%%%
2558: \bibitem{Wyner}
2559: A. D. Wyner, 
2560: ``The wire-tap channel,'' 
2561: Bell. Sys. Tech. Jour., vol. 54, pp. 1355-1387, 1975.
2562: %%%%%%%%%
2563: \bibitem{Deve}
2564: I. Devetak,
2565: ``The private classical information capacity and quantum information 
2566: capacity of a quantum channel,''
2567: quant-ph/0304127 (2003).
2568: %%%%%%%%%
2569: \bibitem{WNI}
2570: A. Winter, A. C. A. Nascimento, and
2571: H. Imai,
2572: ``Commitment Capacity of Discrete Memoryless Channels,''
2573: cs.CR/0304014 (2003)
2574: %%%%%%%%%
2575: \bibitem{Gal}
2576: R.\ G.\ Gallager, 
2577: {\em Information Theory and Reliable Communication}, 
2578: John Wiley \& Sons, 1968.
2579: %%%%%%%%%
2580: %\bibitem{Maurer}
2581: %U. M. Maurer, 
2582: %``The Strong Secret Key Rate of Discrete Random Triples,'' 
2583: %Communication and Cryptography-Two Sides of One Tapestry, 
2584: %R. Blahut et al. eds.), Kluwler Academic Publishers, pp. 271-285, 1994. 
2585: %U. M. Maurer and S. Wolf, 
2586: %``Information-Theoretic Key Agreement:From Weak to Strong Secrecy for Free,'' 
2587: %Advances in Cryptology-EUROCRYPT'00, 
2588: %Lecture Notes in Computer Science, Springer-Verlag, 
2589: %vol. 1807, pp. 351-368, 2000.
2590: \bibitem{Oohama}
2591: Y. Oohama,
2592: ``Error Probability of Identification via Channels
2593: at Rates above Capacity,''
2594: In {\em Proc. of International Symposium of Information Theory},
2595: Lausanne, p. 26, 2002.
2596: \bibitem{Oohama2}
2597: Y. Oohama,
2598: ``Average Error Probability of Identification via Channels at Rates above
2599: Identification Capacity,''
2600: In {\em Proc. of International Symposium of Information Theory
2601: and Its Applications}, p. 859--862, 2002.
2602: 
2603: %\bibitem{Oohama3}
2604: %Y. Oohama,
2605: %private communication, 2004.
2606: 
2607: %%%%%%%%%
2608: \bibitem{Hay-Nag}
2609: M. Hayashi and H. Nagaoka,
2610: ``General formulas for capacity of classical-quantum channels,''
2611: {\it IEEE Trans. Inform. Theor.}, {\bf 49}, 1753-1768, 2003;
2612: quant-ph/0206186 (2002).
2613: %%%%%%%%%
2614: \bibitem{Nag-Hay}
2615: H.\ Nagaoka and M.\ Hayashi,
2616: ``An information-spectrum approach to
2617: classical and quantum hypothesis testing,''
2618: quant-ph/0206185 (2002).
2619: %%%%%%%%%
2620: \bibitem{ON1}
2621: T.\ Ogawa and H.\ Nagaoka,
2622: ``A New Proof of the Channel Coding Theorem via
2623: Hypothesis Testing in Quantum Information Theory,''
2624: {\em Proc.\ 2002 IEEE International Symposium on Information Theory},
2625: p.73. (2002);
2626: quant-ph/0208139 (2002).
2627: %%%%%%%%%
2628: \bibitem{H-text}
2629: M. Hayashi,
2630: {\em Introduction to Quantum Information Theory},
2631: (Saiensu-sha, 2004) (In Japanese);
2632: Its English version will be published from Springer in March 2006.
2633: 
2634: \bibitem{Steinberg}
2635: Y. Steinberg,
2636: ``New Converses in the Theory of Identification via Chanels,''
2637: {\it IEEE Trans. Inform. Theor.}, {\bf 44}, 984--998, 1998.
2638: 
2639: \bibitem{Arimoto}
2640: S. Arimoto,
2641: ``On the Converse to the 
2642: coding theorem for discrete memoryless channels,''
2643: {\it IEEE Trans. Inform. Theor.}, {\bf 19}, 357--359, 1973.
2644: 
2645: \bibitem{CN}
2646: I. Csisz\'{a}r, and P. Narayan, 
2647: ``Common Randomness and Secret Key Generation with a Helper,''
2648: {\it IEEE Trans. Inform. Theor.}, {\bf 46}, 344--366, 2000.
2649: \bibitem{CY}
2650: N. Cai and R. Yeung,
2651: ``Quantum Privacy and Quantum Wiretap Channels,''
2652: manuscript, 2003.
2653: \bibitem{AW}
2654: R. Ahlswede and A. Winter,
2655: ``Strong converse for identification via quantum channels,''
2656: {\it IEEE Trans. Inform. Theor.}, {\bf 48}, 569--579, 2002.
2657: 
2658: \bibitem{V-H}
2659: S.\ Verd\'{u} and T.S.\ Han, 
2660: ``A general formula for channel capacity,"
2661: {\em IEEE Trans.\ Inform.\ Theory}, 
2662: vol.40, no.4, 1147--1157, 1994.
2663: \end{thebibliography}
2664: 
2665: \begin{biography}{Masahito Hayashi} was born in Japan in 1971.
2666: He received the B. S. degree from Faculty of Sciences in Kyoto 
2667: University, Japan, in 1994
2668: and the M. S. and Ph. D. degrees in Mathematics from 
2669: Kyoto University, Japan, in 1996 and 1999, respectively.
2670: 
2671: He worked in Kyoto University as a Research Fellow of the Japan Society of the 
2672: Promotion of Science from 1998 to 2000,
2673: and worked in the 
2674: Laboratory for Mathematical Neuroscience, 
2675: Brain Science Institute, RIKEN from 2000 to 2003.
2676: In 2003, he joined 
2677: Quantum Computation and Information Project, ERATO, JST
2678: as the Research Head.
2679: He also works in 
2680: Superrobust Computation Project
2681: Information Science and Technology Strategic Core (21st Century COE by MEXT)
2682: Graduate School of Information Science and Technology
2683: The University of Tokyo
2684: as Adjunct Associate Professor from 2004.
2685: He is an Editorial Board of International Journal of Quantum Information.
2686: His research interests include quantum information theory and
2687: quantum statistical inference.
2688: \end{biography}
2689: \end{document}