astro-ph0206485/ms.tex
1: \documentclass[manuscript]{aastex}
2: \usepackage{natbib}
3: %\usepackage{psfig}
4: \bibsep 0pt
5: %\documentstyle[referee,psfig]{laa}
6: %\documentstyle[referee]{laa}
7: %\documentstyle[psfig]{laa}
8: \def\EQN{Eqn. }
9: \def\158{$\lambda 158\mu$}
10: \def\63{$\lambda 63\mu$}
11: \def\etc{{\it etc.}}
12: \def\AVbar{$<$ A$_V$ $>$}
13: \def\EBV{E$_{B-V}$}
14: \def\HH{{\rm H}_2}
15: \def\nH2{{\rm n}({\rm H}_2)}
16: \def\NH2{{\rm N}({\rm H}_2)}
17: \def\pccc{{\rm cm}^{-3}} \def\pcc{{\rm cm}^{-2}}
18: \def\NCO{N(\rm CO)}
19: \def\Tstar#1 {\mbox{${\rm T}_{\rm #1}$}}
20: \def\Tsub#1 {\mbox{${\rm T}_{\rm #1}$}}
21: \def\TK  {\Tsub K }
22: \def\TB  {\Tsub B }
23: \def\DT  {\mbox{$\Delta{\rm T}$}}
24: \def\TC  {\Tstar C }
25: \def\TL  {\Tsub L }
26: \def\Tsp {\Tsub sp }
27: \def\TA  {\Tstar A }
28: \def\Tsys{\Tstar sys }
29: \def\TheT{\Tstar T }
30: \def\TheHUP{\mbox{h$\nu$/k}}
31: \def\Texc {\Tsub exc }
32: \def\vturb{\mbox{v$_{turb}$}}
33: \def\Tmb {\Tsub mb }
34: \def\Tcmb{\Tsub cmb }
35: \def\Tcont{\Tsub cont }
36: \def\Snu{S_{\nu}}
37: \def\arcsec{\mbox{$^{\prime\prime}$}} 
38: \def\arcmin{\mbox{$^{\prime}$}}
39: \def\omet{$(1-{\rm e}^{-\tau})$}
40: \def\ometov{$(1-{\rm e}^{-\tau({\rm v})})$}
41: \def\Romet{(1-{\rm e}^{-R\tau})}
42: \def\iomet{$\int{1-e^{-\tau}}dv$} \def\itau{$\int \tau dv$}
43: \def\degr{$^{\rm o}$}
44: \def\p{$^+$}
45: \def\cotw {\mbox{$^{12}$CO}}
46: \def\coth {\mbox{$^{13}$CO}}
47: \def\coei {\mbox{C$^{18}$O}}
48: \def\as{^{\prime\prime} }
49: \def\hcop{\mbox{{HCO\p}}} 
50: \def\chp{\mbox{CH\p}}
51:  \def\cth{\mbox{C$_3$H}}
52: \def\cch{\mbox{C$_2$H}}
53: \def\cfh{\mbox{C$_4$H}} \def\CnHm{\mbox{C$_n$H$_m$}} 
54: \def\hhco{\mbox{H$_2$CO}}
55: \def\h13cop{\mbox{{H$^{13}$CO\p}}}
56: \def\nnhp{\mbox{N$_2$H\p}}
57: \def\c3h2{\mbox{C$_3$H$_2$}}
58: \def\ad{^{\rm{o}} } \def\am{^{\prime}}
59: \def\Vphi{$V_\theta(R)$} \def\R0{R$_0$} \def\Jl{{{\rm J}_l}}
60: \def\oneskip{\vskip\baselineskip} \def\mc{\mu\rm m} \def\kpc{\rm kpc}
61: \def\eg{e.g.} \def\etal{\mbox{\it et al.}} \def\deg{{}^\circ}
62: \def\ddeg{{}^\circ\kern-.1em} \def\Rsun{{R_0}} \def\Lsun{{L_0}}
63: \def\Msun{{M_0}} \def\pc{\rm pc} \def\th{{\Theta}}
64: \def\thsun{{\Theta_0}}
65: \def\kms{\mbox{km\,s$^{-1}$}}
66: \def\ps{\mbox{s$^{-1}$}}
67: \def\bll{BL Lac}
68: \def\fight{10.8}
69: \def\E#1{\,10^{#1}}
70: \def\P#1,{$\nH2\TK~=~#1\times~10^4~\pccc$~K}
71: \def\ec#1,#2,#3,{#1\,(#2)\E{#3}}
72: \def\xe{x(e)}
73: \def\Cas{Cassiopeia }
74: \def\sac{`spiral-arm' clouds}
75: \def\zoph{$\zeta$ Oph}
76: \def\methCN{\mbox{CH$_3$CN}}
77: \def\H3{\mbox{H$_3$}}
78: \def\Lya{\mbox{Ly-$\alpha$}}
79: \def\ammon{\mbox{N\H3} }
80: \def\zcg{\mbox {$\zeta^\gamma_C$}}
81: \def\DLAS{Damped Lyman-$\alpha$ systems}
82: \sloppy
83: %
84: %
85: \shorttitle{Noise in the strong-signal limit}
86: 
87: \begin{document}
88: 
89: \title{Noise and the strong signal limit in radio astronomical measurement}
90: 
91: \author{H. Liszt}
92: \affil{NRAO, 520 Edgemont Rd., Charlottesville, VA 22903-2475}
93: \email{hliszt@nrao.edu}
94: %
95: %\institute{National Radio Astronomy Observatory,
96: %           520 Edgemont Road,
97: %          Charlottesville, VA,
98: %
99: %           USA 22903-2475}
100: %
101: 
102: %\date{received \today}
103: %\offprints{H. S. Liszt}
104: %\mail{hliszt@nrao.edu}
105: %
106: \begin{abstract}
107: The random error of radioastronomical measurements is usually computed in 
108: the weak-signal limit, which assumes that the system temperature is 
109: sensibly the same on and off source, or with and without a spectral 
110: line.  This assumption is often very poor.  We give examples of common
111: situations in which it is important to distinguish the system noise
112: in signal-bearing and signal-free regions.
113: \end{abstract}
114: 
115: \keywords{methods: data analysis; methods: statistics;
116:  instrumentation: miscellaneous}
117: 
118: \section{Introduction}
119: 
120: Few experiments are performed without some attempt at estimating
121: their errors, and the random errors of measurement in radio
122: astronomy are typically determined in one general way.  Some form
123: of comparison is performed whereby samples are taken toward and 
124: away from a signal source, or with and without a spectral line.  
125: Subsequent analysis 
126: proceeds under the assumption that random errors everywhere in the
127: dataset are as given by the statistical properties manifested in the 
128: signal-free regions.  No attempt is made to measure the variances of 
129: signal-bearing and signal-free samples separately during the experiment, 
130: and, after the fact, random errors of measurement in signal-bearing 
131: samples are obscured because the form of the signal is arbitrary.  
132: Discussions of fitting and profile analysis invariably assume that 
133: measurement variances are the same with or without the signal, as 
134: for instance the Zeeman analysis of \cite{Mar95} or the fitting of 
135: functions ($e.g.$ Gaussians) by \cite{KapSmi+66} or \cite{Rie69}. 
136: Textbook discussions contain no suggestion that system noise is 
137: influenced by the presence of a signal or that samples with 
138: different variances may be interleaved in the same datastream
139:  \citep{Kra86,BurGra01,RohWil00}.
140: 
141: Yet, such treatment has been flawed for a surprisingly long time.  
142: 100 K H I lines have been routinely observed with sub-100 K receiving 
143: systems for more than 30 years.  Continuum sources whose antenna temperatures
144: exceed the equivalent noise temperature of the receiving equipment
145: have been observed even longer.  The error of measurement in signal-bearing 
146: samples is often significantly different -- with current
147: receivers it could easily be a factor of 5 at the peak of a 
148: strong galactic H I emission line -- but the difference has been ignored.
149:      
150: Error estimates determine confidence levels and even data containing 
151: strong signals can be compromised by misunderstanding of their significance; 
152: for instance,
153: when two very strong signals are differenced to detect a smaller one
154: in H I emission-absorption experiments and searches for Zeeman splitting. 
155: Considering how slowly experimental errors typically improve with the 
156: amount of time invested in an experiment, it follows that changes 
157: in the acknowledged errors of an experiment are equivalent to much 
158: larger differences in the observing time required to reach them.  
159: $A~priori$ knowledge of errors is an important 
160: element in the design of experiments and these considerations may 
161: have a significant effect on the planning of an observing session.  
162: They should be implemented in the software which supports analysis.
163: 
164: The purpose of this work is to illustrate a variety of common situations 
165: where random error is dominated by the presence of a
166: signal.  In the following section some basics of radio astronomy 
167: measurement are sketched. These are used to analyse 
168: the statistics of noise and the errors of component fitting when 
169: signals are present in emission and absorption.  The final
170: section is a brief summary with an even briefer mention of the
171: extension of these notions to aperture synthesis.
172: 
173: \section{Power, temperature and noise}
174: 
175: \subsection{Basics}
176: 
177: A temperature scale is established whereby power is compared to the 
178: classical power spectral density kT (W Hz$^{-1}$) in a resistor in 
179: thermal equilibrium at temperature T \citep{Dic46,Kra86,RohWil00}.  
180: The output power level of the telescope system is then quoted as
181: a \lq system temperature\rq , $i.e.$, k\Tsys.  The actual power 
182: density  $ h\nu/(e^{h\nu/kT}-1)+h\nu/2$ \citep{CalWel51} 
183: reduces to kT only in the Rayleigh-Jeans limit and when zero-point 
184: fluctuations are ignored.
185: 
186: In our simplified discussion we assert \Tsys\ = \TheT + \TA.  
187: \TheT\ represents everything which does not depend on any particular 
188: source or input signal and we assume that it is a constant or 
189: constant function of frequency $\nu$: possible dependencies of 
190: \TheT\ are suppressed for convenience of notation.  Observing at a
191: frequency $\nu$ entails a minimum contribution of $h\nu/k$ to \Tsys, 
192: which is included in $\TheT$.
193: 
194: \TA\ represents a signal external to the telescope.  The  equivalent 
195: temperature of a signal is its \lq antenna temperature\rq\ which by 
196: convention is related to the incident flux density 
197: S$_\nu$ (W m$^{-2}$ Hz$^{-1}$) as S$_\nu$$ = 2$ k\TA/A. The effective 
198: area A is proportional to the geometric area of the telescope aperture.
199: 
200: The signal may be confined in space or frequency, so we write 
201: \TA\ = \TA(v) where v is some combination of independent variables.
202: In the presence of signal the power density is 
203: k\Tsys(v) =  k\TheT\ + k\TA(v) and the dependence of \TA\ upon v 
204: makes \Tsys\ 
205: similarly dependent.  If v represents the pointing of the telescope,
206: added power comes and goes as the telescope moves. Alternatively, v 
207: may be velocity or frequency, and, as far as the receiver and square-law 
208: detector are concerned, the presence of  signal at some v=v\arcmin\ is 
209: not manifested at v $<>$ v\arcmin.  The passband may be translated or 
210: inverted by mixing, but the receiver 
211: and detector electronics are entirely linear in frequency.  The 
212: spectrum is not jumbled nor is it appreciably smoothed until it is 
213: integrated and channelized in the so-called \lq backend \rq 
214: \footnote{Even so, independence of adjacent 1 kHz slices of the 
215: spectrum, corresponding to 0.2 \kms\ at the H I line, requires a 
216: minimum integration time of order only 1 msec}.   In Sect. 
217: 2.7 we discuss an exception to this linearity, namely, quantization 
218: noise in digital correlator spectrometers.
219: 
220: \subsection{Passband or system noise as a measurement variance}
221: 
222: Eventually a datastream is formed from samples of \Tsys, each of duration 
223: t (say) taken over a spectral width $\Delta\nu$; this could be a spectrum, a 
224: continuum drift scan, {\it etc.}  Associated with measurement of the output 
225: power k\Tsys\ there is a variance given by the \cite{Dic46} or 
226: radiometer equation: 
227: 
228: $$\Delta{\rm T(v)}^2 = {{\Tsys^2({\rm v})}\over{{\rm N}}} = 
229:  {({\TheT + \TA({\rm v}))^2}\over{{\rm N}}} \eqno(1) $$ 
230: 
231: The dimensionless quantity N $\equiv \Delta\nu {\rm t}$ 
232: is the product of the bandwidth measured in Hz 
233: and the integration time in seconds.  Precise determination of 
234: the output power density kT within a band $\Delta \nu$ is done by averaging 
235: N independent samples.  Within a band of width $\Delta \nu$ about some 
236: frequency $\nu$, the contained frequency components beat each other down 
237: to a frequency range 0..$\Delta \nu$ so that all appear together 
238: summed within one channel of this width.
239: 
240: Radiometer noise in the output datastream is the measurement variance 
241: of the power, independent of whether that power was contributed by 
242: \TheT\ or \TA.  So the variance of the measured strength of an emission 
243: line, usually considered to be set only by \TheT, actually increases in 
244: proportion to the source strength itself, weakly for weak signals and more
245: strongly for very strong ones.
246: 
247: \subsection{Normalization and noise in real-world experiments}
248: 
249: As examples of the way that random error is affected by considerations 
250: of experimental design, we compare some common methods of data-taking.  
251: We consider that it is possible to take data ``on''- or ``off''-source; 
252: if the data are spectra, even the on-source data may have regions of 
253: the bandpass which are signal-free.
254: 
255: In the simplest case where data are taken while staring at
256: the source, the variance is given directly by \EQN 1
257: 
258: $$\Delta{\rm T(v)}^2 ~(on)~ = {({\TheT + \TA({\rm v}))^2}\over{{\rm N_{on}}}} .
259: \eqno(2a)$$ 
260: 
261: When on- and off-source data are differenced the rms is 
262: 
263: $$\Delta{\rm T(v)}^2 ~(on-off)~ = {({\TheT + \TA({\rm v}))^2 }\over{{\rm N_{on}}}} 
264:  +{{\TheT^2}\over{{\rm N_{off}}}} 
265: \eqno(2b)$$ 
266: 
267: and the rms in signal-free regions is increased relative to that at
268: the signal peak.
269: 
270: In some cases a quotient is formed from on- and off-source 
271: data: the mean off-source power level is equated to a number, 
272: $\TheT$, and data appear in the form $\TheT$(on/off) or 
273: $\TheT$(on-off)/off.  Both have the variance
274: 
275: $$\Delta{\rm T(v)}^2 ~(on/off)~ =  {({\TheT + \TA({\rm v}))^2}\over{{\rm N_{on}}}} 
276: + {({\TheT + \TA({\rm v}))^2}\over{{\rm N_{off}}}} 
277: \eqno(2c) $$ 
278: 
279: so formation of the quotient increases the rms in the 
280: signal-bearing regions relative to the case where simple 
281: differencing is done, and everwhere relative to the pure ``on'' 
282: spectrum.
283: 
284: Because of such considerations, it is not possible to calculate 
285: the random error in signal-bearing regions, even given the empirical rms
286: in the signal-free regions and the system properties which pertain to
287: them, unless it is also understood how the data were taken.
288: 
289: %\subsection{Variances of derived parameters} 
290: %
291: %\def\setxi{\lbrace x_i \rbrace}
292: %\def\ibar{\langle i \rangle} 
293: %\def\inbar{\langle i^n \rangle} 
294: %\def\meanin{\langle i^n \rangle}
295: %\def\meansqri{\langle i^2 \rangle}
296: %\def\somey{\meansqri - \ibar^2}
297: %
298: %In the simplest case, adjacent samples are independent and the 
299: %
300: %Variances of measured global properties like the 
301: %total intensity, intensity centroid, {\it etc.} follow from the usual rule 
302: %for propagation of errors of a function $F(\setxi)$ of a set of independent 
303: %random variables $\setxi$, each of which has variance $\sigma_i$ 
304: %as given for instance in the previous subsection.
305: %$var^2 (F(\setxi)) = \sum_i{\sigma_i^2} 
306: %({{\partial F(\setxi)}\over{\partial x_i}})^2 $.
307: %
308: %Defining $s \equiv \sum_i{x_i}$ and $\inbar \equiv \sum_i i^n {x_i}/s$ we 
309: %have  
310: %
311: %$$ var(s) = \sum_i {\sigma_i^2} \eqno(2a)  $$
312: %
313: %$$ var(\meanin) = 
314: % \sum_i{ {{\sigma_i^2}\over{s^2}} (i^n - \meanin)^2} \eqno(2b) $$
315: %
316: %$$ var(\ibar^n) = \sum_i{ {{\sigma_i^2 n^2}\over{s^2}} \ibar^{2(n-1)}
317: % (i-\ibar)^2} \eqno(2c) $$
318: %
319: %$$ var(disp(i)) = \sum_i{ {{\sigma_i}^2\over{4 s^2 disp(i)^2 }}
320: % (disp(i)^2-(i-\ibar)^2)^2 } \eqno(2d) $$
321: %
322: %$$ var(dsp(i)) = \sum_i{ {{\sigma_i^2 dsp(i)^2}\over{4 s^2}}
323: % (1-{{(i-\ibar)^2}\over{dsp(i)^2}})^2 } \eqno(2d) $$
324: %
325: %where $dsp(i) \equiv \sqrt{\somey}$:  \EQN\ 2d is for the 
326: %of the variance of the dispersion, which is defined as a 
327: %{\it square root}.  Derived quantities which are linear in the $\setxi$
328: %have the same variance even when the $\setxi$ are $not$
329: % independent.
330: 
331: \subsection{Emission line profiles}
332: 
333: One obvious example of the strong signal limit of a spectral line is
334: galactic atomic hydrogen.  Fig. 1 shows a typical low latitude galactic 
335: H I profile observed with a 25m telescope \citep{HarBur97} during the 
336: Leiden-Dwingeloo Sky Survey (LDSS).  In the lower panel, the scale is 
337: expanded to show how the $\pm 1 \sigma$ noise envelope varies for 
338: data taken in the form (on-off)/off with $\TheT = 36$K, a typical value 
339: during the survey.  The spectrum in Fig. 1 still has very 
340: high peak/rms signal-noise (465:1), but not nearly as good (1700:1)
341: as implied by the 0.06 K rms over the baseline regions:
342: the rms error of the integrated brightness is nearly twice
343: as high as that estimated from the baseline rms level. 
344: H I is now commonly observed with $\TheT = 15 - 25 $K.  If the 
345: same  profile were reobserved with \TheT\ = 18 K for one-fourth 
346: the amount of time (to reach the same baseline rms ), the 
347: line-generated rms error would be twice as high again.
348: 
349: From the LDSS, 
350: we find that some 41\% of the sky contains H I with a peak brightness 
351: $\TB \ge 20$K, 33\% has $\TB \ge 30$K and 27\% has $\TB \ge 40$K 
352: (for 0\degr $\le ~l~ \le $ 180\degr, 0\degr $\le ~b~ \le $ 90\degr).
353: 
354: \subsection{Profile fitting}
355: 
356: Discussions of profile fitting typically assume that the rms 
357: fluctuation is the same in every channel of a spectrum; to do otherwise
358: would introduce imponderables and greatly hinder general understanding.
359: %For instance, consider the discussion of Marshall (1995) concerning
360: %MEM reconstruction of Zeeman-splitting in strong H I spectra.  Analytic 
361: %expressions for the errors of fitting a Gaussian profile in the presence 
362: %of a constant rms are given by \cite{KapSmi+66} and \cite{Rie69}.   
363: However, datapoints having a higher rms should be accorded lower 
364: weight.
365: 
366: We did a numerical experiment, fitting pure Gaussian profiles
367: of fixed width (FWHM=$\Delta$V)and varying strength \TA(0), in the
368: presence of noise which varies following \EQN 1 (a pure ``on'' 
369: scan following the discussion of Sect. 2.3).  We constructed 
370: spectra with 1 \kms\ channels at an assumed observing frequency of 
371: 1420.40575 MHz (the $\lambda$21cm line), using \TheT = 20 K typical 
372: of modern H I receivers.  We assumed an observing time of 30 seconds, 
373: so that $\sqrt{N} = 376.9$ in \EQN  1 or $\Delta$T = 0.053 K when 
374: \TA\ = 0.  We then inserted gaussian lines having $\Delta V =
375: 10$ \kms\ and peak strengths \TA(0) = 2.5, 5.0, 10, 20, ... 160 K,
376: with the variance of the noise in accord with \EQN 1.  Ensembles
377: of such spectra were generated for each value of \TA(0) and 
378: fit to single Gaussians. The fitting was done twice for each spectrum, 
379: weighting by constant or (correctly) changing variance.
380: 
381: The results of this experiment are reported in Fig. 2.  The bottom
382: curve in each panel is the rms of the fitted parameter given by 
383: analytic formulae, which coincides with the mean {\it a posteriori} 
384: error estimate returned by fitting software which assumes a constant 
385: profile rms.  Stronger lines lead to linear 
386: improvements in fitting of the central velocity and width in this case, 
387: while the peak and profile integral fits are independent of strength; 
388: the fractional precision increases but fitting to the profile integral 
389: does not achieve higher precision than simply summing the channel values.  
390: %In the case of constant rms, all of the variances scale inversely as $\sqrt{N}$.
391: 
392: The uppermost curve in each panel is the actual rms of the parameter 
393: determination with weighting by a constant variance.  The 
394: shaded (middle) curve is the rms with proper weighting;
395: in this case, the fitting software returns accurate error estimates.  
396: Several phenomena are discernible in this diagram.  There are irremediable 
397: increases in the variances of the fitted parameters relative to the case of 
398: constant profile rms.  The precision of the fitted centroid and 
399: width improve only very slowly for strong signals, instead of linearly. 
400: Variances of the peak and integrated strengths increase in
401: absolute terms as well.  The fitting is only very slightly improved by 
402: correct weighting and the actual variances and the claimed error 
403: estimates diverge sharply if the behaviour of the noise 
404: is ignored.  This could be misconstrued as implying that the stronger 
405: lines are less purely Gaussian.
406: 
407: %$$ var^2(\TA(0)) = {\sqrt{{20\ln{2}}\over{\pi}}~
408: % {{h \DT^2}\over{\Delta V}}} \eqno(3a) $$
409: %
410: %$$ var^2(v_0) = {{1}\over{\sqrt{2\pi\ln{2}}}}~
411: % {{h \DT^2 \Delta V}\over{\TA(0)^2}} \eqno(3b) $$
412: %
413: %$$ var^2(\Delta V) = \sqrt{ {{32\ln{2}} \over{\pi}} }~ 
414: % {{h \DT^2 \Delta V} \over{\TA(0)^2} } \eqno(3c) $$
415: %
416: %$$ var^2(\int\TA dv)= \sqrt{{{9\pi}\over{8\ln{2}}}}~ h\DT^2\Delta V
417: % \eqno(3d) $$
418: 
419: %Not much intuitive meaning is usually attached to these formulae,
420: %but we see that all the variances involve the product $h\DT^2$
421: %which is essentially the inverse of the {\it time} spent on the 
422: %experiment. To measure the peak strength more precisely requires 
423: %longer time or a broader line and so forth.  The variance of the 
424: %line integral is limited by the inherent variance of the zeroth-moment 
425: %taken over the interval of the line.  Gaussian fitting by itself 
426: %cannot determine the line profile integral any better than simply 
427: %summing over the signal-bearing region (assuming an absence of other 
428: %problems).
429: 
430: %These formulae apply to fitting a single gaussian component in the 
431: %presence of constant rms error; in practice less weight must be 
432: %accorded to points with higher rms if the fitting is to achieve
433: %maximum precision.  To explore this issue we did a series of numerical 
434: %experiments whose results are reported in Fig. 2 and 3.  
435: 
436: %In each panel of Fig. 2, the uppermost curve is the variance of the
437: %fitted parameter ignoring the varying noise level.  The middle curve
438: %is the variance when the variation is recognized; the fitting is
439: %improved only slightly and variances in the data are irremidiably
440: %increased by the increased channel rms levels.  The biggest difference 
441: %comes in comparing the formal
442: %error estimates of the fits with the actual variances.  The bottom
443: %curve in each panel is the mean error estimate returned by the software
444: %when the noise variation is not recognized, and these are substantially 
445: %too small.  Such is not the case when the software models the noise
446: %in accordance with the construction of the synthetic spectra.
447: %
448: 
449: %Fig. 3 shows the $\chi ^2$ for the fits, in the case where the variation 
450: %of the noise variance is ignored (the reported $\chi ^2$ does not
451: %vary for the algorithm which properly models the noise and yields
452: %the slightly smaller variances in some panels of Fig. 2).  Judged in 
453: %these terms, the fits to stronger emission profiles are in fact reported 
454: %to be poor.    If taken seriously, they could be interpreted as implying 
455: %a progressive, significantly more non-gaussian shape for stronger lines, 
456: %(but this would be wrong).  Of course in the real world, H I lines this 
457: %strong would probably not be optically thin, or purely gaussian, in the 
458: %first place.
459: 
460: \subsection{Sensitivity of absorption measurements}
461: 
462: Staring at a continuum source characterized by an antenna temperature 
463: \TA\ = \TC\ results in a system temperature \Tsys = \TheT + \TC.  If 
464: the continuum is extinguished by a pure scatterer characterized by 
465: optical depth $\tau(v)$, it follows that
466: 
467: $$\Tsys({\rm v}) = \TheT  + \TC e^{-\tau(v)} \eqno(4) $$
468: 
469: $$\DT({\rm v}) = {{\Tsys({\rm v})}\over{\sqrt{{\rm N_{on}}}}} = 
470:  {{\TheT +\TC e^{-\tau(v)}}\over{\sqrt{{\rm N_{on}}}}} \eqno(5) $$
471: 
472: The system temperature is higher where there is no absorption.
473: \EQN 4 can be inverted to solve for the optical 
474: depth from the observed profile of \Tsys(v), $i.e.$ 
475: $\tau(v) = -\ln{((\Tsys(v)- \TheT )/\TC)}$.  Neglecting other effects,
476: the rms of the line/continuum ratio (the argument of the logarithm 
477: in this expression) is just $\sigma_{l/c} = \DT/\TC$.
478: $\sigma_{l/c}$ may be normally distributed but 
479: the logarithmic dependence of $\tau(v)$ makes its error
480: distribution noticeably asymmetric for moderate to large optical 
481: depth.  Change in the derived optical depth for a given
482: fluctuation  $\delta_{l/c}$ in the line/continuum ratio can be written
483: 
484: $$\delta\tau(v)_\mp = \tau(v) + \ln{ (e^{-\tau(v)} \pm \delta_{l/c}) } \eqno(6) $$
485: 
486: where $\pm$ and $\mp$ convey the sense of the variations.
487: Differentiation yields the rms of the derived optical depth
488: 
489: $$ \Delta\tau(v) = \sigma_{l/c} e^{\tau(v)} 
490:  [{ {\TheT+\TC e^{-\tau(v)}} \over {\TheT+\TC} }]. \eqno(7)  $$
491: 
492: %$$ var(\tau) = \sigma_{l/c} e^\tau 
493: % (1-{ {\TC(1-e^{-\tau})} \over {\TheT+\TC} }), \eqno(8). $$
494: 
495: The usual analysis sets $\tau(v) = 0$ on the right-hand side of \EQN 5
496: so that the term in brackets in \EQN 7 is unity. 
497: In Fig. 3 we plot $\delta\tau_+/\tau~ vs.~ \tau$ for different \TC,
498: taking  $\delta_{l/c} = \sigma_{l/c}$ in \EQN 6 and assuming \TheT = 20 K, 
499: $\sqrt{N} = 376.9$ as before.  In the usual analysis (upper panel) the 
500: fractional error in optical depth is minimized at $\tau \approx 1$ for
501: all \TC\ and sensitivity appears to saturate at rather small 
502: $\TC \approx \TheT$.  However, use of \EQN 7 shows that the sensitivity 
503: never saturates, in the sense that it is possible to achieve higher 
504: precision on ever-thicker lines (lower panel).  Furthermore, the error 
505: in optical depth at $\tau \approx 1$ is much smaller in the lower panel 
506: when \TC $>$ \TheT.    
507: 
508: %%3
509: %\begin{figure}
510: %\psfig{figure=tsysfig02.eps,height=4.8 cm}
511: %\caption[]{Mean and variance of $\chi^2$ for the naive fits 
512: %described in Fig. 1
513: %(see Sect. 2.2).}
514: %\end{figure}
515: 
516: Numerical experiments doing Gaussian fitting to absorption lines
517: showed (as before) that proper weighting gives slightly improved 
518: parameter variances, and much-improved error estimates.  Because
519: the rms is higher in signal-free regions, naive error estimates 
520: returned by unwitting software are too large.  Error in determining
521: the continuum level of the baseline regions of an absorption spectrum 
522: increases with \TC\ and may eventually become the limiting factor in 
523: determining the line/continuum ratio.
524: 
525: %These ideas are borne out by numerical experiments like those reported
526: %in Sec. 2.5, where large samples of fitted parameters are analyzed.  The 
527: %smaller noise in the line-bearing region greatly increases the sensitivity 
528: %when \TC/\Tsys\ is large.  Slightly smaller sample variances and 
529: %much-improved formal error estimates are obtained when fitting 
530: %is done with a realistic estimate of the channel-channel noise
531: %variations.  There is one important difference; whereas the reported
532: %$\chi^2$ increased artificially when the noise level was assumed constant
533: %in the emission simulation above, the opposite occurs for absorption
534: %because the noise is higher in the signal-free regions.  Put another
535: %way, if we compare the sample variances, the reported (formal) error 
536: %estimates from the fitting software and the computed $\chi^2$, all of
537: %these are in harmony when the fitting software accounts for the variable
538: %noise. When it does not, the sample variances are slightly higher 
539: %(the fitting process itself is less precise), the error
540: %estimates from the software are noticeably higher than the sample
541: %variances and the reported $\chi^2$ is much too small since it is
542: %normalized by the (larger) off-signal variance.
543: 
544: \subsection{Quantization noise}
545: 
546: Use of digital correlators represents a possible departure from the 
547: frequency-preserving character of the receiver and detector front-end, 
548: owing to the phenomenon of quantization noise \citep{Ben48,GwiCar+00}.  
549: Input to the 
550: correlator is bandpass filtered so that the sampling theorem may be 
551: applied to recovery of the data,  but digitization of the 
552: continuously varying input power results in a representation of the
553: signal which is very strongly {\it not} band-limited.  That portion of 
554: the power spectrum lying outside the original band is returned, in 
555: varying degree depending on the sampling rate,
556: as a form of noise.  For Nyquist sampling (sampling at 
557: a rate twice the bandwidth) all is returned. For faster sampling 
558: the return is reduced as sampling sidebands beat with weaker, 
559: further-out portions of the quantization 
560: noise spectrum.  As shown by \cite{Ben48} for a 16-level system,
561: quantization noise is steadily reduced until the sampling rate is 
562: 10 times Nyquist.
563: 
564: Thus, sampling and quantization schemes scatter input power
565: throughout the passband. Experiments using input thermal noise on
566: systems with (many) more bits than are used in radio astronomy show 
567: that the quantization noise is essentially white ({\it ibid}) but 
568: the spectral characteristics of quantization noise are very much
569: dependent on the form of the input.  Very strong, highly confined 
570: signals can produce distortions of the outlying passband.
571: Weaker signals will simply be dispersed with little
572: effect on either the noise level or shape of the passband.
573: 
574: Because of quantization noise,  even the blackest absorption line
575: will not reduce the rms to the level attained in the absence of 
576: all input signal.  \EQN 5, modified 
577: to account for quantization loss (1-$\epsilon$) in the case that strong 
578: absorption occupies a negligibly small fraction of the correlator 
579: bandpass (so that the quantization noise remains evenly distributed 
580: over the passband) is
581: 
582: $$ \Delta{\rm T} =  {{\TheT
583:   + \TC (\epsilon e^{-\tau}+(1-\epsilon))}
584: \over{\epsilon\sqrt{\rm N}}}. $$
585: 
586: Examples of quantization losses at Nyquist sampling rates are 
587: (1-$\epsilon$) =  0.36 (1-bit
588: or 2-level quantization), 0.12 (3-level) and 0.028 (9-level), so that 
589: minimum fractions $(1-\epsilon)/\epsilon$ = 0.57, 0.14 or 0.03 of the 
590: rms corresponding to the input \TC\ would unavoidably be present in 
591: each channel,  including those at the bottom of the line.  This 
592: complicates error analysis but the high efficiencies of modern 
593: correlators preserve at least some of the benefits discussed.  
594: Such considerations are another reason to prefer higher-level 
595: quantization and over-sampling schemes.
596: 
597: \section{Summary and extension to interferometry}
598: 
599: Radio astronomers frequently observe signals which 
600: are strong enough to dominate the random errors of their experiments.
601: Unfortunately, it is not always possible to recognize the effects 
602: which are induced and they are neglected.  Nonetheless, they have always 
603: been present in the data.
604: 
605: This discussion points up obvious deficiencies in extant data reduction
606: software and analysis techniques.  Perhaps less obvious is the need not
607: only for accurate calibration but also for reliable reporting on the part
608: of the telescope systems.   Measurement errors cannot be accurately assessed 
609: and accomodated in downstream data handling unless the system, continuum 
610: and line antenna temperatures are preserved, along with knowledge of the mode
611: of data-taking.  Synthesis instruments may be
612: particularly difficult in this regard.  Consider the use of the VLA
613: (say) to detect H I absorption against a continuum source at low galactic
614: latitude in the presence of an emission profile like that shown in Fig. 1.
615: The VLA does not return the total power or singledish spectra, or,
616: equivalently, the variation of \Tsys\ across the passband.  The
617: interferometer experiment {\it per se} can only succeed to the extent
618: that foreground emission disappears; only its added noise
619: contribution remains.
620: 
621: We began the discussion by pointing out that the noise contributed 
622: from sky signals in single-dish observations occurs -- ignoring 
623: sidelobes, quantization noise and the like -- at those places and/or 
624: frequencies where the sources themselves are located.  It is an 
625: interesting endeavour to try to understand the extent to which source 
626: noise in interferometer experiments is similarly localized in the output 
627: datastream.  For phased arrays it would seem possible to reproduce the 
628: single-dish mode.  For synthesis arrays \citep{AnaEke+89,CraNap89} the 
629: situation is much more complicated
630: and uncertain even in the weak signal limit.
631: 
632: %Synthesis maps are created by taking the transforms of weighted sums of 
633: %visibilities (voltage products between antenna pairs). The noise associated 
634: %with these products can be calculated on a sample-by-sample basis 
635: %(see Chap. 6 of \cite{ThoMor+01}) and the map-making procedure can be
636: %tracked (distributing noise appropriately over the region synthesized) to 
637: %derive the errors of any data product.  The cross-correlation of two
638: %independent measurements of the same signal has a slightly lower noise
639: %level than that which appears at the output of the square-law detector
640: %on a single dish: 
641: %$\Delta{\rm T(v)}^2 \propto (\TheT+\TA)^2+(f\times\TheT+\TA)^2$
642: %where f = 0 for cross-correlation and 1 for autocorrelation.
643: %The self-noise present in spectra line observations can be discussed in the 
644: %same terms, on a channel-by-channel basis.
645: 
646: \acknowledgements
647: 
648: The National Radio Astronomy Observatory is operated by AUI, Inc. under a
649: cooperative agreement with the US National Science Foundation.  I thank
650: Darrel Emerson, Tony Kerr, Robert Lucas and A. R. (Dick) Thompson for 
651: helpful comments.  Barry Clark pointed out the relevance of quantization 
652: noise and Fred Schwab provided the reference to \cite{Ben48}. This paper was 
653: put in final form while the author was enjoying the hospitality of the IAP 
654: in Paris.
655: 
656: %\bibliographystyle{apj}
657: %\bibliography{mnemonic,absorption}
658: 
659: \begin{thebibliography}{13}
660: \expandafter\ifx\csname natexlab\endcsname\relax\def\natexlab#1{#1}\fi
661: 
662: \bibitem[{{Anantharamaiah} {et~al.}(1989){Anantharamaiah}, {Ekers},
663:   {Radhakrishnan}, {Cornwell}, \& {Goss}}]{AnaEke+89}
664: {Anantharamaiah}, K.~R., {Ekers}, R.~D., {Radhakrishnan}, V., {Cornwell},
665:   T.~J., \& {Goss}, W.~M. 1989, in ASP Conf. Ser. 6: Synthesis Imaging in Radio
666:   Astronomy, ed. R.~A. {Perley}, F.~R. {Schwab}, \& A.~H. {Bridle}, 431--442
667: 
668: \bibitem[{{Bennett}(1948)}]{Ben48}
669: {Bennett}, W.~R. 1948, BSTJ, 27, 446
670: 
671: \bibitem[{{Burke} \& {Graham-Smith}(1997)}]{BurGra01}
672: {Burke}, B.~F. \& {Graham-Smith}, F. 1997, {An Introduction to Radio Astronomy}
673:   (Cambridge, U.K. ; New York : Cambridge University Press, 1997)
674: 
675: \bibitem[{{Callen} \& {Welton}(1951)}]{CalWel51}
676: {Callen}, H.~B. \& {Welton}, T.~A. 1951, Phys. Rev, 83, 1
677: 
678: \bibitem[{{Crane} \& {Napier}(1989)}]{CraNap89}
679: {Crane}, P.~C. \& {Napier}, P.~J. 1989, in ASP Conf. Ser. 6: Synthesis Imaging
680:   in Radio Astronomy, ed. R.~A. {Perley}, F.~R. {Schwab}, \& A.~H. {Bridle},
681:   139--165
682: 
683: \bibitem[{{Dicke}(1946)}]{Dic46}
684: {Dicke}, R. 1946, Rev. Sci. Inst., 17, 268
685: 
686: \bibitem[{{Gwinn} {et~al.}(2000){Gwinn}, {Carlson}, {Dougherty}, {Del Rizzo},
687:   {Reynolds}, {Jauncey}, {Tzioumis}, {Quick}, {McCulloch}, {Hirabayashi},
688:   {Kobayashi}, \& Y.}]{GwiCar+00}
689: {Gwinn}, C.~R., {Carlson}, B., {Dougherty}, S., {Del Rizzo}, D., {Reynolds},
690:   J.~E., {Jauncey}, D.~L., {Tzioumis}, A.~K., {Quick}, J., {McCulloch}, P.~M.,
691:   {Hirabayashi}, H., {Kobayashi}, H., \& Y., M. 2000, astro-ph0002064
692: 
693: \bibitem[{{Hartmann} \& {Burton}(1997)}]{HarBur97}
694: {Hartmann}, D. \& {Burton}, W.~B. 1997, Atlas of galactic neutral hydrogen
695:   (Cambridge, New York: Cambridge University Press.)
696: 
697: \bibitem[{{Kaper} {et~al.}(1966){Kaper}, {Smits}, {Schwarz}, {Takakubo}, \&
698:   {van Woerden}}]{KapSmi+66}
699: {Kaper}, H.~G., {Smits}, D.~W., {Schwarz}, U.~J., {Takakubo}, K., \& {van
700:   Woerden}, H. 1966, B. A. N., 18, 465
701: 
702: \bibitem[{{Kraus}(1986)}]{Kra86}
703: {Kraus}, J.~D. 1986, Radio astronomy (Powell, Ohio: Cygnus-Quasar Books, 1986)
704: 
705: \bibitem[{{Marshall}(1995)}]{Mar95}
706: {Marshall}, J. 1995, Mon. Not. R. Astron. Soc., 275, 217
707: 
708: %\bibitem[{{Perley} {et~al.}(1989){Perley}, {Schwab}, \& {Bridle}}]{Per89}
709: %{Perley}, R.~A., {Schwab}, F.~R., \& {Bridle}, A.~H., eds. 1989, ASP Conf. Ser.
710: %  6: Synthesis Imaging in Radio Astronomy
711: 
712: \bibitem[{{Rieu}(1969)}]{Rie69}
713: {Rieu}, N. 1969, A\&A, 1, 128
714: 
715: \bibitem[{{Rohlfs} {et~al.}(2000){Rohlfs}, {Wilson}, \&
716:   {Huettemeister}}]{RohWil00}
717: {Rohlfs}, K., {Wilson}, T.~L., \& {Huettemeister}, S. 2000, Tools of radio
718:   astronomy (New York : Springer, 2000.\ (Astronomy and astrophysics Library))
719: 
720: \end{thebibliography}
721: 
722: \clearpage
723: 
724: \begin{figure}
725: \plotone{fg1.eps}
726: \caption[]{Top: H I emission observed at (l,b) = (60\degr,$+$1.5\degr)
727: with the 25m Dwingeloo telescope by \cite{HarBur97}.  Bottom: expanded
728: view of the $\pm 1 \sigma$ noise envelope assuming $\TheT = 36$ K.}
729: \end{figure}
730: 
731: %2
732: \begin{figure}
733: \plotone{fg2.eps}
734: \caption[]{Rms error of derived gaussian fitting parameters.  Top left,
735: central velocity.  Bottom left, the FWHM, $\Delta V$.  Top right, the
736: peak line strength.  Bottom right, the profile integral.  In each panel
737: the uppermost curve is the empirically-determined rms and the bottommost 
738: curve the expected or reported rms, all for weighting by a constant
739: profile variance.  The middle curve is the parameter rms when weighting
740: by the correct noise variance.  For the other
741: assumptions used to calculate these curves, see Sect. 2.5}
742: \end{figure}
743: \clearpage
744: %3
745: \begin{figure}
746: \plotone{fg3.eps}
747: \caption[]{Fractional rms error in optical depth when a nominal 20 K system 
748: is used to observe continuum sources of varying strengths 
749: \TC, occulted by a pure scattering medium of optical depth $\tau$.  
750: These plots correspond roughly to 30 second integrations
751: in 1 \kms\ channels at 1420 MHz.  At top, \Tsys\ is assumed independent
752: of $\tau$; at bottom the dependence of \Tsys\ on $\tau$ (\EQN 7) is 
753: included.}
754: \end{figure}
755: \clearpage
756: 
757: \end{document}
758: