q-bio0503025/rfVS.bbl
1: \begin{thebibliography}{}
2: 
3: \bibitem[Alizadeh {\em et~al.}, 2000]{alizadeh}
4: Alizadeh, A.~A., Eisen, M.~B., Davis, R.~E., Ma, C., Lossos, I.~S., Rosenwald,
5:   A., Boldrick, J.~C., Sabet, H., Tran, T., Yu, X., Powell, J.~I., Yang, L.,
6:   Marti, G.~E., Moore, T., {Hudson Jr}, J., Lu, L., Lewis, D.~B., Tibshirani,
7:   R., Sherlock, G., Chan, W.~C., Greiner, T.~C., Weisenburger, D.~D., Armitage,
8:   J.~O., Warnke, R., Levy, R., Wilson, W., Grever, M.~R., Byrd, J.~C.,
9:   Botstein, D., Brown, P.~O.  \& Staudt, L.~M. (2000{\em{}}) {Distinct types of
10:   diffuse large B-cell lymphoma identified by gene expression profiling}.
11: \newblock {\em Nature, } {\bf 403}, 503--511.
12: 
13: \bibitem[Alon {\em et~al.}, 1999]{alon}
14: Alon, U., Barkai, N., Notterman, D.~A., Gish, K., Ybarra, S., Mack, D.  \&
15:   Levine, A.~J. (1999{\em{}}) {Broad patterns of gene expression revealed by
16:   clustering analysis of tumor and normal colon tissues probed by
17:   oligonucleotide arrays}.
18: \newblock {\em Proc Natl Acad Sci U S A, } {\bf 96}, 6745--6750.
19: 
20: \bibitem[Alvarez {\em et~al.}, 2005]{SaraRF}
21: Alvarez, S., Diaz-Uriarte, R., Osorio, A., Barroso, A., Melchor, L., Paz,
22:   M.~F., Honrado, E., Rodriguez, R., Urioste, M., Valle, L., Diez, O.,
23:   Cigudosa, J.~C., Dopazo, J., Esteller, M.  \& Benitez, J. (2005{\em{}}) {A
24:   Predictor Based on the Somatic Genomic Changes of the BRCA1/BRCA2 Breast
25:   Cancer Tumors Identifies the Non-BRCA1/BRCA2 Tumors with BRCA1 Promoter
26:   Hypermethylation}.
27: \newblock {\em Clin Cancer Res, } {\bf 11}, 1146--1153.
28: 
29: \bibitem[Ambroise \& McLachlan, 2002]{ambroise}
30: Ambroise, C. \& McLachlan, G.~J. (2002{\em{}}) Selection bias in gene
31:   extraction on the basis of microarray gene-expression data.
32: \newblock {\em Proc Natl Acad Sci USA, } {\bf 99} (10), 6562--6566.
33: 
34: 
35: \bibitem[Braga-Neto {\em et~al.}, 2004]{Braga-Neto.Carroll2004}
36: Braga-Neto, U., Hashimoto, R., Dougherty, E.~R., Nguyen, D.~V.  \& Carroll,
37:   R.~J. (2004{\em{}}) {Is cross-validation better than resubstitution for
38:   ranking genes?}
39: \newblock {\em Bioinformatics, } {\bf 20}, 253--258.
40: 
41: \bibitem[Breiman, 1996]{breiman-bagging}
42: Breiman, L. (1996{\em{}}) Bagging predictors.
43: \newblock {\em Machine Learning, } {\bf 24}, 123--140.
44: 
45: \bibitem[Breiman, 2001{\em{a}}]{breiman-2-cultures}
46: Breiman, L. (2001{\em{a}}) Statistical modeling: the two cultures (with
47:   discussion).
48: \newblock {\em Statistical Science, } {\bf 16}, 199--231.
49: 
50: \bibitem[Breiman, 2001{\em{b}}]{breiman-rf}
51: Breiman, L. (2001{\em{b}}) Random forests.
52: \newblock {\em Machine Learning, } {\bf 45}, 5--32.
53: 
54: \bibitem[Breiman {\em et~al.}, 1984]{cart}
55: Breiman, L., Friedman, J., Olshen, R.  \& Stone, C. (1984{\em{}}) {\em
56:   Classification and regression trees}.
57: \newblock Chapman \& Hall, New York.
58: 
59: \bibitem[Bureau {\em et~al.}, 2003]{Bureau2003}
60: Bureau, A., Dupuis, J., Hayward, B., Falls, K.  \& {Van Eerdewegh}, P.
61:   (2003{\em{}}) {Mapping complex traits using Random Forests}.
62: \newblock {\em BMC Genet, } {\bf 4 Suppl 1}, S64.
63: 
64: \bibitem[Dettling, 2004]{bag-boost}
65: Dettling, M. (2004{\em{}}) Bagboosting for tumor classification with gene
66:   expression data.
67: \newblock {\em Bioinformatics, } {\bf 20}, 3583--593.
68: 
69: \bibitem[Dettling \& B{\"u}hlmann, 2004]{pelora}
70: Dettling, M. \& B{\"u}hlmann, P. (2004{\em{}}) Finding predictive gene groups
71:   from microarray data.
72: \newblock {\em J. Multivariate Anal., } {\bf 90}, 106--131.
73: 
74: \bibitem[D{\'\i}az-Uriarte, 2005]{Yo-azuaje} D{\'\i}az-Uriarte, R.
75:   (2005{\em{}}) Supervised methods with genomic data: a review and
76:   cautionary view. In F. Azuaje and J. Dopazo (eds.) {\em Data
77:     analysis and visualization in genomics and proteomics}. New York:
78:   Wiley pp. 193--214.
79: 
80: \bibitem[Dudoit \& Fridlyand, 2003]{dudoit-inbook} Dudoit, S. \&
81:   Fridlyand, J. (2003{\em{}}) Classification in microarray
82:   experiments.  In T. Speed (ed.) {\em Statistical analysis of gene expression
83:     microarray data}. New York: Chapman \& Hall pp. 93--158.
84: 
85: \bibitem[Dudoit {\em et~al.}, 2002]{dudoit-dlda}
86: Dudoit, S., Fridlyand, J.  \& Speed, T.~P. (2002{\em{}}) Comparison of
87:   discrimination methods for the classification of tumors suing gene expression
88:   data.
89: \newblock {\em J Am Stat Assoc, } {\bf 97} (457), 77--87.
90: 
91: \bibitem[Efron \& Gong, 1983]{efron-gong}
92: Efron, B. \& Gong, G. (1983{\em{}}) 
93: A leisurely look at the bootstrap, the jacknife, and cross-validation.
94: \newblock {\em The American Statistician, } {\bf 37}, 36--48.
95: 
96: 
97: \bibitem[Efron \& Tibshirani, 1997]{632-rule}
98: Efron, B. \& Tibshirani, R.~J. (1997{\em{}}) Improvements on cross-validation:
99:   the .632+ bootstrap method.
100: \newblock {\em J. American Statistical Association, } {\bf 92}, 548--560.
101: 
102: \bibitem[Ein-Dor {\em et~al.}, 2005]{EinDor}
103: Ein-Dor, L., Kela, I., Getz, G., Givol, D.  \& Domany, E. (2005{\em{}}) Outcome
104:   signature genes in breat cancer: is there a unique set?
105: \newblock {\em Bioinformatics, } {\bf 21}, 171--178.
106: 
107: \bibitem[Faraway, 1992]{Faraway-92}
108: Faraway, J. (1992{\em{}}) On the cost of data analysis.
109: \newblock {\em Journal of Computational and Graphical Statistics, } {\bf 1},
110:   251--231.
111: 
112: \bibitem[Friedman \& Meulman, 2005]{COSA}
113: Friedman, J. \& Meulman, J. (2005{\em{}}) Clustering objects on subsets of
114:   attributes (with discussion).
115: \newblock {\em J. Royal Statistical Society, Series B, } {\bf 66}, 815--850.
116: 
117: \bibitem[Golub {\em et~al.}, 1999]{golub}
118: Golub, T.~R., Slonim, D.~K., Tamayo, P., Huard, C., Gaasenbeek, M., Mesirov,
119:   J.~P., Coller, H., Loh, M.~L., Downing, J.~R., Caligiuri, M.~A., Bloomfield,
120:   C.~D.  \& Lander, E.~S. (1999{\em{}}) Molecular classification of cancer:
121:   class discovery and class prediction by gene expression monitoring.
122: \newblock {\em Science, } {\bf 286}, 531--537.
123: 
124: \bibitem[Gunther {\em et~al.}, 2003]{Gunther.Heyes2003}
125: Gunther, E.~C., Stone, D.~J., Gerwien, R.~W., Bento, P.  \& Heyes, M.~P.
126:   (2003{\em{}}) {Prediction of clinical drug efficacy by classification of
127:   drug-induced genomic expression profiles in vitro}.
128: \newblock {\em Proc Natl Acad Sci U S A, } {\bf 100}, 9608--9613.
129: 
130: \bibitem[Harrell, 2001]{harrell-01}
131: Harrell, J. F.~E. (2001{\em{}}) {\em Regression modeling strategies}.
132: \newblock Springer, New York.
133: 
134: \bibitem[Hastie {\em et~al.}, 2001]{htf-01}
135: Hastie, T., Tibshirani, R.  \& Friedman, J. (2001{\em{}}) {\em The elements of
136:   statistical learning}.
137: \newblock Springer, New York.
138: 
139: 
140: \bibitem[Herrero {\em et~al.}, 2004]{gepas2}
141: Herrero, J., Vaquerizas, J.M., Al-Shahrour, F., Conde, L., Mateos, Á., 
142: Santoyo, J., Díaz-Uriarte, R. \& Dopazo, J. (2004{\em{}}).
143: New challenges in gene expression data analysis and the extended GEPAS.
144: \newblock{\em Nucleic Acids Research} {\bf 32 (Web Server issue)}, W485--W491.
145: 
146: 
147: \bibitem[Izmirlian, 2004]{Izmir2004}
148: Izmirlian, G. (2004{\em{}}) {Application of the random forest classification
149:   algorithm to a SELDI-TOF proteomics study in the setting of a cancer
150:   prevention trial}.
151: \newblock {\em Ann N Y Acad Sci, } {\bf 1020}, 154--174.
152: 
153: \bibitem[Jolliffe, 2002]{jolliffe}
154: Jolliffe, I.~T. (2002{\em{}}) {\em Principal component analysis, 2nd ed.}
155: \newblock Springer, New York.
156: 
157: \bibitem[Khan {\em et~al.}, 2001]{khan}
158: Khan, J., Wei, J.~S., Ringner, M., Saal, L.~H., Ladanyi, M., Westermann, F.,
159:   Berthold, F., Schwab, M., Antonescu, C.~R., Peterson, C.  \& Meltzer, P.~S.
160:   (2001{\em{}}) {Classification and diagnostic prediction of cancers using gene
161:   expression profiling and artificial neural networks}.
162: \newblock {\em Nat Med, } {\bf 7}, 673--679.
163: 
164: \bibitem[Liaw \& Wiener, 2002]{rf-rnews}
165: Liaw, A. \& Wiener, M. (2002{\em{}}) Classification and regression by
166:   randomforest.
167: \newblock {\em Rnews, } {\bf 2}, 18--22.
168: 
169: \bibitem[Man {\em et~al.}, 2004]{Man-rf}
170: Man, M.~Z., Dyson, G., Johnson, K.  \& Liao, B. (2004{\em{}}) {Evaluating
171:   methods for classifying expression data}.
172: \newblock {\em J Biopharm Statist, } {\bf 14}, 1065--1084.
173: 
174: \bibitem[McLachlan, 1992]{mclach-dlda}
175: McLachlan, G.~J. (1992{\em{}}) {\em Discriminant analysis and statistical
176:   pattern recognition}.
177: \newblock Wiley, New York.
178: 
179: 
180: \bibitem[Michielis {\em et~al.}, 2005]{Michielis}
181: Michielis, S., Koscielny, S. \& Hill, C. (2005). {Prediction of cnacer outcome
182: with microarrays: a multiple random validation strategy.} 
183: \newblock{\em The Lancet,} {\bf 365}, 488--492.
184: 
185: \bibitem[Pan {\em et~al.}, 2005]{pan-pnas}
186: Pan, K.-H., Lih, C.-J., \& Cohen, S.~N. (2005{\em{}}) 
187: {Effects of threshold choice on the biological conclusions reached during the
188:   analysis of gene expression by DNA microarrays}.
189: \newblock{\em PNAS,}{\bf 102}, 8961--8965.
190: 
191: 
192: 
193: \bibitem[Pepe, 2003]{pepe-book}
194: Pepe, M.~S. (2003{\em{}}) {\em The statistical evaluation of medical tests for
195:   classification and prediction}.
196: \newblock Oxford Univeristy Press, Oxford.
197: 
198: %\bibitem[Pepe {\em et~al.}, 2003]{Pepe.roc}
199: %Pepe, M.~S., Longton, G., Anderson, G.~L.  \& Schummer, M. (2003{\em{}})
200: %  {Selecting differentially expressed genes from microarray experiments}.
201: %\newblock {\em Biometrics, } {\bf 59}, 133--142.
202: 
203: \bibitem[Pomeroy {\em et~al.}, 2002]{pomeroy}
204: Pomeroy, S.~L., Tamayo, P., Gaasenbeek, M., Sturla, L.~M., Angelo, M.,
205:   McLaughlin, M.~E., Kim, J.~Y., Goumnerova, L.~C., Black, P.~M., Lau, C.,
206:   Allen, J.~C., Zagzag, D., Olson, J.~M., Curran, T., Wetmore, C., Biegel,
207:   J.~A., Poggio, T., Mukherjee, S., Rifkin, R., Califano, A., Stolovitzky, G.,
208:   Louis, D.~N., Mesirov, J.~P., Lander, E.~S.  \& Golub, T.~R. (2002{\em{}})
209:   {Prediction of central nervous system embryonal tumour outcome based on gene
210:   expression}.
211: \newblock {\em Nature, } {\bf 415}, 436--442.
212: 
213: \bibitem[{R Development Core Team}, 2004]{R}
214: {R Development Core Team} (2004{\em{}}) {\em R: A language and environment for
215:   statistical computing}.
216: \newblock R Foundation for Statistical Computing Vienna, Austria.
217: \newblock 3-900051-07-0.
218: 
219: 
220: \bibitem[Ramaswamy {\em et~al.}, 2003]{ramas-03}
221: Ramaswamy, S., Ross, K.~N., Lander, E.~S.  \& Golub, T.~R. (2003{\em{}}) A
222:   molecular signature of metastasis in primary solid tumors.
223: \newblock {\em Nature Genetics, } {\bf 33}, 49--54.
224: 
225: \bibitem[Ripley, 1996]{ripley-96}
226: Ripley, B.~D. (1996{\em{}}) {\em Pattern recognition and neural networks}.
227: \newblock Cambridge University Press, Cambridge.
228: 
229: \bibitem[Roepman {\em et~al.}, 2005]{roepman}
230: Roepman, P., Wessels, L.~F., Kettelarij, N., Kemmeren, P., Miles, A.~J.,
231:   Lijnzaad, P., Tilanus, M.~G., Koole, R., Hordijk, G.~J., {van der Vliet},
232:   P.~C., Reinders, M.~J., Slootweg, P.~J.  \& Holstege, F.~C. (2005{\em{}}) {An
233:   expression profile for diagnosis of lymph node metastases from primary head
234:   and neck squamous cell carcinomas}.
235: \newblock {\em Nat Genet, } {\bf 37}, 182--186.
236: 
237: \bibitem[Romualdi {\em et~al.}, 2003]{romualdi-03}
238: Romualdi, C., Campanaro, S., Campagna, D., Celegato, B., Cannata, N., Toppo,
239:   S., Valle, G.  \& Lanfranchi, G. (2003{\em{}}) Pattern recognition in gene
240:   expression profiling using dna array: a comparative study of different
241:   statistical methods applied to cancer classification.
242: \newblock {\em Hum. Mol. Genet., } {\bf 12} (8), 823--836.
243: 
244: \bibitem[Ross {\em et~al.}, 2000]{ross}
245: Ross, D.~T., Scherf, U., Eisen, M.~B., Perou, C.~M., Rees, C., Spellman, P.,
246:   Iyer, V., Jeffrey, S.~S., de~Rijn, M.~V., Waltham, M., Pergamenschikov, A.,
247:   Lee, J.~C., Lashkari, D., Shalon, D., Myers, T.~G., Weinstein, J.~N.,
248:   Botstein, D.  \& Brown, P.~O. (2000{\em{}}) Systematic variation in gene
249:   expression patterns in human cancer cell lines.
250: \newblock {\em Nature Genetics, } {\bf 24} (3), 227--235.
251: 
252: \bibitem[Schwender {\em et~al.}, 2004]{Schwender.Bolt2004}
253: Schwender, H., Zucknick, M., Ickstadt, K.  \& Bolt, H.~M. (2004{\em{}}) {A
254:   pilot study on the application of statistical classification procedures to
255:   molecular epidemiological data}.
256: \newblock {\em Toxicol Lett, } {\bf 151}, 291--299.
257: 
258: \bibitem[Simon {\em et~al.}, 2003{\em{a}}]{simon-03}
259: Simon, R., Radmacher, M.~D., Dobbin, K.  \& McShane, L.~M. (2003{\em{a}})
260:   Pitfalls in the use of dna microarray data for diagnostic and prognostic
261:   classification.
262: \newblock {\em Journal of the National Cancer Institute, } {\bf 95} (1),
263:   14--18.
264: 
265: \bibitem[Simon {\em et~al.}, 2003{\em{b}}]{simon.book}
266: Simon, R.~M., Korn, E.~L., McShane, L.~M., Radmacher, M.~D., Wright, G.~W.  \&
267:   Zhao, Y. (2003{\em{b}}) {\em Design and analysis of DNA microarray
268:   investigations}.
269: \newblock Springer, New York.
270: 
271: \bibitem[Singh {\em et~al.}, 2002]{singh}
272: Singh, D., Febbo, P.~G., Ross, K., Jackson, D.~G., Manola, J., Ladd, C.,
273:   Tamayo, P., Renshaw, A.~A., D'Amico, A.~V., Richie, J.~P., Lander, E.~S.,
274:   Loda, M., Kantoff, P.~W., Golub, T.~R.  \& Sellers, W.~R. (2002{\em{}}) {Gene
275:   expression correlates of clinical prostate cancer behavior}.
276: \newblock {\em Cancer Cell, } {\bf 1}, 203--209.
277: 
278: \bibitem[Somorjai {\em et~al.}, 2003]{Somorjai2003}
279: Somorjai, R.~L., Dolenko, B.  \& Baumgartner, R. (2003{\em{}}) {Class
280:   prediction and discovery using gene microarray and proteomics mass
281:   spectroscopy data: curses, caveats, cautions}.
282: \newblock {\em Bioinformatics, } {\bf 19}, 1484--1491.
283: 
284: \bibitem[Svetnik {\em et~al.}, 2004]{svetnik} Svetnik, V., Liaw, A. ,
285:   Tong, C \& Wang, T. (2004{\em{}}) Application of Breiman's random
286:   forest to modeling structure-activity relationships of
287:   pharmaceutical molecules. In F. Roli, J. Kittler, and T. Windeatt
288:   (eds.). {\em Multiple Classier Systems, Fifth International
289:     Workshop, MCS 2004, Proceedings, 9-11 June 2004, Cagliari, Italy.
290:     Lecture Notes in Computer Science, vol. 3077.} F. Roli, J.
291:   Kittler, and T. Windeatt (eds.).  Berlin: Springer, pp. 334--343.
292: 
293: 
294: 
295: \bibitem[Tibshirani {\em et~al.}, 2002]{shrunkenc}
296: Tibshirani, R., Hastie, T., Narasimhan, B.  \& Chu, G. (2002{\em{}}) Diagnosis
297:   of multiple cancer types by shrunken centroids of gene expression.
298: \newblock {\em Proc Natl Acad Sci USA, } {\bf 99} (10), 6567--6572.
299: 
300: \bibitem[Tierney {\em et~al.}, 2004]{snow}
301: Tierney, L., Rossini, A.~J., Li, N.  \& Sevcikova, H. (2004{\em{}}).
302: \newblock Snow: simple network of workstations.
303: \newblock Technical report
304:   URL:http://www.stat.uiowa.edu/~luke/R/cluster/cluster.html.
305: 
306: \bibitem[van~'t Veer {\em et~al.}, 2002]{vveer}
307: van~'t Veer, L.~J., Dai, H., van~de Vijver, M.~J., He, Y.~D., Hart, A. A.~M.,
308:   Mao, M., Peterse, H.~L., van~der Kooy, K., Marton, M.~J., Witteveen, A.~T.,
309:   Schreiber, G.~J., Kerkhoven, R.~M., Roberts, C., Linsley, P.~S., Bernards, R.
310:    \& Friend, S.~H. (2002{\em{}}) Gene expression profiling predicts clinical
311:   outcome of breast cancer.
312: \newblock {\em Nature, } {\bf 415}, 530--536.
313: 
314: \bibitem[Wu {\em et~al.}, 2003]{Wu.Zhao2003}
315: Wu, B., Abbott, T., Fishman, D., McMurray, W., Mor, G., Stone, K., Ward, D.,
316:   Williams, K.  \& Zhao, H. (2003{\em{}}) {Comparison of statistical methods
317:   for classification of ovarian cancer using mass spectrometry data}.
318: \newblock {\em Bioinformatics, } {\bf 19}, 1636--1643.
319: 
320: 
321: \bibitem[Yeung {\em et~al.}, 2005]{BMA-selection}
322: Yeung, K.~Y., Bumgarner, R.~E. \& Raftery, A.~E. (2005). {Bayesian model
323:   averaging: development of an improved multi-calss, gene selection and
324:   classification tool for microarray data.}
325: \newblock {\em Bioinformatics,} {\bf 21}, 2394--2402.
326: 
327: \bibitem[Yu, 2004]{Rmpi}
328: Yu, H. (2004{\em{}}).
329: \newblock Rmpi: interface (wrapper) to mpi (message-passing interface).
330: \newblock Technical report Department of Statistics, University of Western
331:   Ontario URL:http://www.stats.uwo.ca/faculty/yu/Rmpi.
332: 
333: \end{thebibliography}
334: