1: \begin{thebibliography}{}
2:
3: \bibitem[Alizadeh {\em et~al.}, 2000]{alizadeh}
4: Alizadeh, A.~A., Eisen, M.~B., Davis, R.~E., Ma, C., Lossos, I.~S., Rosenwald,
5: A., Boldrick, J.~C., Sabet, H., Tran, T., Yu, X., Powell, J.~I., Yang, L.,
6: Marti, G.~E., Moore, T., {Hudson Jr}, J., Lu, L., Lewis, D.~B., Tibshirani,
7: R., Sherlock, G., Chan, W.~C., Greiner, T.~C., Weisenburger, D.~D., Armitage,
8: J.~O., Warnke, R., Levy, R., Wilson, W., Grever, M.~R., Byrd, J.~C.,
9: Botstein, D., Brown, P.~O. \& Staudt, L.~M. (2000{\em{}}) {Distinct types of
10: diffuse large B-cell lymphoma identified by gene expression profiling}.
11: \newblock {\em Nature, } {\bf 403}, 503--511.
12:
13: \bibitem[Alon {\em et~al.}, 1999]{alon}
14: Alon, U., Barkai, N., Notterman, D.~A., Gish, K., Ybarra, S., Mack, D. \&
15: Levine, A.~J. (1999{\em{}}) {Broad patterns of gene expression revealed by
16: clustering analysis of tumor and normal colon tissues probed by
17: oligonucleotide arrays}.
18: \newblock {\em Proc Natl Acad Sci U S A, } {\bf 96}, 6745--6750.
19:
20: \bibitem[Alvarez {\em et~al.}, 2005]{SaraRF}
21: Alvarez, S., Diaz-Uriarte, R., Osorio, A., Barroso, A., Melchor, L., Paz,
22: M.~F., Honrado, E., Rodriguez, R., Urioste, M., Valle, L., Diez, O.,
23: Cigudosa, J.~C., Dopazo, J., Esteller, M. \& Benitez, J. (2005{\em{}}) {A
24: Predictor Based on the Somatic Genomic Changes of the BRCA1/BRCA2 Breast
25: Cancer Tumors Identifies the Non-BRCA1/BRCA2 Tumors with BRCA1 Promoter
26: Hypermethylation}.
27: \newblock {\em Clin Cancer Res, } {\bf 11}, 1146--1153.
28:
29: \bibitem[Ambroise \& McLachlan, 2002]{ambroise}
30: Ambroise, C. \& McLachlan, G.~J. (2002{\em{}}) Selection bias in gene
31: extraction on the basis of microarray gene-expression data.
32: \newblock {\em Proc Natl Acad Sci USA, } {\bf 99} (10), 6562--6566.
33:
34:
35: \bibitem[Braga-Neto {\em et~al.}, 2004]{Braga-Neto.Carroll2004}
36: Braga-Neto, U., Hashimoto, R., Dougherty, E.~R., Nguyen, D.~V. \& Carroll,
37: R.~J. (2004{\em{}}) {Is cross-validation better than resubstitution for
38: ranking genes?}
39: \newblock {\em Bioinformatics, } {\bf 20}, 253--258.
40:
41: \bibitem[Breiman, 1996]{breiman-bagging}
42: Breiman, L. (1996{\em{}}) Bagging predictors.
43: \newblock {\em Machine Learning, } {\bf 24}, 123--140.
44:
45: \bibitem[Breiman, 2001{\em{a}}]{breiman-2-cultures}
46: Breiman, L. (2001{\em{a}}) Statistical modeling: the two cultures (with
47: discussion).
48: \newblock {\em Statistical Science, } {\bf 16}, 199--231.
49:
50: \bibitem[Breiman, 2001{\em{b}}]{breiman-rf}
51: Breiman, L. (2001{\em{b}}) Random forests.
52: \newblock {\em Machine Learning, } {\bf 45}, 5--32.
53:
54: \bibitem[Breiman {\em et~al.}, 1984]{cart}
55: Breiman, L., Friedman, J., Olshen, R. \& Stone, C. (1984{\em{}}) {\em
56: Classification and regression trees}.
57: \newblock Chapman \& Hall, New York.
58:
59: \bibitem[Bureau {\em et~al.}, 2003]{Bureau2003}
60: Bureau, A., Dupuis, J., Hayward, B., Falls, K. \& {Van Eerdewegh}, P.
61: (2003{\em{}}) {Mapping complex traits using Random Forests}.
62: \newblock {\em BMC Genet, } {\bf 4 Suppl 1}, S64.
63:
64: \bibitem[Dettling, 2004]{bag-boost}
65: Dettling, M. (2004{\em{}}) Bagboosting for tumor classification with gene
66: expression data.
67: \newblock {\em Bioinformatics, } {\bf 20}, 3583--593.
68:
69: \bibitem[Dettling \& B{\"u}hlmann, 2004]{pelora}
70: Dettling, M. \& B{\"u}hlmann, P. (2004{\em{}}) Finding predictive gene groups
71: from microarray data.
72: \newblock {\em J. Multivariate Anal., } {\bf 90}, 106--131.
73:
74: \bibitem[D{\'\i}az-Uriarte, 2005]{Yo-azuaje} D{\'\i}az-Uriarte, R.
75: (2005{\em{}}) Supervised methods with genomic data: a review and
76: cautionary view. In F. Azuaje and J. Dopazo (eds.) {\em Data
77: analysis and visualization in genomics and proteomics}. New York:
78: Wiley pp. 193--214.
79:
80: \bibitem[Dudoit \& Fridlyand, 2003]{dudoit-inbook} Dudoit, S. \&
81: Fridlyand, J. (2003{\em{}}) Classification in microarray
82: experiments. In T. Speed (ed.) {\em Statistical analysis of gene expression
83: microarray data}. New York: Chapman \& Hall pp. 93--158.
84:
85: \bibitem[Dudoit {\em et~al.}, 2002]{dudoit-dlda}
86: Dudoit, S., Fridlyand, J. \& Speed, T.~P. (2002{\em{}}) Comparison of
87: discrimination methods for the classification of tumors suing gene expression
88: data.
89: \newblock {\em J Am Stat Assoc, } {\bf 97} (457), 77--87.
90:
91: \bibitem[Efron \& Gong, 1983]{efron-gong}
92: Efron, B. \& Gong, G. (1983{\em{}})
93: A leisurely look at the bootstrap, the jacknife, and cross-validation.
94: \newblock {\em The American Statistician, } {\bf 37}, 36--48.
95:
96:
97: \bibitem[Efron \& Tibshirani, 1997]{632-rule}
98: Efron, B. \& Tibshirani, R.~J. (1997{\em{}}) Improvements on cross-validation:
99: the .632+ bootstrap method.
100: \newblock {\em J. American Statistical Association, } {\bf 92}, 548--560.
101:
102: \bibitem[Ein-Dor {\em et~al.}, 2005]{EinDor}
103: Ein-Dor, L., Kela, I., Getz, G., Givol, D. \& Domany, E. (2005{\em{}}) Outcome
104: signature genes in breat cancer: is there a unique set?
105: \newblock {\em Bioinformatics, } {\bf 21}, 171--178.
106:
107: \bibitem[Faraway, 1992]{Faraway-92}
108: Faraway, J. (1992{\em{}}) On the cost of data analysis.
109: \newblock {\em Journal of Computational and Graphical Statistics, } {\bf 1},
110: 251--231.
111:
112: \bibitem[Friedman \& Meulman, 2005]{COSA}
113: Friedman, J. \& Meulman, J. (2005{\em{}}) Clustering objects on subsets of
114: attributes (with discussion).
115: \newblock {\em J. Royal Statistical Society, Series B, } {\bf 66}, 815--850.
116:
117: \bibitem[Golub {\em et~al.}, 1999]{golub}
118: Golub, T.~R., Slonim, D.~K., Tamayo, P., Huard, C., Gaasenbeek, M., Mesirov,
119: J.~P., Coller, H., Loh, M.~L., Downing, J.~R., Caligiuri, M.~A., Bloomfield,
120: C.~D. \& Lander, E.~S. (1999{\em{}}) Molecular classification of cancer:
121: class discovery and class prediction by gene expression monitoring.
122: \newblock {\em Science, } {\bf 286}, 531--537.
123:
124: \bibitem[Gunther {\em et~al.}, 2003]{Gunther.Heyes2003}
125: Gunther, E.~C., Stone, D.~J., Gerwien, R.~W., Bento, P. \& Heyes, M.~P.
126: (2003{\em{}}) {Prediction of clinical drug efficacy by classification of
127: drug-induced genomic expression profiles in vitro}.
128: \newblock {\em Proc Natl Acad Sci U S A, } {\bf 100}, 9608--9613.
129:
130: \bibitem[Harrell, 2001]{harrell-01}
131: Harrell, J. F.~E. (2001{\em{}}) {\em Regression modeling strategies}.
132: \newblock Springer, New York.
133:
134: \bibitem[Hastie {\em et~al.}, 2001]{htf-01}
135: Hastie, T., Tibshirani, R. \& Friedman, J. (2001{\em{}}) {\em The elements of
136: statistical learning}.
137: \newblock Springer, New York.
138:
139:
140: \bibitem[Herrero {\em et~al.}, 2004]{gepas2}
141: Herrero, J., Vaquerizas, J.M., Al-Shahrour, F., Conde, L., Mateos, Á.,
142: Santoyo, J., Díaz-Uriarte, R. \& Dopazo, J. (2004{\em{}}).
143: New challenges in gene expression data analysis and the extended GEPAS.
144: \newblock{\em Nucleic Acids Research} {\bf 32 (Web Server issue)}, W485--W491.
145:
146:
147: \bibitem[Izmirlian, 2004]{Izmir2004}
148: Izmirlian, G. (2004{\em{}}) {Application of the random forest classification
149: algorithm to a SELDI-TOF proteomics study in the setting of a cancer
150: prevention trial}.
151: \newblock {\em Ann N Y Acad Sci, } {\bf 1020}, 154--174.
152:
153: \bibitem[Jolliffe, 2002]{jolliffe}
154: Jolliffe, I.~T. (2002{\em{}}) {\em Principal component analysis, 2nd ed.}
155: \newblock Springer, New York.
156:
157: \bibitem[Khan {\em et~al.}, 2001]{khan}
158: Khan, J., Wei, J.~S., Ringner, M., Saal, L.~H., Ladanyi, M., Westermann, F.,
159: Berthold, F., Schwab, M., Antonescu, C.~R., Peterson, C. \& Meltzer, P.~S.
160: (2001{\em{}}) {Classification and diagnostic prediction of cancers using gene
161: expression profiling and artificial neural networks}.
162: \newblock {\em Nat Med, } {\bf 7}, 673--679.
163:
164: \bibitem[Liaw \& Wiener, 2002]{rf-rnews}
165: Liaw, A. \& Wiener, M. (2002{\em{}}) Classification and regression by
166: randomforest.
167: \newblock {\em Rnews, } {\bf 2}, 18--22.
168:
169: \bibitem[Man {\em et~al.}, 2004]{Man-rf}
170: Man, M.~Z., Dyson, G., Johnson, K. \& Liao, B. (2004{\em{}}) {Evaluating
171: methods for classifying expression data}.
172: \newblock {\em J Biopharm Statist, } {\bf 14}, 1065--1084.
173:
174: \bibitem[McLachlan, 1992]{mclach-dlda}
175: McLachlan, G.~J. (1992{\em{}}) {\em Discriminant analysis and statistical
176: pattern recognition}.
177: \newblock Wiley, New York.
178:
179:
180: \bibitem[Michielis {\em et~al.}, 2005]{Michielis}
181: Michielis, S., Koscielny, S. \& Hill, C. (2005). {Prediction of cnacer outcome
182: with microarrays: a multiple random validation strategy.}
183: \newblock{\em The Lancet,} {\bf 365}, 488--492.
184:
185: \bibitem[Pan {\em et~al.}, 2005]{pan-pnas}
186: Pan, K.-H., Lih, C.-J., \& Cohen, S.~N. (2005{\em{}})
187: {Effects of threshold choice on the biological conclusions reached during the
188: analysis of gene expression by DNA microarrays}.
189: \newblock{\em PNAS,}{\bf 102}, 8961--8965.
190:
191:
192:
193: \bibitem[Pepe, 2003]{pepe-book}
194: Pepe, M.~S. (2003{\em{}}) {\em The statistical evaluation of medical tests for
195: classification and prediction}.
196: \newblock Oxford Univeristy Press, Oxford.
197:
198: %\bibitem[Pepe {\em et~al.}, 2003]{Pepe.roc}
199: %Pepe, M.~S., Longton, G., Anderson, G.~L. \& Schummer, M. (2003{\em{}})
200: % {Selecting differentially expressed genes from microarray experiments}.
201: %\newblock {\em Biometrics, } {\bf 59}, 133--142.
202:
203: \bibitem[Pomeroy {\em et~al.}, 2002]{pomeroy}
204: Pomeroy, S.~L., Tamayo, P., Gaasenbeek, M., Sturla, L.~M., Angelo, M.,
205: McLaughlin, M.~E., Kim, J.~Y., Goumnerova, L.~C., Black, P.~M., Lau, C.,
206: Allen, J.~C., Zagzag, D., Olson, J.~M., Curran, T., Wetmore, C., Biegel,
207: J.~A., Poggio, T., Mukherjee, S., Rifkin, R., Califano, A., Stolovitzky, G.,
208: Louis, D.~N., Mesirov, J.~P., Lander, E.~S. \& Golub, T.~R. (2002{\em{}})
209: {Prediction of central nervous system embryonal tumour outcome based on gene
210: expression}.
211: \newblock {\em Nature, } {\bf 415}, 436--442.
212:
213: \bibitem[{R Development Core Team}, 2004]{R}
214: {R Development Core Team} (2004{\em{}}) {\em R: A language and environment for
215: statistical computing}.
216: \newblock R Foundation for Statistical Computing Vienna, Austria.
217: \newblock 3-900051-07-0.
218:
219:
220: \bibitem[Ramaswamy {\em et~al.}, 2003]{ramas-03}
221: Ramaswamy, S., Ross, K.~N., Lander, E.~S. \& Golub, T.~R. (2003{\em{}}) A
222: molecular signature of metastasis in primary solid tumors.
223: \newblock {\em Nature Genetics, } {\bf 33}, 49--54.
224:
225: \bibitem[Ripley, 1996]{ripley-96}
226: Ripley, B.~D. (1996{\em{}}) {\em Pattern recognition and neural networks}.
227: \newblock Cambridge University Press, Cambridge.
228:
229: \bibitem[Roepman {\em et~al.}, 2005]{roepman}
230: Roepman, P., Wessels, L.~F., Kettelarij, N., Kemmeren, P., Miles, A.~J.,
231: Lijnzaad, P., Tilanus, M.~G., Koole, R., Hordijk, G.~J., {van der Vliet},
232: P.~C., Reinders, M.~J., Slootweg, P.~J. \& Holstege, F.~C. (2005{\em{}}) {An
233: expression profile for diagnosis of lymph node metastases from primary head
234: and neck squamous cell carcinomas}.
235: \newblock {\em Nat Genet, } {\bf 37}, 182--186.
236:
237: \bibitem[Romualdi {\em et~al.}, 2003]{romualdi-03}
238: Romualdi, C., Campanaro, S., Campagna, D., Celegato, B., Cannata, N., Toppo,
239: S., Valle, G. \& Lanfranchi, G. (2003{\em{}}) Pattern recognition in gene
240: expression profiling using dna array: a comparative study of different
241: statistical methods applied to cancer classification.
242: \newblock {\em Hum. Mol. Genet., } {\bf 12} (8), 823--836.
243:
244: \bibitem[Ross {\em et~al.}, 2000]{ross}
245: Ross, D.~T., Scherf, U., Eisen, M.~B., Perou, C.~M., Rees, C., Spellman, P.,
246: Iyer, V., Jeffrey, S.~S., de~Rijn, M.~V., Waltham, M., Pergamenschikov, A.,
247: Lee, J.~C., Lashkari, D., Shalon, D., Myers, T.~G., Weinstein, J.~N.,
248: Botstein, D. \& Brown, P.~O. (2000{\em{}}) Systematic variation in gene
249: expression patterns in human cancer cell lines.
250: \newblock {\em Nature Genetics, } {\bf 24} (3), 227--235.
251:
252: \bibitem[Schwender {\em et~al.}, 2004]{Schwender.Bolt2004}
253: Schwender, H., Zucknick, M., Ickstadt, K. \& Bolt, H.~M. (2004{\em{}}) {A
254: pilot study on the application of statistical classification procedures to
255: molecular epidemiological data}.
256: \newblock {\em Toxicol Lett, } {\bf 151}, 291--299.
257:
258: \bibitem[Simon {\em et~al.}, 2003{\em{a}}]{simon-03}
259: Simon, R., Radmacher, M.~D., Dobbin, K. \& McShane, L.~M. (2003{\em{a}})
260: Pitfalls in the use of dna microarray data for diagnostic and prognostic
261: classification.
262: \newblock {\em Journal of the National Cancer Institute, } {\bf 95} (1),
263: 14--18.
264:
265: \bibitem[Simon {\em et~al.}, 2003{\em{b}}]{simon.book}
266: Simon, R.~M., Korn, E.~L., McShane, L.~M., Radmacher, M.~D., Wright, G.~W. \&
267: Zhao, Y. (2003{\em{b}}) {\em Design and analysis of DNA microarray
268: investigations}.
269: \newblock Springer, New York.
270:
271: \bibitem[Singh {\em et~al.}, 2002]{singh}
272: Singh, D., Febbo, P.~G., Ross, K., Jackson, D.~G., Manola, J., Ladd, C.,
273: Tamayo, P., Renshaw, A.~A., D'Amico, A.~V., Richie, J.~P., Lander, E.~S.,
274: Loda, M., Kantoff, P.~W., Golub, T.~R. \& Sellers, W.~R. (2002{\em{}}) {Gene
275: expression correlates of clinical prostate cancer behavior}.
276: \newblock {\em Cancer Cell, } {\bf 1}, 203--209.
277:
278: \bibitem[Somorjai {\em et~al.}, 2003]{Somorjai2003}
279: Somorjai, R.~L., Dolenko, B. \& Baumgartner, R. (2003{\em{}}) {Class
280: prediction and discovery using gene microarray and proteomics mass
281: spectroscopy data: curses, caveats, cautions}.
282: \newblock {\em Bioinformatics, } {\bf 19}, 1484--1491.
283:
284: \bibitem[Svetnik {\em et~al.}, 2004]{svetnik} Svetnik, V., Liaw, A. ,
285: Tong, C \& Wang, T. (2004{\em{}}) Application of Breiman's random
286: forest to modeling structure-activity relationships of
287: pharmaceutical molecules. In F. Roli, J. Kittler, and T. Windeatt
288: (eds.). {\em Multiple Classier Systems, Fifth International
289: Workshop, MCS 2004, Proceedings, 9-11 June 2004, Cagliari, Italy.
290: Lecture Notes in Computer Science, vol. 3077.} F. Roli, J.
291: Kittler, and T. Windeatt (eds.). Berlin: Springer, pp. 334--343.
292:
293:
294:
295: \bibitem[Tibshirani {\em et~al.}, 2002]{shrunkenc}
296: Tibshirani, R., Hastie, T., Narasimhan, B. \& Chu, G. (2002{\em{}}) Diagnosis
297: of multiple cancer types by shrunken centroids of gene expression.
298: \newblock {\em Proc Natl Acad Sci USA, } {\bf 99} (10), 6567--6572.
299:
300: \bibitem[Tierney {\em et~al.}, 2004]{snow}
301: Tierney, L., Rossini, A.~J., Li, N. \& Sevcikova, H. (2004{\em{}}).
302: \newblock Snow: simple network of workstations.
303: \newblock Technical report
304: URL:http://www.stat.uiowa.edu/~luke/R/cluster/cluster.html.
305:
306: \bibitem[van~'t Veer {\em et~al.}, 2002]{vveer}
307: van~'t Veer, L.~J., Dai, H., van~de Vijver, M.~J., He, Y.~D., Hart, A. A.~M.,
308: Mao, M., Peterse, H.~L., van~der Kooy, K., Marton, M.~J., Witteveen, A.~T.,
309: Schreiber, G.~J., Kerkhoven, R.~M., Roberts, C., Linsley, P.~S., Bernards, R.
310: \& Friend, S.~H. (2002{\em{}}) Gene expression profiling predicts clinical
311: outcome of breast cancer.
312: \newblock {\em Nature, } {\bf 415}, 530--536.
313:
314: \bibitem[Wu {\em et~al.}, 2003]{Wu.Zhao2003}
315: Wu, B., Abbott, T., Fishman, D., McMurray, W., Mor, G., Stone, K., Ward, D.,
316: Williams, K. \& Zhao, H. (2003{\em{}}) {Comparison of statistical methods
317: for classification of ovarian cancer using mass spectrometry data}.
318: \newblock {\em Bioinformatics, } {\bf 19}, 1636--1643.
319:
320:
321: \bibitem[Yeung {\em et~al.}, 2005]{BMA-selection}
322: Yeung, K.~Y., Bumgarner, R.~E. \& Raftery, A.~E. (2005). {Bayesian model
323: averaging: development of an improved multi-calss, gene selection and
324: classification tool for microarray data.}
325: \newblock {\em Bioinformatics,} {\bf 21}, 2394--2402.
326:
327: \bibitem[Yu, 2004]{Rmpi}
328: Yu, H. (2004{\em{}}).
329: \newblock Rmpi: interface (wrapper) to mpi (message-passing interface).
330: \newblock Technical report Department of Statistics, University of Western
331: Ontario URL:http://www.stats.uwo.ca/faculty/yu/Rmpi.
332:
333: \end{thebibliography}
334: