1: \begin{thebibliography}{10}
2:
3: \bibitem{srikant-association}
4: R.~Agrawal and R.~Srikant.
5: \newblock {Fast Algorithms for Mining Association Rules in Large Databases}.
6: \newblock In {\em Proceedings of the 20th International Conference on Very
7: Large Data Bases (VLDB'94)}, pages 487--499. Morgan Kaufmann, Sep 1994.
8: \newblock Santiago de Chile, Chile.
9:
10: \bibitem{model-management}
11: P.A. Bernstein, R.~Pottinger, and A.Y. Halevy.
12: \newblock {A Vision for Management of Complex Models}.
13: \newblock {\em SIGMOD Record}, Vol. 29(4):pages 55--63, Dec 2000.
14:
15: \bibitem{bradley-cacm}
16: J.S. Bradley, J.~Gehrke, R.~Ramakrishnan, and R.~Srikant.
17: \newblock {Scaling Mining Algorithms to Large Databases}.
18: \newblock {\em Communications of the ACM}, Vol. 45(8):pages 38--43, Aug 2002.
19:
20: \bibitem{cartbook}
21: L.~Breiman, J.H. Friedman, R.A. Olshen, and C.J. Stone.
22: \newblock {\em {Classification and Regression Trees}}.
23: \newblock Chapman and Hall/CRC, 1984.
24:
25: \bibitem{cover-thomas}
26: T.M. Cover and J.A. Thomas.
27: \newblock {\em {Elements of Information Theory}}.
28: \newblock John Wiley and Sons: Series in Telecommunications, 1991.
29:
30: \bibitem{fisher}
31: D.H. Fisher.
32: \newblock {Knowledge Acquisition via Incremental Conceptual Clustering}.
33: \newblock {\em Machine Learning}, Vol. 2(2):pages 139--172, 1987.
34:
35: \bibitem{clustering-categorical}
36: V.~Ganti, J.~Gehrke, and R.~Ramakrishnan.
37: \newblock {CACTUS: Clustering Categorical Data using Summaries}.
38: \newblock In {\em Proceedings of the Fifth ACM SIGKDD International Conference
39: on Knowledge Discovery and Data Mining (KDD'99)}, pages 73--83. ACM Press,
40: Aug 1999.
41: \newblock San Diego, CA.
42:
43: \bibitem{ieee-scaling}
44: V.~Ganti, J.~Gehrke, and R.~Ramakrishnan.
45: \newblock {Mining Very Large Databases}.
46: \newblock {\em IEEE Computer}, Vol. 32(8):pages 38--45, Aug 1999.
47:
48: \bibitem{gasch}
49: A.P. Gasch, P.T. Spellman, C.M. Kao, O.~Carmel-Harel, M.B. Eisen, G.~Storz,
50: D.~Botstein, and P.O. Brown.
51: \newblock {Genomic Expression Programs in the Response of Yeast Cells to
52: Environmental Changes}.
53: \newblock {\em Molecular Biology of the Cell}, Vol. 11:pages 4241--4257, 2000.
54:
55: \bibitem{dt-scaling}
56: J.~Gehrke, R.~Ramakrishnan, and V.~Ganti.
57: \newblock {RainForest: A Framework for Fast Decision Tree Construction of Large
58: Datasets}.
59: \newblock {\em Data Mining and Knowledge Discovery}, Vol. 4(2/3):pages
60: 127--162, July 2000.
61:
62: \bibitem{dissimilarity}
63: J.C. Gower and P.~Legendre.
64: \newblock {Metric and Euclidean Properties of Dissimilarity Coefficients}.
65: \newblock {\em Journal of Classification}, Vol. 3:pages 5--48, 1986.
66:
67: \bibitem{hastie-book}
68: T.~Hastie, R.~Tibshirani, and J.~Friedman.
69: \newblock {\em {The Elements of Statistical Learning: Data Mining, Inference,
70: and Prediction}}.
71: \newblock Springer, 2001.
72:
73: \bibitem{jones-furnas}
74: W.P. Jones and G.W. Furnas.
75: \newblock {Pictures of Relevance: A Geometric Analysis of Similarity Measures}.
76: \newblock {\em Journal of the American Society for Information Science}, Vol.
77: 38(6):pages 420--442, 1987.
78:
79: \bibitem{kamath-galaxies}
80: C.~Kamath, E.~Cantu-Paz, I.K. Fodor, and N.A. Tang.
81: \newblock {Classifying Bent-Double Galaxies}.
82: \newblock {\em IEEE/AiP Computing in Science and Engineering (CiSE)}, Vol.
83: 4(4):pages 52--60, Jul/Aug 2002.
84:
85: \bibitem{mackay}
86: D.J.C. MacKay.
87: \newblock {\em {Information Theory, Inference, and Learning Algorithms}}.
88: \newblock Cambridge University Press, 2003.
89:
90: \bibitem{michalski}
91: R.S. Michalski.
92: \newblock {Knowledge Acquisition through Conceptual Clustering: A Theoretical
93: Framework and Algorithm for Partitioning Data into Conjunctive Concepts}.
94: \newblock {\em International Journal of Policy Analysis and Information
95: Systems}, Vol. 4:pages 219--243, 1980.
96:
97: \bibitem{moore-lee}
98: A.W. Moore and M.S. Lee.
99: \newblock {Cached Sufficient Statistics for Efficient Machine Learning with
100: Large Datasets}.
101: \newblock {\em Journal of Artificial Intelligence Research}, Vol. 8:pages
102: 67--91, 1998.
103:
104: \bibitem{muggleton-ilp}
105: S.~Muggleton.
106: \newblock {Scientific Knowledge Discovery using Inductive Logic Programming}.
107: \newblock {\em Communications of the ACM}, Vol. 42(11):pages 42--46, Nov 1999.
108:
109: \bibitem{c45}
110: J.R. Quinlan.
111: \newblock {\em {C4.5: Programs for Machine Learning}}.
112: \newblock Morgan Kaufmann, 1993.
113:
114: \bibitem{schema-matching}
115: E.~Rahm and P.A. Bernstein.
116: \newblock {A Survey of Approaches to Automatic Schema Matching}.
117: \newblock {\em VLDB Journal}, Vol. 10(4):pages 334--350, 2001.
118:
119: \bibitem{genesis}
120: A.~Sturn, J.~Quackenbush, and Z.~Trajanoski.
121: \newblock {Genesis: Cluster Analysis of Microarray Data}.
122: \newblock {\em Bioinformatics}, Vol. 18(1):pages 207--208, 2002.
123:
124: \bibitem{profiling-classes}
125: R.E. Valdes-Perez, V.~Pericliev, and F.~Pereira.
126: \newblock {Concise, Intelligible, and Approximate Profiling of Multiple
127: Classes}.
128: \newblock {\em International Journal of Human Computer Studies}, Vol.
129: 53(3):pages 411--436, 2000.
130:
131: \bibitem{wyrick}
132: J.J. Wyrick, F.C. Holstege, E.G. Jennings, H.C. Causton, D.~Shore,
133: M.~Grunstein, E.S. Lander, and R.A. Young.
134: \newblock {Chromosomal Landscape of Nucleosome-Dependent Gene Expression and
135: Silencing in Yeast}.
136: \newblock {\em Nature}, Vol. 402:pages 418--421, 1999.
137:
138: \bibitem{zaki-non-redundant}
139: M.~Zaki.
140: \newblock {Generating Non-Redundant Association Rules}.
141: \newblock In {\em Proceedings of the Sixth ACM SIGKDD International Conference
142: on Knowledge Discovery and Data Mining (KDD'99)}, pages 34--43. ACM Press,
143: 2000.
144: \newblock Boston, MA.
145:
146: \end{thebibliography}
147: