1: \begin{thebibliography}{}
2:
3: \bibitem[\protect\citename{Cardie}1993]{Cardie:93a}
4: Claire Cardie.
5: \newblock 1993.
6: \newblock A case-based approach to knowledge acquisition for domain-specific
7: sentence analysis.
8: \newblock In {\em 11th {National Conference on Artifical Intelligence}}, pages
9: 798--803.
10:
11: \bibitem[\protect\citename{Church and Hanks}1990]{Church+Hanks:90a}
12: Kenneth~Ward Church and Patrick Hanks.
13: \newblock 1990.
14: \newblock Word association norms, mutual information, and lexicography.
15: \newblock {\em Computational Linguistics}, 16(1):22--29.
16:
17: \bibitem[\protect\citename{Church}1988]{Church:88a}
18: Kenneth~W. Church.
19: \newblock 1988.
20: \newblock A stochastic parts program and noun phrase parser for unrestricted
21: text.
22: \newblock In {\em {Second Conference on Applied Natural Language Processing}},
23: pages 136--143.
24:
25: \bibitem[\protect\citename{Cover and Thomas}1991]{Cover+Thomas:91a}
26: Thomas~M. Cover and Joy~A. Thomas.
27: \newblock 1991.
28: \newblock {\em Elements of Information Theory}.
29: \newblock John Wiley.
30:
31: \bibitem[\protect\citename{Dagan \bgroup et al.\egroup
32: }1995]{Dagan+Marcus+Markovitch:95a}
33: Ido Dagan, Shaul Marcus, and Shaul Marko\-vitch.
34: \newblock 1995.
35: \newblock Contextual word similarity and esti\-ma\-tion from sparse data.
36: \newblock {\em Computer Speech and Language}, 9:123--152.
37:
38: \bibitem[\protect\citename{Dagan \bgroup et al.\egroup
39: }1999]{Dagan+Lee+Pereira:99a}
40: Ido Dagan, Lillian Lee, and Fernando Pereira.
41: \newblock 1999.
42: \newblock Similarity-based models of cooccurrence probabilities.
43: \newblock {\em Machine Learning}, 34(1-3):43--69.
44:
45: \bibitem[\protect\citename{Essen and Steinbiss}1992]{Essen+Steinbiss:92a}
46: Ute Essen and Volker Steinbiss.
47: \newblock 1992.
48: \newblock Co-occurrence smoothing for stochastic language modeling.
49: \newblock In {\em {ICASSP 92}}, volume~1, pages 161--164.
50:
51: \bibitem[\protect\citename{Gibbons}1993]{Gibbons:93a}
52: Jean~Dickinson Gibbons.
53: \newblock 1993.
54: \newblock {\em Nonparametric Measures of Association}.
55: \newblock Number 07-091 in Sage University Paper series on Quantitative
56: Applications in the Social Sciences. Sage, Newberry Park, CA.
57:
58: \bibitem[\protect\citename{Grishman and Sterling}1993]{Grishman+Sterling:93a}
59: Ralph Grishman and John Sterling.
60: \newblock 1993.
61: \newblock Smoothing of automatically generated selectional constraints.
62: \newblock In {\em {Human Language Technology: Proceedings of the ARPA
63: Workshop}}, pages 254--259.
64:
65: \bibitem[\protect\citename{Hatzivassiloglou and
66: McKeown}1993]{Hatzivassiloglou+McKeown:93a}
67: Vasileios Hatzivassiloglou and Kathleen McKeown.
68: \newblock 1993.
69: \newblock Towards the automatic identification of adjectival scales: Clustering
70: of adjectives according to meaning.
71: \newblock In {\em 31st {Annual Meeting} of the {ACL}}, pages 172--182.
72:
73: \bibitem[\protect\citename{Hatzivassiloglou}1996]{Hatzivassiloglou:96a}
74: Vasileios Hatzivassiloglou.
75: \newblock 1996.
76: \newblock Do we need linguistics when we have statistics? {A} comparative
77: analysis of the contributions of linguistic cues to a statistical word
78: grouping system.
79: \newblock In Judith~L. Klavans and Philip Resnik, editors, {\em The Balancing
80: Act}, pages 67--94. MIT Press.
81:
82: \bibitem[\protect\citename{Hindle}1990]{Hindle:90a}
83: Don Hindle.
84: \newblock 1990.
85: \newblock Noun classification from predicate-argument structures.
86: \newblock In {\em 28th {Annual Meeting} of the {ACL}}, pages 268--275.
87:
88: \bibitem[\protect\citename{Jelinek and Mercer}1980]{Jelinek+Mercer:80a}
89: Frederick Jelinek and Robert~L. Mercer.
90: \newblock 1980.
91: \newblock Interpolated estimation of {M}arkov source parameters from sparse
92: data.
93: \newblock In {\em {Proceedings of the Workshop on Pattern Recognition in
94: Practice}}.
95:
96: \bibitem[\protect\citename{Jones and Furnas}1987]{Jones+Furnas:87a}
97: William~P. Jones and George~W. Furnas.
98: \newblock 1987.
99: \newblock Pictures of relevance.
100: \newblock {\em Journal of the American Society for Information Science},
101: 38(6):420--442.
102:
103: \bibitem[\protect\citename{Karov and Edelman}1998]{Karov+Edelman:98a}
104: Yael Karov and Shimon Edelman.
105: \newblock 1998.
106: \newblock Simi\-lar\-ity-based word sense disambiguation.
107: \newblock {\em Computational Linguistics}, 24(1):41--59.
108:
109: \bibitem[\protect\citename{Katz}1987]{Katz:87a}
110: Slava~M. Katz.
111: \newblock 1987.
112: \newblock Estimation of probabilities from sparse data for the language model
113: component of a speech recognizer.
114: \newblock {\em {IEEE} Transactions on Acoustics, Speech and Signal Processing},
115: ASSP-35(3):400--401, March.
116:
117: \bibitem[\protect\citename{Kaufman and Rousseeuw}1990]{Kaufman+Rousseeuw:90}
118: Leonard Kaufman and Peter~J. Rousseeuw.
119: \newblock 1990.
120: \newblock {\em Finding Groups in Data: An Introduction to Cluster Analysis}.
121: \newblock John Wiley and Sons.
122:
123: \bibitem[\protect\citename{Kay and R\"oscheisen}1993]{Kay+Roscheisen:93a}
124: Martin Kay and Martin R\"oscheisen.
125: \newblock 1993.
126: \newblock Text-translation alignment.
127: \newblock {\em Computational Linguistics}, 19(1):121--142.
128:
129: \bibitem[\protect\citename{Lee}1997]{Lee:thesis}
130: Lillian Lee.
131: \newblock 1997.
132: \newblock {\em Similarity-Based Approaches to Natural Language Processing}.
133: \newblock {Ph.D.} thesis, Harvard University.
134:
135: \bibitem[\protect\citename{Lin}1991]{JLin:91}
136: Jianhua Lin.
137: \newblock 1991.
138: \newblock Divergence measures based on the {S}hannon entropy.
139: \newblock {\em {IEEE} Transactions on Information Theory}, 37(1):145--151.
140:
141: \bibitem[\protect\citename{Lin}1997]{Lin:97a}
142: Dekang Lin.
143: \newblock 1997.
144: \newblock Using syntactic dependency as local context to resolve word sense
145: ambiguity.
146: \newblock In {\em 35th {Annual Meeting} of the {ACL}}, pages 64--71.
147:
148: \bibitem[\protect\citename{Lin}1998a]{Lin:98b}
149: Dekang Lin.
150: \newblock 1998a.
151: \newblock Automatic retrieval and clustering of similar words.
152: \newblock In {\em COLING-ACL '98}, pages 768--773.
153:
154: \bibitem[\protect\citename{Lin}1998b]{Lin:98a}
155: Dekang Lin.
156: \newblock 1998b.
157: \newblock An information theoretic definition of similarity.
158: \newblock In {\em {Machine Learning: Proceedings of the Fiftheenth
159: International Conference (ICML '98)}}.
160:
161: \bibitem[\protect\citename{Luk}1995]{Luk:95a}
162: Alpha~K. Luk.
163: \newblock 1995.
164: \newblock Statistical sense disambiguation with relatively small corpora using
165: dictionary definitions.
166: \newblock In {\em 33rd {Annual Meeting} of the {ACL}}, pages 181--188.
167:
168: \bibitem[\protect\citename{Ng and Lee}1996]{Ng+Lee:96a}
169: Hwee~Tou Ng and Hian~Beng Lee.
170: \newblock 1996.
171: \newblock Integrating multiple knowledge sources to disambiguate word sense: An
172: exemplar-based approach.
173: \newblock In {\em 34th {Annual Meeting} of the {ACL}}, pages 40--47.
174:
175: \bibitem[\protect\citename{Ng}1997]{Ng:97b}
176: Hwee~Tou Ng.
177: \newblock 1997.
178: \newblock Exemplar-based word sense disambiguation: Some recent improvements.
179: \newblock In {\em {Second Conference on Empirical Methods in Natural Language
180: Processing (EMNLP-2)}}, pages 208--213.
181:
182: \bibitem[\protect\citename{Rao}1982]{Rao:82a}
183: C.~Radhakrishna Rao.
184: \newblock 1982.
185: \newblock Diversity: Its measurement, decomposition, apportionment and
186: analysis.
187: \newblock {\em Sankyh$\bar{a}$: The Indian Journal of Statistics}, 44(A):1--22.
188:
189: \bibitem[\protect\citename{Resnik}1995]{Resnik:95b}
190: Philip Resnik.
191: \newblock 1995.
192: \newblock Using information content to evaluate semantic similarity in a
193: taxonomy.
194: \newblock In {\em Proceedings of IJCAI-95}, pages 448--453.
195:
196: \bibitem[\protect\citename{Salton and McGill}1983]{Salton+McGill:83a}
197: Gerard Salton and Michael~J. McGill.
198: \newblock 1983.
199: \newblock {\em Introduction to Modern Information Retrieval}.
200: \newblock McGraw-Hill.
201:
202: \bibitem[\protect\citename{Smadja \bgroup et al.\egroup
203: }1996]{Smadja+McKeown+Hatzivassiloglou:96a}
204: Frank Smadja, Kathleen~R. McKeown, and Vasileios Hatzivassiloglou.
205: \newblock 1996.
206: \newblock Translating collocations for bilingual lexicons: A statistical
207: approach.
208: \newblock {\em Computational Linguistics}, 22(1):1--38.
209:
210: \bibitem[\protect\citename{Stanfill and Waltz}1986]{Stanfill+Waltz:86a}
211: Craig Stanfill and David Waltz.
212: \newblock 1986.
213: \newblock Toward memory-based reasoning.
214: \newblock {\em Communications of the {ACM}}, 29(12):1213--1228.
215:
216: \bibitem[\protect\citename{Sugawara \bgroup et al.\egroup
217: }1985]{Sugawara+al:85a}
218: K.~Sugawara, M.~Nishimura, K.~Toshioka, M.~Okochi, and T.~Kaneko.
219: \newblock 1985.
220: \newblock Isolated word recognition using hidden {Markov} models.
221: \newblock In {\em {ICASSP 85}}, pages 1--4.
222:
223: \bibitem[\protect\citename{van Rijsbergen}1979]{Rijsbergen:79a}
224: C.~J. van Rijsbergen.
225: \newblock 1979.
226: \newblock {\em Information Retrieval}.
227: \newblock Butterworths, second edition.
228:
229: \bibitem[\protect\citename{Zavrel and Daelemans}1997]{Zavrel+Daelemans:97a}
230: Jakub Zavrel and Walter Daelemans.
231: \newblock 1997.
232: \newblock Memory-based learning: Using similarity for smoothing.
233: \newblock In {\em 35th {Annual Meeting} of the {ACL}}, pages 436--443.
234:
235: \end{thebibliography}
236: