1: \begin{thebibliography}{}
2:
3: \bibitem[\protect\citeauthoryear{Backus}{Backus}{1959}]{Backus:1959}
4: Backus, J.~W. (1959).
5: \newblock {The syntax and semantics of the proposed international algebraic
6: language of the Z\"urich ACM-GAMM Conference}.
7: \newblock In {\em {Proceedings of the International Conference on Information
8: Processing}}, Paris.
9:
10: \bibitem[\protect\citeauthoryear{Baker}{Baker}{1979}]{Baker:79}
11: Baker, J.~K. (1979).
12: \newblock Trainable grammars for speech recognition.
13: \newblock In D.~Klatt and J.~Wolf (Eds.), {\em Speech Communication Papers for
14: {ASA'97}}, pp.\ 547--550.
15:
16: \bibitem[\protect\citeauthoryear{Baum}{Baum}{1972}]{Baum:72}
17: Baum, L.~E. (1972).
18: \newblock An inequality and associated maximization technique in statistical
19: estimation for probabilistic functions of {M}arkov processes.
20: \newblock {\em Inequalities\/}~{\em III}, 1--8.
21:
22: \bibitem[\protect\citeauthoryear{Booth and Thompson}{Booth and
23: Thompson}{1973}]{Booth:73}
24: Booth, T.~L. and R.~A. Thompson (1973).
25: \newblock Applying probability measures to abstract languages.
26: \newblock {\em {IEEE} Transactions on Computers\/}~{\em C-22\/}(5), 442--450.
27:
28: \bibitem[\protect\citeauthoryear{Charniak}{Charniak}{1996}]{Charniak:96}
29: Charniak, E. (1996).
30: \newblock Tree-bank grammars.
31: \newblock Technical Report CS-96-02, Brown University.
32:
33: \bibitem[\protect\citeauthoryear{Chi}{Chi}{1999}]{Chi:1999}
34: Chi, Z. (1999).
35: \newblock Statistical properties of probabilistic context-free grammars.
36: \newblock {\em Computational Linguistics\/}~{\em 25\/}(1).
37:
38: \bibitem[\protect\citeauthoryear{Chi and Geman}{Chi and
39: Geman}{1998}]{Chi:1998b}
40: Chi, Z. and S.~Geman (1998).
41: \newblock Squibs and discussions: Estimation of probabilistic context-free
42: grammars.
43: \newblock {\em Computational Linguistics\/}~{\em 24\/}(2).
44:
45: \bibitem[\protect\citeauthoryear{Chomsky}{Chomsky}{1956}]{Chomsky:1956}
46: Chomsky, N. (1956).
47: \newblock Three models for the description of language.
48: \newblock {\em IRE Transactions on Information Theory\/}.
49:
50: \bibitem[\protect\citeauthoryear{Cover and Thomas}{Cover and
51: Thomas}{1991}]{CoverThomas:91}
52: Cover, T.~M. and J.~A. Thomas (1991).
53: \newblock {\em Elements of Information Theory}.
54: \newblock New York: Wiley.
55:
56: \bibitem[\protect\citeauthoryear{DeGroot}{DeGroot}{1989}]{DeGroot:89}
57: DeGroot, M.~H. (1989).
58: \newblock {\em Probability and statistics\/} (2 ed.).
59: \newblock Addison-Wesley.
60:
61: \bibitem[\protect\citeauthoryear{Dempster, Laird, and Rubin}{Dempster
62: et~al.}{1977}]{Dempster:77}
63: Dempster, A.~P., N.~M. Laird, and D.~B. Rubin (1977).
64: \newblock Maximum likelihood from incomplete data via the {{\em EM}} algorithm.
65: \newblock {\em J. Royal Statist. Soc.\/}~{\em 39\/}(B), 1--38.
66:
67: \bibitem[\protect\citeauthoryear{Duda, Hart, and Stork}{Duda
68: et~al.}{2001}]{Duda:01}
69: Duda, R.~O., P.~E. Hart, and D.~G. Stork (2001).
70: \newblock {\em Pattern Classification --- 2nd ed}.
71: \newblock New York: Wiley.
72:
73: \bibitem[\protect\citeauthoryear{Hopcroft and Ullman}{Hopcroft and
74: Ullman}{1979}]{HopcroftUllman:79}
75: Hopcroft, J.~E. and J.~D. Ullman (1979).
76: \newblock {\em Introduction to Automata Theory, Languages, and Computation}.
77: \newblock Reading, MA: Addison-Wesley.
78:
79: \bibitem[\protect\citeauthoryear{Jaynes}{Jaynes}{1957}]{Jaynes:57}
80: Jaynes, E.~T. (1957).
81: \newblock Information theory and statistical mechanics.
82: \newblock {\em Physical Review\/}~{\em 106}, 620--630.
83:
84: \bibitem[\protect\citeauthoryear{Johnson}{Johnson}{1998}]{Johnson:1998}
85: Johnson, M. (1998).
86: \newblock {PCFG} models of linguistic tree representations.
87: \newblock {\em Computational Linguistics\/}~{\em 24\/}(4).
88:
89: \bibitem[\protect\citeauthoryear{Klein and Manning}{Klein and
90: Manning}{2003}]{KleinManning:2003}
91: Klein, D. and C.~D. Manning (2003).
92: \newblock Accurate unlexicalized parsing.
93: \newblock In {\em Proceedings of {ACL-03}}, Sapporo, Japan.
94:
95: \bibitem[\protect\citeauthoryear{Lari and Young}{Lari and
96: Young}{1990}]{Lari:90}
97: Lari, K. and S.~J. Young (1990).
98: \newblock The estimation of stochastic context-free grammars using the
99: inside-outside algorithm.
100: \newblock {\em Computer Speech and Language\/}~{\em 4}, 35--56.
101:
102: \bibitem[\protect\citeauthoryear{McLachlan and Krishnan}{McLachlan and
103: Krishnan}{1997}]{McLachlan:97}
104: McLachlan, G.~J. and T.~Krishnan (1997).
105: \newblock {\em The {EM} Algorithm and Extensions}.
106: \newblock New York: Wiley.
107:
108: \bibitem[\protect\citeauthoryear{Nederhof and Satta}{Nederhof and
109: Satta}{2003}]{NederhofSatta:2003}
110: Nederhof, M.-J. and G.~Satta (2003).
111: \newblock Probabilistic parsing as intersection.
112: \newblock In {\em {Proceedings of the 8th International Workshop on Parsing
113: Technologies (IWPT-03)}}, Nancy, France.
114:
115: \bibitem[\protect\citeauthoryear{Pereira and Schabes}{Pereira and
116: Schabes}{1992}]{Pereira:92}
117: Pereira, F. and Y.~Schabes (1992).
118: \newblock Inside-outside reestimation from partially bracketed corpora.
119: \newblock In {\em Proceedings of {ACL'92}}, Newark, Delaware.
120:
121: \bibitem[\protect\citeauthoryear{Prescher}{Prescher}{2001}]{Prescher:01c}
122: Prescher, D. (2001).
123: \newblock Inside-outside estimation meets dynamic {EM}.
124: \newblock In {\em Proceedings of IWPT-2001}, Beijing.
125:
126: \bibitem[\protect\citeauthoryear{Prescher}{Prescher}{2002}]{Prescher:Diss}
127: Prescher, D. (2002).
128: \newblock {\em {EM-basierte maschinelle Lernverfahren f\"ur nat\"urliche
129: Sprachen}}.
130: \newblock Ph.\ D. thesis, IMS, University of Stuttgart.
131:
132: \bibitem[\protect\citeauthoryear{Ratnaparkhi}{Ratnaparkhi}{1997}]{Rat:97Report}
133: Ratnaparkhi, A. (1997).
134: \newblock A simple introduction to maximum-entropy models for natural language
135: processing.
136: \newblock Technical report, University of Pennsylvania.
137:
138: \bibitem[\protect\citeauthoryear{Sanchez and Benedi}{Sanchez and
139: Benedi}{1997}]{Sanchez1997}
140: Sanchez, J.~A. and J.~M. Benedi (1997).
141: \newblock Consistency of stochastic context-free grammars from probabilistic
142: estimation based on growth transformations.
143: \newblock {\em IEEE Transactions on Pattern Analysis and Machine
144: Intelligence\/}~{\em 19}.
145:
146: \bibitem[\protect\citeauthoryear{Wu}{Wu}{1983}]{Wu:83}
147: Wu, C. F.~J. (1983).
148: \newblock On the convergence properties of the {EM} algorithm.
149: \newblock {\em The Annals of Statistics\/}~{\em 11\/}(1), 95--103.
150:
151: \end{thebibliography}
152: