cs0412015/paper.bbl
1: \begin{thebibliography}{}
2: 
3: \bibitem[\protect\citeauthoryear{Backus}{Backus}{1959}]{Backus:1959}
4: Backus, J.~W. (1959).
5: \newblock {The syntax and semantics of the proposed international algebraic
6:   language of the Z\"urich ACM-GAMM Conference}.
7: \newblock In {\em {Proceedings of the International Conference on Information
8:   Processing}}, Paris.
9: 
10: \bibitem[\protect\citeauthoryear{Baker}{Baker}{1979}]{Baker:79}
11: Baker, J.~K. (1979).
12: \newblock Trainable grammars for speech recognition.
13: \newblock In D.~Klatt and J.~Wolf (Eds.), {\em Speech Communication Papers for
14:   {ASA'97}}, pp.\  547--550.
15: 
16: \bibitem[\protect\citeauthoryear{Baum}{Baum}{1972}]{Baum:72}
17: Baum, L.~E. (1972).
18: \newblock An inequality and associated maximization technique in statistical
19:   estimation for probabilistic functions of {M}arkov processes.
20: \newblock {\em Inequalities\/}~{\em III}, 1--8.
21: 
22: \bibitem[\protect\citeauthoryear{Booth and Thompson}{Booth and
23:   Thompson}{1973}]{Booth:73}
24: Booth, T.~L. and R.~A. Thompson (1973).
25: \newblock Applying probability measures to abstract languages.
26: \newblock {\em {IEEE} Transactions on Computers\/}~{\em C-22\/}(5), 442--450.
27: 
28: \bibitem[\protect\citeauthoryear{Charniak}{Charniak}{1996}]{Charniak:96}
29: Charniak, E. (1996).
30: \newblock Tree-bank grammars.
31: \newblock Technical Report CS-96-02, Brown University.
32: 
33: \bibitem[\protect\citeauthoryear{Chi}{Chi}{1999}]{Chi:1999}
34: Chi, Z. (1999).
35: \newblock Statistical properties of probabilistic context-free grammars.
36: \newblock {\em Computational Linguistics\/}~{\em 25\/}(1).
37: 
38: \bibitem[\protect\citeauthoryear{Chi and Geman}{Chi and
39:   Geman}{1998}]{Chi:1998b}
40: Chi, Z. and S.~Geman (1998).
41: \newblock Squibs and discussions: Estimation of probabilistic context-free
42:   grammars.
43: \newblock {\em Computational Linguistics\/}~{\em 24\/}(2).
44: 
45: \bibitem[\protect\citeauthoryear{Chomsky}{Chomsky}{1956}]{Chomsky:1956}
46: Chomsky, N. (1956).
47: \newblock Three models for the description of language.
48: \newblock {\em IRE Transactions on Information Theory\/}.
49: 
50: \bibitem[\protect\citeauthoryear{Cover and Thomas}{Cover and
51:   Thomas}{1991}]{CoverThomas:91}
52: Cover, T.~M. and J.~A. Thomas (1991).
53: \newblock {\em Elements of Information Theory}.
54: \newblock New York: Wiley.
55: 
56: \bibitem[\protect\citeauthoryear{DeGroot}{DeGroot}{1989}]{DeGroot:89}
57: DeGroot, M.~H. (1989).
58: \newblock {\em Probability and statistics\/} (2 ed.).
59: \newblock Addison-Wesley.
60: 
61: \bibitem[\protect\citeauthoryear{Dempster, Laird, and Rubin}{Dempster
62:   et~al.}{1977}]{Dempster:77}
63: Dempster, A.~P., N.~M. Laird, and D.~B. Rubin (1977).
64: \newblock Maximum likelihood from incomplete data via the {{\em EM}} algorithm.
65: \newblock {\em J. Royal Statist. Soc.\/}~{\em 39\/}(B), 1--38.
66: 
67: \bibitem[\protect\citeauthoryear{Duda, Hart, and Stork}{Duda
68:   et~al.}{2001}]{Duda:01}
69: Duda, R.~O., P.~E. Hart, and D.~G. Stork (2001).
70: \newblock {\em Pattern Classification --- 2nd ed}.
71: \newblock New York: Wiley.
72: 
73: \bibitem[\protect\citeauthoryear{Hopcroft and Ullman}{Hopcroft and
74:   Ullman}{1979}]{HopcroftUllman:79}
75: Hopcroft, J.~E. and J.~D. Ullman (1979).
76: \newblock {\em Introduction to Automata Theory, Languages, and Computation}.
77: \newblock Reading, MA: Addison-Wesley.
78: 
79: \bibitem[\protect\citeauthoryear{Jaynes}{Jaynes}{1957}]{Jaynes:57}
80: Jaynes, E.~T. (1957).
81: \newblock Information theory and statistical mechanics.
82: \newblock {\em Physical Review\/}~{\em 106}, 620--630.
83: 
84: \bibitem[\protect\citeauthoryear{Johnson}{Johnson}{1998}]{Johnson:1998}
85: Johnson, M. (1998).
86: \newblock {PCFG} models of linguistic tree representations.
87: \newblock {\em Computational Linguistics\/}~{\em 24\/}(4).
88: 
89: \bibitem[\protect\citeauthoryear{Klein and Manning}{Klein and
90:   Manning}{2003}]{KleinManning:2003}
91: Klein, D. and C.~D. Manning (2003).
92: \newblock Accurate unlexicalized parsing.
93: \newblock In {\em Proceedings of {ACL-03}}, Sapporo, Japan.
94: 
95: \bibitem[\protect\citeauthoryear{Lari and Young}{Lari and
96:   Young}{1990}]{Lari:90}
97: Lari, K. and S.~J. Young (1990).
98: \newblock The estimation of stochastic context-free grammars using the
99:   inside-outside algorithm.
100: \newblock {\em Computer Speech and Language\/}~{\em 4}, 35--56.
101: 
102: \bibitem[\protect\citeauthoryear{McLachlan and Krishnan}{McLachlan and
103:   Krishnan}{1997}]{McLachlan:97}
104: McLachlan, G.~J. and T.~Krishnan (1997).
105: \newblock {\em The {EM} Algorithm and Extensions}.
106: \newblock New York: Wiley.
107: 
108: \bibitem[\protect\citeauthoryear{Nederhof and Satta}{Nederhof and
109:   Satta}{2003}]{NederhofSatta:2003}
110: Nederhof, M.-J. and G.~Satta (2003).
111: \newblock Probabilistic parsing as intersection.
112: \newblock In {\em {Proceedings of the 8th International Workshop on Parsing
113:   Technologies (IWPT-03)}}, Nancy, France.
114: 
115: \bibitem[\protect\citeauthoryear{Pereira and Schabes}{Pereira and
116:   Schabes}{1992}]{Pereira:92}
117: Pereira, F. and Y.~Schabes (1992).
118: \newblock Inside-outside reestimation from partially bracketed corpora.
119: \newblock In {\em Proceedings of {ACL'92}}, Newark, Delaware.
120: 
121: \bibitem[\protect\citeauthoryear{Prescher}{Prescher}{2001}]{Prescher:01c}
122: Prescher, D. (2001).
123: \newblock Inside-outside estimation meets dynamic {EM}.
124: \newblock In {\em Proceedings of IWPT-2001}, Beijing.
125: 
126: \bibitem[\protect\citeauthoryear{Prescher}{Prescher}{2002}]{Prescher:Diss}
127: Prescher, D. (2002).
128: \newblock {\em {EM-basierte maschinelle Lernverfahren f\"ur nat\"urliche
129:   Sprachen}}.
130: \newblock Ph.\ D. thesis, IMS, University of Stuttgart.
131: 
132: \bibitem[\protect\citeauthoryear{Ratnaparkhi}{Ratnaparkhi}{1997}]{Rat:97Report}
133: Ratnaparkhi, A. (1997).
134: \newblock A simple introduction to maximum-entropy models for natural language
135:   processing.
136: \newblock Technical report, University of Pennsylvania.
137: 
138: \bibitem[\protect\citeauthoryear{Sanchez and Benedi}{Sanchez and
139:   Benedi}{1997}]{Sanchez1997}
140: Sanchez, J.~A. and J.~M. Benedi (1997).
141: \newblock Consistency of stochastic context-free grammars from probabilistic
142:   estimation based on growth transformations.
143: \newblock {\em IEEE Transactions on Pattern Analysis and Machine
144:   Intelligence\/}~{\em 19}.
145: 
146: \bibitem[\protect\citeauthoryear{Wu}{Wu}{1983}]{Wu:83}
147: Wu, C. F.~J. (1983).
148: \newblock On the convergence properties of the {EM} algorithm.
149: \newblock {\em The Annals of Statistics\/}~{\em 11\/}(1), 95--103.
150: 
151: \end{thebibliography}
152: