1: \begin{thebibliography}{}
2:
3: \bibitem[\protect\citeauthoryear{Akaike}{Akaike}{1974}]{akaike:74}
4: Akaike, H. (1974).
5: \newblock A new look at the statistical model identification.
6: \newblock {\em IEEE Transactions on Automatic Control\/}~{\bf AC--19},
7: 716--723.
8: \newblock For a reprint see E. Parzen et al. (Eds.), \emph{Selected Papers of
9: Hirotugu Akaike}, Springer Series in Statistics, 1998.
10:
11: \bibitem[\protect\citeauthoryear{Amari}{Amari}{1993}]{amari:93}
12: Amari, S. (1993).
13: \newblock Mathematical methods of neurocomputing.
14: \newblock In O.~Barndorff-Nielsen, J.~Jensen, \& W.~Kendall (Eds.), {\em
15: Networks and Chaos---Statistical and Probabilistic Aspects}, pp.\ 1--39.
16: Chapman \& Hall, London.
17:
18: \bibitem[\protect\citeauthoryear{Amari}{Amari}{1998}]{amari:98}
19: Amari, S. (1998).
20: \newblock Natural gradient works efficiently in learning.
21: \newblock {\em Neural Computation\/}~{\bf 10}, 251--276.
22:
23: \bibitem[\protect\citeauthoryear{Amari}{Amari}{2000}]{amari:00}
24: Amari, S. (2000).
25: \newblock Information geometry on hierachical decomposition of stochastic
26: interactions.
27: \newblock Submitted to IEEE Transactions on Information Theory.
28:
29: \bibitem[\protect\citeauthoryear{Baluja \& Davies}{Baluja \&
30: Davies}{1997}]{baluja:97}
31: Baluja, S. \& S.~Davies (1997).
32: \newblock Using optimal dependency-trees for combinatorial optimization:
33: Learning the structure of the search space.
34: \newblock In {\em Proceedings of the Fourteenth International Conference on
35: Machine Learning (ICML-97)}, pp.\ 30--38.
36:
37: \bibitem[\protect\citeauthoryear{Choi, Amari, \& Cichocki}{Choi
38: et~al.}{2000}]{choi:00}
39: Choi, S., S.~Amari, \& A.~Cichocki (2000).
40: \newblock Natural gradient learning for spatio-temporal decorrelation:
41: recurrent network.
42: \newblock {\em IEICE Transactions Fundamentals\/}~{\bf E83}, 2715--2722.
43:
44: \bibitem[\protect\citeauthoryear{French}{French}{1999}]{french:99}
45: French, R.~M. (1999).
46: \newblock Catastrophic forgetting in connectionist networks.
47: \newblock {\em Trends in Cognitive Scienences\/}~{\bf 3}, 128--135.
48:
49: \bibitem[\protect\citeauthoryear{Hansen \& Ostermeier}{Hansen \&
50: Ostermeier}{2001}]{hansen:01}
51: Hansen, N. \& A.~Ostermeier (2001).
52: \newblock Completely derandomized self-adaption in evolutionary strategies.
53: \newblock {\em Evolutionary Computation\/}~{\bf 9}, 159--195.
54:
55: \bibitem[\protect\citeauthoryear{Hornik, Stinchcombe, \& White}{Hornik
56: et~al.}{1989}]{hornik:89}
57: Hornik, K., M.~Stinchcombe, \& H.~White (1989).
58: \newblock Multilayer feedforward networks are universal approximators.
59: \newblock {\em Neural Networks\/}~{\bf 2}, 359--366.
60:
61: \bibitem[\protect\citeauthoryear{Jacobs, Jordan, \& Barto}{Jacobs
62: et~al.}{1990}]{jacobs:90}
63: Jacobs, R.~A., M.~I. Jordan, \& A.~G. Barto (1990).
64: \newblock Task decomposistion through competition in a modular connectionist
65: architecture: The what and where vision tasks.
66: \newblock Technical Report COINS-90-27, Department of Computer and Information
67: Science, University of Massachusetts Amherst.
68:
69: \bibitem[\protect\citeauthoryear{Kearns, Mansour, Ng, \& Ron}{Kearns
70: et~al.}{1995}]{kearns:95}
71: Kearns, M., Y.~Mansour, A.~Y. Ng, \& D.~Ron (1995).
72: \newblock An experimental and theoretical comparison of model selection
73: methods.
74: \newblock In {\em Proceedings of the Workshop on Computational Learning Theory
75: (COLT-95), Morgan Kaufmann Publishers}.
76:
77: \bibitem[\protect\citeauthoryear{Moody}{Moody}{1991}]{moody:91}
78: Moody, J. (1991).
79: \newblock The effective number of parameters: an analysis of generalization and
80: regularization in nonlinear systems.
81: \newblock In {\em Advances in Neural Information Processing Systems}, Volume~4,
82: pp.\ 847--854.
83:
84: \bibitem[\protect\citeauthoryear{M{\"u}hlenbein, Mahnig, \&
85: Rodriguez}{M{\"u}hlenbein et~al.}{1999}]{muehlenbein:99}
86: M{\"u}hlenbein, H., T.~Mahnig, \& A.~O. Rodriguez (1999).
87: \newblock Schemata, distributions and graphical models in evolutionary
88: optimization.
89: \newblock {\em Journal of Heuristics\/}~{\bf 5}, 215--247.
90:
91: \bibitem[\protect\citeauthoryear{Pelikan, Goldberg, \& Lobo}{Pelikan
92: et~al.}{1999}]{pelikan:99}
93: Pelikan, M., D.~E. Goldberg, \& F.~Lobo (1999).
94: \newblock A survey of optimization by building and using probabilistic models.
95: \newblock Technical Report IlliGAL-99018, Illinois Genetic Algorithms
96: Laboratory.
97:
98: \bibitem[\protect\citeauthoryear{Rissanen}{Rissanen}{1978}]{rissanen:78}
99: Rissanen, J. (1978).
100: \newblock Modelling by shortest data description.
101: \newblock {\em Automatica\/}~{\bf 14}, 465--471.
102:
103: \bibitem[\protect\citeauthoryear{Schuurmans}{Schuurmans}{1997}]{schuurmans:97}
104: Schuurmans, D. (1997).
105: \newblock A new metric-based approach to model selection.
106: \newblock In {\em Proceedings of the Fourteenth National Conference on
107: Artificial Intelligence (AAAI-97)}, pp.\ 552--558.
108:
109: \bibitem[\protect\citeauthoryear{Stephens \& Waelbroeck}{Stephens \&
110: Waelbroeck}{1999}]{stephens:99}
111: Stephens, C. \& H.~Waelbroeck (1999).
112: \newblock Codon bias and mutability in {HIV} sequences.
113: \newblock {\em Molecular Evolution\/}~{\bf 48}, 390--397.
114:
115: \bibitem[\protect\citeauthoryear{Toussaint}{Toussaint}{2001}]{toussaint:01}
116: Toussaint, M. (2001).
117: \newblock Neutrality and self-adaptable exploration in evolutionary search.
118: \newblock Technical Report IRINI-2001-05, Institut f{\"u}r Neuroinformatik,
119: Ruhr-Universit{\"a}t Bochum.
120:
121: \bibitem[\protect\citeauthoryear{Toussaint}{Toussaint}{2002}]{toussaint:02b}
122: Toussaint, M. (2002).
123: \newblock A neural model for multi-expert architectures.
124: \newblock In {\em Proceedings of the International Joint Conference on Neural
125: Networks (IJCNN 2002)}.
126:
127: \bibitem[\protect\citeauthoryear{Vapnik}{Vapnik}{1995}]{vapnik:95}
128: Vapnik, V.~N. (1995).
129: \newblock {\em The nature of statistical learning theory}.
130: \newblock Springer, New York.
131:
132: \bibitem[\protect\citeauthoryear{Wagner \& Altenberg}{Wagner \&
133: Altenberg}{1996}]{wagner:96}
134: Wagner, G.~P. \& L.~Altenberg (1996).
135: \newblock Complex adaptations and the evolution of evolvability.
136: \newblock {\em Evolution\/}~{\bf 50}, 967--976.
137:
138: \bibitem[\protect\citeauthoryear{Yao}{Yao}{1999}]{yao:99}
139: Yao, X. (1999).
140: \newblock Evolving artificial neural networks.
141: \newblock In {\em Proceedings of IEEE}, Volume~87, pp.\ 1423--1447.
142:
143: \end{thebibliography}
144: