1: \begin{thebibliography}{10}
2:
3: \bibitem{hot-potato}
4: P.~Baran.
5: \newblock {On Distributed Communication Networks}.
6: \newblock {\em IEEE Transactions on Communications Systems}, Vol. CS-12:pages
7: 1--9, 1964.
8:
9: \bibitem{ddp}
10: D.P. Bertsekas.
11: \newblock {Distributed Dynamic Programming}.
12: \newblock {\em IEEE Transactions on Automatic Control}, Vol. 27:pages 610--616,
13: 1982.
14:
15: \bibitem{bertsekas-dn}
16: D.P. Bertsekas and R.~Gallager.
17: \newblock {\em Data Networks}.
18: \newblock Prentice Hall, Englewood Cliffs, NJ, 1992.
19: \newblock Second Edition.
20:
21: \bibitem{ndp-book}
22: D.P. Bertsekas and J.N. Tsitsiklis.
23: \newblock {\em Neuro-Dynamic Programming}.
24: \newblock Athena Scientific, Belmont, MA, 1996.
25:
26: \bibitem{bertsekas-pdp}
27: D.P. Bertsekas and J.N. Tsitsiklis.
28: \newblock {\em Parallel and Distributed Computation: Numerical Methods}.
29: \newblock Athena Scientific, Belmont, MA, 1997.
30:
31: \bibitem{qrouting}
32: J.~Boyan and M.~Littman.
33: \newblock {Packet Routing in Dynamically Changing Networks: A Reinforcement
34: Learning Approach}.
35: \newblock In {\em Advances in Neural Information Processing Systems 6 (NIPS6)},
36: pages 671--678. Morgan Kaufmann, San Francisco, CA, 1994.
37:
38: \bibitem{chen-druschel}
39: J.~Chen, P.~Druschel, and D.~Subramanian.
40: \newblock {A New Approach to Routing with Dynamic Metrics}.
41: \newblock In {\em Proceedings of the IEEE INFOCOM Conference on Computer
42: Communications}, pages 661--670. IEEE Press, New York, March 1999.
43:
44: \bibitem{ospf-ls}
45: R.~Coltun.
46: \newblock {OSPF: An Internet Routing Protocol}.
47: \newblock {\em ConneXions}, Vol. 3(8):pages 19--25, 1989.
48:
49: \bibitem{anytime-algo}
50: T.~Dean and M.~Boddy.
51: \newblock {An Analysis of Time-Dependent Planning}.
52: \newblock In {\em Proceedings of the Seventh National Conference on Artificial
53: Intelligence (AAAI'88)}, pages 49--54. AAAI/MIT Press, 1988.
54: \newblock St. Paul, MN.
55:
56: \bibitem{stigmergy}
57: G.~Di~Caro and M.~Dorigo.
58: \newblock {AntNet: Distributed Stigmergetic Control for Communications
59: Networks}.
60: \newblock {\em Journal of Artificial Intelligence Research}, Vol. 9:pages
61: 317--365, 1998.
62:
63: \bibitem{MAXQ}
64: T.G. Dietterich.
65: \newblock {Hierarchical Reinforcement Learning with the MAXQ Value Function
66: Decomposition}.
67: \newblock {\em Journal of Artificial Intelligence Research}, Vol. 13:pages
68: 227--303, 2000.
69:
70: \bibitem{rl-coordination}
71: C.~Guestrin, M.~Lagoudakis, and R.~Parr.
72: \newblock {Coordinated Reinforcement Learning}.
73: \newblock In {\em Machine Learning: Proceedings of the Nineteenth International
74: Conference (ICML 2002)}. Morgan Kaufmann, San Francisco, CA, July 2002.
75:
76: \bibitem{rfc1058}
77: C.~Hedrick.
78: \newblock {Routing Information Protocol}.
79: \newblock Request for Comments 1058, Network Working Group, June 1988.
80:
81: \bibitem{rl-survey}
82: L.P. Kaelbling, M.L. Littman, and A.W. Moore.
83: \newblock {Reinforcement Learning: A Survey}.
84: \newblock {\em Journal of Artificial Intelligence Research}, Vol. 4:pages
85: 237--285, 1996.
86:
87: \bibitem{rfc2453}
88: G.~Malkin.
89: \newblock {RIP Version 2}.
90: \newblock Request for Comments 2453, Network Working Group, November 1998.
91:
92: \bibitem{mccalum-thesis}
93: A.K. McCallum.
94: \newblock {\em Reinforcement Learning with Selective Perception and Hidden
95: State}.
96: \newblock PhD thesis, Department of Computer Science, University of Rochester,
97: 1995, revised 1996.
98:
99: \bibitem{rfc1247}
100: J.~Moy.
101: \newblock {OSPF Version 2}.
102: \newblock Request for Comments 1247, Network Working Group, July 1991.
103:
104: \bibitem{rfc1583}
105: J.~Moy.
106: \newblock {OSPF Version 2}.
107: \newblock Request for Comments 1583, Network Working Group, March 1994.
108:
109: \bibitem{irl}
110: A.Y. Ng and S.J. Russell.
111: \newblock {Algorithms for Inverse Reinforcement Learning}.
112: \newblock In {\em Machine Learning: Proceedings of the Seventeenth
113: International Conference (ICML 2000)}, pages 663--670. Morgan Kaufmann, San
114: Francisco, CA, June 2000.
115:
116: \bibitem{steenstrup}
117: M.~Steenstrup~(ed.).
118: \newblock {\em Routing in Communications Networks}.
119: \newblock Prentice Hall, 1995.
120:
121: \bibitem{ants}
122: D.~Subramanian, P.~Druschel, and J.~Chen.
123: \newblock {Ants and Reinforcement Learning: A Case Study in Routing in Dynamic
124: Networks}.
125: \newblock In {\em Proceedings of the Fifteenth International Joint Conference
126: on Artificial Intelligence (IJCAI'97)}, pages 832--839. Morgan Kaufmann, San
127: Francisco, CA, 1997.
128:
129: \bibitem{rl-book}
130: R.S. Sutton and A.G. Barto.
131: \newblock {\em Reinforcement Learning}.
132: \newblock MIT Press, Cambridge, MA, 1998.
133:
134: \bibitem{mdva}
135: S.~Vutukury and J.J. Garcia-Luna-Aceves.
136: \newblock {MDVA: A Distance-Vector Multipath Routing Protocol}.
137: \newblock In {\em Proceedings of the IEEE INFOCOM Conference on Computer
138: Communications}, pages 557--564. IEEE Press, 2001.
139:
140: \end{thebibliography}
141: