cs0207073/paper.bbl
1: \begin{thebibliography}{10}
2: 
3: \bibitem{hot-potato}
4: P.~Baran.
5: \newblock {On Distributed Communication Networks}.
6: \newblock {\em IEEE Transactions on Communications Systems}, Vol. CS-12:pages
7:   1--9, 1964.
8: 
9: \bibitem{ddp}
10: D.P. Bertsekas.
11: \newblock {Distributed Dynamic Programming}.
12: \newblock {\em IEEE Transactions on Automatic Control}, Vol. 27:pages 610--616,
13:   1982.
14: 
15: \bibitem{bertsekas-dn}
16: D.P. Bertsekas and R.~Gallager.
17: \newblock {\em Data Networks}.
18: \newblock Prentice Hall, Englewood Cliffs, NJ, 1992.
19: \newblock Second Edition.
20: 
21: \bibitem{ndp-book}
22: D.P. Bertsekas and J.N. Tsitsiklis.
23: \newblock {\em Neuro-Dynamic Programming}.
24: \newblock Athena Scientific, Belmont, MA, 1996.
25: 
26: \bibitem{bertsekas-pdp}
27: D.P. Bertsekas and J.N. Tsitsiklis.
28: \newblock {\em Parallel and Distributed Computation: Numerical Methods}.
29: \newblock Athena Scientific, Belmont, MA, 1997.
30: 
31: \bibitem{qrouting}
32: J.~Boyan and M.~Littman.
33: \newblock {Packet Routing in Dynamically Changing Networks: A Reinforcement
34:   Learning Approach}.
35: \newblock In {\em Advances in Neural Information Processing Systems 6 (NIPS6)},
36:   pages 671--678. Morgan Kaufmann, San Francisco, CA, 1994.
37: 
38: \bibitem{chen-druschel}
39: J.~Chen, P.~Druschel, and D.~Subramanian.
40: \newblock {A New Approach to Routing with Dynamic Metrics}.
41: \newblock In {\em Proceedings of the IEEE INFOCOM Conference on Computer
42:   Communications}, pages 661--670. IEEE Press, New York, March 1999.
43: 
44: \bibitem{ospf-ls}
45: R.~Coltun.
46: \newblock {OSPF: An Internet Routing Protocol}.
47: \newblock {\em ConneXions}, Vol. 3(8):pages 19--25, 1989.
48: 
49: \bibitem{anytime-algo}
50: T.~Dean and M.~Boddy.
51: \newblock {An Analysis of Time-Dependent Planning}.
52: \newblock In {\em Proceedings of the Seventh National Conference on Artificial
53:   Intelligence (AAAI'88)}, pages 49--54. AAAI/MIT Press, 1988.
54: \newblock St. Paul, MN.
55: 
56: \bibitem{stigmergy}
57: G.~Di~Caro and M.~Dorigo.
58: \newblock {AntNet: Distributed Stigmergetic Control for Communications
59:   Networks}.
60: \newblock {\em Journal of Artificial Intelligence Research}, Vol. 9:pages
61:   317--365, 1998.
62: 
63: \bibitem{MAXQ}
64: T.G. Dietterich.
65: \newblock {Hierarchical Reinforcement Learning with the MAXQ Value Function
66:   Decomposition}.
67: \newblock {\em Journal of Artificial Intelligence Research}, Vol. 13:pages
68:   227--303, 2000.
69: 
70: \bibitem{rl-coordination}
71: C.~Guestrin, M.~Lagoudakis, and R.~Parr.
72: \newblock {Coordinated Reinforcement Learning}.
73: \newblock In {\em Machine Learning: Proceedings of the Nineteenth International
74:   Conference (ICML 2002)}. Morgan Kaufmann, San Francisco, CA, July 2002.
75: 
76: \bibitem{rfc1058}
77: C.~Hedrick.
78: \newblock {Routing Information Protocol}.
79: \newblock Request for Comments 1058, Network Working Group, June 1988.
80: 
81: \bibitem{rl-survey}
82: L.P. Kaelbling, M.L. Littman, and A.W. Moore.
83: \newblock {Reinforcement Learning: A Survey}.
84: \newblock {\em Journal of Artificial Intelligence Research}, Vol. 4:pages
85:   237--285, 1996.
86: 
87: \bibitem{rfc2453}
88: G.~Malkin.
89: \newblock {RIP Version 2}.
90: \newblock Request for Comments 2453, Network Working Group, November 1998.
91: 
92: \bibitem{mccalum-thesis}
93: A.K. McCallum.
94: \newblock {\em Reinforcement Learning with Selective Perception and Hidden
95:   State}.
96: \newblock PhD thesis, Department of Computer Science, University of Rochester,
97:   1995, revised 1996.
98: 
99: \bibitem{rfc1247}
100: J.~Moy.
101: \newblock {OSPF Version 2}.
102: \newblock Request for Comments 1247, Network Working Group, July 1991.
103: 
104: \bibitem{rfc1583}
105: J.~Moy.
106: \newblock {OSPF Version 2}.
107: \newblock Request for Comments 1583, Network Working Group, March 1994.
108: 
109: \bibitem{irl}
110: A.Y. Ng and S.J. Russell.
111: \newblock {Algorithms for Inverse Reinforcement Learning}.
112: \newblock In {\em Machine Learning: Proceedings of the Seventeenth
113:   International Conference (ICML 2000)}, pages 663--670. Morgan Kaufmann, San
114:   Francisco, CA, June 2000.
115: 
116: \bibitem{steenstrup}
117: M.~Steenstrup~(ed.).
118: \newblock {\em Routing in Communications Networks}.
119: \newblock Prentice Hall, 1995.
120: 
121: \bibitem{ants}
122: D.~Subramanian, P.~Druschel, and J.~Chen.
123: \newblock {Ants and Reinforcement Learning: A Case Study in Routing in Dynamic
124:   Networks}.
125: \newblock In {\em Proceedings of the Fifteenth International Joint Conference
126:   on Artificial Intelligence (IJCAI'97)}, pages 832--839. Morgan Kaufmann, San
127:   Francisco, CA, 1997.
128: 
129: \bibitem{rl-book}
130: R.S. Sutton and A.G. Barto.
131: \newblock {\em Reinforcement Learning}.
132: \newblock MIT Press, Cambridge, MA, 1998.
133: 
134: \bibitem{mdva}
135: S.~Vutukury and J.J. Garcia-Luna-Aceves.
136: \newblock {MDVA: A Distance-Vector Multipath Routing Protocol}.
137: \newblock In {\em Proceedings of the IEEE INFOCOM Conference on Computer
138:   Communications}, pages 557--564. IEEE Press, 2001.
139: 
140: \end{thebibliography}
141: