0207:cs0207073/paper.bbl

1: \begin{thebibliography}{10}

2:

3: \bibitem{hot-potato}

4: P.~Baran.

5: \newblock {On Distributed Communication Networks}.

6: \newblock {\em IEEE Transactions on Communications Systems}, Vol. CS-12:pages

7:   1--9, 1964.

8:

9: \bibitem{ddp}

10: D.P. Bertsekas.

11: \newblock {Distributed Dynamic Programming}.

12: \newblock {\em IEEE Transactions on Automatic Control}, Vol. 27:pages 610--616,

13:   1982.

14:

15: \bibitem{bertsekas-dn}

16: D.P. Bertsekas and R.~Gallager.

17: \newblock {\em Data Networks}.

18: \newblock Prentice Hall, Englewood Cliffs, NJ, 1992.

19: \newblock Second Edition.

20:

21: \bibitem{ndp-book}

22: D.P. Bertsekas and J.N. Tsitsiklis.

23: \newblock {\em Neuro-Dynamic Programming}.

24: \newblock Athena Scientific, Belmont, MA, 1996.

25:

26: \bibitem{bertsekas-pdp}

27: D.P. Bertsekas and J.N. Tsitsiklis.

28: \newblock {\em Parallel and Distributed Computation: Numerical Methods}.

29: \newblock Athena Scientific, Belmont, MA, 1997.

30:

31: \bibitem{qrouting}

32: J.~Boyan and M.~Littman.

33: \newblock {Packet Routing in Dynamically Changing Networks: A Reinforcement

34:   Learning Approach}.

35: \newblock In {\em Advances in Neural Information Processing Systems 6 (NIPS6)},

36:   pages 671--678. Morgan Kaufmann, San Francisco, CA, 1994.

37:

38: \bibitem{chen-druschel}

39: J.~Chen, P.~Druschel, and D.~Subramanian.

40: \newblock {A New Approach to Routing with Dynamic Metrics}.

41: \newblock In {\em Proceedings of the IEEE INFOCOM Conference on Computer

42:   Communications}, pages 661--670. IEEE Press, New York, March 1999.

43:

44: \bibitem{ospf-ls}

45: R.~Coltun.

46: \newblock {OSPF: An Internet Routing Protocol}.

47: \newblock {\em ConneXions}, Vol. 3(8):pages 19--25, 1989.

48:

49: \bibitem{anytime-algo}

50: T.~Dean and M.~Boddy.

51: \newblock {An Analysis of Time-Dependent Planning}.

52: \newblock In {\em Proceedings of the Seventh National Conference on Artificial

53:   Intelligence (AAAI'88)}, pages 49--54. AAAI/MIT Press, 1988.

54: \newblock St. Paul, MN.

55:

56: \bibitem{stigmergy}

57: G.~Di~Caro and M.~Dorigo.

58: \newblock {AntNet: Distributed Stigmergetic Control for Communications

59:   Networks}.

60: \newblock {\em Journal of Artificial Intelligence Research}, Vol. 9:pages

61:   317--365, 1998.

62:

63: \bibitem{MAXQ}

64: T.G. Dietterich.

65: \newblock {Hierarchical Reinforcement Learning with the MAXQ Value Function

66:   Decomposition}.

67: \newblock {\em Journal of Artificial Intelligence Research}, Vol. 13:pages

68:   227--303, 2000.

69:

70: \bibitem{rl-coordination}

71: C.~Guestrin, M.~Lagoudakis, and R.~Parr.

72: \newblock {Coordinated Reinforcement Learning}.

73: \newblock In {\em Machine Learning: Proceedings of the Nineteenth International

74:   Conference (ICML 2002)}. Morgan Kaufmann, San Francisco, CA, July 2002.

75:

76: \bibitem{rfc1058}

77: C.~Hedrick.

78: \newblock {Routing Information Protocol}.

79: \newblock Request for Comments 1058, Network Working Group, June 1988.

80:

81: \bibitem{rl-survey}

82: L.P. Kaelbling, M.L. Littman, and A.W. Moore.

83: \newblock {Reinforcement Learning: A Survey}.

84: \newblock {\em Journal of Artificial Intelligence Research}, Vol. 4:pages

85:   237--285, 1996.

86:

87: \bibitem{rfc2453}

88: G.~Malkin.

89: \newblock {RIP Version 2}.

90: \newblock Request for Comments 2453, Network Working Group, November 1998.

91:

92: \bibitem{mccalum-thesis}

93: A.K. McCallum.

94: \newblock {\em Reinforcement Learning with Selective Perception and Hidden

95:   State}.

96: \newblock PhD thesis, Department of Computer Science, University of Rochester,

97:   1995, revised 1996.

98:

99: \bibitem{rfc1247}

100: J.~Moy.

101: \newblock {OSPF Version 2}.

102: \newblock Request for Comments 1247, Network Working Group, July 1991.

103:

104: \bibitem{rfc1583}

105: J.~Moy.

106: \newblock {OSPF Version 2}.

107: \newblock Request for Comments 1583, Network Working Group, March 1994.

108:

109: \bibitem{irl}

110: A.Y. Ng and S.J. Russell.

111: \newblock {Algorithms for Inverse Reinforcement Learning}.

112: \newblock In {\em Machine Learning: Proceedings of the Seventeenth

113:   International Conference (ICML 2000)}, pages 663--670. Morgan Kaufmann, San

114:   Francisco, CA, June 2000.

115:

116: \bibitem{steenstrup}

117: M.~Steenstrup~(ed.).

118: \newblock {\em Routing in Communications Networks}.

119: \newblock Prentice Hall, 1995.

120:

121: \bibitem{ants}

122: D.~Subramanian, P.~Druschel, and J.~Chen.

123: \newblock {Ants and Reinforcement Learning: A Case Study in Routing in Dynamic

124:   Networks}.

125: \newblock In {\em Proceedings of the Fifteenth International Joint Conference

126:   on Artificial Intelligence (IJCAI'97)}, pages 832--839. Morgan Kaufmann, San

127:   Francisco, CA, 1997.

128:

129: \bibitem{rl-book}

130: R.S. Sutton and A.G. Barto.

131: \newblock {\em Reinforcement Learning}.

132: \newblock MIT Press, Cambridge, MA, 1998.

133:

134: \bibitem{mdva}

135: S.~Vutukury and J.J. Garcia-Luna-Aceves.

136: \newblock {MDVA: A Distance-Vector Multipath Routing Protocol}.

137: \newblock In {\em Proceedings of the IEEE INFOCOM Conference on Computer

138:   Communications}, pages 557--564. IEEE Press, 2001.

139:

140: \end{thebibliography}

141: