1: \begin{thebibliography}{10}
2:
3: \bibitem{Aho:1974:DACA}
4: Alfred~V. Aho, John~E. Hopcroft, and Jeffrey~D. Ullman.
5: \newblock {\em The Design and Analysis of Computer Algorithms}.
6: \newblock Addison-Wesley, 1974.
7:
8: \bibitem{1999:lapack}
9: E.~Anderson, Z.~Bai, C.~Bischof, S.~Blackford, J.~Demmel, J.~Dongarra,
10: J.~Du~Croz, A.~Greenbaum, S.~Hammarling, A.~McKenney, and D.~Sorensen.
11: \newblock {\em {LAPACK} Users' Guide}.
12: \newblock Society for Industrial and Applied Mathematics, Philadelphia, PA,
13: third edition, 1999.
14:
15: \bibitem{Bini:1994:PMCFA}
16: Dario Bini and Victor Pan.
17: \newblock {\em Polynomial and Matrix Computations, Volume 1: Fundamental
18: Algorithms.}
19: \newblock Birkhauser, Boston, 1994.
20:
21: \bibitem{Brassel:2003:eccad}
22: Morgan Brassel, Pascal Giorgi, and Clement Pernet.
23: \newblock {LUdivine}: A symbolic block {LU} factorisation for matrices over
24: finite fields using blas, April 2003.
25: \newblock Poster,
26: \url{http://ljk.imag.fr/membres/Jean-Guillaume.Dumas/FFLAS/FFLAS_Download/lu%
27: divine_poster_eccad2003.ps.gz}.
28:
29: \bibitem{BunchHopcroft:1974}
30: James~R. Bunch and John~E. Hopcroft.
31: \newblock Triangular factorization and inversion by fast matrix multiplication.
32: \newblock {\em Mathematics of Computation}, 28:231--236, 1974.
33:
34: \bibitem{Storjohann:2003:ACA}
35: Zhuliang Chen and Arne Storjohann.
36: \newblock Effective reductions to matrix multiplication, July 2003.
37: \newblock ACA'2003, 9th International Conference on Applications of Computer
38: Algebra, Raleigh, North Carolina State University, USA.
39:
40: \bibitem{Coppersmith:1990:MMAP}
41: Don Coppersmith and Shmuel Winograd.
42: \newblock Matrix multiplication via arithmetic progressions.
43: \newblock {\em Journal of Symbolic Computation}, 9(3):251--280, 1990.
44:
45: \bibitem{Courrieu:2005:FMP}
46: Pierre Courrieu.
47: \newblock Fast computation of {Moore-Penrose} inverse matrices.
48: \newblock {\em Neural Information Processing - Letters and Reviews},
49: 8(2):25--29, August 2005.
50:
51: \bibitem{Dixon:1982:Pad}
52: John~D. Dixon.
53: \newblock {Exact solution of linear equations using p-adic expansions.}
54: \newblock {\em Numerische Mathematik}, 40:137--141, 1982.
55:
56: \bibitem{Dongarra:2003:SANS}
57: Jack Dongarra and Victor Eijkhout.
58: \newblock Self-adapting numerical software and automatic tuning of heuristics.
59: \newblock {\em Lecture Notes in Computer Science}, 2660:759--770, January 2003.
60:
61: \bibitem{Dongarra:1990:BLAS}
62: Jack~J. Dongarra, Jeremy~Du Croz, Sven Hammarling, and Iain Duff.
63: \newblock A set of level 3 {Basic Linear Algebra Subprograms}.
64: \newblock {\em Transactions on Mathematical Software}, 16(1):1--17, March 1990.
65: \newblock \url{http://doi.acm.org/10.1145/77626.79170}.
66:
67: \bibitem{Douglas:1994:gemmw}
68: C.~C. Douglas, M.~Heroux, G.~Slishman, and R.~M. Smith.
69: \newblock Gemmw: A portable level~3 blas winograd variant of strassen's
70: matrix-matrix multiply algorithm.
71: \newblock {\em Journal of Computational Physics}, 110:1--10, 1994.
72:
73: \bibitem{DumGioPer:2006:ffpack}
74: Jean-Guillaume Dumas, , Pascal Giorgi, and Cl\'ement Pernet.
75: \newblock {FFLAS-FFPACK}: Finite field linear algebra subroutine/package.
76: \newblock Software, \url{http://ciel.ccsd.cnrs.fr/ciel-00000025}, February
77: 2006.
78:
79: \bibitem{jgd:2004:dotprod}
80: Jean-Guillaume Dumas.
81: \newblock Efficient dot product over finite fields.
82: \newblock In Victor~G. Ganzha, Ernst~W. Mayr, and Evgenii~V. Vorozhtsov,
83: editors, {\em Proceedings of the seventh International Workshop on Computer
84: Algebra in Scientific Computing, Yalta, Ukraine}, pages 139--154. Technische
85: {Universit\"at} {M\"unchen}, Germany, July 2004.
86:
87: \bibitem{jgd:2007:dqt}
88: Jean-Guillaume Dumas.
89: \newblock Q-adic transform revisited.
90: \newblock Technical Report 0710.0510 [cs.SC], ArXiv, October 2007.
91: \newblock http://hal.archives-ouvertes.fr/hal-00173894.
92:
93: \bibitem{jgd:2002:icms}
94: Jean-Guillaume Dumas, Thierry Gautier, Mark Giesbrecht, Pascal Giorgi, Bradford
95: Hovinen, Erich Kaltofen, B.~David Saunders, Will~J. Turner, and Gilles
96: Villard.
97: \newblock {LinBox}: A generic library for exact linear algebra.
98: \newblock In Arjeh~M. Cohen, Xiao-Shan Gao, and Nobuki Takayama, editors, {\em
99: Proceedings of the 2002 International Congress of Mathematical Software,
100: Beijing, China}, pages 40--50. World Scientific Pub, August 2002.
101:
102: \bibitem{jgd:2002:fflas}
103: Jean-Guillaume Dumas, Thierry Gautier, and Cl\'ement Pernet.
104: \newblock Finite field linear algebra subroutines.
105: \newblock In Teo Mora, editor, {\em Proceedings of the 2002 International
106: Symposium on Symbolic and Algebraic Computation, Lille, France}, pages
107: 63--74. ACM Press, New York, July 2002.
108:
109: \bibitem{jgd:2004:ffpack}
110: Jean-Guillaume Dumas, Pascal Giorgi, and Cl\'ement Pernet.
111: \newblock {FFPACK}: Finite field linear algebra package.
112: \newblock In Jaime Gutierrez, editor, {\em Proceedings of the 2004
113: International Symposium on Symbolic and Algebraic Computation, Santander,
114: Spain}, pages 119--126. ACM Press, New York, July 2004.
115:
116: \bibitem{jgd:2006:atrsm}
117: Jean-Guillaume Dumas, Cl\'ement Pernet, and Jean-Louis Roch.
118: \newblock Adaptive triangular system solving.
119: \newblock In {\em Challenges in Symbolic Computation Software}, October 2006.
120: \newblock Dagstuhl Seminar proceedings 06271, paper 770.
121:
122: \bibitem{jgd:2005:charp}
123: Jean-Guillaume Dumas, Cl\'ement Pernet, and Zhendong Wan.
124: \newblock Efficient computation of the characteristic polynomial.
125: \newblock In Manuel Kauers, editor, {\em Proceedings of the 2005 International
126: Symposium on Symbolic and Algebraic Computation, Beijing, China}, pages
127: 140--147. ACM Press, New York, July 2005.
128:
129: \bibitem{DumasPernet:2007:WinoSchedule}
130: Jean-Guillaume Dumas, Cl\'ement Pernet, and Wei Zhou.
131: \newblock Memory efficient scheduling of {Strassen-Winograd}'s matrix
132: multiplication algorithm.
133: \newblock Technical report, arXiv:0707.2347v2, August 2007.
134: \newblock \url{http://arxiv.org/abs/0707.2347v2}.
135:
136: \bibitem{jgd:2002:PComp}
137: Jean-Guillaume Dumas and Jean-Louis Roch.
138: \newblock On parallel block algorithms for exact triangularizations.
139: \newblock {\em Parallel Computing}, 28(11):1531--1548, November 2002.
140:
141: \bibitem{jgd:2001:jsc}
142: Jean-Guillaume Dumas, B.~David Saunders, and Gilles Villard.
143: \newblock On efficient sparse integer matrix {Smith} normal form computations.
144: \newblock {\em Journal of Symbolic Computations}, 32(1/2):71--99, July--August
145: 2001.
146:
147: \bibitem{VonzurGathen:1999:MCA}
148: Joachim~{von zur} Gathen and J{\"u}rgen Gerhard.
149: \newblock {\em Modern Computer Algebra}.
150: \newblock Cambridge University Press, New York, NY, USA, 1999.
151:
152: \bibitem{Giorgi:2003:ACA}
153: Pascal Giorgi.
154: \newblock From blas routines to finite field exact linear algebra solutions,
155: July 2003.
156: \newblock ACA'2003, 9th International Conference on Applications of Computer
157: Algebra, Raleigh, North Carolina State University, USA.
158:
159: \bibitem{Giorgi:2003:issac}
160: Pascal Giorgi, Claude-Pierre Jeannerod, and Gilles Villard.
161: \newblock On the complexity of polynomial matrix computations.
162: \newblock In Rafael Sendra, editor, {\em Proceedings of the 2003 International
163: Symposium on Symbolic and Algebraic Computation, Philadelphia, Pennsylvania,
164: USA}, pages 135--142. ACM Press, New York, August 2003.
165:
166: \bibitem{Golub:1996:MatrixC}
167: Gene~H. Golub and Charles~F. {Van Loan}.
168: \newblock {\em Matrix computations}.
169: \newblock Johns Hopkins Studies in the Mathematical Sciences. The Johns Hopkins
170: University Press, Baltimore, MD, USA, third edition, 1996.
171:
172: \bibitem{2002:gotoblas}
173: Kazushige Goto and Robert van~de Geijn.
174: \newblock On reducing tlb misses in matrix multiplication.
175: \newblock Technical Report TR-2002-55, University of Texas, November 2002.
176: \newblock FLAME working note \#9.
177:
178: \bibitem{Gustavson:1998:RBD}
179: F.~Gustavson, A.~Henriksson, I.~Jonsson, and B.~Kaagstroem.
180: \newblock Recursive blocked data formats and {BLAS's} for dense linear algebra
181: algorithms.
182: \newblock {\em Lecture Notes in Computer Science}, 1541:195--206, 1998.
183:
184: \bibitem{Higham:1990:EFM}
185: Nicholas~J. Higham.
186: \newblock Exploiting fast matrix multiplication within the level 3 {BLAS}.
187: \newblock {\em Trans. on Mathematical Software}, 16(4):352--368, December 1990.
188:
189: \bibitem{Huss-Lederman:1996:ISA}
190: Steven Huss-Lederman, Elaine~M. Jacobson, Jeremy~R. Johnson, Anna Tsao, and
191: Thomas Turnbull.
192: \newblock Implementation of {Strassen}'s algorithm for matrix multiplication.
193: \newblock In {ACM}, editor, {\em Supercomputing '96 Conference Proceedings:
194: November 17--22, Pittsburgh, {PA}}, New York, NY 10036, USA and 1109 Spring
195: Street, Suite 300, Silver Spring, MD 20910, USA, 1996. ACM Press and IEEE
196: Computer Society Press.
197: \newblock \url{http://doi.acm.org/10.1145/369028.369096}.
198:
199: \bibitem{Huss-Lederman:1996:mai}
200: Steven Huss-Lederman, Elaine~M. Jacobson, Jeremy~R. Johnson, Anna Tsao, and
201: Thomas Turnbull.
202: \newblock {Strassen}'s algorithm for matrix multiplication~: Modeling analysis,
203: and implementation.
204: \newblock Technical report, Center for Computing Sciences, November 1996.
205: \newblock CCS-TR-96-17.
206:
207: \bibitem{Ibarra:1982:LSP}
208: Oscar~H. Ibarra, Shlomo Moran, and Roger Hui.
209: \newblock A generalization of the fast {LUP} matrix decomposition algorithm and
210: applications.
211: \newblock {\em Journal of Algorithms}, 3(1):45--56, March 1982.
212:
213: \bibitem{Kaltofen:2005:CCDet}
214: Erich Kaltofen and Gilles Villard.
215: \newblock On the complexity of computing determinants.
216: \newblock {\em Computational Complexity}, 13(3-4):91--130, 2005.
217:
218: \bibitem{Kaporin:2004:TCS}
219: Igor Kaporin.
220: \newblock The aggregation and cancellation techniques as a practical tool for
221: faster matrix multiplication.
222: \newblock {\em Theoretical Computer Science}, 315(2-3):469--510, 2004.
223:
224: \bibitem{Laderman:1992:PAA}
225: Julian Laderman, Victor Pan, and Xuan-He Sha.
226: \newblock On practical algorithms for accelerated matrix multiplication.
227: \newblock {\em Linear Algebra Appl.}, 162--164:557--588, 1992.
228:
229: \bibitem{Montgomery:1985:MMT}
230: Peter~L. Montgomery.
231: \newblock Modular multiplication without trial division.
232: \newblock {\em Mathematics of Computation}, 44(170):519--521, April 1985.
233:
234: \bibitem{Montgomery:1995:BLA}
235: Peter~L. Montgomery.
236: \newblock A block {Lanczos} algorithm for finding dependencies over $gf(2)$.
237: \newblock In Louis~C. Guillou and Jean-Jacques Quisquater, editors, {\em
238: Proceedings of the 1995 International Conference on the Theory and
239: Application of Cryptographic Techniques, Saint-Malo, France}, volume 921 of
240: {\em Lecture Notes in Computer Science}, pages 106--120, May 1995.
241:
242: \bibitem{Noble:1966:MCG}
243: Ben Noble.
244: \newblock A method for computing the generalized inverse of a matrix.
245: \newblock {\em SIAM Journal on Numerical Analysis}, 3(4):582--584, December
246: 1966.
247:
248: \bibitem{Odlyzko:2000:DLPF}
249: Andrew~M. Odlyzko.
250: \newblock Discrete logarithms: The past and the future.
251: \newblock {\em Designs, Codes, and Cryptography}, 19:129--145, 2000.
252:
253: \bibitem{Pernet:2001:Winograd}
254: Cl{\'e}ment Pernet.
255: \newblock Implementation of {Winograd}'s matrix multiplication over finite
256: fields using {ATLAS} level 3 {BLAS}.
257: \newblock Technical Report RR011122, Laboratoire Informatique et Distribution,
258: July 2001.
259: \newblock
260: \url{http://ljk.imag.fr/membres/Jean-Guillaume.Dumas/FFLAS/FFLAS_Download/FF%
261: LAS_technical_report.ps.gz}.
262:
263: \bibitem{Saunders:2001:BBLS}
264: B.~D. Saunders.
265: \newblock Black box methods for least squares problems.
266: \newblock In Bernard Mourrain, editor, {\em {ISSAC} 2001: July 22--25, 2001,
267: University of Western Ontario, London, Ontario, Canada: proceedings of the
268: 2001 International Symposium on Symbolic and Algebraic Computation}, pages
269: 297--302, 2001.
270:
271: \bibitem{Shoup:NTL}
272: Victor Shoup.
273: \newblock {NTL 5.3}: A library for doing number theory, 2002.
274: \newblock \texttt{www.shoup.net/ntl}.
275:
276: \bibitem{Storjohan:2005:HighOrder}
277: Arne Storjohann.
278: \newblock The shifted number system for fast linear algebra on integer
279: matrices.
280: \newblock {\em Journal of Complexity}, 21(4):609--650, 2005.
281:
282: \bibitem{Strassen:1969:GENO}
283: Volker Strassen.
284: \newblock {Gaussian} elimination is not optimal.
285: \newblock {\em Numerische Mathematik}, 13:354--356, 1969.
286:
287: \bibitem{Whaley:2001:AEO}
288: R.~Clint Whaley, Antoine Petitet, and Jack~J. Dongarra.
289: \newblock Automated empirical optimizations of software and the {ATLAS}
290: project.
291: \newblock {\em Parallel Computing}, 27(1--2):3--35, January 2001.
292: \newblock
293: \url{http://www.netlib.org/utk/people/JackDongarra/PAPERS/atlas_pub.pdf}.
294:
295: \bibitem{Zassenhaus:1978:RHF}
296: Hans Zassenhaus.
297: \newblock A remark on the {Hensel} factorization method.
298: \newblock {\em Mathematics of Computation}, 32(141):287--292, January 1978.
299:
300: \end{thebibliography}
301: