%---------------------------------------------------------------------------- % SUBMITTED / IN PREPARATION %---------------------------------------------------------------------------- @misc{adgj__, author = "Ani Anciaux-Sedrakian and Hugo Dorfsman and Thomas Guignon and Fabienne J\'ez\'equel and Theo Mary", title = "Mixed precision {BiCGstab} solvers for the solution of large sparse linear systems", note = "In preparation", keywords = {inpreparation}, } @misc{bkmr__a, author = "Marc Baboulin and Oguz Kaya and Theo Mary and Matthieu Robeyns", title = "Numerical stability of tree tensor network operations, and a stable rounding algorithm", note = "HAL EPrint hal-04996127", url = {https://hal.science/hal-04996127}, keywords = {submitted}, } @misc{efmr__, author = "El-Mehdi El Arar and Silviu Filip and Theo Mary and Elisa Riccietti", title = "Mixed precision accumulation for neural network inference guided by componentwise forward error analysis", note = "HAL EPrint hal-04995708", url = {https://hal.science/hal-04995708}, keywords = {submitted}, } @misc{bglm__, author = "J\'er\'emy Berthomieu and Stef Graillat and Dimitri Lesnoff and Theo Mary", title = "Multiword matrix multiplication over large finite fields in floating-point arithmetic", note = "HAL EPrint hal-04917201", url = {https://hal.science/hal-04917201}, keywords = {submitted}, } @misc{mami__, author = "Theo Mary and Mantas Mikaitis", title = "Error analysis of matrix multiplication with narrow range floating-point arithmetic", note = "HAL EPrint hal-04671474; to appear in \textit{SIAM J. Sci. Comput.}.", url = {https://hal.science/hal-04671474}, keywords = {journal}, } @misc{mary__, author = "Theo Mary", title = "Error analysis of Gramian-based low-rank approximation (and why it is not as unstable as one may think)", note = "HAL EPrint hal-04554516; to appear in \textit{SIAM J. Matrix Anal. Appl.}.", url = {https://hal.science/hal-04554516}, keywords = {journal}, } @misc{bhmv__, author = "Alfredo Buttari and Nicholas J. Higham and Theo Mary and Bastien Vieubl\'e", title = "A modular framework for the backward error analysis of {GMRES}", note = "HAL EPrint hal-04525918", url = {https://hal.science/hal-04525918}, keywords = {submitted}, } @misc{jema__, author = "Fabienne J\'ez\'equel and Theo Mary", title = "Probabilistic estimation of the accuracy of inner products and application to stochastic validation", note = "HAL EPrint hal-04554459", url = {https://hal.science/hal-04554459}, keywords = {submitted}, } @misc{grma__, author = "Stef Graillat and Theo Mary", title = "Condense and Distill: fast distillation of large floating-point sums via condensation", note = "HAL EPrint hal-04507609; to appear in \textit{SIAM J. Sci. Comput.}.", url = {https://hal.science/hal-04507609}, keywords = {journal}, } @misc{bbgm__, author = "Theo Beuzeville and Alfredo Buttari and Serge Gratton and Theo Mary", title = "Deterministic and probabilistic backward error analysis of neural networks in floating-point arithmetic", note = "HAL EPrint hal-04663142", url = {https://hal.science/hal-04663142/}, keywords = {submitted}, } @misc{gmr__, author = "R\'emi Gribonval and Theo Mary and Elisa Riccietti", title = "Optimal quantization of rank-one matrices in floating-point arithmetic---with applications to butterfly factorizations", note = "HAL EPrint hal-04125381", url = {https://inria.hal.science/hal-04125381}, keywords = {submitted}, } @misc{bkmr__, author = "Marc Baboulin and Oguz Kaya and Theo Mary and Matthieu Robeyns", title = "Mixed precision iterative refinement for low-rank matrix and tensor approximations", note = "HAL EPrint hal-04115337", url = {https://inria.hal.science/hal-04115337}, keywords = {submitted}, } %---------------------------------------------------------------------------- % PUBLISHED %---------------------------------------------------------------------------- @article{bmp25, author = "Alfredo Buttari and Theo Mary and Andr\'e Pacteau", title = "Truncated {QR} factorization with pivoting in mixed precision", journal=j-SISC, volume = {47}, number = {2}, pages = {B382-B401}, year = {2025}, doi = {10.1137/24M1644705}, keywords = {journal}, } @inproceedings{bdkm24, author = "Marc Baboulin and Simplice Donfack and Oguz Kaya and Theo Mary and Matthieu Robeyns", title = "Mixed precision randomized low-rank approximation with GPU tensor cores", booktitle="Euro-Par 2024: Parallel Processing", year="2024", publisher="Springer Nature Switzerland", address="Cham", pages="31--44", doi = {10.1007/978-3-031-69583-4_3}, keywords = {proceeding}, } @inproceedings{gjmm24a, author = "Stef Graillat and Fabienne J\'ez\'equel and Theo Mary and Rom\'eo Molina and Daichi Mukunoki", title = "Reduced-Precision and Reduced-Exponent Formats for Accelerating Adaptive Precision Sparse Matrix-Vector Product", booktitle="Euro-Par 2024: Parallel Processing", year="2024", publisher="Springer Nature Switzerland", address="Cham", pages="17--30", doi = {10.1007/978-3-031-69583-4_2}, keywords = {proceeding}, } @article{abbg24, author = {Amestoy, P. R. and Boiteau, O. and Buttari, A. and Gerest, M. and J\'ez\'equel, F. and L'Excellent, J.-Y. and Mary, T.}, title = "Communication avoiding block low-rank parallel multifrontal triangular solve with many right-hand sides", journal=j-SIMAX, volume = {45}, number = {1}, pages = {148-166}, year = {2024}, doi = {10.1137/23M1568600}, keywords = {journal}, } @article{gjmm24, author = "Stef Graillat and Fabienne J\'ez\'equel and Theo Mary and Rom\'eo Molina", title = "Adaptive precision sparse matrix-vector product and its application to Krylov solvers", journal=j-SISC, volume = {46}, number = {1}, pages = {C30-C56}, year = {2024}, doi = {10.1137/22M1522619}, keywords = {journal}, } @article{abhl24, author = {Amestoy, P. R. and Buttari, A. and Higham, N. J. and L'Excellent, J.-Y. and Mary, T. and Vieubl\'e, B.}, title = {Five-precision {GMRES}-based iterative refinement}, journal=j-SIMAX, volume = {45}, number = {1}, pages = {529-552}, year = {2024}, doi = {10.1137/23M1549079}, keywords = {journal} } @article{abhl23, author = "Patrick R. Amestoy and Alfredo Buttari and Nicholas J. Higham and Jean-Yves L'Excellent and Theo Mary and Bastien Vieubl{\'e}", title = "Combining Sparse Approximate Factorizations with Mixed Precision Iterative Refinement", journal=j-TOMS, year=2023, volume = {49}, number = {1}, doi = {10.1145/3582493}, keywords = {journal} } @article{loma23, author = {Lopez, F. and Mary, T.}, title = {{Mixed Precision {LU} Factorization on {GPU} Tensor Cores: Reducing Data Movement and Memory Footprint}}, journal=j-IJHPCA, volume = {37}, number = {2}, pages = {165-179}, year = {2023}, doi = {10.1177/10943420221136848}, keywords = {journal} } @article{bglm23, author = "J\'er\'emy Berthomieu and Stef Graillat and Dimitri Lesnoff and Theo Mary", title = "Modular Matrix Multiplication on GPU for Polynomial System Solving", journal="ACM Commun. Comput. Algebra", volume = 57, number = 2, pages = "35-38", year=2023, doi="10.1145/3614408.3614411", keywords = {journal} } @article{oaab23, author = "S. Operto and Patrick R. Amestoy and Hossein Aghamiry and Stephen Beller and Alfredo Buttari and L. Combe and Victorita Dolean and Matthieu Gerest and Gaoshan Guo and Pierre Jolivet and Jean-Yves L'Excellent and Frichnel Mamfoumbi and Theo Mary and Chiara Puglisi and Alessandra Ribodetti and Pierre-Henri Tournier", title = "Is 3D frequency-domain FWI of full-azimuth/long-offset OBN data feasible? The Gorgon case study", journal={Leading Edge}, volume = 42, number = 3, pages = "146-228", year = {2023}, doi="10.1190/tle42030173.1", keywords = {journal}, } @misc{bbgm22, author = "Th\'eo Beuzeville and Alfredo Buttari and Serge Gratton and Theo Mary and Erkan Ulker", title = "Adversarial attacks via Sequential Quadratic Programming", note = "HAL EPrint hal-03752184", year = "2022", url = {https://hal.archives-ouvertes.fr/hal-03752184/}, keywords = {submitted}, } @misc{bbgm21, author = "Th\'eo Beuzeville and Alfredo Buttari and Serge Gratton and Theo Mary and St\'ephane Pralet", title = "Adversarial attacks via backward error analysis", note = "HAL EPrint hal-03296180", year = "2021", url = {https://hal.science/hal-03296180}, keywords = {submitted}, } @article{cfhm22, author = "Matteo Croci and Massimiliano Fasi and Nicholas J. Higham and Theo Mary and Mantas Mikaitis", title = "Stochastic Rounding: {Implementation}, Error Analysis and Applications", journal = j-RSOS, volume = 9, number = 3, pages = "1-25", year = {2022}, doi = "10.1098/rsos.211631", keywords = {journal} } @article{hima22, author = "Nicholas J. Higham and Theo Mary", title = "Mixed Precision Algorithms in Numerical Linear Algebra", journal = j-AN, volume = 31, pages = "347-414", year = {2022}, doi = "10.1017/s0962492922000022", keywords = {journal} } @article{abbg22, author = {Amestoy, P. R. and Boiteau, O. and Buttari, A. and Gerest, M. and J\'ez\'equel, F. and L'Excellent, J.-Y. and Mary, T.}, title = {Mixed Precision Low Rank Approximations and their Application to Block Low Rank LU Factorization}, journal = j-IMAJNA, year = {2022}, volume = {43}, number = {4}, pages={2198--2227}, doi = {10.1093/imanum/drac037}, keywords = {journal} } @article{fhlm23, author = "Massimiliano Fasi and Nicholas J. Higham and Florent Lopez and Theo Mary and Mantas Mikaitis", title = "Matrix Multiplication in Multiword Arithmetic: {Error} Analysis and Application to {GPU} Tensor Cores", journal = j-SISC, doi="10.1137/21M1465032", year = {2023}, keywords = {journal} } @article{bhlm21, author = {Buttari, A. and Huber, M. and Leleux, P. and Mary, T. and Ruede, U. and Wohlmuth, B.}, title = {{Block Low Rank Single Precision Coarse Grid Solvers for Extreme Scale Multigrid Methods}}, journal = j-NLAA, year = {2021}, volume = {29}, number = {1}, doi={10.1002/nla.2407}, keywords = {journal} } @article{abm21, author = {Ashcraft, C. and Buttari, A. and Mary, T.}, title = {{Block Low-Rank Matrices with Shared Bases: Potential and Limitations of the BLR$^2$ Format}}, journal = j-SIMAX, year = {2021}, volume = {42}, number = {2}, pages = {990--1010}, doi={10.1137/20M1386451}, keywords = {journal} } @article{hima21, author = {Higham, N. J. and Mary, T.}, title = {{Solving Block Low-Rank Linear Systems by LU Factorization is Numerically Stable}}, journal = j-IMAJNA, year = {2021}, volume = {42}, number = {2}, pages = {951--980}, doi={10.1093/imanum/drab020}, keywords = {journal} } @article{chm21, author = {Connolly, M. P. and Higham, N. J. and Mary, T.}, title = {{Stochastic Rounding and its Probabilistic Backward Error Analysis}}, journal = j-SISC, year = {2021}, volume = {43}, number = {1}, pages = {A566--A585}, doi={10.1137/20M1334796}, keywords = {journal} } @article{hima20, author = {Higham, N. J. and Mary, T.}, title = {{Sharper Probabilistic Backward Error Analysis for Basic Linear Algebra Kernels with Random Data}}, journal = j-SISC, year = {2020}, volume = {42}, number = {5}, pages = {A3427--A3446}, doi={10.1137/20M1314355}, urldoc={doc/SharperProbAna.pdf}, keywords = {journal} } @article{bhlm20, author = {Blanchard, P. and Higham, N. J. and Lopez, F. and Mary, T. and Pranesh, S.}, title = {{Mixed Precision Block Fused Multiply-Add: Error Analysis and Application to GPU Tensor Cores}}, journal = j-SISC, year = {2020}, volume = {42}, number = {3}, pages = {C124--C141}, doi = {10.1137/19M1289546}, keywords = {journal} } @article{bhm20, author = {Blanchard, P. and Higham, N. J. and Mary, T.}, title = {{A Class of Fast and Accurate Summation Algorithms}}, journal = j-SISC, year = {2020}, volume = {42}, number = {3}, pages = {A1541--1557}, doi = {10.1137/19M1257780}, keywords = {journal} } @article{jmpr19, author = {Jeannerod, C.-P. and Mary, T. and Pernet, C. and Roche, D. S.}, title = {Improving the Complexity of Block Low-Rank Factorizations with Fast Matrix Arithmetic}, journal = j-SIMAX, year = {2019}, volume = {40}, number = {4}, pages = {1478--1496}, doi = {10.1137/19M1255628}, keywords = {journal} } @article{hima19a, author = {Higham, N. J. and Mary, T.}, title = {{A New Approach to Probabilistic Rounding Error Analysis}}, journal = j-SISC, year = {2019}, volume = {41}, number = {5}, pages = {A2815--A2835}, doi = {10.1137/18M1226312}, keywords = {journal} } @article{ablm19a, author = {Amestoy, P. R. and Buttari, A. and L'Excellent, J.-Y. and Mary, T.}, title = {{Bridging the Gap between Flat and Hierarchical Low-rank Matrix Formats: the Multilevel Block Low-Rank Format}}, journal = j-SISC, year = {2019}, volume = {41}, number = {3}, pages = {A1414--A1442}, doi = {10.1137/18M1182760}, keywords = {journal} } @article{gcgm19, author = {Gorman, C. and Chavez, G. and Ghysels, P. and Mary, T. and Rouet, F.-H. and Li, X. S.}, title = {{Robust and Accurate Stopping Criteria for Adaptive Randomized Sampling in Matrix-Free Hierarchically Semiseparable Construction}}, journal = j-SISC, year = {2019}, volume = {41}, number = {5}, pages = {S61--S85}, doi={10.1137/18M1194961}, keywords = {journal} } @article{hima19, author = {Higham, N. J. and Mary, T.}, title = {{A New Preconditioner that Exploits Low-Rank Approximations to Factorization Error}}, journal = j-SISC, volume = {41}, number = {1}, pages = {A59--A82}, year = {2019}, doi = {10.1137/18M1182802}, keywords = {journal} } @article{ablm19, author = {Amestoy, Patrick R. and Buttari, Alfredo and L'Excellent, Jean-Yves and Mary, Theo}, title = {{Performance and Scalability of the Block Low-Rank Multifrontal Factorization on Multicore Architectures}}, journal = j-TOMS, volume = {45}, number = {1}, year = {2019}, pages = {2:1--2:26}, doi = {10.1145/3242094}, keywords = {journal} } @article{ablm17, author = {Amestoy, P. R. and Buttari, A. and L'Excellent, J.-Y. and Mary, T.}, title = {{On the Complexity of the Block Low-Rank Multifrontal Factorization}}, journal = j-SISC, volume = {39}, number = {4}, pages = {A1710--A1740}, year = {2017}, doi={10.1137/16M1077192}, keywords = {journal} } @article{abbl16, author = {Amestoy, P. R. and Brossier, R. and Buttari, A. and L'Excellent, J.-Y. and Mary, T. and M\'etivier, L. and Miniussi, A. and Operto, S.}, title = {{Fast 3D frequency-domain full waveform inversion with a parallel Block Low-Rank multifrontal direct solver: application to OBC data from the North Sea}}, journal = j-GEO, year = {2016}, volume = {81}, number = {6}, pages = {R363--R383}, doi={10.1190/geo2016-0052.1}, keywords = {journal} } @article{sjka17, author = {{Shantsev}, D. V. and {Jaysaval}, P. and {de la Kethulle de Ryhove}, S. and {Amestoy}, P. R. and {Buttari}, A. and {L'Excellent}, J.-Y. and {Mary}, T.}, title = "{Large-scale 3D EM modeling with a Block Low-Rank multifrontal direct solver}", journal = j-GJI, year = {2017}, volume = {209}, number = {3}, pages = {1558--1571}, doi = {10.1093/gji/ggx106}, keywords = {journal} } @inproceedings{abfl21, author = {Amestoy, P. R. and Buttari, A. and Faucher, F. and L'Excellent, J.-Y. and Mary, T. }, title = {Recent work on sparse direct solvers to exploit numerical and structural properties of {HDG} discretizations}, BOOKTITLE={14th WCCM and ECCOMAS congress 2020, Paris, France}, month=Jan, year={2021}, keywords = {proceeding} } @inproceedings{abfg22, author = {Amestoy, P. R. and Buttari, A. and Faucher, F. and Gerest, M. and L'Excellent, J.-Y. and Mary, T. }, title = {Mixed precision sparse direct solver applied to {3D} wave propagation}, BOOKTITLE={ECCOMAS congress 2022, Oslo, Norway}, month=Jun, year={2022}, keywords = {proceeding} } @phdthesis{mary17, AUTHOR = {Mary, T.}, TITLE = {Block Low-Rank multifrontal solvers: complexity, performance, and scalability}, school = {Universit\'e de Toulouse}, type = {{P}h{D} Thesis}, MONTH = Nov, YEAR = {2017}, urldoc = {doc/thesis.pdf}, keywords = {thesis} } @inproceedings{abbl15, title = {{3D frequency-domain seismic modeling with a Parallel BLR multifrontal direct solver}}, author = {Amestoy, P. R. and Brossier, R. and Buttari, A. and L'Excellent, J.-Y. and Mary, T. and M\'etivier, L. and Miniussi, A. and Operto, S. and Virieux, J. and Weisbecker, C.}, booktitle = {International Conference Society of Exploration Geophysicists (SEG) Annual Meeting}, address = {New Orleans, USA}, year = {2015}, month = Oct, doi={10.1190/segam2015-5811693.1}, keywords = {proceeding} } @inproceedings{abbl15a, title = {{Efficient 3D frequency-domain full-waveform inversion of ocean-bottom cable data with sparse block low-rank direct solver: a real data case study from the North Sea}}, author = {Amestoy, P. R. and Brossier, R. and Buttari, A. and L'Excellent, J.-Y. and Mary, T. and M\'etivier, L. and Miniussi, A. and Operto, S. and Ribodetti, A. and Virieux, J. and Weisbecker, C.}, booktitle = {International Conference Society of Exploration Geophysicists (SEG) Annual Meeting}, address = {New Orleans, USA}, year = {2015}, month = Oct, doi={10.1190/segam2015-5713962.1}, keywords = {proceeding} } @inproceedings{mykl15, title = {{Performance of Random Sampling for Computing Low-rank Approximations of a Dense Matrix on GPUs}}, author = {Mary, T. and Yamazaki, I. and Kurzak, J. and Luszczek, P. and Tomov, S. and Dongarra, J.}, booktitle = {SC'15 - International Conference for High Performance Computing, Networking, Storage and Analysis}, address = {Austin, USA}, year = {2015}, month = Nov, doi = {10.1145/2807591.2807613}, keywords = {proceeding} } @inproceedings{ymkt14, author={Yamazaki, I. and Mary, T. and Kurzak, J. and Tomov, S. and Dongarra, J.}, booktitle={2014 IEEE International Conference on Big Data}, title={Access-averse framework for computing low-rank matrix approximations}, address = {Washington, USA}, year={2014}, month=Oct, doi={10.1109/BigData.2014.7004374}, keywords = {proceeding} } @misc{mary19, author = {Mary, T.}, title = {Pour quelques equations de plus}, note = {Article de vulgarisation scientifique dans le blog Binaire de lemonde.fr}, year = {2019}, url={http://binaire.blog.lemonde.fr/2019/02/06/il-etait-une-fois-ma-these-pour-quelques-equations-de-plus/}, keywords = {popular} }