BibTeX records: James Demmel

download as .bib file

@article{DBLP:journals/siammax/Demmel23,
  author       = {James Demmel},
  title        = {Nearly Optimal Block-Jacobi Preconditioning},
  journal      = {{SIAM} J. Matrix Anal. Appl.},
  volume       = {44},
  number       = {1},
  pages        = {408--413},
  year         = {2023},
  url          = {https://doi.org/10.1137/22m1504901},
  doi          = {10.1137/22M1504901},
  timestamp    = {Sun, 13 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siammax/Demmel23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siammax/DemmelGR23,
  author       = {James Demmel and
                  Laura Grigori and
                  Alexander Rusciano},
  title        = {An Improved Analysis and Unified Perspective on Deterministic and
                  Randomized Low-Rank Matrix Approximation},
  journal      = {{SIAM} J. Matrix Anal. Appl.},
  volume       = {44},
  number       = {2},
  pages        = {559--591},
  year         = {2023},
  url          = {https://doi.org/10.1137/21m1391316},
  doi          = {10.1137/21M1391316},
  timestamp    = {Fri, 02 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siammax/DemmelGR23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipps/ChoDKLLL23,
  author       = {Younghyun Cho and
                  James Weldon Demmel and
                  Jacob King and
                  Xiaoye S. Li and
                  Yang Liu and
                  Hengrui Luo},
  title        = {Harnessing the Crowd for Autotuning High-Performance Computing Applications},
  booktitle    = {{IEEE} International Parallel and Distributed Processing Symposium,
                  {IPDPS} 2023, St. Petersburg, FL, USA, May 15-19, 2023},
  pages        = {635--645},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/IPDPS54959.2023.00069},
  doi          = {10.1109/IPDPS54959.2023.00069},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ipps/ChoDKLLL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BharadwajMMGBD23,
  author       = {Vivek Bharadwaj and
                  Osman Asif Malik and
                  Riley Murray and
                  Laura Grigori and
                  Aydin Bulu{\c{c}} and
                  James Demmel},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Fast Exact Leverage Score Sampling from Khatri-Rao Products with Applications
                  to Tensor Decomposition},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/959f70ee50044bed305e48e3484005a7-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/BharadwajMMGBD23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2301-12584,
  author       = {Vivek Bharadwaj and
                  Osman Asif Malik and
                  Riley Murray and
                  Laura Grigori and
                  Aydin Bulu{\c{c}} and
                  James Demmel},
  title        = {Fast Exact Leverage Score Sampling from Khatri-Rao Products with Applications
                  to Tensor Decomposition},
  journal      = {CoRR},
  volume       = {abs/2301.12584},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2301.12584},
  doi          = {10.48550/ARXIV.2301.12584},
  eprinttype    = {arXiv},
  eprint       = {2301.12584},
  timestamp    = {Wed, 01 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2301-12584.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-11474,
  author       = {Riley Murray and
                  James Demmel and
                  Michael W. Mahoney and
                  N. Benjamin Erichson and
                  Maksim Melnichenko and
                  Osman Asif Malik and
                  Laura Grigori and
                  Piotr Luszczek and
                  Michal Derezinski and
                  Miles E. Lopes and
                  Tianyu Liang and
                  Hengrui Luo and
                  Jack J. Dongarra},
  title        = {Randomized Numerical Linear Algebra : {A} Perspective on the Field
                  With an Eye to Software},
  journal      = {CoRR},
  volume       = {abs/2302.11474},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.11474},
  doi          = {10.48550/ARXIV.2302.11474},
  eprinttype    = {arXiv},
  eprint       = {2302.11474},
  timestamp    = {Fri, 24 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-11474.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-03700,
  author       = {James Demmel and
                  Ioana Dumitriu and
                  Ryan Schneider},
  title        = {Generalized Pseudospectral Shattering and Inverse-Free Matrix Pencil
                  Diagonalization},
  journal      = {CoRR},
  volume       = {abs/2306.03700},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.03700},
  doi          = {10.48550/ARXIV.2306.03700},
  eprinttype    = {arXiv},
  eprint       = {2306.03700},
  timestamp    = {Tue, 13 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-03700.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-13835,
  author       = {Daniel Zou and
                  Xinchen Jin and
                  Xueyang Yu and
                  Hao Zhang and
                  James Demmel},
  title        = {Computron: Serving Distributed Deep Learning Models with Model Parallel
                  Swapping},
  journal      = {CoRR},
  volume       = {abs/2306.13835},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.13835},
  doi          = {10.48550/ARXIV.2306.13835},
  eprinttype    = {arXiv},
  eprint       = {2306.13835},
  timestamp    = {Tue, 27 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-13835.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2308-15720,
  author       = {Younghyun Cho and
                  James Weldon Demmel and
                  Michal Derezinski and
                  Haoyun Li and
                  Hengrui Luo and
                  Michael W. Mahoney and
                  Riley J. Murray},
  title        = {Surrogate-based Autotuning for Randomized Sketching Algorithms in
                  Regression Problems},
  journal      = {CoRR},
  volume       = {abs/2308.15720},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.15720},
  doi          = {10.48550/ARXIV.2308.15720},
  eprinttype    = {arXiv},
  eprint       = {2308.15720},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-15720.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-15419,
  author       = {Tianyu Liang and
                  Riley Murray and
                  Aydin Bulu{\c{c}} and
                  James Demmel},
  title        = {Fast multiplication of random dense matrices with fixed sparse matrices},
  journal      = {CoRR},
  volume       = {abs/2310.15419},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.15419},
  doi          = {10.48550/ARXIV.2310.15419},
  eprinttype    = {arXiv},
  eprint       = {2310.15419},
  timestamp    = {Tue, 31 Oct 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-15419.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2311-08316,
  author       = {Maksim Melnichenko and
                  Oleg Balabanov and
                  Riley Murray and
                  James Demmel and
                  Michael W. Mahoney and
                  Piotr Luszczek},
  title        = {CholeskyQR with Randomization and Pivoting for Tall Matrices {(CQRRPT)}},
  journal      = {CoRR},
  volume       = {abs/2311.08316},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.08316},
  doi          = {10.48550/ARXIV.2311.08316},
  eprinttype    = {arXiv},
  eprint       = {2311.08316},
  timestamp    = {Tue, 21 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-08316.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/correctness/DemmelDGHLLLPRR22,
  author       = {James Demmel and
                  Jack J. Dongarra and
                  Mark Gates and
                  Greg Henry and
                  Julien Langou and
                  Xiaoye S. Li and
                  Piotr Luszczek and
                  Weslley S. Pereira and
                  E. Jason Riedy and
                  Cindy Rubio{-}Gonz{\'{a}}lez},
  editor       = {Ignacio Laguna and
                  Cindy Rubio{-}Gonz{\'{a}}lez},
  title        = {Proposed Consistent Exception Handling for the {BLAS} and {LAPACK}},
  booktitle    = {Sixth {IEEE/ACM} International Workshop on Software Correctness for
                  {HPC} Applications, Correctness@SC 2022, Dallas, TX, USA, November
                  13-18, 2022},
  pages        = {1--9},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/Correctness56720.2022.00006},
  doi          = {10.1109/CORRECTNESS56720.2022.00006},
  timestamp    = {Sun, 12 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/correctness/DemmelDGHLLLPRR22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipps/BharadwajBD22,
  author       = {Vivek Bharadwaj and
                  Aydin Bulu{\c{c}} and
                  James Demmel},
  title        = {Distributed-Memory Sparse Kernels for Machine Learning},
  booktitle    = {2022 {IEEE} International Parallel and Distributed Processing Symposium,
                  {IPDPS} 2022, Lyon, France, May 30 - June 3, 2022},
  pages        = {47--58},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/IPDPS53621.2022.00014},
  doi          = {10.1109/IPDPS53621.2022.00014},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ipps/BharadwajBD22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/pasc/ChenDDHH22,
  author       = {Anthony Chen and
                  James Demmel and
                  Grace Dinh and
                  Mason Haberle and
                  Olga Holtz},
  editor       = {Timothy Robinson},
  title        = {Communication bounds for convolutional neural networks},
  booktitle    = {{PASC} '22: Platform for Advanced Scientific Computing Conference,
                  Basel, Switzerland, June 27 - 29, 2022},
  pages        = {1:1--1:10},
  publisher    = {{ACM}},
  year         = {2022},
  url          = {https://doi.org/10.1145/3539781.3539784},
  doi          = {10.1145/3539781.3539784},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pasc/ChenDDHH22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-07673,
  author       = {Vivek Bharadwaj and
                  Aydin Bulu{\c{c}} and
                  James Demmel},
  title        = {Distributed-Memory Sparse Kernels for Machine Learning},
  journal      = {CoRR},
  volume       = {abs/2203.07673},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.07673},
  doi          = {10.48550/ARXIV.2203.07673},
  eprinttype    = {arXiv},
  eprint       = {2203.07673},
  timestamp    = {Mon, 28 Mar 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-07673.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2204-08279,
  author       = {Anthony Chen and
                  James Demmel and
                  Grace Dinh and
                  Mason Haberle and
                  Olga Holtz},
  title        = {Communication Bounds for Convolutional Neural Networks},
  journal      = {CoRR},
  volume       = {abs/2204.08279},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2204.08279},
  doi          = {10.48550/ARXIV.2204.08279},
  eprinttype    = {arXiv},
  eprint       = {2204.08279},
  timestamp    = {Tue, 19 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2204-08279.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-01409,
  author       = {Hengrui Luo and
                  Younghyun Cho and
                  James Weldon Demmel and
                  Xiaoye S. Li and
                  Yang Liu},
  title        = {Hybrid Models for Mixed Variables in Bayesian Optimization},
  journal      = {CoRR},
  volume       = {abs/2206.01409},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.01409},
  doi          = {10.48550/ARXIV.2206.01409},
  eprinttype    = {arXiv},
  eprint       = {2206.01409},
  timestamp    = {Fri, 03 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-01409.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-09281,
  author       = {James Demmel and
                  Jack J. Dongarra and
                  Mark Gates and
                  Greg Henry and
                  Julien Langou and
                  Xiaoye S. Li and
                  Piotr Luszczek and
                  Weslley da Silva Pereira and
                  E. Jason Riedy and
                  Cindy Rubio{-}Gonz{\'{a}}lez},
  title        = {Proposed Consistent Exception Handling for the {BLAS} and {LAPACK}},
  journal      = {CoRR},
  volume       = {abs/2207.09281},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.09281},
  doi          = {10.48550/ARXIV.2207.09281},
  eprinttype    = {arXiv},
  eprint       = {2207.09281},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-09281.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-05105,
  author       = {Vivek Bharadwaj and
                  Osman Asif Malik and
                  Riley Murray and
                  Aydin Bulu{\c{c}} and
                  James Demmel},
  title        = {Distributed-Memory Randomized Algorithms for Sparse Tensor {CP} Decomposition},
  journal      = {CoRR},
  volume       = {abs/2210.05105},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.05105},
  doi          = {10.48550/ARXIV.2210.05105},
  eprinttype    = {arXiv},
  eprint       = {2210.05105},
  timestamp    = {Thu, 13 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-05105.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ccfthpc/YouHHVD21,
  author       = {Yang You and
                  Jingyue Huang and
                  Cho{-}Jui Hsieh and
                  Richard W. Vuduc and
                  James Demmel},
  title        = {Communication-avoiding kernel ridge regression on parallel and distributed
                  systems},
  journal      = {{CCF} Trans. High Perform. Comput.},
  volume       = {3},
  number       = {3},
  pages        = {252--270},
  year         = {2021},
  url          = {https://doi.org/10.1007/s42514-021-00078-5},
  doi          = {10.1007/S42514-021-00078-5},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ccfthpc/YouHHVD21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/cmam/SolomonikD21,
  author       = {Edgar Solomonik and
                  James Demmel},
  title        = {Fast Bilinear Algorithms for Symmetric Tensor Contractions},
  journal      = {Comput. Methods Appl. Math.},
  volume       = {21},
  number       = {1},
  pages        = {211--231},
  year         = {2021},
  url          = {https://doi.org/10.1515/cmam-2019-0075},
  doi          = {10.1515/CMAM-2019-0075},
  timestamp    = {Tue, 23 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/cmam/SolomonikD21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamsc/DasDFGMY21,
  author       = {Swapnil Das and
                  James Demmel and
                  Kimon Fountoulakis and
                  Laura Grigori and
                  Michael W. Mahoney and
                  Shenghao Yang},
  title        = {Parallel and Communication Avoiding Least Angle Regression},
  journal      = {{SIAM} J. Sci. Comput.},
  volume       = {43},
  number       = {2},
  pages        = {C154--C176},
  year         = {2021},
  url          = {https://doi.org/10.1137/19M1305720},
  doi          = {10.1137/19M1305720},
  timestamp    = {Tue, 05 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siamsc/DasDFGMY21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamsc/SolomonikDH21,
  author       = {Edgar Solomonik and
                  James Demmel and
                  Torsten Hoefler},
  title        = {Communication Lower Bounds of Bilinear Algorithms for Symmetric Tensor
                  Contractions},
  journal      = {{SIAM} J. Sci. Comput.},
  volume       = {43},
  number       = {5},
  pages        = {A3328--A3356},
  year         = {2021},
  url          = {https://doi.org/10.1137/20M1338599},
  doi          = {10.1137/20M1338599},
  timestamp    = {Fri, 03 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/siamsc/SolomonikDH21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipps/WongpanichPDTLY21,
  author       = {Arissa Wongpanich and
                  Hieu Pham and
                  James Demmel and
                  Mingxing Tan and
                  Quoc V. Le and
                  Yang You and
                  Sameer Kumar},
  title        = {Training EfficientNets at Supercomputer Scale: 83{\%} ImageNet Top-1
                  Accuracy in One Hour},
  booktitle    = {{IEEE} International Parallel and Distributed Processing Symposium
                  Workshops, {IPDPS} Workshops 2021, Portland, OR, USA, June 17-21,
                  2021},
  pages        = {947--950},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/IPDPSW52791.2021.00146},
  doi          = {10.1109/IPDPSW52791.2021.00146},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ipps/WongpanichPDTLY21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isca/0001KKDDWNS21,
  author       = {Qijing Huang and
                  Aravind Kalaiah and
                  Minwoo Kang and
                  James Demmel and
                  Grace Dinh and
                  John Wawrzynek and
                  Thomas Norell and
                  Yakun Sophia Shao},
  title        = {CoSA: Scheduling by Constrained Optimization for Spatial Accelerators},
  booktitle    = {48th {ACM/IEEE} Annual International Symposium on Computer Architecture,
                  {ISCA} 2021, Virtual Event / Valencia, Spain, June 14-18, 2021},
  pages        = {554--566},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ISCA52012.2021.00050},
  doi          = {10.1109/ISCA52012.2021.00050},
  timestamp    = {Mon, 19 Feb 2024 07:32:07 +0100},
  biburl       = {https://dblp.org/rec/conf/isca/0001KKDDWNS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/mcsoc/ChoDLLL21,
  author       = {Younghyun Cho and
                  James Demmel and
                  Xiaoye S. Li and
                  Yang Liu and
                  Hengrui Luo},
  title        = {Enhancing Autotuning Capability with a History Database},
  booktitle    = {14th {IEEE} International Symposium on Embedded Multicore/Many-core
                  Systems-on-Chip, MCSoC 2021, Singapore, Singapore, December 20-23,
                  2021},
  pages        = {249--257},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/MCSoC51149.2021.00044},
  doi          = {10.1109/MCSOC51149.2021.00044},
  timestamp    = {Sat, 26 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/mcsoc/ChoDLLL21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ppopp/0179SMZMDL21,
  author       = {Yang Liu and
                  Wissam M. Sid{-}Lakhdar and
                  Osni Marques and
                  Xinran Zhu and
                  Chang Meng and
                  James Weldon Demmel and
                  Xiaoye S. Li},
  editor       = {Jaejin Lee and
                  Erez Petrank},
  title        = {GPTune: multitask learning for autotuning exascale applications},
  booktitle    = {PPoPP '21: 26th {ACM} {SIGPLAN} Symposium on Principles and Practice
                  of Parallel Programming, Virtual Event, Republic of Korea, February
                  27- March 3, 2021},
  pages        = {234--246},
  publisher    = {{ACM}},
  year         = {2021},
  url          = {https://doi.org/10.1145/3437801.3441621},
  doi          = {10.1145/3437801.3441621},
  timestamp    = {Sun, 06 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ppopp/0179SMZMDL21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ppopp/HanSDY21,
  author       = {Ruobing Han and
                  Min Si and
                  James Demmel and
                  Yang You},
  editor       = {Jaejin Lee and
                  Erez Petrank},
  title        = {Dynamic scaling for low-precision learning},
  booktitle    = {PPoPP '21: 26th {ACM} {SIGPLAN} Symposium on Principles and Practice
                  of Parallel Programming, Virtual Event, Republic of Korea, February
                  27- March 3, 2021},
  pages        = {480--482},
  publisher    = {{ACM}},
  year         = {2021},
  url          = {https://doi.org/10.1145/3437801.3441624},
  doi          = {10.1145/3437801.3441624},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ppopp/HanSDY21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/supercomputer/HanDY21,
  author       = {Ruobing Han and
                  James Demmel and
                  Yang You},
  editor       = {Bradford L. Chamberlain and
                  Ana Lucia Varbanescu and
                  Hatem Ltaief and
                  Piotr Luszczek},
  title        = {Auto-Precision Scaling for Distributed Deep Learning},
  booktitle    = {High Performance Computing - 36th International Conference, {ISC}
                  High Performance 2021, Virtual Event, June 24 - July 2, 2021, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {12728},
  pages        = {79--97},
  publisher    = {Springer},
  year         = {2021},
  url          = {https://doi.org/10.1007/978-3-030-78713-4\_5},
  doi          = {10.1007/978-3-030-78713-4\_5},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/supercomputer/HanDY21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2105-01898,
  author       = {Qijing Huang and
                  Minwoo Kang and
                  Grace Dinh and
                  Thomas Norell and
                  Aravind Kalaiah and
                  James Demmel and
                  John Wawrzynek and
                  Yakun Sophia Shao},
  title        = {CoSA: Scheduling by Constrained Optimization for Spatial Accelerators},
  journal      = {CoRR},
  volume       = {abs/2105.01898},
  year         = {2021},
  url          = {https://arxiv.org/abs/2105.01898},
  eprinttype    = {arXiv},
  eprint       = {2105.01898},
  timestamp    = {Wed, 12 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2105-01898.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-07563,
  author       = {Hengrui Luo and
                  James Weldon Demmel and
                  Younghyun Cho and
                  Xiaoye S. Li and
                  Yang Liu},
  title        = {Non-smooth Bayesian Optimization in Tuning Problems},
  journal      = {CoRR},
  volume       = {abs/2109.07563},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.07563},
  eprinttype    = {arXiv},
  eprint       = {2109.07563},
  timestamp    = {Sat, 26 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-07563.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/kais/YouHRWHKD20,
  author       = {Yang You and
                  Yuxiong He and
                  Samyam Rajbhandari and
                  Wenhan Wang and
                  Cho{-}Jui Hsieh and
                  Kurt Keutzer and
                  James Demmel},
  title        = {Fast {LSTM} by dynamic decomposition on cloud and distributed systems},
  journal      = {Knowl. Inf. Syst.},
  volume       = {62},
  number       = {11},
  pages        = {4169--4197},
  year         = {2020},
  url          = {https://doi.org/10.1007/s10115-020-01487-8},
  doi          = {10.1007/S10115-020-01487-8},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/kais/YouHRWHKD20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/toms/MarquesDV20,
  author       = {Osni Marques and
                  James Demmel and
                  Paulo B. Vasconcelos},
  title        = {Bidiagonal {SVD} Computation via an Associated Tridiagonal Eigenproblem},
  journal      = {{ACM} Trans. Math. Softw.},
  volume       = {46},
  number       = {2},
  pages        = {14:1--14:25},
  year         = {2020},
  url          = {https://doi.org/10.1145/3361746},
  doi          = {10.1145/3361746},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/toms/MarquesDV20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/toms/AhrensDN20,
  author       = {Willow Ahrens and
                  James Demmel and
                  Hong Diep Nguyen},
  title        = {Algorithms for Efficient Reproducible Floating Point Summation},
  journal      = {{ACM} Trans. Math. Softw.},
  volume       = {46},
  number       = {3},
  pages        = {22:1--22:49},
  year         = {2020},
  url          = {https://doi.org/10.1145/3389360},
  doi          = {10.1145/3389360},
  timestamp    = {Tue, 05 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/toms/AhrensDN20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/hipc/DevarakondaD20,
  author       = {Aditya Devarakonda and
                  James Demmel},
  title        = {Avoiding Communication in Logistic Regression},
  booktitle    = {27th {IEEE} International Conference on High Performance Computing,
                  Data, and Analytics, HiPC 2020, Pune, India, December 16-19, 2020},
  pages        = {91--100},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/HiPC50609.2020.00023},
  doi          = {10.1109/HIPC50609.2020.00023},
  timestamp    = {Sun, 25 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/hipc/DevarakondaD20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/hpcasia/WongpanichYD20,
  author       = {Arissa Wongpanich and
                  Yang You and
                  James Demmel},
  title        = {Rethinking the Value of Asynchronous Solvers for Distributed Deep
                  Learning},
  booktitle    = {Proceedings of the International Conference on High Performance Computing
                  in Asia-Pacific Region, {HPC} Asia 2020, Fukuoka, Japan, January 15-17,
                  2020},
  pages        = {52--60},
  publisher    = {{ACM}},
  year         = {2020},
  url          = {https://doi.org/10.1145/3368474.3368498},
  doi          = {10.1145/3368474.3368498},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/hpcasia/WongpanichYD20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/YouLRHKBSDKH20,
  author       = {Yang You and
                  Jing Li and
                  Sashank J. Reddi and
                  Jonathan Hseu and
                  Sanjiv Kumar and
                  Srinadh Bhojanapalli and
                  Xiaodan Song and
                  James Demmel and
                  Kurt Keutzer and
                  Cho{-}Jui Hsieh},
  title        = {Large Batch Optimization for Deep Learning: Training {BERT} in 76
                  minutes},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=Syx4wnEtvH},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iclr/YouLRHKBSDKH20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/spaa/DinhD20,
  author       = {Grace Dinh and
                  James Demmel},
  editor       = {Christian Scheideler and
                  Michael Spear},
  title        = {Communication-Optimal Tilings for Projective Nested Loops with Arbitrary
                  Bounds},
  booktitle    = {{SPAA} '20: 32nd {ACM} Symposium on Parallelism in Algorithms and
                  Architectures, Virtual Event, USA, July 15-17, 2020},
  pages        = {523--525},
  publisher    = {{ACM}},
  year         = {2020},
  url          = {https://doi.org/10.1145/3350755.3400275},
  doi          = {10.1145/3350755.3400275},
  timestamp    = {Sun, 12 Jul 2020 18:55:23 +0200},
  biburl       = {https://dblp.org/rec/conf/spaa/DinhD20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-00119,
  author       = {Grace Dinh and
                  James Demmel},
  title        = {Communication-Optimal Tilings for Projective Nested Loops with Arbitrary
                  Bounds},
  journal      = {CoRR},
  volume       = {abs/2003.00119},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.00119},
  eprinttype    = {arXiv},
  eprint       = {2003.00119},
  timestamp    = {Tue, 10 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-00119.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-08517,
  author       = {Yang You and
                  Yuhui Wang and
                  Huan Zhang and
                  Zhao Zhang and
                  James Demmel and
                  Cho{-}Jui Hsieh},
  title        = {The Limit of the Batch Size},
  journal      = {CoRR},
  volume       = {abs/2006.08517},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.08517},
  eprinttype    = {arXiv},
  eprint       = {2006.08517},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-08517.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2011-00071,
  author       = {Arissa Wongpanich and
                  Hieu Pham and
                  James Demmel and
                  Mingxing Tan and
                  Quoc V. Le and
                  Yang You and
                  Sameer Kumar},
  title        = {Training EfficientNets at Supercomputer Scale: 83{\%} ImageNet Top-1
                  Accuracy in One Hour},
  journal      = {CoRR},
  volume       = {abs/2011.00071},
  year         = {2020},
  url          = {https://arxiv.org/abs/2011.00071},
  eprinttype    = {arXiv},
  eprint       = {2011.00071},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2011-00071.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2011-08281,
  author       = {Aditya Devarakonda and
                  James Demmel},
  title        = {Avoiding Communication in Logistic Regression},
  journal      = {CoRR},
  volume       = {abs/2011.08281},
  year         = {2020},
  url          = {https://arxiv.org/abs/2011.08281},
  eprinttype    = {arXiv},
  eprint       = {2011.08281},
  timestamp    = {Wed, 18 Nov 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2011-08281.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamsc/DevarakondaFDM19,
  author       = {Aditya Devarakonda and
                  Kimon Fountoulakis and
                  James Demmel and
                  Michael W. Mahoney},
  title        = {Avoiding Communication in Primal and Dual Block Coordinate Descent
                  Methods},
  journal      = {{SIAM} J. Sci. Comput.},
  volume       = {41},
  number       = {1},
  pages        = {C1--C27},
  year         = {2019},
  url          = {https://doi.org/10.1137/17M1134433},
  doi          = {10.1137/17M1134433},
  timestamp    = {Thu, 30 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siamsc/DevarakondaFDM19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tpds/YouZHDK19,
  author       = {Yang You and
                  Zhao Zhang and
                  Cho{-}Jui Hsieh and
                  James Demmel and
                  Kurt Keutzer},
  title        = {Fast Deep Neural Network Training on Distributed Systems and Cloud
                  TPUs},
  journal      = {{IEEE} Trans. Parallel Distributed Syst.},
  volume       = {30},
  number       = {11},
  pages        = {2449--2462},
  year         = {2019},
  url          = {https://doi.org/10.1109/TPDS.2019.2913833},
  doi          = {10.1109/TPDS.2019.2913833},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tpds/YouZHDK19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icdm/YouHRWHKD19,
  author       = {Yang You and
                  Yuxiong He and
                  Samyam Rajbhandari and
                  Wenhan Wang and
                  Cho{-}Jui Hsieh and
                  Kurt Keutzer and
                  James Demmel},
  editor       = {Jianyong Wang and
                  Kyuseok Shim and
                  Xindong Wu},
  title        = {Fast {LSTM} Inference by Dynamic Decomposition on Cloud Systems},
  booktitle    = {2019 {IEEE} International Conference on Data Mining, {ICDM} 2019,
                  Beijing, China, November 8-11, 2019},
  pages        = {748--757},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICDM.2019.00085},
  doi          = {10.1109/ICDM.2019.00085},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icdm/YouHRWHKD19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sc/YouHYDKH19,
  author       = {Yang You and
                  Jonathan Hseu and
                  Chris Ying and
                  James Demmel and
                  Kurt Keutzer and
                  Cho{-}Jui Hsieh},
  editor       = {Michela Taufer and
                  Pavan Balaji and
                  Antonio J. Pe{\~{n}}a},
  title        = {Large-batch training for {LSTM} and beyond},
  booktitle    = {Proceedings of the International Conference for High Performance Computing,
                  Networking, Storage and Analysis, {SC} 2019, Denver, Colorado, USA,
                  November 17-19, 2019},
  pages        = {9:1--9:16},
  publisher    = {{ACM}},
  year         = {2019},
  url          = {https://doi.org/10.1145/3295500.3356137},
  doi          = {10.1145/3295500.3356137},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/YouHYDKH19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1901-08256,
  author       = {Yang You and
                  Jonathan Hseu and
                  Chris Ying and
                  James Demmel and
                  Kurt Keutzer and
                  Cho{-}Jui Hsieh},
  title        = {Large-Batch Training for {LSTM} and Beyond},
  journal      = {CoRR},
  volume       = {abs/1901.08256},
  year         = {2019},
  url          = {http://arxiv.org/abs/1901.08256},
  eprinttype    = {arXiv},
  eprint       = {1901.08256},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1901-08256.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-00962,
  author       = {Yang You and
                  Jing Li and
                  Jonathan Hseu and
                  Xiaodan Song and
                  James Demmel and
                  Cho{-}Jui Hsieh},
  title        = {Reducing {BERT} Pre-Training Time from 3 Days to 76 Minutes},
  journal      = {CoRR},
  volume       = {abs/1904.00962},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.00962},
  eprinttype    = {arXiv},
  eprint       = {1904.00962},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-00962.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-11340,
  author       = {Swapnil Das and
                  Jim Demmel and
                  Kimon Fountoulakis and
                  Laura Grigori and
                  Michael W. Mahoney},
  title        = {Parallel and Communication Avoiding Least Angle Regression},
  journal      = {CoRR},
  volume       = {abs/1905.11340},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.11340},
  eprinttype    = {arXiv},
  eprint       = {1905.11340},
  timestamp    = {Wed, 12 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-11340.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1908-05792,
  author       = {Wissam M. Sid{-}Lakhdar and
                  Mohsen Mahmoudi Aznaveh and
                  Xiaoye S. Li and
                  James Weldon Demmel},
  title        = {Multitask and Transfer Learning for Autotuning Exascale Applications},
  journal      = {CoRR},
  volume       = {abs/1908.05792},
  year         = {2019},
  url          = {http://arxiv.org/abs/1908.05792},
  eprinttype    = {arXiv},
  eprint       = {1908.05792},
  timestamp    = {Mon, 19 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1908-05792.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-06524,
  author       = {Grey Ballard and
                  James Demmel and
                  Ioana Dumitriu and
                  Alexander Rusciano},
  title        = {A Generalized Randomized Rank-Revealing Factorization},
  journal      = {CoRR},
  volume       = {abs/1909.06524},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.06524},
  eprinttype    = {arXiv},
  eprint       = {1909.06524},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-06524.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-00223,
  author       = {James Demmel and
                  Laura Grigori and
                  Alexander Rusciano},
  title        = {An improved analysis and unified perspective on deterministic and
                  randomized low rank matrix approximations},
  journal      = {CoRR},
  volume       = {abs/1910.00223},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.00223},
  eprinttype    = {arXiv},
  eprint       = {1910.00223},
  timestamp    = {Fri, 04 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-00223.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-08907,
  author       = {Ruobing Han and
                  Yang You and
                  James Demmel},
  title        = {Auto-Precision Scaling for Distributed Deep Learning},
  journal      = {CoRR},
  volume       = {abs/1911.08907},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.08907},
  eprinttype    = {arXiv},
  eprint       = {1911.08907},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-08907.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamsc/GrigoriCD18,
  author       = {Laura Grigori and
                  S{\'{e}}bastien Cayrols and
                  James Weldon Demmel},
  title        = {Low Rank Approximation of a Sparse Matrix Based on {LU} Factorization
                  with Column and Row Tournament Pivoting},
  journal      = {{SIAM} J. Sci. Comput.},
  volume       = {40},
  number       = {2},
  year         = {2018},
  url          = {https://doi.org/10.1137/16M1074527},
  doi          = {10.1137/16M1074527},
  timestamp    = {Wed, 16 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siamsc/GrigoriCD18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/arith/RiedyD18,
  author       = {E. Jason Riedy and
                  James Demmel},
  title        = {Augmented Arithmetic Operations Proposed for {IEEE-754} 2018},
  booktitle    = {25th {IEEE} Symposium on Computer Arithmetic, {ARITH} 2018, Amherst,
                  MA, USA, June 25-27, 2018},
  pages        = {45--52},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ARITH.2018.8464813},
  doi          = {10.1109/ARITH.2018.8464813},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/arith/RiedyD18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icpp/YouZHDK18,
  author       = {Yang You and
                  Zhao Zhang and
                  Cho{-}Jui Hsieh and
                  James Demmel and
                  Kurt Keutzer},
  title        = {ImageNet Training in Minutes},
  booktitle    = {Proceedings of the 47th International Conference on Parallel Processing,
                  {ICPP} 2018, Eugene, OR, USA, August 13-16, 2018},
  pages        = {1:1--1:10},
  publisher    = {{ACM}},
  year         = {2018},
  url          = {https://doi.org/10.1145/3225058.3225069},
  doi          = {10.1145/3225058.3225069},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icpp/YouZHDK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icpp/SooriDBDGD18,
  author       = {Saeed Soori and
                  Aditya Devarakonda and
                  Zachary Blanco and
                  James Demmel and
                  Mert G{\"{u}}rb{\"{u}}zbalaban and
                  Maryam Mehri Dehnavi},
  title        = {Reducing Communication in Proximal Newton Methods for Sparse Least
                  Squares Problems},
  booktitle    = {Proceedings of the 47th International Conference on Parallel Processing,
                  {ICPP} 2018, Eugene, OR, USA, August 13-16, 2018},
  pages        = {22:1--22:10},
  publisher    = {{ACM}},
  year         = {2018},
  url          = {https://doi.org/10.1145/3225058.3225131},
  doi          = {10.1145/3225058.3225131},
  timestamp    = {Mon, 16 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icpp/SooriDBDGD18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ics/YouDHV18,
  author       = {Yang You and
                  James Demmel and
                  Cho{-}Jui Hsieh and
                  Richard W. Vuduc},
  title        = {Accurate, Fast and Scalable Kernel Ridge Regression on Parallel and
                  Distributed Systems},
  booktitle    = {Proceedings of the 32nd International Conference on Supercomputing,
                  {ICS} 2018, Beijing, China, June 12-15, 2018},
  pages        = {307--317},
  publisher    = {{ACM}},
  year         = {2018},
  url          = {https://doi.org/10.1145/3205289.3205290},
  doi          = {10.1145/3205289.3205290},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ics/YouDHV18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipps/DevarakondaFDM18,
  author       = {Aditya Devarakonda and
                  Kimon Fountoulakis and
                  James Demmel and
                  Michael W. Mahoney},
  title        = {Avoiding Synchronization in First-Order Methods for Sparse Convex
                  Optimization},
  booktitle    = {2018 {IEEE} International Parallel and Distributed Processing Symposium,
                  {IPDPS} 2018, Vancouver, BC, Canada, May 21-25, 2018},
  pages        = {409--418},
  publisher    = {{IEEE} Computer Society},
  year         = {2018},
  url          = {https://doi.org/10.1109/IPDPS.2018.00051},
  doi          = {10.1109/IPDPS.2018.00051},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ipps/DevarakondaFDM18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/spaa/BallardDGJK18,
  author       = {Grey Ballard and
                  James Demmel and
                  Laura Grigori and
                  Mathias Jacquelin and
                  Nicholas Knight},
  editor       = {Christian Scheideler and
                  Jeremy T. Fineman},
  title        = {A 3D Parallel Algorithm for {QR} Decomposition},
  booktitle    = {Proceedings of the 30th on Symposium on Parallelism in Algorithms
                  and Architectures, {SPAA} 2018, Vienna, Austria, July 16-18, 2018},
  pages        = {55--65},
  publisher    = {{ACM}},
  year         = {2018},
  url          = {https://doi.org/10.1145/3210377.3210415},
  doi          = {10.1145/3210377.3210415},
  timestamp    = {Sun, 25 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/spaa/BallardDGJK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1802-06905,
  author       = {James Demmel and
                  Grace Dinh},
  title        = {Communication-Optimal Convolutional Neural Nets},
  journal      = {CoRR},
  volume       = {abs/1802.06905},
  year         = {2018},
  url          = {http://arxiv.org/abs/1802.06905},
  eprinttype    = {arXiv},
  eprint       = {1802.06905},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1802-06905.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1805-00569,
  author       = {Yang You and
                  James Demmel and
                  Cho{-}Jui Hsieh and
                  Richard W. Vuduc},
  title        = {Accurate, Fast and Scalable Kernel Ridge Regression on Parallel and
                  Distributed Systems},
  journal      = {CoRR},
  volume       = {abs/1805.00569},
  year         = {2018},
  url          = {http://arxiv.org/abs/1805.00569},
  eprinttype    = {arXiv},
  eprint       = {1805.00569},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1805-00569.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1805-05278,
  author       = {Grey Ballard and
                  James Demmel and
                  Laura Grigori and
                  Mathias Jacquelin and
                  Nicholas Knight},
  title        = {A 3D Parallel Algorithm for {QR} Decomposition},
  journal      = {CoRR},
  volume       = {abs/1805.05278},
  year         = {2018},
  url          = {http://arxiv.org/abs/1805.05278},
  eprinttype    = {arXiv},
  eprint       = {1805.05278},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1805-05278.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tpds/YouDCSV17,
  author       = {Yang You and
                  James Demmel and
                  Kent Czechowski and
                  Le Song and
                  Rich Vuduc},
  title        = {Design and Implementation of a Communication-Optimal Classifier for
                  Distributed Kernel Support Vector Machines},
  journal      = {{IEEE} Trans. Parallel Distributed Syst.},
  volume       = {28},
  number       = {4},
  pages        = {974--988},
  year         = {2017},
  url          = {https://doi.org/10.1109/TPDS.2016.2608823},
  doi          = {10.1109/TPDS.2016.2608823},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tpds/YouDCSV17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icpp/YouD17,
  author       = {Yang You and
                  James Demmel},
  title        = {Runtime Data Layout Scheduling for Machine Learning Dataset},
  booktitle    = {46th International Conference on Parallel Processing, {ICPP} 2017,
                  Bristol, United Kingdom, August 14-17, 2017},
  pages        = {452--461},
  publisher    = {{IEEE} Computer Society},
  year         = {2017},
  url          = {https://doi.org/10.1109/ICPP.2017.54},
  doi          = {10.1109/ICPP.2017.54},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icpp/YouD17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sc/YouBD17,
  author       = {Yang You and
                  Aydin Bulu{\c{c}} and
                  James Demmel},
  editor       = {Bernd Mohr and
                  Padma Raghavan},
  title        = {Scaling deep learning on {GPU} and knights landing clusters},
  booktitle    = {Proceedings of the International Conference for High Performance Computing,
                  Networking, Storage and Analysis, {SC} 2017, Denver, CO, USA, November
                  12 - 17, 2017},
  pages        = {9},
  publisher    = {{ACM}},
  year         = {2017},
  url          = {https://doi.org/10.1145/3126908.3126912},
  doi          = {10.1145/3126908.3126912},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/YouBD17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/spaa/SolomonikBDH17,
  author       = {Edgar Solomonik and
                  Grey Ballard and
                  James Demmel and
                  Torsten Hoefler},
  editor       = {Christian Scheideler and
                  Mohammad Taghi Hajiaghayi},
  title        = {A Communication-Avoiding Parallel Algorithm for the Symmetric Eigenvalue
                  Problem},
  booktitle    = {Proceedings of the 29th {ACM} Symposium on Parallelism in Algorithms
                  and Architectures, {SPAA} 2017, Washington DC, USA, July 24-26, 2017},
  pages        = {111--121},
  publisher    = {{ACM}},
  year         = {2017},
  url          = {https://doi.org/10.1145/3087556.3087561},
  doi          = {10.1145/3087556.3087561},
  timestamp    = {Sun, 25 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/spaa/SolomonikBDH17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SolomonikDH17,
  author       = {Edgar Solomonik and
                  James Demmel and
                  Torsten Hoefler},
  title        = {Communication Lower Bounds of Bilinear Algorithms for Symmetric Tensor
                  Contractions},
  journal      = {CoRR},
  volume       = {abs/1707.04618},
  year         = {2017},
  url          = {http://arxiv.org/abs/1707.04618},
  eprinttype    = {arXiv},
  eprint       = {1707.04618},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SolomonikDH17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1708-02983,
  author       = {Yang You and
                  Aydin Bulu{\c{c}} and
                  James Demmel},
  title        = {Scaling Deep Learning on {GPU} and Knights Landing clusters},
  journal      = {CoRR},
  volume       = {abs/1708.02983},
  year         = {2017},
  url          = {http://arxiv.org/abs/1708.02983},
  eprinttype    = {arXiv},
  eprint       = {1708.02983},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1708-02983.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1709-05011,
  author       = {Yang You and
                  Zhao Zhang and
                  Cho{-}Jui Hsieh and
                  James Demmel},
  title        = {100-epoch ImageNet Training with AlexNet in 24 Minutes},
  journal      = {CoRR},
  volume       = {abs/1709.05011},
  year         = {2017},
  url          = {http://arxiv.org/abs/1709.05011},
  eprinttype    = {arXiv},
  eprint       = {1709.05011},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1709-05011.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1710-08883,
  author       = {Saeed Soori and
                  Aditya Devarakonda and
                  James Demmel and
                  Mert G{\"{u}}rb{\"{u}}zbalaban and
                  Maryam Mehri Dehnavi},
  title        = {Avoiding Communication in Proximal Methods for Convex Optimization
                  Problems},
  journal      = {CoRR},
  volume       = {abs/1710.08883},
  year         = {2017},
  url          = {http://arxiv.org/abs/1710.08883},
  eprinttype    = {arXiv},
  eprint       = {1710.08883},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1710-08883.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1712-06047,
  author       = {Aditya Devarakonda and
                  Kimon Fountoulakis and
                  James Demmel and
                  Michael W. Mahoney},
  title        = {Avoiding Synchronization in First-Order Methods for Sparse Convex
                  Optimization},
  journal      = {CoRR},
  volume       = {abs/1712.06047},
  year         = {2017},
  url          = {http://arxiv.org/abs/1712.06047},
  eprinttype    = {arXiv},
  eprint       = {1712.06047},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1712-06047.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/cse/GordonDDR16,
  author       = {Steven I. Gordon and
                  James Demmel and
                  Lizanne DeStefano and
                  Lorna Rivera},
  title        = {Implementing a Collaborative Online Course to Extend Access to {HPC}
                  Skills},
  journal      = {Comput. Sci. Eng.},
  volume       = {18},
  number       = {1},
  pages        = {73--79},
  year         = {2016},
  url          = {https://doi.org/10.1109/MCSE.2016.6},
  doi          = {10.1109/MCSE.2016.6},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/cse/GordonDDR16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamsc/AzadBBDGSTW16,
  author       = {Ariful Azad and
                  Grey Ballard and
                  Aydin Bulu{\c{c}} and
                  James Demmel and
                  Laura Grigori and
                  Oded Schwartz and
                  Sivan Toledo and
                  Samuel Williams},
  title        = {Exploiting Multiple Levels of Parallelism in Sparse Matrix-Matrix
                  Multiplication},
  journal      = {{SIAM} J. Sci. Comput.},
  volume       = {38},
  number       = {6},
  year         = {2016},
  url          = {https://doi.org/10.1137/15M104253X},
  doi          = {10.1137/15M104253X},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siamsc/AzadBBDGSTW16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/bigdataconf/GittensDRRGKLMC16,
  author       = {Alex Gittens and
                  Aditya Devarakonda and
                  Evan Racah and
                  Michael F. Ringenburg and
                  Lisa Gerhardt and
                  Jey Kottalam and
                  Jialin Liu and
                  Kristyn J. Maschhoff and
                  Shane Canon and
                  Jatin Chhugani and
                  Pramod Sharma and
                  Jiyan Yang and
                  James Demmel and
                  Jim Harrell and
                  Venkat Krishnamurthy and
                  Michael W. Mahoney and
                  Prabhat},
  editor       = {James Joshi and
                  George Karypis and
                  Ling Liu and
                  Xiaohua Hu and
                  Ronay Ak and
                  Yinglong Xia and
                  Weijia Xu and
                  Aki{-}Hiro Sato and
                  Sudarsan Rachuri and
                  Lyle H. Ungar and
                  Philip S. Yu and
                  Rama Govindaraju and
                  Toyotaro Suzumura},
  title        = {Matrix factorizations at scale: {A} comparison of scientific data
                  analytics in spark and {C+MPI} using three case studies},
  booktitle    = {2016 {IEEE} International Conference on Big Data {(IEEE} BigData 2016),
                  Washington DC, USA, December 5-8, 2016},
  pages        = {204--213},
  publisher    = {{IEEE} Computer Society},
  year         = {2016},
  url          = {https://doi.org/10.1109/BigData.2016.7840606},
  doi          = {10.1109/BIGDATA.2016.7840606},
  timestamp    = {Fri, 19 Nov 2021 16:08:20 +0100},
  biburl       = {https://dblp.org/rec/conf/bigdataconf/GittensDRRGKLMC16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icse/Rubio-Gonzalez016,
  author       = {Cindy Rubio{-}Gonz{\'{a}}lez and
                  Cuong Nguyen and
                  Benjamin Mehne and
                  Koushik Sen and
                  James Demmel and
                  William Kahan and
                  Costin Iancu and
                  Wim Lavrijsen and
                  David H. Bailey and
                  David Hough},
  editor       = {Laura K. Dillon and
                  Willem Visser and
                  Laurie A. Williams},
  title        = {Floating-point precision tuning using blame analysis},
  booktitle    = {Proceedings of the 38th International Conference on Software Engineering,
                  {ICSE} 2016, Austin, TX, USA, May 14-22, 2016},
  pages        = {1074--1085},
  publisher    = {{ACM}},
  year         = {2016},
  url          = {https://doi.org/10.1145/2884781.2884850},
  doi          = {10.1145/2884781.2884850},
  timestamp    = {Thu, 31 Mar 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icse/Rubio-Gonzalez016.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipps/CarsonDGKKSS16,
  author       = {Erin C. Carson and
                  James Demmel and
                  Laura Grigori and
                  Nicholas Knight and
                  Penporn Koanantakool and
                  Oded Schwartz and
                  Harsha Vardhan Simhadri},
  title        = {Write-Avoiding Algorithms},
  booktitle    = {2016 {IEEE} International Parallel and Distributed Processing Symposium,
                  {IPDPS} 2016, Chicago, IL, USA, May 23-27, 2016},
  pages        = {648--658},
  publisher    = {{IEEE} Computer Society},
  year         = {2016},
  url          = {https://doi.org/10.1109/IPDPS.2016.114},
  doi          = {10.1109/IPDPS.2016.114},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ipps/CarsonDGKKSS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/YouLLYDDH16,
  author       = {Yang You and
                  Xiangru Lian and
                  Ji Liu and
                  Hsiang{-}Fu Yu and
                  Inderjit S. Dhillon and
                  James Demmel and
                  Cho{-}Jui Hsieh},
  editor       = {Daniel D. Lee and
                  Masashi Sugiyama and
                  Ulrike von Luxburg and
                  Isabelle Guyon and
                  Roman Garnett},
  title        = {Asynchronous Parallel Greedy Coordinate Descent},
  booktitle    = {Advances in Neural Information Processing Systems 29: Annual Conference
                  on Neural Information Processing Systems 2016, December 5-10, 2016,
                  Barcelona, Spain},
  pages        = {4682--4690},
  year         = {2016},
  url          = {https://proceedings.neurips.cc/paper/2016/hash/43e4e6a6f341e00671e123714de019a8-Abstract.html},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/YouLLYDDH16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sc/BallardDGLOST16,
  author       = {Grey Ballard and
                  James Demmel and
                  Andrew Gearhart and
                  Benjamin Lipshitz and
                  Yishai Oltchik and
                  Oded Schwartz and
                  Sivan Toledo},
  title        = {Network Topologies and Inevitable Contention},
  booktitle    = {First International Workshop on Communication Optimizations in HPC,
                  COMHPC@SC 2016, Salt Lake City, UT, USA, November 18, 2016},
  pages        = {39--52},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/COMHPC.2016.010},
  doi          = {10.1109/COMHPC.2016.010},
  timestamp    = {Sat, 19 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sc/BallardDGLOST16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SolomonikBDH16,
  author       = {Edgar Solomonik and
                  Grey Ballard and
                  James Demmel and
                  Torsten Hoefler},
  title        = {A communication-avoiding parallel algorithm for the symmetric eigenvalue
                  problem},
  journal      = {CoRR},
  volume       = {abs/1604.03703},
  year         = {2016},
  url          = {http://arxiv.org/abs/1604.03703},
  eprinttype    = {arXiv},
  eprint       = {1604.03703},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SolomonikBDH16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GittensDRRGKLMC16,
  author       = {Alex Gittens and
                  Aditya Devarakonda and
                  Evan Racah and
                  Michael F. Ringenburg and
                  Lisa Gerhardt and
                  Jey Kottalam and
                  Jialin Liu and
                  Kristyn J. Maschhoff and
                  Shane Canon and
                  Jatin Chhugani and
                  Pramod Sharma and
                  Jiyan Yang and
                  James Demmel and
                  Jim Harrell and
                  Venkat Krishnamurthy and
                  Michael W. Mahoney and
                  Prabhat},
  title        = {Matrix Factorization at Scale: a Comparison of Scientific Data Analytics
                  in Spark and {C+MPI} Using Three Case Studies},
  journal      = {CoRR},
  volume       = {abs/1607.01335},
  year         = {2016},
  url          = {http://arxiv.org/abs/1607.01335},
  eprinttype    = {arXiv},
  eprint       = {1607.01335},
  timestamp    = {Tue, 17 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/GittensDRRGKLMC16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/DemmelR16,
  author       = {James Demmel and
                  Alex Rusciano},
  title        = {Parallelepipeds obtaining {HBL} lower bounds},
  journal      = {CoRR},
  volume       = {abs/1611.05944},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.05944},
  eprinttype    = {arXiv},
  eprint       = {1611.05944},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/DemmelR16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/DevarakondaFDM16,
  author       = {Aditya Devarakonda and
                  Kimon Fountoulakis and
                  James Demmel and
                  Michael W. Mahoney},
  title        = {Avoiding communication in primal and dual block coordinate descent
                  methods},
  journal      = {CoRR},
  volume       = {abs/1612.04003},
  year         = {2016},
  url          = {http://arxiv.org/abs/1612.04003},
  eprinttype    = {arXiv},
  eprint       = {1612.04003},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/DevarakondaFDM16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jpdc/BallardDGJKN15,
  author       = {Grey Ballard and
                  James Demmel and
                  Laura Grigori and
                  Mathias Jacquelin and
                  Nicholas Knight and
                  Hong Diep Nguyen},
  title        = {Reconstructing Householder vectors from Tall-Skinny {QR}},
  journal      = {J. Parallel Distributed Comput.},
  volume       = {85},
  pages        = {3--31},
  year         = {2015},
  url          = {https://doi.org/10.1016/j.jpdc.2015.06.003},
  doi          = {10.1016/J.JPDC.2015.06.003},
  timestamp    = {Sun, 25 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jpdc/BallardDGJKN15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siammax/DemmelGGX15,
  author       = {James Demmel and
                  Laura Grigori and
                  Ming Gu and
                  Hua Xiang},
  title        = {Communication Avoiding Rank Revealing {QR} Factorization with Column
                  Pivoting},
  journal      = {{SIAM} J. Matrix Anal. Appl.},
  volume       = {36},
  number       = {1},
  pages        = {55--89},
  year         = {2015},
  url          = {https://doi.org/10.1137/13092157X},
  doi          = {10.1137/13092157X},
  timestamp    = {Tue, 26 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siammax/DemmelGGX15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siammax/CarsonD15,
  author       = {Erin C. Carson and
                  James Weldon Demmel},
  title        = {Accuracy of the s-Step Lanczos Method for the Symmetric Eigenproblem
                  in Finite Precision},
  journal      = {{SIAM} J. Matrix Anal. Appl.},
  volume       = {36},
  number       = {2},
  pages        = {793--819},
  year         = {2015},
  url          = {https://doi.org/10.1137/140990735},
  doi          = {10.1137/140990735},
  timestamp    = {Tue, 26 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siammax/CarsonD15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tc/DemmelN15,
  author       = {James Demmel and
                  Hong Diep Nguyen},
  title        = {Parallel Reproducible Summation},
  journal      = {{IEEE} Trans. Computers},
  volume       = {64},
  number       = {7},
  pages        = {2060--2070},
  year         = {2015},
  url          = {https://doi.org/10.1109/TC.2014.2345391},
  doi          = {10.1109/TC.2014.2345391},
  timestamp    = {Sat, 20 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tc/DemmelN15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/topc/BallardDK15,
  author       = {Grey Ballard and
                  James Demmel and
                  Nicholas Knight},
  title        = {Avoiding Communication in Successive Band Reduction},
  journal      = {{ACM} Trans. Parallel Comput.},
  volume       = {1},
  number       = {2},
  pages        = {11:1--11:37},
  year         = {2015},
  url          = {https://doi.org/10.1145/2686877},
  doi          = {10.1145/2686877},
  timestamp    = {Sun, 25 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/topc/BallardDK15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/arith/NguyenD15,
  author       = {Hong Diep Nguyen and
                  James Demmel},
  title        = {Reproducible Tall-Skinny {QR}},
  booktitle    = {22nd {IEEE} Symposium on Computer Arithmetic, {ARITH} 2015, Lyon,
                  France, June 22-24, 2015},
  pages        = {152--159},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/ARITH.2015.28},
  doi          = {10.1109/ARITH.2015.28},
  timestamp    = {Wed, 16 Oct 2019 14:14:53 +0200},
  biburl       = {https://dblp.org/rec/conf/arith/NguyenD15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipps/YouDCSV15,
  author       = {Yang You and
                  James Demmel and
                  Kenneth Czechowski and
                  Le Song and
                  Richard W. Vuduc},
  title        = {{CA-SVM:} Communication-Avoiding Support Vector Machines on Distributed
                  Systems},
  booktitle    = {2015 {IEEE} International Parallel and Distributed Processing Symposium,
                  {IPDPS} 2015, Hyderabad, India, May 25-29, 2015},
  pages        = {847--859},
  publisher    = {{IEEE} Computer Society},
  year         = {2015},
  url          = {https://doi.org/10.1109/IPDPS.2015.117},
  doi          = {10.1109/IPDPS.2015.117},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ipps/YouDCSV15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/xsede/GordonDDR15,
  author       = {Steven I. Gordon and
                  James Demmel and
                  Lizanne DeStefano and
                  Lorna Rivera},
  editor       = {Gregory D. Peterson},
  title        = {Extending access to {HPC} skills through a blended online course},
  booktitle    = {Proceedings of the 2015 {XSEDE} Conference: Scientific Advancements
                  Enabled by Enhanced Cyberinfrastructure, St. Louis, MO, USA, July
                  26 - 30, 2015},
  pages        = {15:1--15:5},
  publisher    = {{ACM}},
  year         = {2015},
  url          = {https://doi.org/10.1145/2792745.2792760},
  doi          = {10.1145/2792745.2792760},
  timestamp    = {Sat, 19 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/xsede/GordonDDR15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/AzadBBDGSTW15,
  author       = {Ariful Azad and
                  Grey Ballard and
                  Aydin Bulu{\c{c}} and
                  James Demmel and
                  Laura Grigori and
                  Oded Schwartz and
                  Sivan Toledo and
                  Samuel Williams},
  title        = {Exploiting Multiple Levels of Parallelism in Sparse Matrix-Matrix
                  Multiplication},
  journal      = {CoRR},
  volume       = {abs/1510.00844},
  year         = {2015},
  url          = {http://arxiv.org/abs/1510.00844},
  eprinttype    = {arXiv},
  eprint       = {1510.00844},
  timestamp    = {Thu, 06 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/AzadBBDGSTW15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/actanum/BallardCDHKS14,
  author       = {Grey Ballard and
                  Erin C. Carson and
                  James Demmel and
                  Mark Hoemmen and
                  Nicholas Knight and
                  Oded Schwartz},
  title        = {Communication lower bounds and optimal algorithms for numerical linear
                  algebra},
  journal      = {Acta Numer.},
  volume       = {23},
  pages        = {1--155},
  year         = {2014},
  url          = {https://doi.org/10.1017/S0962492914000038},
  doi          = {10.1017/S0962492914000038},
  timestamp    = {Sun, 25 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/actanum/BallardCDHKS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/cacm/BallardDHS14,
  author       = {Grey Ballard and
                  James Demmel and
                  Olga Holtz and
                  Oded Schwartz},
  title        = {Communication costs of Strassen's matrix multiplication},
  journal      = {Commun. {ACM}},
  volume       = {57},
  number       = {2},
  pages        = {107--114},
  year         = {2014},
  url          = {https://doi.org/10.1145/2556647.2556660},
  doi          = {10.1145/2556647.2556660},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/cacm/BallardDHS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jpdc/SolomonikMHSD14,
  author       = {Edgar Solomonik and
                  Devin Matthews and
                  Jeff R. Hammond and
                  John F. Stanton and
                  James Demmel},
  title        = {A massively parallel tensor contraction framework for coupled-cluster
                  computations},
  journal      = {J. Parallel Distributed Comput.},
  volume       = {74},
  number       = {12},
  pages        = {3176--3190},
  year         = {2014},
  url          = {https://doi.org/10.1016/j.jpdc.2014.06.002},
  doi          = {10.1016/J.JPDC.2014.06.002},
  timestamp    = {Tue, 29 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jpdc/SolomonikMHSD14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siammax/CarsonD14,
  author       = {Erin C. Carson and
                  James Demmel},
  title        = {A Residual Replacement Strategy for Improving the Maximum Attainable
                  Accuracy of s-Step Krylov Subspace Methods},
  journal      = {{SIAM} J. Matrix Anal. Appl.},
  volume       = {35},
  number       = {1},
  pages        = {22--43},
  year         = {2014},
  url          = {https://doi.org/10.1137/120893057},
  doi          = {10.1137/120893057},
  timestamp    = {Tue, 26 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siammax/CarsonD14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siammax/BallardBDDDPSTY14,
  author       = {Grey Ballard and
                  Dulceneia Becker and
                  James Demmel and
                  Jack J. Dongarra and
                  Alex Druinsky and
                  Inon Peled and
                  Oded Schwartz and
                  Sivan Toledo and
                  Ichitaro Yamazaki},
  title        = {Communication-Avoiding Symmetric-Indefinite Factorization},
  journal      = {{SIAM} J. Matrix Anal. Appl.},
  volume       = {35},
  number       = {4},
  pages        = {1364--1406},
  year         = {2014},
  url          = {https://doi.org/10.1137/130929060},
  doi          = {10.1137/130929060},
  timestamp    = {Sun, 25 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siammax/BallardBDDDPSTY14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ics/BilmesACD14,
  author       = {Jeff A. Bilmes and
                  Krste Asanovic and
                  Chee{-}Whye Chin and
                  Jim Demmel},
  editor       = {Utpal Banerjee},
  title        = {Author retrospective for optimizing matrix multiply using PHiPAC:
                  a portable high-performance {ANSI} {C} coding methodology},
  booktitle    = {{ACM} International Conference on Supercomputing 25th Anniversary
                  Volume},
  pages        = {42--44},
  publisher    = {{ACM}},
  year         = {2014},
  url          = {https://doi.org/10.1145/2591635.2591656},
  doi          = {10.1145/2591635.2591656},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ics/BilmesACD14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipps/WilliamsLASCKD14,
  author       = {Samuel Williams and
                  Mike Lijewski and
                  Ann S. Almgren and
                  Brian van Straalen and
                  Erin C. Carson and
                  Nicholas Knight and
                  James Demmel},
  title        = {s-Step Krylov Subspace Methods as Bottom Solvers for Geometric Multigrid},
  booktitle    = {2014 {IEEE} 28th International Parallel and Distributed Processing
                  Symposium, Phoenix, AZ, USA, May 19-23, 2014},
  pages        = {1149--1158},
  publisher    = {{IEEE} Computer Society},
  year         = {2014},
  url          = {https://doi.org/10.1109/IPDPS.2014.119},
  doi          = {10.1109/IPDPS.2014.119},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ipps/WilliamsLASCKD14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipps/BallardDGJNS14,
  author       = {Grey Ballard and
                  James Demmel and
                  Laura Grigori and
                  Mathias Jacquelin and
                  Hong Diep Nguyen and
                  Edgar Solomonik},
  title        = {Reconstructing Householder Vectors from Tall-Skinny {QR}},
  booktitle    = {2014 {IEEE} 28th International Parallel and Distributed Processing
                  Symposium, Phoenix, AZ, USA, May 19-23, 2014},
  pages        = {1159--1170},
  publisher    = {{IEEE} Computer Society},
  year         = {2014},
  url          = {https://doi.org/10.1109/IPDPS.2014.120},
  doi          = {10.1109/IPDPS.2014.120},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ipps/BallardDGJNS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/spaa/SolomonikCKD14,
  author       = {Edgar Solomonik and
                  Erin C. Carson and
                  Nicholas Knight and
                  James Demmel},
  editor       = {Guy E. Blelloch and
                  Peter Sanders},
  title        = {Tradeoffs between synchronization, communication, and computation
                  in parallel linear algebra computations},
  booktitle    = {26th {ACM} Symposium on Parallelism in Algorithms and Architectures,
                  {SPAA} '14, Prague, Czech Republic - June 23 - 25, 2014},
  pages        = {307--318},
  publisher    = {{ACM}},
  year         = {2014},
  url          = {https://doi.org/10.1145/2612669.2612671},
  doi          = {10.1145/2612669.2612671},
  timestamp    = {Thu, 24 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/spaa/SolomonikCKD14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/xsede/CarbunescuDDGAM14,
  author       = {Razvan Carbunescu and
                  Aditya Devarakonda and
                  James Demmel and
                  Steven I. Gordon and
                  Jay Alameda and
                  Susan Mehringer},
  editor       = {Scott A. Lathrop and
                  Jay Alameda},
  title        = {Architecting an autograder for parallel code},
  booktitle    = {Annual Conference of the Extreme Science and Engineering Discovery
                  Environment, {XSEDE} '14, Atlanta, GA, {USA} - July 13 - 18, 2014},
  pages        = {68:1--68:8},
  publisher    = {{ACM}},
  year         = {2014},
  url          = {https://doi.org/10.1145/2616498.2616571},
  doi          = {10.1145/2616498.2616571},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/xsede/CarbunescuDDGAM14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siammax/KhabouDGG13,
  author       = {Amal Khabou and
                  James Demmel and
                  Laura Grigori and
                  Ming Gu},
  title        = {{LU} Factorization with Panel Rank Revealing Pivoting and Its Communication
                  Avoiding Version},
  journal      = {{SIAM} J. Matrix Anal. Appl.},
  volume       = {34},
  number       = {3},
  pages        = {1401--1429},
  year         = {2013},
  url          = {https://doi.org/10.1137/120863691},
  doi          = {10.1137/120863691},
  timestamp    = {Tue, 26 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siammax/KhabouDGG13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamsc/CarsonKD13,
  author       = {Erin C. Carson and
                  Nicholas Knight and
                  James Demmel},
  title        = {Avoiding Communication in Nonsymmetric Lanczos-Based Krylov Subspace
                  Methods},
  journal      = {{SIAM} J. Sci. Comput.},
  volume       = {35},
  number       = {5},
  year         = {2013},
  url          = {https://doi.org/10.1137/120881191},
  doi          = {10.1137/120881191},
  timestamp    = {Thu, 30 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siamsc/CarsonKD13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/arith/DemmelN13,
  author       = {James Demmel and
                  Hong Diep Nguyen},
  editor       = {Alberto Nannarelli and
                  Peter{-}Michael Seidel and
                  Ping Tak Peter Tang},
  title        = {Fast Reproducible Floating-Point Summation},
  booktitle    = {21st {IEEE} Symposium on Computer Arithmetic, {ARITH} 2013, Austin,
                  TX, USA, April 7-10, 2013},
  pages        = {163--172},
  publisher    = {{IEEE} Computer Society},
  year         = {2013},
  url          = {https://doi.org/10.1109/ARITH.2013.9},
  doi          = {10.1109/ARITH.2013.9},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/arith/DemmelN13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/arith/DemmelN13a,
  author       = {James Demmel and
                  Hong Diep Nguyen},
  editor       = {Alberto Nannarelli and
                  Peter{-}Michael Seidel and
                  Ping Tak Peter Tang},
  title        = {Numerical Reproducibility and Accuracy at ExaScale},
  booktitle    = {21st {IEEE} Symposium on Computer Arithmetic, {ARITH} 2013, Austin,
                  TX, USA, April 7-10, 2013},
  pages        = {235--237},
  publisher    = {{IEEE} Computer Society},
  year         = {2013},
  url          = {https://doi.org/10.1109/ARITH.2013.43},
  doi          = {10.1109/ARITH.2013.43},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/arith/DemmelN13a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/bigdataconf/BensonGD13,
  author       = {Austin R. Benson and
                  David F. Gleich and
                  James Demmel},
  editor       = {Xiaohua Hu and
                  Tsau Young Lin and
                  Vijay V. Raghavan and
                  Benjamin W. Wah and
                  Ricardo Baeza{-}Yates and
                  Geoffrey C. Fox and
                  Cyrus Shahabi and
                  Matthew Smith and
                  Qiang Yang and
                  Rayid Ghani and
                  Wei Fan and
                  Ronny Lempel and
                  Raghunath Nambiar},
  title        = {Direct {QR} factorizations for tall-and-skinny matrices in MapReduce
                  architectures},
  booktitle    = {2013 {IEEE} International Conference on Big Data {(IEEE} BigData 2013),
                  6-9 October 2013, Santa Clara, CA, {USA}},
  pages        = {264--272},
  publisher    = {{IEEE} Computer Society},
  year         = {2013},
  url          = {https://doi.org/10.1109/BigData.2013.6691583},
  doi          = {10.1109/BIGDATA.2013.6691583},
  timestamp    = {Fri, 19 Nov 2021 16:08:20 +0100},
  biburl       = {https://dblp.org/rec/conf/bigdataconf/BensonGD13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipps/DemmelEFKLSS13,
  author       = {James Demmel and
                  David Eliahu and
                  Armando Fox and
                  Shoaib Kamil and
                  Benjamin Lipshitz and
                  Oded Schwartz and
                  Omer Spillinger},
  title        = {Communication-Optimal Parallel Recursive Rectangular Matrix Multiplication},
  booktitle    = {27th {IEEE} International Symposium on Parallel and Distributed Processing,
                  {IPDPS} 2013, Cambridge, MA, USA, May 20-24, 2013},
  pages        = {261--272},
  publisher    = {{IEEE} Computer Society},
  year         = {2013},
  url          = {https://doi.org/10.1109/IPDPS.2013.80},
  doi          = {10.1109/IPDPS.2013.80},
  timestamp    = {Sat, 19 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ipps/DemmelEFKLSS13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipps/SolomonikBD13,
  author       = {Edgar Solomonik and
                  Aydin Bulu{\c{c}} and
                  James Demmel},
  title        = {Minimizing Communication in All-Pairs Shortest Paths},
  booktitle    = {27th {IEEE} International Symposium on Parallel and Distributed Processing,
                  {IPDPS} 2013, Cambridge, MA, USA, May 20-24, 2013},
  pages        = {548--559},
  publisher    = {{IEEE} Computer Society},
  year         = {2013},
  url          = {https://doi.org/10.1109/IPDPS.2013.111},
  doi          = {10.1109/IPDPS.2013.111},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ipps/SolomonikBD13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipps/Demmel13,
  author       = {James Demmel},
  title        = {Communication-Avoiding Algorithms for Linear Algebra and Beyond},
  booktitle    = {27th {IEEE} International Symposium on Parallel and Distributed Processing,
                  {IPDPS} 2013, Cambridge, MA, USA, May 20-24, 2013},
  pages        = {585},
  publisher    = {{IEEE} Computer Society},
  year         = {2013},
  url          = {https://doi.org/10.1109/IPDPS.2013.123},
  doi          = {10.1109/IPDPS.2013.123},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ipps/Demmel13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipps/DemmelGLS13,
  author       = {James Demmel and
                  Andrew Gearhart and
                  Benjamin Lipshitz and
                  Oded Schwartz},
  title        = {Perfect Strong Scaling Using No Additional Energy},
  booktitle    = {27th {IEEE} International Symposium on Parallel and Distributed Processing,
                  {IPDPS} 2013, Cambridge, MA, USA, May 20-24, 2013},
  pages        = {649--660},
  publisher    = {{IEEE} Computer Society},
  year         = {2013},
  url          = {https://doi.org/10.1109/IPDPS.2013.32},
  doi          = {10.1109/IPDPS.2013.32},
  timestamp    = {Sat, 19 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ipps/DemmelGLS13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipps/SolomonikMHD13,
  author       = {Edgar Solomonik and
                  Devin Matthews and
                  Jeff R. Hammond and
                  James Demmel},
  title        = {Cyclops Tensor Framework: Reducing Communication and Eliminating Load
                  Imbalance in Massively Parallel Contractions},
  booktitle    = {27th {IEEE} International Symposium on Parallel and Distributed Processing,
                  {IPDPS} 2013, Cambridge, MA, USA, May 20-24, 2013},
  pages        = {813--824},
  publisher    = {{IEEE} Computer Society},
  year         = {2013},
  url          = {https://doi.org/10.1109/IPDPS.2013.112},
  doi          = {10.1109/IPDPS.2013.112},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ipps/SolomonikMHD13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipps/BallardBDDDPSTY13,
  author       = {Grey Ballard and
                  Dulceneia Becker and
                  James Demmel and
                  Jack J. Dongarra and
                  Alex Druinsky and
                  Inon Peled and
                  Oded Schwartz and
                  Sivan Toledo and
                  Ichitaro Yamazaki},
  title        = {Implementing a Blocked Aasen's Algorithm with a Dynamic Scheduler
                  on Multicore Architectures},
  booktitle    = {27th {IEEE} International Symposium on Parallel and Distributed Processing,
                  {IPDPS} 2013, Cambridge, MA, USA, May 20-24, 2013},
  pages        = {895--907},
  publisher    = {{IEEE} Computer Society},
  year         = {2013},
  url          = {https://doi.org/10.1109/IPDPS.2013.98},
  doi          = {10.1109/IPDPS.2013.98},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ipps/BallardBDDDPSTY13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ppam/KnightCD13,
  author       = {Nicholas Knight and
                  Erin C. Carson and
                  James Demmel},
  editor       = {Roman Wyrzykowski and
                  Jack J. Dongarra and
                  Konrad Karczewski and
                  Jerzy Wasniewski},
  title        = {Exploiting Data Sparsity in Parallel Matrix Powers Computations},
  booktitle    = {Parallel Processing and Applied Mathematics - 10th International Conference,
                  {PPAM} 2013, Warsaw, Poland, September 8-11, 2013, Revised Selected
                  Papers, Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {8384},
  pages        = {15--25},
  publisher    = {Springer},
  year         = {2013},
  url          = {https://doi.org/10.1007/978-3-642-55224-3\_2},
  doi          = {10.1007/978-3-642-55224-3\_2},
  timestamp    = {Thu, 24 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ppam/KnightCD13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sc/Rubio-GonzalezNNDKSBIH13,
  author       = {Cindy Rubio{-}Gonz{\'{a}}lez and
                  Cuong Nguyen and
                  Hong Diep Nguyen and
                  James Demmel and
                  William Kahan and
                  Koushik Sen and
                  David H. Bailey and
                  Costin Iancu and
                  David Hough},
  editor       = {William Gropp and
                  Satoshi Matsuoka},
  title        = {Precimonious: tuning assistant for floating-point precision},
  booktitle    = {International Conference for High Performance Computing, Networking,
                  Storage and Analysis, SC'13, Denver, CO, {USA} - November 17 - 21,
                  2013},
  pages        = {27:1--27:12},
  publisher    = {{ACM}},
  year         = {2013},
  url          = {https://doi.org/10.1145/2503210.2503296},
  doi          = {10.1145/2503210.2503296},
  timestamp    = {Thu, 31 Mar 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sc/Rubio-GonzalezNNDKSBIH13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/spaa/BallardBDGLST13,
  author       = {Grey Ballard and
                  Aydin Bulu{\c{c}} and
                  James Demmel and
                  Laura Grigori and
                  Benjamin Lipshitz and
                  Oded Schwartz and
                  Sivan Toledo},
  editor       = {Guy E. Blelloch and
                  Berthold V{\"{o}}cking},
  title        = {Communication optimal parallel multiplication of sparse random matrices},
  booktitle    = {25th {ACM} Symposium on Parallelism in Algorithms and Architectures,
                  {SPAA} '13, Montreal, QC, Canada - July 23 - 25, 2013},
  pages        = {222--231},
  publisher    = {{ACM}},
  year         = {2013},
  url          = {https://doi.org/10.1145/2486159.2486196},
  doi          = {10.1145/2486159.2486196},
  timestamp    = {Sat, 19 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/spaa/BallardBDGLST13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/spaa/BallardDLST13,
  author       = {Grey Ballard and
                  James Demmel and
                  Benjamin Lipshitz and
                  Oded Schwartz and
                  Sivan Toledo},
  editor       = {Guy E. Blelloch and
                  Berthold V{\"{o}}cking},
  title        = {Communication efficient gaussian elimination with partial pivoting
                  using a shape morphing data layout},
  booktitle    = {25th {ACM} Symposium on Parallelism in Algorithms and Architectures,
                  {SPAA} '13, Montreal, QC, Canada - July 23 - 25, 2013},
  pages        = {232--240},
  publisher    = {{ACM}},
  year         = {2013},
  url          = {https://doi.org/10.1145/2486159.2486198},
  doi          = {10.1145/2486159.2486198},
  timestamp    = {Sat, 19 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/spaa/BallardDLST13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/xsede/GordonADCM13,
  author       = {Steven I. Gordon and
                  Jay Alameda and
                  James Demmel and
                  Razvan Carbunescu and
                  Susan Mehringer},
  editor       = {Nancy Wilkins{-}Diehr},
  title        = {Providing a supported online course on parallel computing},
  booktitle    = {Extreme Science and Engineering Discovery Environment: Gateway to
                  Discovery, XSEDE13, San Diego, CA, {USA} - July 22 - 25, 2013},
  pages        = {60:1--60:4},
  publisher    = {{ACM}},
  year         = {2013},
  url          = {https://doi.org/10.1145/2484762.2484765},
  doi          = {10.1145/2484762.2484765},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/xsede/GordonADCM13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1301-1071,
  author       = {Austin R. Benson and
                  David F. Gleich and
                  James Demmel},
  title        = {Direct {QR} factorizations for tall-and-skinny matrices in MapReduce
                  architectures},
  journal      = {CoRR},
  volume       = {abs/1301.1071},
  year         = {2013},
  url          = {http://arxiv.org/abs/1301.1071},
  eprinttype    = {arXiv},
  eprint       = {1301.1071},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1301-1071.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChristDKSY13,
  author       = {Michael Christ and
                  James Demmel and
                  Nicholas Knight and
                  Thomas Scanlon and
                  Katherine A. Yelick},
  title        = {Communication lower bounds and optimal algorithms for programs that
                  reference arrays - Part 1},
  journal      = {CoRR},
  volume       = {abs/1308.0068},
  year         = {2013},
  url          = {http://arxiv.org/abs/1308.0068},
  eprinttype    = {arXiv},
  eprint       = {1308.0068},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ChristDKSY13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jacm/BallardDHS12,
  author       = {Grey Ballard and
                  James Demmel and
                  Olga Holtz and
                  Oded Schwartz},
  title        = {Graph expansion and communication costs of fast matrix multiplication},
  journal      = {J. {ACM}},
  volume       = {59},
  number       = {6},
  pages        = {32:1--32:23},
  year         = {2012},
  url          = {https://doi.org/10.1145/2395116.2395121},
  doi          = {10.1145/2395116.2395121},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jacm/BallardDHS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamsc/DemmelGHL12,
  author       = {James Demmel and
                  Laura Grigori and
                  Mark Hoemmen and
                  Julien Langou},
  title        = {Communication-optimal Parallel and Sequential {QR} and {LU} Factorizations},
  journal      = {{SIAM} J. Sci. Comput.},
  volume       = {34},
  number       = {1},
  year         = {2012},
  url          = {https://doi.org/10.1137/080731992},
  doi          = {10.1137/080731992},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siamsc/DemmelGHL12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tmi/MurphyADKVL12,
  author       = {Mark Murphy and
                  Marcus T. Alley and
                  James Demmel and
                  Kurt Keutzer and
                  Shreyas Vasanawala and
                  Michael Lustig},
  title        = {Fast {\(\mathscr{l}\)}\({}_{\mbox{1}}\)-SPIRiT Compressed Sensing
                  Parallel Imaging {MRI:} Scalable Parallel Implementation and Clinically
                  Feasible Runtime},
  journal      = {{IEEE} Trans. Medical Imaging},
  volume       = {31},
  number       = {6},
  pages        = {1250--1262},
  year         = {2012},
  url          = {https://doi.org/10.1109/TMI.2012.2188039},
  doi          = {10.1109/TMI.2012.2188039},
  timestamp    = {Thu, 18 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tmi/MurphyADKVL12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/medalg/BallardDHLS12,
  author       = {Grey Ballard and
                  James Demmel and
                  Olga Holtz and
                  Benjamin Lipshitz and
                  Oded Schwartz},
  editor       = {Guy Even and
                  Dror Rawitz},
  title        = {Graph Expansion Analysis for Communication Costs of Fast Rectangular
                  Matrix Multiplication},
  booktitle    = {Design and Analysis of Algorithms - First Mediterranean Conference
                  on Algorithms, MedAlg 2012, Kibbutz Ein Gedi, Israel, December 3-5,
                  2012. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {7659},
  pages        = {13--36},
  publisher    = {Springer},
  year         = {2012},
  url          = {https://doi.org/10.1007/978-3-642-34862-4\_2},
  doi          = {10.1007/978-3-642-34862-4\_2},
  timestamp    = {Sat, 19 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/medalg/BallardDHLS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ppopp/BallardDK12,
  author       = {Grey Ballard and
                  James Demmel and
                  Nicholas Knight},
  editor       = {J. Ramanujam and
                  P. Sadayappan},
  title        = {Communication avoiding successive band reduction},
  booktitle    = {Proceedings of the 17th {ACM} {SIGPLAN} Symposium on Principles and
                  Practice of Parallel Programming, {PPOPP} 2012, New Orleans, LA, USA,
                  February 25-29, 2012},
  pages        = {35--44},
  publisher    = {{ACM}},
  year         = {2012},
  url          = {https://doi.org/10.1145/2145816.2145822},
  doi          = {10.1145/2145816.2145822},
  timestamp    = {Sun, 12 Jun 2022 19:46:08 +0200},
  biburl       = {https://dblp.org/rec/conf/ppopp/BallardDK12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sc/LipshitzBDS12,
  author       = {Benjamin Lipshitz and
                  Grey Ballard and
                  James Demmel and
                  Oded Schwartz},
  editor       = {Jeffrey K. Hollingsworth},
  title        = {Communication-avoiding parallel strassen: implementation and performance},
  booktitle    = {{SC} Conference on High Performance Computing Networking, Storage
                  and Analysis, {SC} '12, Salt Lake City, UT, {USA} - November 11 -
                  15, 2012},
  pages        = {101},
  publisher    = {{IEEE/ACM}},
  year         = {2012},
  url          = {https://doi.org/10.1109/SC.2012.33},
  doi          = {10.1109/SC.2012.33},
  timestamp    = {Sat, 19 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sc/LipshitzBDS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sc/DemmelEFKLSS12,
  author       = {James Demmel and
                  David Eliahu and
                  Armando Fox and
                  Shoaib Kamil and
                  Benjamin Lipshitz and
                  Oded Schwartz and
                  Omer Spillinger},
  title        = {Poster: Beating {MKL} and ScaLAPACK at Rectangular Matrix Multiplication
                  Using the {BFS/DFS} Approach},
  booktitle    = {2012 {SC} Companion: High Performance Computing, Networking Storage
                  and Analysis, Salt Lake City, UT, USA, November 10-16, 2012},
  pages        = {1370},
  publisher    = {{IEEE} Computer Society},
  year         = {2012},
  url          = {https://doi.org/10.1109/SC.Companion.2012.195},
  doi          = {10.1109/SC.COMPANION.2012.195},
  timestamp    = {Sat, 19 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sc/DemmelEFKLSS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sc/Demmel12,
  author       = {Jim Demmel},
  title        = {Communication avoiding algorithms},
  booktitle    = {2012 {SC} Companion: High Performance Computing, Networking Storage
                  and Analysis, Salt Lake City, UT, USA, November 10-16, 2012},
  pages        = {1942--2000},
  publisher    = {{IEEE} Computer Society},
  year         = {2012},
  url          = {https://doi.org/10.1109/SC.Companion.2012.351},
  doi          = {10.1109/SC.COMPANION.2012.351},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/Demmel12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/spaa/BallardDHLS12,
  author       = {Grey Ballard and
                  James Demmel and
                  Olga Holtz and
                  Benjamin Lipshitz and
                  Oded Schwartz},
  editor       = {Guy E. Blelloch and
                  Maurice Herlihy},
  title        = {Brief announcement: strong scaling of matrix multiplication algorithms
                  and memory-independent communication lower bounds},
  booktitle    = {24th {ACM} Symposium on Parallelism in Algorithms and Architectures,
                  {SPAA} '12, Pittsburgh, PA, USA, June 25-27, 2012},
  pages        = {77--79},
  publisher    = {{ACM}},
  year         = {2012},
  url          = {https://doi.org/10.1145/2312005.2312021},
  doi          = {10.1145/2312005.2312021},
  timestamp    = {Sat, 19 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/spaa/BallardDHLS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/spaa/BallardDHLS12a,
  author       = {Grey Ballard and
                  James Demmel and
                  Olga Holtz and
                  Benjamin Lipshitz and
                  Oded Schwartz},
  editor       = {Guy E. Blelloch and
                  Maurice Herlihy},
  title        = {Communication-optimal parallel algorithm for strassen's matrix multiplication},
  booktitle    = {24th {ACM} Symposium on Parallelism in Algorithms and Architectures,
                  {SPAA} '12, Pittsburgh, PA, USA, June 25-27, 2012},
  pages        = {193--204},
  publisher    = {{ACM}},
  year         = {2012},
  url          = {https://doi.org/10.1145/2312005.2312044},
  doi          = {10.1145/2312005.2312044},
  timestamp    = {Sat, 19 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/spaa/BallardDHLS12a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/vecpar/SolomonikD12,
  author       = {Edgar Solomonik and
                  James Demmel},
  editor       = {Michel J. Dayd{\'{e}} and
                  Osni Marques and
                  Kengo Nakajima},
  title        = {Matrix Multiplication on Multidimensional Torus Networks},
  booktitle    = {High Performance Computing for Computational Science - {VECPAR} 2012,
                  10th International Conference, Kobe, Japan, July 17-20, 2012, Revised
                  Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {7851},
  pages        = {201--215},
  publisher    = {Springer},
  year         = {2012},
  url          = {https://doi.org/10.1007/978-3-642-38718-0\_21},
  doi          = {10.1007/978-3-642-38718-0\_21},
  timestamp    = {Tue, 14 May 2019 10:00:36 +0200},
  biburl       = {https://dblp.org/rec/conf/vecpar/SolomonikD12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1202-3173,
  author       = {Grey Ballard and
                  James Demmel and
                  Olga Holtz and
                  Benjamin Lipshitz and
                  Oded Schwartz},
  title        = {Communication-Optimal Parallel Algorithm for Strassen's Matrix Multiplication},
  journal      = {CoRR},
  volume       = {abs/1202.3173},
  year         = {2012},
  url          = {http://arxiv.org/abs/1202.3173},
  eprinttype    = {arXiv},
  eprint       = {1202.3173},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1202-3173.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1202-3177,
  author       = {Grey Ballard and
                  James Demmel and
                  Olga Holtz and
                  Benjamin Lipshitz and
                  Oded Schwartz},
  title        = {Strong Scaling of Matrix Multiplication Algorithms and Memory-Independent
                  Communication Lower Bounds},
  journal      = {CoRR},
  volume       = {abs/1202.3177},
  year         = {2012},
  url          = {http://arxiv.org/abs/1202.3177},
  eprinttype    = {arXiv},
  eprint       = {1202.3177},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1202-3177.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1208-2451,
  author       = {Amal Khabou and
                  James Demmel and
                  Laura Grigori and
                  Ming Gu},
  title        = {{LU} factorization with panel rank revealing pivoting and its communication
                  avoiding version},
  journal      = {CoRR},
  volume       = {abs/1208.2451},
  year         = {2012},
  url          = {http://arxiv.org/abs/1208.2451},
  eprinttype    = {arXiv},
  eprint       = {1208.2451},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1208-2451.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1209-2184,
  author       = {Grey Ballard and
                  James Demmel and
                  Olga Holtz and
                  Benjamin Lipshitz and
                  Oded Schwartz},
  title        = {Graph Expansion Analysis for Communication Costs of Fast Rectangular
                  Matrix Multiplication},
  journal      = {CoRR},
  volume       = {abs/1209.2184},
  year         = {2012},
  url          = {http://arxiv.org/abs/1209.2184},
  eprinttype    = {arXiv},
  eprint       = {1209.2184},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1209-2184.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siammax/BallardDHS11,
  author       = {Grey Ballard and
                  James Demmel and
                  Olga Holtz and
                  Oded Schwartz},
  title        = {Minimizing Communication in Numerical Linear Algebra},
  journal      = {{SIAM} J. Matrix Anal. Appl.},
  volume       = {32},
  number       = {3},
  pages        = {866--901},
  year         = {2011},
  url          = {https://doi.org/10.1137/090769156},
  doi          = {10.1137/090769156},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siammax/BallardDHS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siammax/GrigoriDX11,
  author       = {Laura Grigori and
                  James Demmel and
                  Hua Xiang},
  title        = {{CALU:} {A} Communication Optimal {LU} Factorization Algorithm},
  journal      = {{SIAM} J. Matrix Anal. Appl.},
  volume       = {32},
  number       = {4},
  pages        = {1317--1350},
  year         = {2011},
  url          = {https://doi.org/10.1137/100788926},
  doi          = {10.1137/100788926},
  timestamp    = {Tue, 26 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siammax/GrigoriDX11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/alenex/Demmel11,
  author       = {James Demmel},
  editor       = {Matthias M{\"{u}}ller{-}Hannemann and
                  Renato Fonseca F. Werneck},
  title        = {Avoiding Communication in Numerical Linear Algebra},
  booktitle    = {Proceedings of the Thirteenth Workshop on Algorithm Engineering and
                  Experiments, {ALENEX} 2011, Holiday Inn San Francisco Golden Gateway,
                  San Francisco, California, USA, January 22, 2011},
  pages        = {59},
  publisher    = {{SIAM}},
  year         = {2011},
  url          = {https://doi.org/10.1137/1.9781611972917.6},
  doi          = {10.1137/1.9781611972917.6},
  timestamp    = {Wed, 14 Nov 2018 10:52:08 +0100},
  biburl       = {https://dblp.org/rec/conf/alenex/Demmel11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/europar/SolomonikD11,
  author       = {Edgar Solomonik and
                  James Demmel},
  editor       = {Emmanuel Jeannot and
                  Raymond Namyst and
                  Jean Roman},
  title        = {Communication-Optimal Parallel 2.5D Matrix Multiplication and {LU}
                  Factorization Algorithms},
  booktitle    = {Euro-Par 2011 Parallel Processing - 17th International Conference,
                  Euro-Par 2011, Bordeaux, France, August 29 - September 2, 2011, Proceedings,
                  Part {II}},
  series       = {Lecture Notes in Computer Science},
  volume       = {6853},
  pages        = {90--109},
  publisher    = {Springer},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-3-642-23397-5\_10},
  doi          = {10.1007/978-3-642-23397-5\_10},
  timestamp    = {Tue, 14 May 2019 10:00:46 +0200},
  biburl       = {https://dblp.org/rec/conf/europar/SolomonikD11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/hotchips/Demmel11,
  author       = {Jim Demmel},
  title        = {Rethinking algorithms for future architectures: Communication-avoiding
                  algorithms},
  booktitle    = {2011 {IEEE} Hot Chips 23 Symposium (HCS), Stanford, CA, USA, August
                  17-19, 2011},
  pages        = {1--63},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.ieeecomputersociety.org/10.1109/HOTCHIPS.2011.7477498},
  doi          = {10.1109/HOTCHIPS.2011.7477498},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/hotchips/Demmel11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcnn/MizutaniD11,
  author       = {Eiji Mizutani and
                  James Demmel},
  title        = {On improving trust-region variable projection algorithms for separable
                  nonlinear least squares learning},
  booktitle    = {The 2011 International Joint Conference on Neural Networks, {IJCNN}
                  2011, San Jose, California, USA, July 31 - August 5, 2011},
  pages        = {397--404},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/IJCNN.2011.6033249},
  doi          = {10.1109/IJCNN.2011.6033249},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ijcnn/MizutaniD11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipps/AndersonBDK11,
  author       = {Michael J. Anderson and
                  Grey Ballard and
                  James Demmel and
                  Kurt Keutzer},
  title        = {Communication-Avoiding {QR} Decomposition for GPUs},
  booktitle    = {25th {IEEE} International Symposium on Parallel and Distributed Processing,
                  {IPDPS} 2011, Anchorage, Alaska, USA, 16-20 May, 2011 - Conference
                  Proceedings},
  pages        = {48--58},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/IPDPS.2011.15},
  doi          = {10.1109/IPDPS.2011.15},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ipps/AndersonBDK11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipps/BulucWOD11,
  author       = {Aydin Bulu{\c{c}} and
                  Samuel Williams and
                  Leonid Oliker and
                  James Demmel},
  title        = {Reduced-Bandwidth Multithreaded Algorithms for Sparse Matrix-Vector
                  Multiplication},
  booktitle    = {25th {IEEE} International Symposium on Parallel and Distributed Processing,
                  {IPDPS} 2011, Anchorage, Alaska, USA, 16-20 May, 2011 - Conference
                  Proceedings},
  pages        = {721--733},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/IPDPS.2011.73},
  doi          = {10.1109/IPDPS.2011.73},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ipps/BulucWOD11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sc/SolomonikBD11,
  author       = {Edgar Solomonik and
                  Abhinav Bhatele and
                  James Demmel},
  editor       = {Scott A. Lathrop and
                  Jim Costa and
                  William Kramer},
  title        = {Improving communication performance in dense linear algebra via topology
                  aware collectives},
  booktitle    = {Conference on High Performance Computing Networking, Storage and Analysis,
                  {SC} 2011, Seattle, WA, USA, November 12-18, 2011},
  pages        = {77:1--77:11},
  publisher    = {{ACM}},
  year         = {2011},
  url          = {https://doi.org/10.1145/2063384.2063487},
  doi          = {10.1145/2063384.2063487},
  timestamp    = {Fri, 03 Jul 2020 08:57:23 +0200},
  biburl       = {https://dblp.org/rec/conf/sc/SolomonikBD11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/snc/Demmel11,
  author       = {James Demmel},
  editor       = {Marc Moreno Maza},
  title        = {Accurate and efficient expression evaluation and linear algebra, or
                  why it can be easier to compute accurate eigenvalues of a Vandermonde
                  matrix than the accurate sum of 3 numbers},
  booktitle    = {{SNC} 2011, Proceedings of the 2011 Internation Workshop on Symbolic-Numeric
                  Computation, San Jose, California, USA, June 7-9, 2011},
  pages        = {2},
  publisher    = {{ACM}},
  year         = {2011},
  url          = {https://doi.org/10.1145/2331684.2331686},
  doi          = {10.1145/2331684.2331686},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/snc/Demmel11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/spaa/BallardDHS11,
  author       = {Grey Ballard and
                  James Demmel and
                  Olga Holtz and
                  Oded Schwartz},
  editor       = {Rajmohan Rajaraman and
                  Friedhelm Meyer auf der Heide},
  title        = {Graph expansion and communication costs of fast matrix multiplication:
                  regular submission},
  booktitle    = {{SPAA} 2011: Proceedings of the 23rd Annual {ACM} Symposium on Parallelism
                  in Algorithms and Architectures, San Jose, CA, USA, June 4-6, 2011
                  (Co-located with {FCRC} 2011)},
  pages        = {1--12},
  publisher    = {{ACM}},
  year         = {2011},
  url          = {https://doi.org/10.1145/1989493.1989495},
  doi          = {10.1145/1989493.1989495},
  timestamp    = {Sun, 25 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/spaa/BallardDHS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/spaa/BallardDG11,
  author       = {Grey Ballard and
                  James Demmel and
                  Andrew Gearhart},
  editor       = {Rajmohan Rajaraman and
                  Friedhelm Meyer auf der Heide},
  title        = {Brief announcement: communication bounds for heterogeneous architectures},
  booktitle    = {{SPAA} 2011: Proceedings of the 23rd Annual {ACM} Symposium on Parallelism
                  in Algorithms and Architectures, San Jose, CA, USA, June 4-6, 2011
                  (Co-located with {FCRC} 2011)},
  pages        = {257--258},
  publisher    = {{ACM}},
  year         = {2011},
  url          = {https://doi.org/10.1145/1989493.1989531},
  doi          = {10.1145/1989493.1989531},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/spaa/BallardDG11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:reference/parallel/LiDGGS11,
  author       = {Xiaoye Sherry Li and
                  James Demmel and
                  John R. Gilbert and
                  Laura Grigori and
                  Meiyue Shao},
  editor       = {David A. Padua},
  title        = {SuperLU},
  booktitle    = {Encyclopedia of Parallel Computing},
  pages        = {1955--1962},
  publisher    = {Springer},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-0-387-09766-4\_95},
  doi          = {10.1007/978-0-387-09766-4\_95},
  timestamp    = {Wed, 12 Jul 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/reference/parallel/LiDGGS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1109-1693,
  author       = {Grey Ballard and
                  James Demmel and
                  Olga Holtz and
                  Oded Schwartz},
  title        = {Graph Expansion and Communication Costs of Fast Matrix Multiplication},
  journal      = {CoRR},
  volume       = {abs/1109.1693},
  year         = {2011},
  url          = {http://arxiv.org/abs/1109.1693},
  eprinttype    = {arXiv},
  eprint       = {1109.1693},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1109-1693.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamsc/BallardDHS10,
  author       = {Grey Ballard and
                  James Demmel and
                  Olga Holtz and
                  Oded Schwartz},
  title        = {Communication-optimal Parallel and Sequential Cholesky Decomposition},
  journal      = {{SIAM} J. Sci. Comput.},
  volume       = {32},
  number       = {6},
  pages        = {3495--3523},
  year         = {2010},
  url          = {https://doi.org/10.1137/090760969},
  doi          = {10.1137/090760969},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siamsc/BallardDHS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/spaa/GrigoriDDP10,
  author       = {Laura Grigori and
                  Pierre{-}Yves David and
                  James Demmel and
                  Sylvain Peyronnet},
  editor       = {Friedhelm Meyer auf der Heide and
                  Cynthia A. Phillips},
  title        = {Brief announcement: Lower bounds on communication for sparse Cholesky
                  factorization of a model problem},
  booktitle    = {{SPAA} 2010: Proceedings of the 22nd Annual {ACM} Symposium on Parallelism
                  in Algorithms and Architectures, Thira, Santorini, Greece, June 13-15,
                  2010},
  pages        = {79--81},
  publisher    = {{ACM}},
  year         = {2010},
  url          = {https://doi.org/10.1145/1810479.1810496},
  doi          = {10.1145/1810479.1810496},
  timestamp    = {Wed, 21 Nov 2018 11:15:55 +0100},
  biburl       = {https://dblp.org/rec/conf/spaa/GrigoriDDP10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1011-3077,
  author       = {Grey Ballard and
                  James Demmel and
                  Ioana Dumitriu},
  title        = {Minimizing Communication for Eigenproblems and the Singular Value
                  Decomposition},
  journal      = {CoRR},
  volume       = {abs/1011.3077},
  year         = {2010},
  url          = {http://arxiv.org/abs/1011.3077},
  eprinttype    = {arXiv},
  eprint       = {1011.3077},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1011-3077.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/cacm/AsanovicBDKKKMPSWWY09,
  author       = {Krste Asanovic and
                  Rastislav Bod{\'{\i}}k and
                  James Demmel and
                  Tony M. Keaveny and
                  Kurt Keutzer and
                  John Kubiatowicz and
                  Nelson Morgan and
                  David A. Patterson and
                  Koushik Sen and
                  John Wawrzynek and
                  David Wessel and
                  Katherine A. Yelick},
  title        = {A view of the parallel computing landscape},
  journal      = {Commun. {ACM}},
  volume       = {52},
  number       = {10},
  pages        = {56--67},
  year         = {2009},
  url          = {https://doi.org/10.1145/1562764.1562783},
  doi          = {10.1145/1562764.1562783},
  timestamp    = {Thu, 13 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/cacm/AsanovicBDKKKMPSWWY09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pc/WilliamsOVSYD09,
  author       = {Samuel Williams and
                  Leonid Oliker and
                  Richard W. Vuduc and
                  John Shalf and
                  Katherine A. Yelick and
                  James Demmel},
  title        = {Optimization of sparse matrix-vector multiplication on emerging multicore
                  platforms},
  journal      = {Parallel Comput.},
  volume       = {35},
  number       = {3},
  pages        = {178--194},
  year         = {2009},
  url          = {https://doi.org/10.1016/j.parco.2008.12.006},
  doi          = {10.1016/J.PARCO.2008.12.006},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pc/WilliamsOVSYD09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamsc/DemmelHHR09,
  author       = {James Demmel and
                  Mark Hoemmen and
                  Yozo Hida and
                  E. Jason Riedy},
  title        = {Nonnegative Diagonals and High Performance on Low-Profile Matrices
                  from Householder {QR}},
  journal      = {{SIAM} J. Sci. Comput.},
  volume       = {31},
  number       = {4},
  pages        = {2832--2841},
  year         = {2009},
  url          = {https://doi.org/10.1137/080725763},
  doi          = {10.1137/080725763},
  timestamp    = {Thu, 30 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siamsc/DemmelHHR09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/toms/DemmelHRL09,
  author       = {James Demmel and
                  Yozo Hida and
                  E. Jason Riedy and
                  Xiaoye S. Li},
  title        = {Extra-Precise Iterative Refinement for Overdetermined Least Squares
                  Problems},
  journal      = {{ACM} Trans. Math. Softw.},
  volume       = {35},
  number       = {4},
  pages        = {28:1--28:32},
  year         = {2009},
  url          = {https://doi.org/10.1145/1462173.1462177},
  doi          = {10.1145/1462173.1462177},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/toms/DemmelHRL09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sc/MohiyuddinHDY09,
  author       = {Marghoob Mohiyuddin and
                  Mark Hoemmen and
                  James Demmel and
                  Katherine A. Yelick},
  title        = {Minimizing communication in sparse matrix solvers},
  booktitle    = {Proceedings of the {ACM/IEEE} Conference on High Performance Computing,
                  {SC} 2009, November 14-20, 2009, Portland, Oregon, {USA}},
  publisher    = {{ACM}},
  year         = {2009},
  url          = {https://doi.org/10.1145/1654059.1654096},
  doi          = {10.1145/1654059.1654096},
  timestamp    = {Tue, 06 Nov 2018 16:59:29 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/MohiyuddinHDY09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/spaa/BallardDHS09,
  author       = {Grey Ballard and
                  James Demmel and
                  Olga Holtz and
                  Oded Schwartz},
  editor       = {Friedhelm Meyer auf der Heide and
                  Michael A. Bender},
  title        = {Communication-optimal parallel and sequential Cholesky decomposition:
                  extended abstract},
  booktitle    = {{SPAA} 2009: Proceedings of the 21st Annual {ACM} Symposium on Parallelism
                  in Algorithms and Architectures, Calgary, Alberta, Canada, August
                  11-13, 2009},
  pages        = {245--252},
  publisher    = {{ACM}},
  year         = {2009},
  url          = {https://doi.org/10.1145/1583991.1584054},
  doi          = {10.1145/1583991.1584054},
  timestamp    = {Wed, 21 Nov 2018 11:15:22 +0100},
  biburl       = {https://dblp.org/rec/conf/spaa/BallardDHS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-0902-2537,
  author       = {Grey Ballard and
                  James Demmel and
                  Olga Holtz and
                  Oded Schwartz},
  title        = {Communication-optimal Parallel and Sequential Cholesky Decomposition},
  journal      = {CoRR},
  volume       = {abs/0902.2537},
  year         = {2009},
  url          = {http://arxiv.org/abs/0902.2537},
  eprinttype    = {arXiv},
  eprint       = {0902.2537},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-0902-2537.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-0905-2485,
  author       = {Grey Ballard and
                  James Demmel and
                  Olga Holtz and
                  Oded Schwartz},
  title        = {Minimizing Communication in Linear Algebra},
  journal      = {CoRR},
  volume       = {abs/0905.2485},
  year         = {2009},
  url          = {http://arxiv.org/abs/0905.2485},
  eprinttype    = {arXiv},
  eprint       = {0905.2485},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-0905-2485.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jgo/NieDG08,
  author       = {Jiawang Nie and
                  James Demmel and
                  Ming Gu},
  title        = {Global minimization of rational functions and the nearest GCDs},
  journal      = {J. Glob. Optim.},
  volume       = {40},
  number       = {4},
  pages        = {697--718},
  year         = {2008},
  url          = {https://doi.org/10.1007/s10898-006-9119-8},
  doi          = {10.1007/S10898-006-9119-8},
  timestamp    = {Fri, 11 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jgo/NieDG08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamjo/NieD08,
  author       = {Jiawang Nie and
                  James Demmel},
  title        = {Sparse {SOS} Relaxations for Minimizing Functions that are Summations
                  of Small Polynomials},
  journal      = {{SIAM} J. Optim.},
  volume       = {19},
  number       = {4},
  pages        = {1534--1558},
  year         = {2008},
  url          = {https://doi.org/10.1137/060668791},
  doi          = {10.1137/060668791},
  timestamp    = {Mon, 08 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siamjo/NieD08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamsc/BindelDF08,
  author       = {David Bindel and
                  James Demmel and
                  Mark J. Friedman},
  title        = {Continuation of Invariant Subspaces in Large Bifurcation Problems},
  journal      = {{SIAM} J. Sci. Comput.},
  volume       = {30},
  number       = {2},
  pages        = {637--656},
  year         = {2008},
  url          = {https://doi.org/10.1137/060654219},
  doi          = {10.1137/060654219},
  timestamp    = {Thu, 30 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siamsc/BindelDF08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamsc/DemmelMPV08,
  author       = {James Demmel and
                  Osni Marques and
                  Beresford N. Parlett and
                  Christof V{\"{o}}mel},
  title        = {Performance and Accuracy of LAPACK's Symmetric Tridiagonal Eigensolvers},
  journal      = {{SIAM} J. Sci. Comput.},
  volume       = {30},
  number       = {3},
  pages        = {1508--1526},
  year         = {2008},
  url          = {https://doi.org/10.1137/070688778},
  doi          = {10.1137/070688778},
  timestamp    = {Thu, 30 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siamsc/DemmelMPV08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/toms/HowellDFHM08,
  author       = {Gary W. Howell and
                  James Demmel and
                  Charles T. Fulton and
                  Sven Hammarling and
                  Karen Marmol},
  title        = {Cache efficient bidiagonalization using {BLAS} 2.5 operators},
  journal      = {{ACM} Trans. Math. Softw.},
  volume       = {34},
  number       = {3},
  pages        = {14:1--14:33},
  year         = {2008},
  url          = {https://doi.org/10.1145/1356052.1356055},
  doi          = {10.1145/1356052.1356055},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/toms/HowellDFHM08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/toms/MarquesVDP08,
  author       = {Osni Marques and
                  Christof V{\"{o}}mel and
                  James Demmel and
                  Beresford N. Parlett},
  title        = {Algorithm 880: {A} testing infrastructure for symmetric tridiagonal
                  eigensolvers},
  journal      = {{ACM} Trans. Math. Softw.},
  volume       = {35},
  number       = {1},
  pages        = {8:1--8:13},
  year         = {2008},
  url          = {https://doi.org/10.1145/1377603.1377611},
  doi          = {10.1145/1377603.1377611},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/toms/MarquesVDP08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipps/DemmelHMY08,
  author       = {James Demmel and
                  Mark Hoemmen and
                  Marghoob Mohiyuddin and
                  Katherine A. Yelick},
  title        = {Avoiding communication in sparse matrix computations},
  booktitle    = {22nd {IEEE} International Symposium on Parallel and Distributed Processing,
                  {IPDPS} 2008, Miami, Florida USA, April 14-18, 2008},
  pages        = {1--12},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/IPDPS.2008.4536305},
  doi          = {10.1109/IPDPS.2008.4536305},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ipps/DemmelHMY08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sc/GrigoriDX08,
  author       = {Laura Grigori and
                  James Demmel and
                  Hua Xiang},
  title        = {Communication avoiding Gaussian elimination},
  booktitle    = {Proceedings of the {ACM/IEEE} Conference on High Performance Computing,
                  {SC} 2008, November 15-21, 2008, Austin, Texas, {USA}},
  pages        = {29},
  publisher    = {{IEEE/ACM}},
  year         = {2008},
  url          = {https://doi.org/10.1109/SC.2008.5214287},
  doi          = {10.1109/SC.2008.5214287},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/GrigoriDX08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sc/VolkovD08,
  author       = {Vasily Volkov and
                  James Demmel},
  title        = {Benchmarking GPUs to tune dense linear algebra},
  booktitle    = {Proceedings of the {ACM/IEEE} Conference on High Performance Computing,
                  {SC} 2008, November 15-21, 2008, Austin, Texas, {USA}},
  pages        = {31},
  publisher    = {{IEEE/ACM}},
  year         = {2008},
  url          = {https://doi.org/10.1109/SC.2008.5214359},
  doi          = {10.1109/SC.2008.5214359},
  timestamp    = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/VolkovD08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-0806-2159,
  author       = {James Demmel and
                  Laura Grigori and
                  Mark Hoemmen and
                  Julien Langou},
  title        = {Communication-avoiding parallel and sequential {QR} factorizations},
  journal      = {CoRR},
  volume       = {abs/0806.2159},
  year         = {2008},
  url          = {http://arxiv.org/abs/0806.2159},
  eprinttype    = {arXiv},
  eprint       = {0806.2159},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-0806-2159.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aaecc/NishtalaVDY07,
  author       = {Rajesh Nishtala and
                  Richard W. Vuduc and
                  James Demmel and
                  Katherine A. Yelick},
  title        = {When cache blocking of sparse matrix vector multiply works and why},
  journal      = {Appl. Algebra Eng. Commun. Comput.},
  volume       = {18},
  number       = {3},
  pages        = {297--311},
  year         = {2007},
  url          = {https://doi.org/10.1007/s00200-007-0038-9},
  doi          = {10.1007/S00200-007-0038-9},
  timestamp    = {Mon, 05 Jun 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aaecc/NishtalaVDY07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nm/DemmelDHK07,
  author       = {James Demmel and
                  Ioana Dumitriu and
                  Olga Holtz and
                  Robert Kleinberg},
  title        = {Fast matrix multiplication is stable},
  journal      = {Numerische Mathematik},
  volume       = {106},
  number       = {2},
  pages        = {199--224},
  year         = {2007},
  url          = {https://doi.org/10.1007/s00211-007-0061-6},
  doi          = {10.1007/S00211-007-0061-6},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/nm/DemmelDHK07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nm/DemmelDH07,
  author       = {James Demmel and
                  Ioana Dumitriu and
                  Olga Holtz},
  title        = {Fast linear algebra is stable},
  journal      = {Numerische Mathematik},
  volume       = {108},
  number       = {1},
  pages        = {59--91},
  year         = {2007},
  url          = {https://doi.org/10.1007/s00211-007-0114-x},
  doi          = {10.1007/S00211-007-0114-X},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/nm/DemmelDH07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamsc/GrigoriDL07,
  author       = {Laura Grigori and
                  James Demmel and
                  Xiaoye S. Li},
  title        = {Parallel Symbolic Factorization for Sparse {LU} with Static Pivoting},
  journal      = {{SIAM} J. Sci. Comput.},
  volume       = {29},
  number       = {3},
  pages        = {1289--1314},
  year         = {2007},
  url          = {https://doi.org/10.1137/050638102},
  doi          = {10.1137/050638102},
  timestamp    = {Thu, 30 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siamsc/GrigoriDL07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipsn/KimPCDFGT07,
  author       = {Sukun Kim and
                  Shamim Pakzad and
                  David E. Culler and
                  James Demmel and
                  Gregory Fenves and
                  Steven D. Glaser and
                  Martin Turon},
  editor       = {Tarek F. Abdelzaher and
                  Leonidas J. Guibas and
                  Matt Welsh},
  title        = {Health monitoring of civil infrastructures using wireless sensor networks},
  booktitle    = {Proceedings of the 6th International Conference on Information Processing
                  in Sensor Networks, {IPSN} 2007, Cambridge, Massachusetts, USA, April
                  25-27, 2007},
  pages        = {254--263},
  publisher    = {{ACM}},
  year         = {2007},
  url          = {https://doi.org/10.1145/1236360.1236395},
  doi          = {10.1145/1236360.1236395},
  timestamp    = {Thu, 26 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ipsn/KimPCDFGT07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sc/WilliamsOVSYD07,
  author       = {Samuel Williams and
                  Leonid Oliker and
                  Richard W. Vuduc and
                  John Shalf and
                  Katherine A. Yelick and
                  James Demmel},
  editor       = {Becky Verastegui},
  title        = {Optimization of sparse matrix-vector multiplication on emerging multicore
                  platforms},
  booktitle    = {Proceedings of the {ACM/IEEE} Conference on High Performance Networking
                  and Computing, {SC} 2007, November 10-16, 2007, Reno, Nevada, {USA}},
  pages        = {38},
  publisher    = {{ACM} Press},
  year         = {2007},
  url          = {https://doi.org/10.1145/1362622.1362674},
  doi          = {10.1145/1362622.1362674},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sc/WilliamsOVSYD07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:reference/crc/HidaDLKGBTLLMVLRDKPB07,
  author       = {Yozo Hida and
                  James Demmel and
                  Julien Langou and
                  Jakub Kurzak and
                  Ming Gu and
                  Alfredo Buttari and
                  Stanimire Tomov and
                  Piotr Luszczek and
                  Julie Langou and
                  Osni Marques and
                  Christof V{\"{o}}mel and
                  Xiaoye S. Li and
                  E. Jason Riedy and
                  Jack J. Dongarra and
                  William Kahan and
                  Beresford N. Parlett and
                  David Bindel},
  editor       = {Sanguthevar Rajasekaran and
                  John H. Reif},
  title        = {Prospectus for a Dense Linear Algebra Software Library},
  booktitle    = {Handbook of Parallel Computing - Models, Algorithms and Applications},
  publisher    = {Chapman and Hall/CRC},
  year         = {2007},
  url          = {https://doi.org/10.1201/9781420011296.ch29},
  doi          = {10.1201/9781420011296.CH29},
  timestamp    = {Fri, 28 Jul 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/reference/crc/HidaDLKGBTLLMVLRDKPB07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-0712-4027,
  author       = {James Demmel and
                  Ioana Dumitriu and
                  Olga Holtz and
                  Plamen Koev},
  title        = {Accurate and Efficient Expression Evaluation and Linear Algebra},
  journal      = {CoRR},
  volume       = {abs/0712.4027},
  year         = {2007},
  url          = {http://arxiv.org/abs/0712.4027},
  eprinttype    = {arXiv},
  eprint       = {0712.4027},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-0712-4027.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/moc/DemmelK06,
  author       = {James Demmel and
                  Plamen Koev},
  title        = {Accurate and efficient evaluation of Schur and Jack functions},
  journal      = {Math. Comput.},
  volume       = {75},
  number       = {253},
  pages        = {223--239},
  year         = {2006},
  url          = {https://doi.org/10.1090/S0025-5718-05-01780-1},
  doi          = {10.1090/S0025-5718-05-01780-1},
  timestamp    = {Wed, 17 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/moc/DemmelK06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/mp/NieDS06,
  author       = {Jiawang Nie and
                  James Demmel and
                  Bernd Sturmfels},
  title        = {Minimizing Polynomials via Sum of Squares over the Gradient Ideal},
  journal      = {Math. Program.},
  volume       = {106},
  number       = {3},
  pages        = {587--606},
  year         = {2006},
  url          = {https://doi.org/10.1007/s10107-005-0672-6},
  doi          = {10.1007/S10107-005-0672-6},
  timestamp    = {Sat, 27 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/mp/NieDS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/toms/DemmelHKLMR06,
  author       = {James Demmel and
                  Yozo Hida and
                  William Kahan and
                  Xiaoye S. Li and
                  Sonil Mukherjee and
                  E. Jason Riedy},
  title        = {Error bounds from extra-precise iterative refinement},
  journal      = {{ACM} Trans. Math. Softw.},
  volume       = {32},
  number       = {2},
  pages        = {325--351},
  year         = {2006},
  url          = {https://doi.org/10.1145/1141885.1141894},
  doi          = {10.1145/1141885.1141894},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/toms/DemmelHKLMR06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/para/DemmelDPKGBHLMRVLLKBLT06,
  author       = {James Demmel and
                  Jack J. Dongarra and
                  Beresford N. Parlett and
                  William Kahan and
                  Ming Gu and
                  David Bindel and
                  Yozo Hida and
                  Xiaoye S. Li and
                  Osni Marques and
                  E. Jason Riedy and
                  Christof V{\"{o}}mel and
                  Julien Langou and
                  Piotr Luszczek and
                  Jakub Kurzak and
                  Alfredo Buttari and
                  Julie Langou and
                  Stanimire Tomov},
  editor       = {Bo K{\aa}gstr{\"{o}}m and
                  Erik Elmroth and
                  Jack J. Dongarra and
                  Jerzy Wasniewski},
  title        = {Prospectus for the Next {LAPACK} and ScaLAPACK Libraries},
  booktitle    = {Applied Parallel Computing. State of the Art in Scientific Computing,
                  8th International Workshop, {PARA} 2006, Ume{\aa}, Sweden, June 18-21,
                  2006, Revised Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {4699},
  pages        = {11--23},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/978-3-540-75755-9\_2},
  doi          = {10.1007/978-3-540-75755-9\_2},
  timestamp    = {Mon, 03 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/para/DemmelDPKGBHLMRVLLKBLT06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/para/KatagiriVD06,
  author       = {Takahiro Katagiri and
                  Christof V{\"{o}}mel and
                  James Demmel},
  editor       = {Bo K{\aa}gstr{\"{o}}m and
                  Erik Elmroth and
                  Jack J. Dongarra and
                  Jerzy Wasniewski},
  title        = {Automatic Performance Tuning for the Multi-section with Multiple Eigenvalues
                  Method for Symmetric Tridiagonal Eigenproblems},
  booktitle    = {Applied Parallel Computing. State of the Art in Scientific Computing,
                  8th International Workshop, {PARA} 2006, Ume{\aa}, Sweden, June 18-21,
                  2006, Revised Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {4699},
  pages        = {938--948},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/978-3-540-75755-9\_111},
  doi          = {10.1007/978-3-540-75755-9\_111},
  timestamp    = {Thu, 25 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/para/KatagiriVD06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sensys/KimPCDFGT06,
  author       = {Sukun Kim and
                  Shamim Pakzad and
                  David E. Culler and
                  James Demmel and
                  Gregory Fenves and
                  Steven D. Glaser and
                  Martin Turon},
  editor       = {Andrew T. Campbell and
                  Philippe Bonnet and
                  John S. Heidemann},
  title        = {Wireless sensor networks for structural health monitoring},
  booktitle    = {Proceedings of the 4th International Conference on Embedded Networked
                  Sensor Systems, SenSys 2006, Boulder, Colorado, USA, October 31 -
                  November 3, 2006},
  pages        = {427--428},
  publisher    = {{ACM}},
  year         = {2006},
  url          = {https://doi.org/10.1145/1182807.1182889},
  doi          = {10.1145/1182807.1182889},
  timestamp    = {Thu, 26 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sensys/KimPCDFGT06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-math-0603207,
  author       = {James Demmel and
                  Ioana Dumitriu and
                  Olga Holtz and
                  Robert Kleinberg},
  title        = {Fast matrix multiplication is stable},
  journal      = {CoRR},
  volume       = {abs/math/0603207},
  year         = {2006},
  url          = {http://arxiv.org/abs/math/0603207},
  eprinttype    = {arXiv},
  eprint       = {math/0603207},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-math-0603207.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-math-0612264,
  author       = {James Demmel and
                  Ioana Dumitriu and
                  Olga Holtz},
  title        = {Fast linear algebra is stable},
  journal      = {CoRR},
  volume       = {abs/math/0612264},
  year         = {2006},
  url          = {http://arxiv.org/abs/math/0612264},
  eprinttype    = {arXiv},
  eprint       = {math/0612264},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-math-0612264.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jgo/NieD05,
  author       = {Jiawang Nie and
                  James Demmel},
  title        = {Minimum Ellipsoid Bounds for Solutions of Polynomial Systems via Sum
                  of Squares},
  journal      = {J. Glob. Optim.},
  volume       = {33},
  number       = {4},
  pages        = {511--525},
  year         = {2005},
  url          = {https://doi.org/10.1007/s10898-005-2099-2},
  doi          = {10.1007/S10898-005-2099-2},
  timestamp    = {Fri, 11 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jgo/NieD05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siammax/DemmelK05,
  author       = {James Demmel and
                  Plamen Koev},
  title        = {The Accurate and Efficient Solution of a Totally Positive Generalized
                  Vandermonde Linear System},
  journal      = {{SIAM} J. Matrix Anal. Appl.},
  volume       = {27},
  number       = {1},
  pages        = {142--152},
  year         = {2005},
  url          = {https://doi.org/10.1137/S0895479804440335},
  doi          = {10.1137/S0895479804440335},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/siammax/DemmelK05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccS/BindelDFGK05,
  author       = {David Bindel and
                  James Demmel and
                  Mark J. Friedman and
                  Willy Govaerts and
                  Yuri A. Kuznetsov},
  editor       = {Vaidy S. Sunderam and
                  G. Dick van Albada and
                  Peter M. A. Sloot and
                  Jack J. Dongarra},
  title        = {Bifurcation Analysis of Large Equilibrium Systems in Matlab},
  booktitle    = {Computational Science - {ICCS} 2005, 5th International Conference,
                  Atlanta, GA, USA, May 22-25, 2005, Proceedings, Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {3514},
  pages        = {50--57},
  publisher    = {Springer},
  year         = {2005},
  url          = {https://doi.org/10.1007/11428831\_7},
  doi          = {10.1007/11428831\_7},
  timestamp    = {Tue, 14 May 2019 10:00:48 +0200},
  biburl       = {https://dblp.org/rec/conf/iccS/BindelDFGK05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/dagstuhl/DemmelDH05,
  author       = {James Demmel and
                  Ioana Dumitriu and
                  Olga Holtz},
  editor       = {Bruno Buchberger and
                  Shin'ichi Oishi and
                  Michael Plum and
                  Siegfried M. Rump},
  title        = {Toward accurate polynomial evaluation in rounded arithmetic (short
                  report)},
  booktitle    = {Algebraic and Numerical Algorithms and Computer-assisted Proofs, 25.-30.
                  September 2005},
  series       = {Dagstuhl Seminar Proceedings},
  volume       = {05391},
  publisher    = {Internationales Begegnungs- und Forschungszentrum f{\"{u}}r Informatik
                  (IBFI), Schloss Dagstuhl, Germany},
  year         = {2005},
  url          = {http://drops.dagstuhl.de/opus/volltexte/2006/447},
  timestamp    = {Thu, 10 Jun 2021 13:02:04 +0200},
  biburl       = {https://dblp.org/rec/conf/dagstuhl/DemmelDH05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-math-0508350,
  author       = {James Demmel and
                  Ioana Dumitriu and
                  Olga Holtz},
  title        = {Toward accurate polynomial evaluation in rounded arithmetic},
  journal      = {CoRR},
  volume       = {abs/math/0508350},
  year         = {2005},
  url          = {http://arxiv.org/abs/math/0508350},
  eprinttype    = {arXiv},
  eprint       = {math/0508350},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-math-0508350.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijhpca/VuducDB04,
  author       = {Richard W. Vuduc and
                  James Demmel and
                  Jeff A. Bilmes},
  title        = {Statistical Models for Empirical Search-Based Performance Tuning},
  journal      = {Int. J. High Perform. Comput. Appl.},
  volume       = {18},
  number       = {1},
  pages        = {65--94},
  year         = {2004},
  url          = {https://doi.org/10.1177/1094342004041293},
  doi          = {10.1177/1094342004041293},
  timestamp    = {Thu, 12 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ijhpca/VuducDB04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/na/DemmelH04,
  author       = {James Demmel and
                  Yozo Hida},
  title        = {Fast and Accurate Floating Point Summation with Application to Computational
                  Geometry},
  journal      = {Numer. Algorithms},
  volume       = {37},
  number       = {1-4},
  pages        = {101--112},
  year         = {2004},
  url          = {https://doi.org/10.1023/B:NUMA.0000049458.99541.38},
  doi          = {10.1023/B:NUMA.0000049458.99541.38},
  timestamp    = {Sat, 25 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/na/DemmelH04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nm/DemmelK04,
  author       = {James Demmel and
                  Plamen Koev},
  title        = {Accurate SVDs of weakly diagonally dominant M-matrices},
  journal      = {Numerische Mathematik},
  volume       = {98},
  number       = {1},
  pages        = {99--104},
  year         = {2004},
  url          = {https://doi.org/10.1007/s00211-004-0527-8},
  doi          = {10.1007/S00211-004-0527-8},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/nm/DemmelK04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamsc/DemmelH04,
  author       = {James Demmel and
                  Yozo Hida},
  title        = {Accurate and Efficient Floating Point Summation},
  journal      = {{SIAM} J. Sci. Comput.},
  volume       = {25},
  number       = {4},
  pages        = {1214--1248},
  year         = {2004},
  url          = {https://doi.org/10.1137/S1064827502407627},
  doi          = {10.1137/S1064827502407627},
  timestamp    = {Thu, 30 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siamsc/DemmelH04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icpp/LeeVDY04,
  author       = {Benjamin C. Lee and
                  Richard W. Vuduc and
                  James Demmel and
                  Katherine A. Yelick},
  title        = {Performance Models for Evaluation and Automatic Tuning of Symmetric
                  Sparse Matrix-Vector Multiply},
  booktitle    = {33rd International Conference on Parallel Processing {(ICPP} 2004),
                  15-18 August 2004, Montreal, Quebec, Canada},
  pages        = {169--176},
  publisher    = {{IEEE} Computer Society},
  year         = {2004},
  url          = {https://doi.org/10.1109/ICPP.2004.1327917},
  doi          = {10.1109/ICPP.2004.1327917},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icpp/LeeVDY04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/para/BindelBD04,
  author       = {David Bindel and
                  Zhaojun Bai and
                  James Demmel},
  editor       = {Jack J. Dongarra and
                  Kaj Madsen and
                  Jerzy Wasniewski},
  title        = {Model Reduction for {RF} {MEMS} Simulation},
  booktitle    = {Applied Parallel Computing, State of the Art in Scientific Computing,
                  7th International Workshop, {PARA} 2004, Lyngby, Denmark, June 20-23,
                  2004, Revised Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {3732},
  pages        = {286--295},
  publisher    = {Springer},
  year         = {2004},
  url          = {https://doi.org/10.1007/11558958\_34},
  doi          = {10.1007/11558958\_34},
  timestamp    = {Tue, 14 May 2019 10:00:40 +0200},
  biburl       = {https://dblp.org/rec/conf/para/BindelBD04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/para/ImBADY04,
  author       = {Eun{-}Jin Im and
                  Ismail Bustany and
                  Cleve Ashcraft and
                  James Demmel and
                  Katherine A. Yelick},
  editor       = {Jack J. Dongarra and
                  Kaj Madsen and
                  Jerzy Wasniewski},
  title        = {Performance Tuning of Matrix Triple Products Based on Matrix Structure},
  booktitle    = {Applied Parallel Computing, State of the Art in Scientific Computing,
                  7th International Workshop, {PARA} 2004, Lyngby, Denmark, June 20-23,
                  2004, Revised Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {3732},
  pages        = {740--746},
  publisher    = {Springer},
  year         = {2004},
  url          = {https://doi.org/10.1007/11558958\_89},
  doi          = {10.1007/11558958\_89},
  timestamp    = {Thu, 25 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/para/ImBADY04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nn/MizutaniD03,
  author       = {Eiji Mizutani and
                  James Demmel},
  title        = {On structure-exploiting trust-region regularized nonlinear least squares
                  algorithms for neural-network learning},
  journal      = {Neural Networks},
  volume       = {16},
  number       = {5-6},
  pages        = {745--753},
  year         = {2003},
  url          = {https://doi.org/10.1016/S0893-6080(03)00085-6},
  doi          = {10.1016/S0893-6080(03)00085-6},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/nn/MizutaniD03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/toms/LiD03,
  author       = {Xiaoye S. Li and
                  James Demmel},
  title        = {SuperLU{\_}DIST: {A} scalable distributed-memory sparse direct solver
                  for unsymmetric linear systems},
  journal      = {{ACM} Trans. Math. Softw.},
  volume       = {29},
  number       = {2},
  pages        = {110--140},
  year         = {2003},
  url          = {https://doi.org/10.1145/779359.779361},
  doi          = {10.1145/779359.779361},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/toms/LiD03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccS/VuducGDY03,
  author       = {Rich Vuduc and
                  Attila Gyulassy and
                  James Demmel and
                  Katherine A. Yelick},
  editor       = {Peter M. A. Sloot and
                  David Abramson and
                  Alexander V. Bogdanov and
                  Jack J. Dongarra and
                  Albert Y. Zomaya and
                  Yuri E. Gorbachev},
  title        = {Memory Hierarchy Optimizations and Performance ounds for Sparse {A}},
  booktitle    = {Computational Science - {ICCS} 2003, International Conference, Melbourne,
                  Australia and St. Petersburg, Russia, June 2-4, 2003. Proceedings,
                  Part {III}},
  series       = {Lecture Notes in Computer Science},
  volume       = {2659},
  pages        = {705--714},
  publisher    = {Springer},
  year         = {2003},
  url          = {https://doi.org/10.1007/3-540-44863-2\_69},
  doi          = {10.1007/3-540-44863-2\_69},
  timestamp    = {Tue, 20 Jun 2023 16:27:45 +0200},
  biburl       = {https://dblp.org/rec/conf/iccS/VuducGDY03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/MizutaniD03,
  author       = {Eiji Mizutani and
                  James Demmel},
  editor       = {Sebastian Thrun and
                  Lawrence K. Saul and
                  Bernhard Sch{\"{o}}lkopf},
  title        = {Iterative Scaled Trust-Region Learning in Krylov Subspaces via Pearlmutter's
                  Implicit Sparse Hessian-Vector Multiply},
  booktitle    = {Advances in Neural Information Processing Systems 16 [Neural Information
                  Processing Systems, {NIPS} 2003, December 8-13, 2003, Vancouver and
                  Whistler, British Columbia, Canada]},
  pages        = {209--216},
  publisher    = {{MIT} Press},
  year         = {2003},
  url          = {https://proceedings.neurips.cc/paper/2003/hash/6ee69d3769e832ec77c9584e0b7ba112-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/MizutaniD03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/toms/LiDBHHIKKKMTTY02,
  author       = {Xiaoye S. Li and
                  James Demmel and
                  David H. Bailey and
                  Greg Henry and
                  Yozo Hida and
                  Jimmy Iskandar and
                  William Kahan and
                  Suh Y. Kang and
                  Anil Kapur and
                  Michael C. Martin and
                  Brandon Thompson and
                  Teresa Tung and
                  Daniel J. Yoo},
  title        = {Design, implementation and testing of extended and mixed precision
                  {BLAS}},
  journal      = {{ACM} Trans. Math. Softw.},
  volume       = {28},
  number       = {2},
  pages        = {152--205},
  year         = {2002},
  url          = {https://doi.org/10.1145/567806.567808},
  doi          = {10.1145/567806.567808},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/toms/LiDBHHIKKKMTTY02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/toms/BindelDKM02,
  author       = {David Bindel and
                  James Demmel and
                  William Kahan and
                  Osni Marques},
  title        = {On computing givens rotations reliably and efficiently},
  journal      = {{ACM} Trans. Math. Softw.},
  volume       = {28},
  number       = {2},
  pages        = {206--238},
  year         = {2002},
  url          = {https://doi.org/10.1145/567806.567809},
  doi          = {10.1145/567806.567809},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/toms/BindelDKM02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sc/VuducDYKNL02,
  author       = {Rich Vuduc and
                  James Demmel and
                  Katherine A. Yelick and
                  Shoaib Kamil and
                  Rajesh Nishtala and
                  Benjamin C. Lee},
  editor       = {Roscoe C. Giles and
                  Daniel A. Reed and
                  Kathryn Kelley},
  title        = {Performance optimizations and bounds for sparse matrix-vector multiply},
  booktitle    = {Proceedings of the 2002 {ACM/IEEE} conference on Supercomputing, Baltimore,
                  Maryland, USA, November 16-22, 2002, {CD-ROM}},
  pages        = {35:1--35:35},
  publisher    = {{IEEE} Computer Society},
  year         = {2002},
  url          = {https://doi.org/10.1109/SC.2002.10025},
  doi          = {10.1109/SC.2002.10025},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/VuducDYKNL02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/focm/DemmelDM01,
  author       = {James Demmel and
                  Benjamin Diament and
                  Gregorio Malajovich},
  title        = {On the Complexity of Computing Error Bounds},
  journal      = {Found. Comput. Math.},
  volume       = {1},
  number       = {1},
  pages        = {101--125},
  year         = {2001},
  url          = {https://doi.org/10.1007/s10208001004},
  doi          = {10.1007/S10208001004},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/focm/DemmelDM01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccS/DrummondDMRSS01,
  author       = {Leroy Anthony Drummond and
                  James Demmel and
                  Carlos R. Mechoso and
                  Howard Robinson and
                  Keith Sklower and
                  Joseph A. Spahr},
  editor       = {Vassil N. Alexandrov and
                  Jack J. Dongarra and
                  Benjoe A. Juliano and
                  Ren{\'{e}} S. Renner and
                  Chih Jeng Kenneth Tan},
  title        = {A Data Broker for Distributed Computing Environments},
  booktitle    = {Computational Science - {ICCS} 2001, International Conference, San
                  Francisco, CA, USA, May 28-30, 2001. Proceedings, Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {2073},
  pages        = {31--40},
  publisher    = {Springer},
  year         = {2001},
  url          = {https://doi.org/10.1007/3-540-45545-0\_13},
  doi          = {10.1007/3-540-45545-0\_13},
  timestamp    = {Fri, 01 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iccS/DrummondDMRSS01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccS/VuducDB01,
  author       = {Rich Vuduc and
                  James Demmel and
                  Jeff A. Bilmes},
  editor       = {Vassil N. Alexandrov and
                  Jack J. Dongarra and
                  Benjoe A. Juliano and
                  Ren{\'{e}} S. Renner and
                  Chih Jeng Kenneth Tan},
  title        = {Statistical Models for Automatic Performance Tuning},
  booktitle    = {Computational Science - {ICCS} 2001, International Conference, San
                  Francisco, CA, USA, May 28-30, 2001. Proceedings, Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {2073},
  pages        = {117--126},
  publisher    = {Springer},
  year         = {2001},
  url          = {https://doi.org/10.1007/3-540-45545-0\_21},
  doi          = {10.1007/3-540-45545-0\_21},
  timestamp    = {Sun, 04 Jun 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iccS/VuducDB01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siammax/Demmel00,
  author       = {James Demmel},
  title        = {Accurate Singular Value Decompositions of Structured Matrices},
  journal      = {{SIAM} J. Matrix Anal. Appl.},
  volume       = {21},
  number       = {2},
  pages        = {562--580},
  year         = {2000},
  url          = {https://doi.org/10.1137/S0895479897328716},
  doi          = {10.1137/S0895479897328716},
  timestamp    = {Tue, 26 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siammax/Demmel00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamsc/DemmelDF00,
  author       = {James Weldon Demmel and
                  Luca Dieci and
                  Mark J. Friedman},
  title        = {Computing Connecting Orbits via an Improved Algorithm for Continuing
                  Invariant Subspaces},
  journal      = {{SIAM} J. Sci. Comput.},
  volume       = {22},
  number       = {1},
  pages        = {81--94},
  year         = {2000},
  url          = {https://doi.org/10.1137/S1064827598344868},
  doi          = {10.1137/S1064827598344868},
  timestamp    = {Thu, 30 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siamsc/DemmelDF00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/MizutaniD00,
  author       = {Eiji Mizutani and
                  James Demmel},
  editor       = {Todd K. Leen and
                  Thomas G. Dietterich and
                  Volker Tresp},
  title        = {On Iterative Krylov-Dogleg Trust-Region Steps for Solving Neural Networks
                  Nonlinear Least Squares Problems},
  booktitle    = {Advances in Neural Information Processing Systems 13, Papers from
                  Neural Information Processing Systems {(NIPS)} 2000, Denver, CO, {USA}},
  pages        = {605--611},
  publisher    = {{MIT} Press},
  year         = {2000},
  url          = {https://proceedings.neurips.cc/paper/2000/hash/7ffd85d93a3e4de5c490d304ccd9f864-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/MizutaniD00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/saig/VuducD00,
  author       = {Rich Vuduc and
                  James Demmel},
  editor       = {Walid Taha},
  title        = {Code Generators for Automatic Tuning of Numerical Kernels: Experiences
                  with {FFTW}},
  booktitle    = {Semantics, Applications, and Implementation of Program Generation,
                  International Workshop {SAIG} 2000, Montreal, Canada, September 20,
                  2000, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {1924},
  pages        = {190--211},
  publisher    = {Springer},
  year         = {2000},
  url          = {https://doi.org/10.1007/3-540-45350-4\_14},
  doi          = {10.1007/3-540-45350-4\_14},
  timestamp    = {Tue, 14 May 2019 10:00:40 +0200},
  biburl       = {https://dblp.org/rec/conf/saig/VuducD00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:books/siam/00/Demmel00,
  author       = {James Demmel},
  editor       = {Zhaojun Bai and
                  James Demmel and
                  Jack J. Dongarra and
                  Axel Ruhe and
                  Henk A. van der Vorst},
  title        = {A Brief Tour of Eigenproblems},
  booktitle    = {Templates for the Solution of Algebraic Eigenvalue Problems},
  series       = {Software, environments, tools},
  volume       = {11},
  pages        = {7--36},
  publisher    = {{SIAM}},
  year         = {2000},
  url          = {https://doi.org/10.1137/1.9780898719581.ch2},
  doi          = {10.1137/1.9780898719581.CH2},
  timestamp    = {Wed, 31 Jul 2019 12:12:21 +0200},
  biburl       = {https://dblp.org/rec/books/siam/00/Demmel00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:books/siam/00/Demmel00a,
  author       = {James Demmel},
  editor       = {Zhaojun Bai and
                  James Demmel and
                  Jack J. Dongarra and
                  Axel Ruhe and
                  Henk A. van der Vorst},
  title        = {Singular Value Decomposition},
  booktitle    = {Templates for the Solution of Algebraic Eigenvalue Problems},
  series       = {Software, environments, tools},
  volume       = {11},
  pages        = {135--147},
  publisher    = {{SIAM}},
  year         = {2000},
  url          = {https://doi.org/10.1137/1.9780898719581.ch6},
  doi          = {10.1137/1.9780898719581.CH6},
  timestamp    = {Wed, 31 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/books/siam/00/Demmel00a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:books/siam/00/ChenDGSLSMBDFSVL00,
  author       = {T. Chen and
                  James Demmel and
                  Ming Gu and
                  Yousef Saad and
                  Richard B. Lehoucq and
                  Danny C. Sorensen and
                  Kristyn J. Maschhoff and
                  Zhaojun Bai and
                  David Day and
                  Roland W. Freund and
                  Gerard L. G. Sleijpen and
                  Henk A. van der Vorst and
                  Ruipeng Li},
  editor       = {Zhaojun Bai and
                  James Demmel and
                  Jack J. Dongarra and
                  Axel Ruhe and
                  Henk A. van der Vorst},
  title        = {Non-Hermitian Eigenvalue Problems},
  booktitle    = {Templates for the Solution of Algebraic Eigenvalue Problems},
  series       = {Software, environments, tools},
  volume       = {11},
  pages        = {149--231},
  publisher    = {{SIAM}},
  year         = {2000},
  url          = {https://doi.org/10.1137/1.9780898719581.ch7},
  doi          = {10.1137/1.9780898719581.CH7},
  timestamp    = {Fri, 03 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/books/siam/00/ChenDGSLSMBDFSVL00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:books/siam/00/DongarraKLDV00,
  author       = {Jack J. Dongarra and
                  Plamen Koev and
                  Xiaoye S. Li and
                  James Demmel and
                  Henk A. van der Vorst},
  editor       = {Zhaojun Bai and
                  James Demmel and
                  Jack J. Dongarra and
                  Axel Ruhe and
                  Henk A. van der Vorst},
  title        = {Common Issues},
  booktitle    = {Templates for the Solution of Algebraic Eigenvalue Problems},
  series       = {Software, environments, tools},
  volume       = {11},
  pages        = {315--336},
  publisher    = {{SIAM}},
  year         = {2000},
  url          = {https://doi.org/10.1137/1.9780898719581.ch10},
  doi          = {10.1137/1.9780898719581.CH10},
  timestamp    = {Wed, 31 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/books/siam/00/DongarraKLDV00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@book{DBLP:books/siam/00/BDDRV2000,
  editor       = {Zhaojun Bai and
                  James Demmel and
                  Jack J. Dongarra and
                  Axel Ruhe and
                  Henk A. van der Vorst},
  title        = {Templates for the Solution of Algebraic Eigenvalue Problems},
  series       = {Software, environments, tools},
  volume       = {11},
  publisher    = {{SIAM}},
  year         = {2000},
  url          = {https://doi.org/10.1137/1.9780898719581},
  doi          = {10.1137/1.9780898719581},
  isbn         = {978-0-89871-471-5},
  timestamp    = {Wed, 31 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/books/siam/00/BDDRV2000.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@book{DBLP:books/siam/AndersonBCBDDCGHMS99,
  author       = {Edward C. Anderson and
                  Zhaojun Bai and
                  Christian H. Bischof and
                  L. Susan Blackford and
                  James Demmel and
                  Jack J. Dongarra and
                  Jeremy Du Croz and
                  Anne Greenbaum and
                  Sven Hammarling and
                  A. McKenney and
                  Danny C. Sorensen},
  title        = {{LAPACK} Users' Guide, Third Edition},
  series       = {Software, Environments and Tools},
  publisher    = {{SIAM}},
  year         = {1999},
  url          = {https://doi.org/10.1137/1.9780898719604},
  doi          = {10.1137/1.9780898719604},
  isbn         = {978-0-89871-447-0},
  timestamp    = {Mon, 13 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/books/siam/AndersonBCBDDCGHMS99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siammax/DemmelEGLL99,
  author       = {James Weldon Demmel and
                  Stanley C. Eisenstat and
                  John R. Gilbert and
                  Xiaoye S. Li and
                  Joseph W. H. Liu},
  title        = {A Supernodal Approach to Sparse Partial Pivoting},
  journal      = {{SIAM} J. Matrix Anal. Appl.},
  volume       = {20},
  number       = {3},
  pages        = {720--755},
  year         = {1999},
  url          = {https://doi.org/10.1137/S0895479895291765},
  doi          = {10.1137/S0895479895291765},
  timestamp    = {Tue, 26 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siammax/DemmelEGLL99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siammax/DemmelGL99,
  author       = {James Weldon Demmel and
                  John R. Gilbert and
                  Xiaoye S. Li},
  title        = {An Asynchronous Parallel Supernodal Algorithm for Sparse Gaussian
                  Elimination},
  journal      = {{SIAM} J. Matrix Anal. Appl.},
  volume       = {20},
  number       = {4},
  pages        = {915--952},
  year         = {1999},
  url          = {https://doi.org/10.1137/S0895479897317685},
  doi          = {10.1137/S0895479897317685},
  timestamp    = {Tue, 26 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siammax/DemmelGL99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ppsc/LiD99,
  author       = {Xiaoye S. Li and
                  James Demmel},
  title        = {A Scalable Sparse Direct Solver Using Static Pivoting},
  booktitle    = {Proceedings of the Ninth {SIAM} Conference on Parallel Processing
                  for Scientific Computing, {PPSC} 1999, San Antonio, Texas, USA, March
                  22-24, 1999},
  publisher    = {{SIAM}},
  year         = {1999},
  timestamp    = {Mon, 20 Mar 2017 14:21:45 +0100},
  biburl       = {https://dblp.org/rec/conf/ppsc/LiD99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sc/AdamsD99,
  author       = {Mark Adams and
                  Jim Demmel},
  title        = {Parallel Multigrid Solver for 3D Unstructured Finite Element Problems},
  booktitle    = {Proceedings of the {ACM/IEEE} Conference on Supercomputing, {SC} 1999,
                  November 13-19, 1999, Portland, Oregon, {USA}},
  pages        = {27},
  publisher    = {{ACM}},
  year         = {1999},
  url          = {https://doi.org/10.1145/331532.331559},
  doi          = {10.1145/331532.331559},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/AdamsD99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/spaa/Demmel99,
  author       = {James Demmel},
  editor       = {Gary L. Miller and
                  Vijaya Ramachandran},
  title        = {Making Sparse Matrix Computations Scalable (Invited Talk Abstract)},
  booktitle    = {Proceedings of the Eleventh Annual {ACM} Symposium on Parallel Algorithms
                  and Architectures, {SPAA} '99, Saint-Malo, France, June 27-30, 1999},
  pages        = {43},
  publisher    = {{ACM}},
  year         = {1999},
  url          = {https://doi.org/10.1145/305619.305624},
  doi          = {10.1145/305619.305624},
  timestamp    = {Wed, 21 Nov 2018 12:27:44 +0100},
  biburl       = {https://dblp.org/rec/conf/spaa/Demmel99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/cacm/SaltzSGDBD98,
  author       = {Joel H. Saltz and
                  Alan Sussman and
                  Susan L. Graham and
                  James Demmel and
                  Scott B. Baden and
                  Jack J. Dongarra},
  title        = {Programming Tools and Environments},
  journal      = {Commun. {ACM}},
  volume       = {41},
  number       = {11},
  pages        = {64--73},
  year         = {1998},
  url          = {https://doi.org/10.1145/287831.287841},
  doi          = {10.1145/287831.287841},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/cacm/SaltzSGDBD98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siammax/BaiD98,
  author       = {Zhaojun Bai and
                  James Demmel},
  title        = {Using the Matrix Sign Function to Compute Invariant Subspaces},
  journal      = {{SIAM} J. Matrix Anal. Appl.},
  volume       = {19},
  number       = {1},
  pages        = {205--225},
  year         = {1998},
  url          = {https://doi.org/10.1137/s0895479896297719},
  doi          = {10.1137/S0895479896297719},
  timestamp    = {Sun, 13 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siammax/BaiD98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sc/LiD98,
  author       = {Xiaoye S. Li and
                  James Demmel},
  title        = {Making Sparse Gaussian Elimination Scalable by Static Pivoting},
  booktitle    = {Proceedings of the {ACM/IEEE} Conference on Supercomputing, {SC} 1998,
                  November 7-13, 1998, Orlando, FL, {USA}},
  pages        = {34},
  publisher    = {{IEEE} Computer Society},
  year         = {1998},
  url          = {https://doi.org/10.1109/SC.1998.10030},
  doi          = {10.1109/SC.1998.10030},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/LiD98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@book{DBLP:books/daglib/0041378,
  author       = {James Demmel},
  title        = {Applied Numerical Linear Algebra},
  publisher    = {{SIAM}},
  year         = {1997},
  url          = {https://doi.org/10.1137/1.9781611971446},
  doi          = {10.1137/1.9781611971446},
  isbn         = {978-0-898713-89-3},
  timestamp    = {Wed, 24 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/books/daglib/0041378.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jpdc/ChakrabartiDY97,
  author       = {Soumen Chakrabarti and
                  James Demmel and
                  Katherine A. Yelick},
  title        = {Models and Scheduling Algorithms for Mixed Data and Task Parallel
                  Programs},
  journal      = {J. Parallel Distributed Comput.},
  volume       = {47},
  number       = {2},
  pages        = {168--184},
  year         = {1997},
  url          = {https://doi.org/10.1006/jpdc.1997.1413},
  doi          = {10.1006/JPDC.1997.1413},
  timestamp    = {Sat, 22 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jpdc/ChakrabartiDY97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamsc/BaiDDPRS97,
  author       = {Zhaojun Bai and
                  James Demmel and
                  Jack J. Dongarra and
                  Antoine Petitet and
                  Howard Robinson and
                  Ken Stanley},
  title        = {The Spectral Decomposition of Nonsymmetric Matrices on Distributed
                  Memory Parallel Computers},
  journal      = {{SIAM} J. Sci. Comput.},
  volume       = {18},
  number       = {5},
  pages        = {1446--1461},
  year         = {1997},
  url          = {https://doi.org/10.1137/S1064827595281368},
  doi          = {10.1137/S1064827595281368},
  timestamp    = {Thu, 30 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siamsc/BaiDDPRS97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/toms/BlackfordCPWDDRSDH97,
  author       = {L. Susan Blackford and
                  Andrew J. Cleary and
                  Antoine Petitet and
                  R. Clinton Whaley and
                  James Demmel and
                  Inderjit S. Dhillon and
                  H. Ren and
                  Ken Stanley and
                  Jack J. Dongarra and
                  Sven Hammarling},
  title        = {Practical Experience in the Numerical Dangers of Heterogeneous Computing},
  journal      = {{ACM} Trans. Math. Softw.},
  volume       = {23},
  number       = {2},
  pages        = {133--147},
  year         = {1997},
  url          = {https://doi.org/10.1145/264029.264030},
  doi          = {10.1145/264029.264030},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/toms/BlackfordCPWDDRSDH97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/BilmesACD97,
  author       = {Jeff A. Bilmes and
                  Krste Asanovic and
                  Chee{-}Whye Chin and
                  James Demmel},
  title        = {Using PHiPAC to speed error back-propagation learning},
  booktitle    = {1997 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} '97, Munich, Germany, April 21-24, 1997},
  pages        = {4153--4156},
  publisher    = {{IEEE} Computer Society},
  year         = {1997},
  url          = {https://doi.org/10.1109/ICASSP.1997.604861},
  doi          = {10.1109/ICASSP.1997.604861},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/BilmesACD97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ics/BilmesACD97,
  author       = {Jeff A. Bilmes and
                  Krste Asanovic and
                  Chee{-}Whye Chin and
                  James Demmel},
  editor       = {Steven J. Wallach and
                  Hans P. Zima},
  title        = {Optimizing Matrix Multiply Using PHiPAC: {A} Portable, High-Performance,
                  {ANSI} {C} Coding Methodology},
  booktitle    = {Proceedings of the 11th international conference on Supercomputing,
                  {ICS} 1997, Vienna, Austria, July 7-11, 1997},
  pages        = {340--347},
  publisher    = {{ACM}},
  year         = {1997},
  url          = {https://doi.org/10.1145/263580.263662},
  doi          = {10.1145/263580.263662},
  timestamp    = {Tue, 06 Nov 2018 11:07:03 +0100},
  biburl       = {https://dblp.org/rec/conf/ics/BilmesACD97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ppsc/BlackfordCCDDDDHHPSWW97,
  author       = {L. Susan Blackford and
                  Jaeyoung Choi and
                  Andrew J. Cleary and
                  Eduardo F. D'Azevedo and
                  James Demmel and
                  Inderjit S. Dhillon and
                  Jack J. Dongarra and
                  Sven Hammarling and
                  Greg Henry and
                  Antoine Petitet and
                  Ken Stanley and
                  David W. Walker and
                  R. Clinton Whaley},
  title        = {ScaLAPACK: {A} Linear Algebra Library for Message-Passing Computers},
  booktitle    = {Proceedings of the Eighth {SIAM} Conference on Parallel Processing
                  for Scientific Computing, {PPSC} 1997, Hyatt Regency Minneapolis on
                  Nicollel Mall Hotel, Minneapolis, Minnesota, USA, March 14-17, 1997},
  publisher    = {{SIAM}},
  year         = {1997},
  timestamp    = {Mon, 21 Aug 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ppsc/BlackfordCCDDDDHHPSWW97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/para/ClearyDDDHPRSW96,
  author       = {Andrew J. Cleary and
                  James Demmel and
                  Inderjit S. Dhillon and
                  Jack J. Dongarra and
                  Sven Hammarling and
                  Antoine Petitet and
                  H. Ren and
                  Ken Stanley and
                  R. Clinton Whaley},
  editor       = {Jerzy Wasniewski and
                  Jack J. Dongarra and
                  Kaj Madsen and
                  Dorte Olesen},
  title        = {Practical Experience in the Dangers of Heterogeneous Computing},
  booktitle    = {Applied Parallel Computing, Industrial Computation and Optimization,
                  Third International Workshop, {PARA} 96, Lyngby, Denmark, August 18-21,
                  1996, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {1184},
  pages        = {57--64},
  publisher    = {Springer},
  year         = {1996},
  url          = {https://doi.org/10.1007/3-540-62095-8\_7},
  doi          = {10.1007/3-540-62095-8\_7},
  timestamp    = {Tue, 14 May 2019 10:00:40 +0200},
  biburl       = {https://dblp.org/rec/conf/para/ClearyDDDHPRSW96.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sc/BlackfordCCDDDHHPSWW96,
  author       = {L. Susan Blackford and
                  Jaeyoung Choi and
                  Andrew J. Cleary and
                  James Demmel and
                  Inderjit S. Dhillon and
                  Jack J. Dongarra and
                  Sven Hammarling and
                  Greg Henry and
                  Antoine Petitet and
                  Ken Stanley and
                  David W. Walker and
                  R. Clinton Whaley},
  title        = {ScaLAPACK: {A} Portable Linear Algebra Library for Distributed Memory
                  Computers - Design Issues and Performance},
  booktitle    = {Proceedings of the 1996 {ACM/IEEE} Conference on Supercomputing, November
                  17-22, 1996, Pittsburgh, PA, {USA}},
  pages        = {5},
  publisher    = {{IEEE} Computer Society},
  year         = {1996},
  url          = {https://doi.ieeecomputersociety.org/10.1109/SC.1996.41},
  doi          = {10.1109/SC.1996.41},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/BlackfordCCDDDHHPSWW96.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/cvgip/ManochaD95,
  author       = {Dinesh Manocha and
                  James Demmel},
  title        = {Algorithms for Intersecting Parametric and Algebraic Curves {II:}
                  Multiple Intersections},
  journal      = {{CVGIP} Graph. Model. Image Process.},
  volume       = {57},
  number       = {2},
  pages        = {81--100},
  year         = {1995},
  url          = {https://doi.org/10.1006/gmip.1995.1010},
  doi          = {10.1006/GMIP.1995.1010},
  timestamp    = {Thu, 14 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/cvgip/ManochaD95.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nla/DemmelHS95,
  author       = {James Weldon Demmel and
                  Nicholas J. Higham and
                  Robert S. Schreiber},
  title        = {Stability of block \emph{LU} factorization},
  journal      = {Numer. Linear Algebra Appl.},
  volume       = {2},
  number       = {2},
  pages        = {173--190},
  year         = {1995},
  url          = {https://doi.org/10.1002/nla.1680020208},
  doi          = {10.1002/NLA.1680020208},
  timestamp    = {Mon, 11 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/nla/DemmelHS95.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/para/ChoiDDDOPSWW95,
  author       = {Jaeyoung Choi and
                  James Demmel and
                  Inderjit S. Dhillon and
                  Jack J. Dongarra and
                  Susan Ostrouchov and
                  Antoine Petitet and
                  Ken Stanley and
                  David W. Walker and
                  R. Clinton Whaley},
  editor       = {Jack J. Dongarra and
                  Kaj Madsen and
                  Jerzy Wasniewski},
  title        = {ScaLAPACK: {A} Portable Linear Algebra Library for Distributed Memory
                  Computers - Design Issues and Performance},
  booktitle    = {Applied Parallel Computing, Computations in Physics, Chemistry and
                  Engineering Science, Second International Workshop, {PARA} '95, Lyngby,
                  Denmark, August 21-24, 1995, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {1041},
  pages        = {95--106},
  publisher    = {Springer},
  year         = {1995},
  url          = {https://doi.org/10.1007/3-540-60902-4\_12},
  doi          = {10.1007/3-540-60902-4\_12},
  timestamp    = {Tue, 14 May 2019 10:00:40 +0200},
  biburl       = {https://dblp.org/rec/conf/para/ChoiDDDOPSWW95.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ppsc/DemmelS95,
  author       = {James Demmel and
                  Ken Stanley},
  editor       = {David H. Bailey and
                  Petter E. Bj{\o}rstad and
                  John R. Gilbert and
                  Michael Mascagni and
                  Robert S. Schreiber and
                  Horst D. Simon and
                  Virginia Torczon and
                  Layne T. Watson},
  title        = {The Performance of Finding Eigenvalues and Eigenvaectors of Dense
                  Symmetric Matrices on Distributed Memory Computers},
  booktitle    = {Proceedings of the Seventh {SIAM} Conference on Parallel Processing
                  for Scientific Computing, {PPSC} 1995, San Francisco, California,
                  USA, February 15-17, 1995},
  pages        = {528--533},
  publisher    = {{SIAM}},
  year         = {1995},
  timestamp    = {Mon, 20 Mar 2017 14:21:45 +0100},
  biburl       = {https://dblp.org/rec/conf/ppsc/DemmelS95.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sc/DemmelS95,
  author       = {James Demmel and
                  Sharon Smith},
  editor       = {Sidney Karin},
  title        = {Performance of a Parallel Global Atmospheric Chemical Tracer Model},
  booktitle    = {Proceedings Supercomputing '95, San Diego, CA, USA, December 4-8,
                  1995},
  pages        = {80},
  publisher    = {{ACM}},
  year         = {1995},
  url          = {https://doi.org/10.1145/224170.224504},
  doi          = {10.1145/224170.224504},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/DemmelS95.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/spaa/ChakrabartiDY95,
  author       = {Soumen Chakrabarti and
                  James Demmel and
                  Katherine A. Yelick},
  editor       = {Charles E. Leiserson},
  title        = {Modeling the Benefits of Mixed Data and Task Parallelism},
  booktitle    = {7th Annual {ACM} Symposium on Parallel Algorithms and Architectures,
                  {SPAA} '95, Santa Barbara, California, USA, July 17-19, 1995},
  pages        = {74--83},
  publisher    = {{ACM}},
  year         = {1995},
  url          = {https://doi.org/10.1145/215399.215423},
  doi          = {10.1145/215399.215423},
  timestamp    = {Wed, 21 Nov 2018 12:27:44 +0100},
  biburl       = {https://dblp.org/rec/conf/spaa/ChakrabartiDY95.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:books/sp/cstoday95/BaiDDDGRV95,
  author       = {Zhaojun Bai and
                  David Day and
                  James Demmel and
                  Jack J. Dongarra and
                  Ming Gu and
                  Axel Ruhe and
                  Henk A. van der Vorst},
  editor       = {Jan van Leeuwen},
  title        = {Templates for Linear Algebra Problems},
  booktitle    = {Computer Science Today: Recent Trends and Developments},
  series       = {Lecture Notes in Computer Science},
  volume       = {1000},
  pages        = {115--140},
  publisher    = {Springer},
  year         = {1995},
  url          = {https://doi.org/10.1007/BFb0015240},
  doi          = {10.1007/BFB0015240},
  timestamp    = {Tue, 14 May 2019 10:00:35 +0200},
  biburl       = {https://dblp.org/rec/books/sp/cstoday95/BaiDDDGRV95.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@book{DBLP:books/siam/BarrettBCDDDEPRV94,
  author       = {Richard F. Barrett and
                  Michael W. Berry and
                  Tony F. Chan and
                  James Demmel and
                  June M. Donato and
                  Jack J. Dongarra and
                  Victor Eijkhout and
                  Roldan Pozo and
                  Charles H. Romine and
                  Henk A. van der Vorst},
  title        = {Templates for the Solution of Linear Systems: Building Blocks for
                  Iterative Methods},
  series       = {Other Titles in Applied Mathematics},
  publisher    = {{SIAM}},
  year         = {1994},
  url          = {https://doi.org/10.1137/1.9781611971538},
  doi          = {10.1137/1.9781611971538},
  isbn         = {978-0-89871-328-2},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/books/siam/BarrettBCDDDEPRV94.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tc/DemmelL94,
  author       = {James Demmel and
                  Xiaoye S. Li},
  title        = {Faster Numerical Algorithms via Exception Handling},
  journal      = {{IEEE} Trans. Computers},
  volume       = {43},
  number       = {8},
  pages        = {983--992},
  year         = {1994},
  url          = {https://doi.org/10.1109/12.295860},
  doi          = {10.1109/12.295860},
  timestamp    = {Sat, 20 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tc/DemmelL94.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tog/ManochaD94,
  author       = {Dinesh Manocha and
                  James Demmel},
  title        = {Algorithms for intersecting parametric and algebraic curves {I:} simple
                  intersections},
  journal      = {{ACM} Trans. Graph.},
  volume       = {13},
  number       = {1},
  pages        = {73--100},
  year         = {1994},
  url          = {https://doi.org/10.1145/174462.174617},
  doi          = {10.1145/174462.174617},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tog/ManochaD94.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jc/PanD93,
  author       = {Victor Y. Pan and
                  James Demmel},
  title        = {A New Algorithm for the Symmetric Tridiagonal Eigenvalue Problem},
  journal      = {J. Complex.},
  volume       = {9},
  number       = {3},
  pages        = {387--405},
  year         = {1993},
  url          = {https://doi.org/10.1006/jcom.1993.1025},
  doi          = {10.1006/JCOM.1993.1025},
  timestamp    = {Mon, 03 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jc/PanD93.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siammax/DemmelH93,
  author       = {James Weldon Demmel and
                  Nicholas J. Higham},
  title        = {Improved Error Bounds for Underdetermined System Solvers},
  journal      = {{SIAM} J. Matrix Anal. Appl.},
  volume       = {14},
  number       = {1},
  pages        = {1--14},
  year         = {1993},
  url          = {https://doi.org/10.1137/0614001},
  doi          = {10.1137/0614001},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siammax/DemmelH93.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamsc/BaiD93,
  author       = {Zhaojun Bai and
                  James Weldon Demmel},
  title        = {Computing the Generalized Singular Value Decomposition},
  journal      = {{SIAM} J. Sci. Comput.},
  volume       = {14},
  number       = {6},
  pages        = {1464--1486},
  year         = {1993},
  url          = {https://doi.org/10.1137/0914085},
  doi          = {10.1137/0914085},
  timestamp    = {Thu, 30 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siamsc/BaiD93.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/toms/DemmelK93,
  author       = {James Demmel and
                  Bo K{\aa}gstr{\"{o}}m},
  title        = {The generalized Schur decomposition of an arbitrary pencil A-{\(\lambda\)}B
                  - robust software with error bounds and applications. Part {I:} theory
                  and algorithms},
  journal      = {{ACM} Trans. Math. Softw.},
  volume       = {19},
  number       = {2},
  pages        = {160--174},
  year         = {1993},
  url          = {https://doi.org/10.1145/152613.152615},
  doi          = {10.1145/152613.152615},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/toms/DemmelK93.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/toms/DemmelK93a,
  author       = {James Demmel and
                  Bo K{\aa}gstr{\"{o}}m},
  title        = {The generalized Schur decomposition of an arbitrary pencil A-{\(\lambda\)}B
                  - robust software with error bounds and applications. Part {II:} software
                  and applications},
  journal      = {{ACM} Trans. Math. Softw.},
  volume       = {19},
  number       = {2},
  pages        = {175--201},
  year         = {1993},
  url          = {https://doi.org/10.1145/152613.152616},
  doi          = {10.1145/152613.152616},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/toms/DemmelK93a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/toms/BaiDM93,
  author       = {Zhaojun Bai and
                  James Demmel and
                  A. McKenney},
  title        = {On computing condition numbers for the nonsymmetric eigenproblem},
  journal      = {{ACM} Trans. Math. Softw.},
  volume       = {19},
  number       = {2},
  pages        = {202--223},
  year         = {1993},
  url          = {https://doi.org/10.1145/152613.152617},
  doi          = {10.1145/152613.152617},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/toms/BaiDM93.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/arith/DemmelL93,
  author       = {James Demmel and
                  Xiaoye S. Li},
  editor       = {Earl E. Swartzlander Jr. and
                  Mary Jane Irwin and
                  Graham A. Jullien},
  title        = {Faster numerical algorithms via exception handling},
  booktitle    = {11th Symposium on Computer Arithmetic, 29 June - 2 July 1993, Windsor,
                  Canada, Proceedings},
  pages        = {234--241},
  publisher    = {{IEEE} Computer Society/},
  year         = {1993},
  url          = {https://doi.org/10.1109/ARITH.1993.378087},
  doi          = {10.1109/ARITH.1993.378087},
  timestamp    = {Wed, 16 Oct 2019 14:14:53 +0200},
  biburl       = {https://dblp.org/rec/conf/arith/DemmelL93.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ppsc/DemmelDGW93,
  author       = {James Demmel and
                  Jack J. Dongarra and
                  Robert A. van de Geijn and
                  David W. Walker},
  editor       = {Richard F. Sincovec and
                  David E. Keyes and
                  Michael R. Leuze and
                  Linda R. Petzold and
                  Daniel A. Reed},
  title        = {{LAPACK} for Distributed Memory Architectures: The Next Generation},
  booktitle    = {Proceedings of the Sixth {SIAM} Conference on Parallel Processing
                  for Scientific Computing, {PPSC} 1993, Norfolk, Virginia, USA, March
                  22-24, 1993},
  pages        = {323--329},
  publisher    = {{SIAM}},
  year         = {1993},
  timestamp    = {Mon, 21 Aug 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ppsc/DemmelDGW93.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ppsc/BaiD93,
  author       = {Zhaojun Bai and
                  James Demmel},
  editor       = {Richard F. Sincovec and
                  David E. Keyes and
                  Michael R. Leuze and
                  Linda R. Petzold and
                  Daniel A. Reed},
  title        = {Design of a Parallel Nonsymmetric Eigenroutine Toolbox, Part {I}},
  booktitle    = {Proceedings of the Sixth {SIAM} Conference on Parallel Processing
                  for Scientific Computing, {PPSC} 1993, Norfolk, Virginia, USA, March
                  22-24, 1993},
  pages        = {391--398},
  publisher    = {{SIAM}},
  year         = {1993},
  timestamp    = {Mon, 20 Mar 2017 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ppsc/BaiD93.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siammax/Demmel92,
  author       = {James Demmel},
  title        = {The Componentwise Distance to the Nearest Singular Matrix},
  journal      = {{SIAM} J. Matrix Anal. Appl.},
  volume       = {13},
  number       = {1},
  pages        = {10--19},
  year         = {1992},
  url          = {https://doi.org/10.1137/0613003},
  doi          = {10.1137/0613003},
  timestamp    = {Tue, 26 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siammax/Demmel92.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siammax/DemmelV92,
  author       = {James Demmel and
                  Kresimir Veselic},
  title        = {Jacobi's Method is More Accurate than {QR}},
  journal      = {{SIAM} J. Matrix Anal. Appl.},
  volume       = {13},
  number       = {4},
  pages        = {1204--1245},
  year         = {1992},
  url          = {https://doi.org/10.1137/0613074},
  doi          = {10.1137/0613074},
  timestamp    = {Tue, 26 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siammax/DemmelV92.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/toms/DemmelH92,
  author       = {James Demmel and
                  Nicholas J. Higham},
  title        = {Stability of block algorithms with fast level-3 {BLAS}},
  journal      = {{ACM} Trans. Math. Softw.},
  volume       = {18},
  number       = {3},
  pages        = {274--291},
  year         = {1992},
  url          = {https://doi.org/10.1145/131766.131769},
  doi          = {10.1145/131766.131769},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/toms/DemmelH92.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/concurrency/Demmel91,
  author       = {James Demmel},
  title        = {{LAPACK:} {A} portable linear algebra library for high-performance
                  computers},
  journal      = {Concurr. Pract. Exp.},
  volume       = {3},
  number       = {6},
  pages        = {655--666},
  year         = {1991},
  url          = {https://doi.org/10.1002/cpe.4330030610},
  doi          = {10.1002/CPE.4330030610},
  timestamp    = {Thu, 21 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/concurrency/Demmel91.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamrev/Demmel90,
  author       = {James Weldon Demmel},
  title        = {Matrix Computations; Second Edition (Gene Golub and Charles F. Van
                  Loan)},
  journal      = {{SIAM} Rev.},
  volume       = {32},
  number       = {4},
  pages        = {690--691},
  year         = {1990},
  url          = {https://doi.org/10.1137/1032141},
  doi          = {10.1137/1032141},
  timestamp    = {Tue, 29 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siamrev/Demmel90.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamsc/DemmelK90,
  author       = {James Demmel and
                  William Kahan},
  title        = {Accurate Singular Values of Bidiagonal Matrices},
  journal      = {{SIAM} J. Sci. Comput.},
  volume       = {11},
  number       = {5},
  pages        = {873--912},
  year         = {1990},
  url          = {https://doi.org/10.1137/0911052},
  doi          = {10.1137/0911052},
  timestamp    = {Thu, 30 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siamsc/DemmelK90.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sc/AndersonBDGMCHDBS90,
  author       = {Edward C. Anderson and
                  Zhaojun Bai and
                  Jack J. Dongarra and
                  Anne Greenbaum and
                  A. McKenney and
                  Jeremy Du Croz and
                  Sven Hammarling and
                  James Demmel and
                  Christian H. Bischof and
                  Danny C. Sorensen},
  editor       = {Joanne L. Martin and
                  Daniel V. Pryor and
                  Gary R. Montry},
  title        = {{LAPACK:} a portable linear algebra library for high-performance computers},
  booktitle    = {Proceedings Supercomputing '90, New York, NY, USA, November 12-16,
                  1990},
  pages        = {2--11},
  publisher    = {{IEEE} Computer Society},
  year         = {1990},
  url          = {https://doi.org/10.1109/SUPERC.1990.129995},
  doi          = {10.1109/SUPERC.1990.129995},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/AndersonBDGMCHDBS90.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijhsc/BaiD89,
  author       = {Zhaojun Bai and
                  James Demmel},
  title        = {On a Block Implementation of Hessenberg Multishift {QR} Iteration},
  journal      = {Int. J. High Speed Comput.},
  volume       = {1},
  number       = {1},
  pages        = {97--112},
  year         = {1989},
  url          = {https://doi.org/10.1142/S0129053389000068},
  doi          = {10.1142/S0129053389000068},
  timestamp    = {Tue, 08 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijhsc/BaiD89.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/DemmelL89,
  author       = {James Demmel and
                  Gerardo Lafferriere},
  title        = {Optimal three finger grasps},
  booktitle    = {Proceedings of the 1989 {IEEE} International Conference on Robotics
                  and Automation, Scottsdale, Arizona, USA, May 14-19, 1989},
  pages        = {936--942},
  publisher    = {{IEEE} Computer Society},
  year         = {1989},
  url          = {https://doi.org/10.1109/ROBOT.1989.100101},
  doi          = {10.1109/ROBOT.1989.100101},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icra/DemmelL89.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/DemmelLSS88,
  author       = {James Demmel and
                  Gerardo Lafferriere and
                  Jacob T. Schwartz and
                  Micha Sharir},
  title        = {Theoretical and experimental studies using a multifinger planar manipulator},
  booktitle    = {Proceedings of the 1988 {IEEE} International Conference on Robotics
                  and Automation, Philadelphia, Pennsylvania, USA, April 24-29, 1988},
  pages        = {390--395},
  publisher    = {{IEEE} Computer Society},
  year         = {1988},
  url          = {https://doi.org/10.1109/ROBOT.1988.12079},
  doi          = {10.1109/ROBOT.1988.12079},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/DemmelLSS88.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/computing/Demmel87,
  author       = {James Weldon Demmel},
  title        = {Three methods for refining estimates of invariant subspaces},
  journal      = {Computing},
  volume       = {38},
  number       = {1},
  pages        = {43--57},
  year         = {1987},
  url          = {https://doi.org/10.1007/BF02253743},
  doi          = {10.1007/BF02253743},
  timestamp    = {Thu, 06 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/computing/Demmel87.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jc/Demmel87,
  author       = {James Demmel},
  title        = {The geometry of III-conditioning},
  journal      = {J. Complex.},
  volume       = {3},
  number       = {2},
  pages        = {201--229},
  year         = {1987},
  url          = {https://doi.org/10.1016/0885-064X(87)90027-6},
  doi          = {10.1016/0885-064X(87)90027-6},
  timestamp    = {Tue, 16 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jc/Demmel87.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/arith/Demmel87,
  author       = {James Demmel},
  editor       = {Mary Jane Irwin and
                  Renato Stefanelli},
  title        = {On error analysis in arithmetic with varying relative precision},
  booktitle    = {8th {IEEE} Symposium on Computer Arithmetic, {ARITH} 1987, Como, Italy,
                  May 18-21, 1987},
  pages        = {148--152},
  publisher    = {{IEEE} Computer Society},
  year         = {1987},
  url          = {https://doi.org/10.1109/ARITH.1987.6158694},
  doi          = {10.1109/ARITH.1987.6158694},
  timestamp    = {Wed, 16 Oct 2019 14:14:53 +0200},
  biburl       = {https://dblp.org/rec/conf/arith/Demmel87.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/computing/DemmelK85,
  author       = {James Weldon Demmel and
                  Fritz Kr{\"{u}}ckeberg},
  title        = {An interval algorithm for solving systems of linear equations to prespecified
                  accuracy},
  journal      = {Computing},
  volume       = {34},
  number       = {2},
  pages        = {117--129},
  year         = {1985},
  url          = {https://doi.org/10.1007/BF02259840},
  doi          = {10.1007/BF02259840},
  timestamp    = {Thu, 06 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/computing/DemmelK85.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics