BibTeX records: Jimmy Ba

download as .bib file

@article{DBLP:journals/corr/abs-2403-03218,
  author       = {Nathaniel Li and
                  Alexander Pan and
                  Anjali Gopal and
                  Summer Yue and
                  Daniel Berrios and
                  Alice Gatti and
                  Justin D. Li and
                  Ann{-}Kathrin Dombrowski and
                  Shashwat Goel and
                  Long Phan and
                  Gabriel Mukobi and
                  Nathan Helm{-}Burger and
                  Rassin Lababidi and
                  Lennart Justen and
                  Andrew B. Liu and
                  Michael Chen and
                  Isabelle Barrass and
                  Oliver Zhang and
                  Xiaoyuan Zhu and
                  Rishub Tamirisa and
                  Bhrugu Bharathi and
                  Adam Khoja and
                  Zhenqi Zhao and
                  Ariel Herbert{-}Voss and
                  Cort B. Breuer and
                  Andy Zou and
                  Mantas Mazeika and
                  Zifan Wang and
                  Palash Oswal and
                  Weiran Liu and
                  Adam A. Hunt and
                  Justin Tienken{-}Harder and
                  Kevin Y. Shih and
                  Kemper Talley and
                  John Guan and
                  Russell Kaplan and
                  Ian Steneker and
                  David Campbell and
                  Brad Jokubaitis and
                  Alex Levinson and
                  Jean Wang and
                  William Qian and
                  Kallol Krishna Karmakar and
                  Steven Basart and
                  Stephen Fitz and
                  Mindy Levine and
                  Ponnurangam Kumaraguru and
                  Uday Kiran Tupakula and
                  Vijay Varadharajan and
                  Yan Shoshitaishvili and
                  Jimmy Ba and
                  Kevin M. Esvelt and
                  Alexandr Wang and
                  Dan Hendrycks},
  title        = {The {WMDP} Benchmark: Measuring and Reducing Malicious Use With Unlearning},
  journal      = {CoRR},
  volume       = {abs/2403.03218},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2403.03218},
  doi          = {10.48550/ARXIV.2403.03218},
  eprinttype    = {arXiv},
  eprint       = {2403.03218},
  timestamp    = {Tue, 07 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2403-03218.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/RazdaibiedinaMK23,
  author       = {Anastasia Razdaibiedina and
                  Yuning Mao and
                  Madian Khabsa and
                  Mike Lewis and
                  Rui Hou and
                  Jimmy Ba and
                  Amjad Almahairi},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Residual Prompt Tuning: improving prompt tuning with residual reparameterization},
  booktitle    = {Findings of the Association for Computational Linguistics: {ACL} 2023,
                  Toronto, Canada, July 9-14, 2023},
  pages        = {6740--6757},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-acl.421},
  doi          = {10.18653/V1/2023.FINDINGS-ACL.421},
  timestamp    = {Thu, 10 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/RazdaibiedinaMK23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aied/JaipersaudZBPZZ23,
  author       = {Brandon Jaipersaud and
                  Paul Zhang and
                  Jimmy Ba and
                  Andrew Petersen and
                  Lisa Zhang and
                  Michael R. Zhang},
  editor       = {Ning Wang and
                  Genaro Rebolledo{-}Mendez and
                  Vania Dimitrova and
                  Noboru Matsuda and
                  Olga C. Santos},
  title        = {Decomposed Prompting to Answer Questions on a Course Discussion Board},
  booktitle    = {Artificial Intelligence in Education. Posters and Late Breaking Results,
                  Workshops and Tutorials, Industry and Innovation Tracks, Practitioners,
                  Doctoral Consortium and Blue Sky - 24th International Conference,
                  {AIED} 2023, Tokyo, Japan, July 3-7, 2023, Proceedings},
  series       = {Communications in Computer and Information Science},
  volume       = {1831},
  pages        = {218--223},
  publisher    = {Springer},
  year         = {2023},
  url          = {https://doi.org/10.1007/978-3-031-36336-8\_33},
  doi          = {10.1007/978-3-031-36336-8\_33},
  timestamp    = {Fri, 04 Aug 2023 15:27:47 +0200},
  biburl       = {https://dblp.org/rec/conf/aied/JaipersaudZBPZZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/BaeZRWHBG23,
  author       = {Juhan Bae and
                  Michael R. Zhang and
                  Michael Ruan and
                  Eric Wang and
                  So Hasegawa and
                  Jimmy Ba and
                  Roger Baker Grosse},
  title        = {Multi-Rate {VAE:} Train Once, Get the Full Rate-Distortion Curve},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=OJ8aSjCaMNK},
  timestamp    = {Fri, 30 Jun 2023 14:38:38 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/BaeZRWHBG23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ZhouMHPPCB23,
  author       = {Yongchao Zhou and
                  Andrei Ioan Muresanu and
                  Ziwen Han and
                  Keiran Paster and
                  Silviu Pitis and
                  Harris Chan and
                  Jimmy Ba},
  title        = {Large Language Models are Human-Level Prompt Engineers},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=92gvk82DE-},
  timestamp    = {Fri, 30 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ZhouMHPPCB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LiuVGBL23,
  author       = {Zhaoyan Liu and
                  No{\"{e}}l Vouitsis and
                  Satya Krishna Gorti and
                  Jimmy Ba and
                  Gabriel Loaiza{-}Ganem},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {{TR0N:} Translator Networks for 0-Shot Plug-and-Play Conditional Generation},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {22092--22112},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/liu23ak.html},
  timestamp    = {Mon, 28 Aug 2023 17:23:08 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/LiuVGBL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iticse/ZhangJB0ZZ23,
  author       = {Paul Zhang and
                  Brandon Jaipersaud and
                  Jimmy Ba and
                  Andrew Petersen and
                  Lisa Zhang and
                  Michael R. Zhang},
  editor       = {Mikko{-}Jussi Laakso and
                  Mattia Monga and
                  Simon and
                  Judithe Sheard},
  title        = {Classifying Course Discussion Board Questions using LLMs},
  booktitle    = {Proceedings of the 2023 Conference on Innovation and Technology in
                  Computer Science Education V. 2, ITiCSE 2023, Turku, Finland, July
                  7-12, 2023},
  pages        = {658},
  publisher    = {{ACM}},
  year         = {2023},
  url          = {https://doi.org/10.1145/3587103.3594202},
  doi          = {10.1145/3587103.3594202},
  timestamp    = {Fri, 07 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iticse/ZhangJB0ZZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BaESWW23,
  author       = {Jimmy Ba and
                  Murat A. Erdogdu and
                  Taiji Suzuki and
                  Zhichao Wang and
                  Denny Wu},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Learning in the Presence of Low-dimensional Structure: {A} Spiked
                  Random Matrix Perspective},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/38a1671ab0747b6ffe4d1c6ef117a3a9-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/BaESWW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DuboisLTZGBGLH23,
  author       = {Yann Dubois and
                  Chen Xuechen Li and
                  Rohan Taori and
                  Tianyi Zhang and
                  Ishaan Gulrajani and
                  Jimmy Ba and
                  Carlos Guestrin and
                  Percy Liang and
                  Tatsunori B. Hashimoto},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {AlpacaFarm: {A} Simulation Framework for Methods that Learn from Human
                  Feedback},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/5fc47800ee5b30b8777fdd30abcaaf3b-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/DuboisLTZGBGLH23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LifshitzPCBM23,
  author       = {Shalev Lifshitz and
                  Keiran Paster and
                  Harris Chan and
                  Jimmy Ba and
                  Sheila A. McIlraith},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {{STEVE-1:} {A} Generative Model for Text-to-Behavior in Minecraft},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/dd03f856fc7f2efeec8b1c796284561d-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/LifshitzPCBM23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2301-04104,
  author       = {Danijar Hafner and
                  Jurgis Pasukonis and
                  Jimmy Ba and
                  Timothy P. Lillicrap},
  title        = {Mastering Diverse Domains through World Models},
  journal      = {CoRR},
  volume       = {abs/2301.04104},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2301.04104},
  doi          = {10.48550/ARXIV.2301.04104},
  eprinttype    = {arXiv},
  eprint       = {2301.04104},
  timestamp    = {Thu, 19 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2301-04104.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2304-05970,
  author       = {Silviu Pitis and
                  Michael R. Zhang and
                  Andrew Wang and
                  Jimmy Ba},
  title        = {Boosted Prompt Ensembles for Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2304.05970},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2304.05970},
  doi          = {10.48550/ARXIV.2304.05970},
  eprinttype    = {arXiv},
  eprint       = {2304.05970},
  timestamp    = {Wed, 19 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2304-05970.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2304-13742,
  author       = {Zhaoyan Liu and
                  No{\"{e}}l Vouitsis and
                  Satya Krishna Gorti and
                  Jimmy Ba and
                  Gabriel Loaiza{-}Ganem},
  title        = {{TR0N:} Translator Networks for 0-Shot Plug-and-Play Conditional Generation},
  journal      = {CoRR},
  volume       = {abs/2304.13742},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2304.13742},
  doi          = {10.48550/ARXIV.2304.13742},
  eprinttype    = {arXiv},
  eprint       = {2304.13742},
  timestamp    = {Wed, 03 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2304-13742.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-03937,
  author       = {Anastasia Razdaibiedina and
                  Yuning Mao and
                  Rui Hou and
                  Madian Khabsa and
                  Mike Lewis and
                  Jimmy Ba and
                  Amjad Almahairi},
  title        = {Residual Prompt Tuning: Improving Prompt Tuning with Residual Reparameterization},
  journal      = {CoRR},
  volume       = {abs/2305.03937},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.03937},
  doi          = {10.48550/ARXIV.2305.03937},
  eprinttype    = {arXiv},
  eprint       = {2305.03937},
  timestamp    = {Thu, 11 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-03937.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-12031,
  author       = {Augustin Toma and
                  Patrick R. Lawler and
                  Jimmy Ba and
                  Rahul G. Krishnan and
                  Barry B. Rubin and
                  Bo Wang},
  title        = {Clinical Camel: An Open-Source Expert-Level Medical Language Model
                  with Dialogue-Based Knowledge Encoding},
  journal      = {CoRR},
  volume       = {abs/2305.12031},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.12031},
  doi          = {10.48550/ARXIV.2305.12031},
  eprinttype    = {arXiv},
  eprint       = {2305.12031},
  timestamp    = {Fri, 26 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-12031.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-14387,
  author       = {Yann Dubois and
                  Xuechen Li and
                  Rohan Taori and
                  Tianyi Zhang and
                  Ishaan Gulrajani and
                  Jimmy Ba and
                  Carlos Guestrin and
                  Percy Liang and
                  Tatsunori B. Hashimoto},
  title        = {AlpacaFarm: {A} Simulation Framework for Methods that Learn from Human
                  Feedback},
  journal      = {CoRR},
  volume       = {abs/2305.14387},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.14387},
  doi          = {10.48550/ARXIV.2305.14387},
  eprinttype    = {arXiv},
  eprint       = {2305.14387},
  timestamp    = {Tue, 06 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-14387.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-15316,
  author       = {Yongchao Zhou and
                  Hshmat Sahak and
                  Jimmy Ba},
  title        = {Training on Thin Air: Improve Image Classification with Generated
                  Data},
  journal      = {CoRR},
  volume       = {abs/2305.15316},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.15316},
  doi          = {10.48550/ARXIV.2305.15316},
  eprinttype    = {arXiv},
  eprint       = {2305.15316},
  timestamp    = {Tue, 06 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-15316.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-00937,
  author       = {Shalev Lifshitz and
                  Keiran Paster and
                  Harris Chan and
                  Jimmy Ba and
                  Sheila A. McIlraith},
  title        = {{STEVE-1:} {A} Generative Model for Text-to-Behavior in Minecraft},
  journal      = {CoRR},
  volume       = {abs/2306.00937},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.00937},
  doi          = {10.48550/ARXIV.2306.00937},
  eprinttype    = {arXiv},
  eprint       = {2306.00937},
  timestamp    = {Mon, 12 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-00937.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-15817,
  author       = {Yangjun Ruan and
                  Honghua Dong and
                  Andrew Wang and
                  Silviu Pitis and
                  Yongchao Zhou and
                  Jimmy Ba and
                  Yann Dubois and
                  Chris J. Maddison and
                  Tatsunori Hashimoto},
  title        = {Identifying the Risks of {LM} Agents with an LM-Emulated Sandbox},
  journal      = {CoRR},
  volume       = {abs/2309.15817},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.15817},
  doi          = {10.48550/ARXIV.2309.15817},
  eprinttype    = {arXiv},
  eprint       = {2309.15817},
  timestamp    = {Tue, 17 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-15817.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-06786,
  author       = {Keiran Paster and
                  Marco Dos Santos and
                  Zhangir Azerbayev and
                  Jimmy Ba},
  title        = {OpenWebMath: An Open Dataset of High-Quality Mathematical Web Text},
  journal      = {CoRR},
  volume       = {abs/2310.06786},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.06786},
  doi          = {10.48550/ARXIV.2310.06786},
  eprinttype    = {arXiv},
  eprint       = {2310.06786},
  timestamp    = {Tue, 24 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-06786.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2312-04528,
  author       = {Michael R. Zhang and
                  Nishkrit Desai and
                  Juhan Bae and
                  Jonathan Lorraine and
                  Jimmy Ba},
  title        = {Using Large Language Models for Hyperparameter Optimization},
  journal      = {CoRR},
  volume       = {abs/2312.04528},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2312.04528},
  doi          = {10.48550/ARXIV.2312.04528},
  eprinttype    = {arXiv},
  eprint       = {2312.04528},
  timestamp    = {Tue, 02 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2312-04528.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/BaEGSSWZ22,
  author       = {Jimmy Ba and
                  Murat A. Erdogdu and
                  Marzyeh Ghassemi and
                  Shengyang Sun and
                  Taiji Suzuki and
                  Denny Wu and
                  Tianzong Zhang},
  title        = {Understanding the Variance Collapse of {SVGD} in High Dimensions},
  booktitle    = {The Tenth International Conference on Learning Representations, {ICLR}
                  2022, Virtual Event, April 25-29, 2022},
  publisher    = {OpenReview.net},
  year         = {2022},
  url          = {https://openreview.net/forum?id=Qycd9j5Qp9J},
  timestamp    = {Sat, 20 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/BaEGSSWZ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BaESWWY22,
  author       = {Jimmy Ba and
                  Murat A. Erdogdu and
                  Taiji Suzuki and
                  Zhichao Wang and
                  Denny Wu and
                  Greg Yang},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {High-dimensional Asymptotics of Feature Learning: How One Gradient
                  Step Improves the Representation},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/f7e7fabd73b3df96c54a320862afcb78-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/BaESWWY22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/PasterMB22,
  author       = {Keiran Paster and
                  Sheila A. McIlraith and
                  Jimmy Ba},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {You Can't Count on Luck: Why Decision Transformers and RvS Fail in
                  Stochastic Environments},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/fe90657b12193c7b52a3418bdc351807-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/PasterMB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ZhouNB22,
  author       = {Yongchao Zhou and
                  Ehsan Nezhadarya and
                  Jimmy Ba},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {Dataset Distillation using Neural Feature Regression},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/3fe2a777282299ecb4f9e7ebb531f0ab-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/ZhouNB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2205-01445,
  author       = {Jimmy Ba and
                  Murat A. Erdogdu and
                  Taiji Suzuki and
                  Zhichao Wang and
                  Denny Wu and
                  Greg Yang},
  title        = {High-dimensional Asymptotics of Feature Learning: How One Gradient
                  Step Improves the Representation},
  journal      = {CoRR},
  volume       = {abs/2205.01445},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.01445},
  doi          = {10.48550/ARXIV.2205.01445},
  eprinttype    = {arXiv},
  eprint       = {2205.01445},
  timestamp    = {Thu, 05 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-01445.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2205-15967,
  author       = {Keiran Paster and
                  Sheila A. McIlraith and
                  Jimmy Ba},
  title        = {You Can't Count on Luck: Why Decision Transformers Fail in Stochastic
                  Environments},
  journal      = {CoRR},
  volume       = {abs/2205.15967},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.15967},
  doi          = {10.48550/ARXIV.2205.15967},
  eprinttype    = {arXiv},
  eprint       = {2205.15967},
  timestamp    = {Wed, 01 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-15967.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-00719,
  author       = {Yongchao Zhou and
                  Ehsan Nezhadarya and
                  Jimmy Ba},
  title        = {Dataset Distillation using Neural Feature Regression},
  journal      = {CoRR},
  volume       = {abs/2206.00719},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.00719},
  doi          = {10.48550/ARXIV.2206.00719},
  eprinttype    = {arXiv},
  eprint       = {2206.00719},
  timestamp    = {Mon, 13 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-00719.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2209-13569,
  author       = {Siddhartha Rao Kamalakara and
                  Acyr Locatelli and
                  Bharat Venkitesh and
                  Jimmy Ba and
                  Yarin Gal and
                  Aidan N. Gomez},
  title        = {Exploring Low Rank Training of Deep Neural Networks},
  journal      = {CoRR},
  volume       = {abs/2209.13569},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2209.13569},
  doi          = {10.48550/ARXIV.2209.13569},
  eprinttype    = {arXiv},
  eprint       = {2209.13569},
  timestamp    = {Thu, 06 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2209-13569.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-01910,
  author       = {Yongchao Zhou and
                  Andrei Ioan Muresanu and
                  Ziwen Han and
                  Keiran Paster and
                  Silviu Pitis and
                  Harris Chan and
                  Jimmy Ba},
  title        = {Large Language Models Are Human-Level Prompt Engineers},
  journal      = {CoRR},
  volume       = {abs/2211.01910},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.01910},
  doi          = {10.48550/ARXIV.2211.01910},
  eprinttype    = {arXiv},
  eprint       = {2211.01910},
  timestamp    = {Fri, 04 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-01910.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-03905,
  author       = {Juhan Bae and
                  Michael R. Zhang and
                  Michael Ruan and
                  Eric Wang and
                  So Hasegawa and
                  Jimmy Ba and
                  Roger B. Grosse},
  title        = {Multi-Rate {VAE:} Train Once, Get the Full Rate-Distortion Curve},
  journal      = {CoRR},
  volume       = {abs/2212.03905},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.03905},
  doi          = {10.48550/ARXIV.2212.03905},
  eprinttype    = {arXiv},
  eprint       = {2212.03905},
  timestamp    = {Mon, 02 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-03905.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/AmariBGLNSWX21,
  author       = {Shun{-}ichi Amari and
                  Jimmy Ba and
                  Roger Baker Grosse and
                  Xuechen Li and
                  Atsushi Nitanda and
                  Taiji Suzuki and
                  Denny Wu and
                  Ji Xu},
  title        = {When does preconditioning help or hurt generalization?},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=S724o4\_WB3},
  timestamp    = {Wed, 23 Jun 2021 17:36:39 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/AmariBGLNSWX21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/HafnerL0B21,
  author       = {Danijar Hafner and
                  Timothy P. Lillicrap and
                  Mohammad Norouzi and
                  Jimmy Ba},
  title        = {Mastering Atari with Discrete World Models},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=0oabwyZbOu},
  timestamp    = {Wed, 23 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/HafnerL0B21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/PasterMB21,
  author       = {Keiran Paster and
                  Sheila A. McIlraith and
                  Jimmy Ba},
  title        = {Planning from Pixels using Inverse Dynamics Models},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=V6BjBgku7Ro},
  timestamp    = {Wed, 23 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/PasterMB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/WuJBG21,
  author       = {Yuhuai Wu and
                  Albert Q. Jiang and
                  Jimmy Ba and
                  Roger Baker Grosse},
  title        = {{INT:} An Inequality Benchmark for Evaluating Generalization in Theorem
                  Proving},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=O6LPudowNQm},
  timestamp    = {Mon, 30 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/WuJBG21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/JiaNWB21,
  author       = {Sheng Jia and
                  Ehsan Nezhadarya and
                  Yuhuai Wu and
                  Jimmy Ba},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {Efficient Statistical Tests: {A} Neural Tangent Kernel Approach},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {4893--4903},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/jia21a.html},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/JiaNWB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/WuRLBGS21,
  author       = {Yuhuai Wu and
                  Markus N. Rabe and
                  Wenda Li and
                  Jimmy Ba and
                  Roger B. Grosse and
                  Christian Szegedy},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {{LIME:} Learning Inductive Bias for Primitives of Mathematical Reasoning},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {11251--11262},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/wu21c.html},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/WuRLBGS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/HanZCPZB21,
  author       = {Beining Han and
                  Chongyi Zheng and
                  Harris Chan and
                  Keiran Paster and
                  Michael R. Zhang and
                  Jimmy Ba},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Learning Domain Invariant Representations in Goal-conditioned Block
                  MDPs},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {764--776},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/06d172404821f7d01060cc9629171b2e-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/HanZCPZB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LiZXDB21,
  author       = {Jingling Li and
                  Mozhi Zhang and
                  Keyulu Xu and
                  John Dickerson and
                  Jimmy Ba},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {How does a Neural Network's Architecture Impact its Robustness to
                  Noisy Labels?},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {9788--9803},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/51311013e51adebc3c34d2cc591fefee-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/LiZXDB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/SaxenaBH21,
  author       = {Vaibhav Saxena and
                  Jimmy Ba and
                  Danijar Hafner},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Clockwork Variational Autoencoders},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {29246--29257},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/f490d0af974fedf90cb0f1edce8e3dd5-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/SaxenaBH21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2101-06223,
  author       = {Yuhuai Wu and
                  Markus N. Rabe and
                  Wenda Li and
                  Jimmy Ba and
                  Roger B. Grosse and
                  Christian Szegedy},
  title        = {{LIME:} Learning Inductive Bias for Primitives of Mathematical Reasoning},
  journal      = {CoRR},
  volume       = {abs/2101.06223},
  year         = {2021},
  url          = {https://arxiv.org/abs/2101.06223},
  eprinttype    = {arXiv},
  eprint       = {2101.06223},
  timestamp    = {Fri, 22 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2101-06223.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-09532,
  author       = {Vaibhav Saxena and
                  Jimmy Ba and
                  Danijar Hafner},
  title        = {Clockwork Variational Autoencoders},
  journal      = {CoRR},
  volume       = {abs/2102.09532},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.09532},
  eprinttype    = {arXiv},
  eprint       = {2102.09532},
  timestamp    = {Wed, 24 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-09532.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-14248,
  author       = {Beining Han and
                  Chongyi Zheng and
                  Harris Chan and
                  Keiran Paster and
                  Michael R. Zhang and
                  Jimmy Ba},
  title        = {Learning Domain Invariant Representations in Goal-conditioned Block
                  MDPs},
  journal      = {CoRR},
  volume       = {abs/2110.14248},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.14248},
  eprinttype    = {arXiv},
  eprint       = {2110.14248},
  timestamp    = {Fri, 29 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-14248.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/WenLGZCB20,
  author       = {Yeming Wen and
                  Kevin Luk and
                  Maxime Gazeau and
                  Guodong Zhang and
                  Harris Chan and
                  Jimmy Ba},
  editor       = {Silvia Chiappa and
                  Roberto Calandra},
  title        = {An Empirical Study of Stochastic Gradient Descent with Structured
                  Covariance Noise},
  booktitle    = {The 23rd International Conference on Artificial Intelligence and Statistics,
                  {AISTATS} 2020, 26-28 August 2020, Online [Palermo, Sicily, Italy]},
  series       = {Proceedings of Machine Learning Research},
  volume       = {108},
  pages        = {3621--3631},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v108/wen20a.html},
  timestamp    = {Mon, 29 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/WenLGZCB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/BaESWZ20,
  author       = {Jimmy Ba and
                  Murat A. Erdogdu and
                  Taiji Suzuki and
                  Denny Wu and
                  Tianzong Zhang},
  title        = {Generalization of Two-layer Neural Networks: An Asymptotic Viewpoint},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=H1gBsgBYwH},
  timestamp    = {Thu, 07 May 2020 17:11:47 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/BaESWZ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/HafnerLB020,
  author       = {Danijar Hafner and
                  Timothy P. Lillicrap and
                  Jimmy Ba and
                  Mohammad Norouzi},
  title        = {Dream to Control: Learning Behaviors by Latent Imagination},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=S1lOTC4tDS},
  timestamp    = {Thu, 07 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/HafnerLB020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/PitisCJB20,
  author       = {Silviu Pitis and
                  Harris Chan and
                  Kiarash Jamali and
                  Jimmy Ba},
  title        = {An Inductive Bias for Distances: Neural Nets that Respect the Triangle
                  Inequality},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=HJeiDpVFPr},
  timestamp    = {Thu, 07 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/PitisCJB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/WangB20,
  author       = {Tingwu Wang and
                  Jimmy Ba},
  title        = {Exploring Model-based Planning with Policy Networks},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=H1exf64KwH},
  timestamp    = {Thu, 07 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/WangB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/WangZB20,
  author       = {Yuanhao Wang and
                  Guodong Zhang and
                  Jimmy Ba},
  title        = {On Solving Minimax Optimization Locally: {A} Follow-the-Ridge Approach},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=Hkx7\_1rKwS},
  timestamp    = {Fri, 12 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/WangZB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/WenTB20,
  author       = {Yeming Wen and
                  Dustin Tran and
                  Jimmy Ba},
  title        = {BatchEnsemble: an Alternative Approach to Efficient Ensemble and Lifelong
                  Learning},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=Sklf1yrYDr},
  timestamp    = {Thu, 07 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/WenTB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/HuangPBV20,
  author       = {Xiao Shi Huang and
                  Felipe P{\'{e}}rez and
                  Jimmy Ba and
                  Maksims Volkovs},
  title        = {Improving Transformer Optimization Through Better Initialization},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {4475--4483},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/huang20f.html},
  timestamp    = {Tue, 15 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/HuangPBV20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/PitisCZSB20,
  author       = {Silviu Pitis and
                  Harris Chan and
                  Stephen Zhao and
                  Bradly C. Stadie and
                  Jimmy Ba},
  title        = {Maximum Entropy Gain Exploration for Long Horizon Multi-goal Reinforcement
                  Learning},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {7750--7761},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/pitis20a.html},
  timestamp    = {Tue, 15 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/PitisCZSB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/uai/StadieZB20,
  author       = {Bradly C. Stadie and
                  Lunjun Zhang and
                  Jimmy Ba},
  editor       = {Ryan P. Adams and
                  Vibhav Gogate},
  title        = {Learning Intrinsic Rewards as a Bi-Level Optimization Problem},
  booktitle    = {Proceedings of the Thirty-Sixth Conference on Uncertainty in Artificial
                  Intelligence, {UAI} 2020, virtual online, August 3-6, 2020},
  series       = {Proceedings of Machine Learning Research},
  volume       = {124},
  pages        = {111--120},
  publisher    = {{AUAI} Press},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v124/stadie20a.html},
  timestamp    = {Tue, 07 May 2024 20:09:01 +0200},
  biburl       = {https://dblp.org/rec/conf/uai/StadieZB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-05825,
  author       = {Silviu Pitis and
                  Harris Chan and
                  Kiarash Jamali and
                  Jimmy Ba},
  title        = {An Inductive Bias for Distances: Neural Nets that Respect the Triangle
                  Inequality},
  journal      = {CoRR},
  volume       = {abs/2002.05825},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.05825},
  eprinttype    = {arXiv},
  eprint       = {2002.05825},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-05825.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-06715,
  author       = {Yeming Wen and
                  Dustin Tran and
                  Jimmy Ba},
  title        = {BatchEnsemble: An Alternative Approach to Efficient Ensemble and Lifelong
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2002.06715},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.06715},
  eprinttype    = {arXiv},
  eprint       = {2002.06715},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-06715.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-10732,
  author       = {Shun{-}ichi Amari and
                  Jimmy Ba and
                  Roger B. Grosse and
                  Xuechen Li and
                  Atsushi Nitanda and
                  Taiji Suzuki and
                  Denny Wu and
                  Ji Xu},
  title        = {When Does Preconditioning Help or Hurt Generalization?},
  journal      = {CoRR},
  volume       = {abs/2006.10732},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.10732},
  eprinttype    = {arXiv},
  eprint       = {2006.10732},
  timestamp    = {Wed, 24 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-10732.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-02832,
  author       = {Silviu Pitis and
                  Harris Chan and
                  Stephen Zhao and
                  Bradly C. Stadie and
                  Jimmy Ba},
  title        = {Maximum Entropy Gain Exploration for Long Horizon Multi-goal Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2007.02832},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.02832},
  eprinttype    = {arXiv},
  eprint       = {2007.02832},
  timestamp    = {Wed, 02 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-02832.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-02924,
  author       = {Yuhuai Wu and
                  Albert Q. Jiang and
                  Jimmy Ba and
                  Roger B. Grosse},
  title        = {{INT:} An Inequality Benchmark for Evaluating Generalization in Theorem
                  Proving},
  journal      = {CoRR},
  volume       = {abs/2007.02924},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.02924},
  eprinttype    = {arXiv},
  eprint       = {2007.02924},
  timestamp    = {Mon, 30 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-02924.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-04212,
  author       = {Yuhuai Wu and
                  Honghua Dong and
                  Roger B. Grosse and
                  Jimmy Ba},
  title        = {The Scattering Compositional Learner: Discovering Objects, Attributes,
                  Relationships in Analogical Reasoning},
  journal      = {CoRR},
  volume       = {abs/2007.04212},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.04212},
  eprinttype    = {arXiv},
  eprint       = {2007.04212},
  timestamp    = {Mon, 20 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-04212.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-04532,
  author       = {Fartash Faghri and
                  David Duvenaud and
                  David J. Fleet and
                  Jimmy Ba},
  title        = {A Study of Gradient Variance in Deep Learning},
  journal      = {CoRR},
  volume       = {abs/2007.04532},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.04532},
  eprinttype    = {arXiv},
  eprint       = {2007.04532},
  timestamp    = {Mon, 20 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-04532.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2009-01791,
  author       = {Danijar Hafner and
                  Pedro A. Ortega and
                  Jimmy Ba and
                  Thomas Parr and
                  Karl J. Friston and
                  Nicolas Heess},
  title        = {Action and Perception as Divergence Minimization},
  journal      = {CoRR},
  volume       = {abs/2009.01791},
  year         = {2020},
  url          = {https://arxiv.org/abs/2009.01791},
  eprinttype    = {arXiv},
  eprint       = {2009.01791},
  timestamp    = {Wed, 16 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2009-01791.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-02193,
  author       = {Danijar Hafner and
                  Timothy P. Lillicrap and
                  Mohammad Norouzi and
                  Jimmy Ba},
  title        = {Mastering Atari with Discrete World Models},
  journal      = {CoRR},
  volume       = {abs/2010.02193},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.02193},
  eprinttype    = {arXiv},
  eprint       = {2010.02193},
  timestamp    = {Mon, 12 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-02193.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-02419,
  author       = {Keiran Paster and
                  Sheila A. McIlraith and
                  Jimmy Ba},
  title        = {Planning from Pixels using Inverse Dynamics Models},
  journal      = {CoRR},
  volume       = {abs/2012.02419},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.02419},
  eprinttype    = {arXiv},
  eprint       = {2012.02419},
  timestamp    = {Wed, 09 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-02419.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-11538,
  author       = {Brendon Matusch and
                  Jimmy Ba and
                  Danijar Hafner},
  title        = {Evaluating Agents without Rewards},
  journal      = {CoRR},
  volume       = {abs/2012.11538},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.11538},
  eprinttype    = {arXiv},
  eprint       = {2012.11538},
  timestamp    = {Mon, 04 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-11538.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-12896,
  author       = {Jingling Li and
                  Mozhi Zhang and
                  Keyulu Xu and
                  John P. Dickerson and
                  Jimmy Ba},
  title        = {Noisy Labels Can Induce Good Representations},
  journal      = {CoRR},
  volume       = {abs/2012.12896},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.12896},
  eprinttype    = {arXiv},
  eprint       = {2012.12896},
  timestamp    = {Tue, 05 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-12896.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/JiaKB19,
  author       = {Sheng Jia and
                  Jamie Kiros and
                  Jimmy Ba},
  title        = {{DOM-Q-NET:} Grounded {RL} on Structured Language},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=HJgd1nAqFX},
  timestamp    = {Thu, 25 Jul 2019 13:03:15 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/JiaKB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/WangZFB19,
  author       = {Tingwu Wang and
                  Yuhao Zhou and
                  Sanja Fidler and
                  Jimmy Ba},
  title        = {Neural Graph Evolution: Towards Efficient Automatic Robot Design},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=BkgWHnR5tm},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/WangZFB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ZhangLBH19,
  author       = {Michael R. Zhang and
                  James Lucas and
                  Jimmy Ba and
                  Geoffrey E. Hinton},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {Lookahead Optimizer: k steps forward, 1 step back},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {9593--9604},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/90fd4f88f588ae64038134f1eeaa023f-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/ZhangLBH19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LiuKBKS19,
  author       = {Jenny Liu and
                  Aviral Kumar and
                  Jimmy Ba and
                  Jamie Kiros and
                  Kevin Swersky},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {Graph Normalizing Flows},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {13556--13566},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/1e44fdf9c44d7328fecc02d677ed704d-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/LiuKBKS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1902-04546,
  author       = {Harris Chan and
                  Yuhuai Wu and
                  Jamie Kiros and
                  Sanja Fidler and
                  Jimmy Ba},
  title        = {{ACTRCE:} Augmenting Experience via Teacher's Advice For Multi-Goal
                  Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1902.04546},
  year         = {2019},
  url          = {http://arxiv.org/abs/1902.04546},
  eprinttype    = {arXiv},
  eprint       = {1902.04546},
  timestamp    = {Tue, 21 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1902-04546.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1902-07257,
  author       = {Sheng Jia and
                  Jamie Kiros and
                  Jimmy Ba},
  title        = {{DOM-Q-NET:} Grounded {RL} on Structured Language},
  journal      = {CoRR},
  volume       = {abs/1902.07257},
  year         = {2019},
  url          = {http://arxiv.org/abs/1902.07257},
  eprinttype    = {arXiv},
  eprint       = {1902.07257},
  timestamp    = {Tue, 21 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1902-07257.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1902-08234,
  author       = {Yeming Wen and
                  Kevin Luk and
                  Maxime Gazeau and
                  Guodong Zhang and
                  Harris Chan and
                  Jimmy Ba},
  title        = {Interplay Between Optimization and Generalization of Stochastic Gradient
                  Descent with Covariance Noise},
  journal      = {CoRR},
  volume       = {abs/1902.08234},
  year         = {2019},
  url          = {http://arxiv.org/abs/1902.08234},
  eprinttype    = {arXiv},
  eprint       = {1902.08234},
  timestamp    = {Tue, 21 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1902-08234.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-13177,
  author       = {Jenny Liu and
                  Aviral Kumar and
                  Jimmy Ba and
                  Jamie Kiros and
                  Kevin Swersky},
  title        = {Graph Normalizing Flows},
  journal      = {CoRR},
  volume       = {abs/1905.13177},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.13177},
  eprinttype    = {arXiv},
  eprint       = {1905.13177},
  timestamp    = {Mon, 03 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-13177.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-05370,
  author       = {Tingwu Wang and
                  Yuhao Zhou and
                  Sanja Fidler and
                  Jimmy Ba},
  title        = {Neural Graph Evolution: Towards Efficient Automatic Robot Design},
  journal      = {CoRR},
  volume       = {abs/1906.05370},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.05370},
  eprinttype    = {arXiv},
  eprint       = {1906.05370},
  timestamp    = {Mon, 24 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-05370.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-08649,
  author       = {Tingwu Wang and
                  Jimmy Ba},
  title        = {Exploring Model-based Planning with Policy Networks},
  journal      = {CoRR},
  volume       = {abs/1906.08649},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.08649},
  eprinttype    = {arXiv},
  eprint       = {1906.08649},
  timestamp    = {Mon, 24 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-08649.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1907-02057,
  author       = {Tingwu Wang and
                  Xuchan Bao and
                  Ignasi Clavera and
                  Jerrick Hoang and
                  Yeming Wen and
                  Eric D. Langlois and
                  Shunshi Zhang and
                  Guodong Zhang and
                  Pieter Abbeel and
                  Jimmy Ba},
  title        = {Benchmarking Model-Based Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1907.02057},
  year         = {2019},
  url          = {http://arxiv.org/abs/1907.02057},
  eprinttype    = {arXiv},
  eprint       = {1907.02057},
  timestamp    = {Fri, 20 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1907-02057.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1907-08610,
  author       = {Michael R. Zhang and
                  James Lucas and
                  Geoffrey E. Hinton and
                  Jimmy Ba},
  title        = {Lookahead Optimizer: k steps forward, 1 step back},
  journal      = {CoRR},
  volume       = {abs/1907.08610},
  year         = {2019},
  url          = {http://arxiv.org/abs/1907.08610},
  eprinttype    = {arXiv},
  eprint       = {1907.08610},
  timestamp    = {Tue, 23 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1907-08610.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-07512,
  author       = {Yuanhao Wang and
                  Guodong Zhang and
                  Jimmy Ba},
  title        = {On Solving Minimax Optimization Locally: {A} Follow-the-Ridge Approach},
  journal      = {CoRR},
  volume       = {abs/1910.07512},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.07512},
  eprinttype    = {arXiv},
  eprint       = {1910.07512},
  timestamp    = {Fri, 12 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-07512.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-01603,
  author       = {Danijar Hafner and
                  Timothy P. Lillicrap and
                  Jimmy Ba and
                  Mohammad Norouzi},
  title        = {Dream to Control: Learning Behaviors by Latent Imagination},
  journal      = {CoRR},
  volume       = {abs/1912.01603},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.01603},
  eprinttype    = {arXiv},
  eprint       = {1912.01603},
  timestamp    = {Tue, 07 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-01603.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/MartensBJ18,
  author       = {James Martens and
                  Jimmy Ba and
                  Matt Johnson},
  title        = {Kronecker-factored Curvature Approximations for Recurrent Neural Networks},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=HyMTkQZAb},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/MartensBJ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/WangLBF18,
  author       = {Tingwu Wang and
                  Renjie Liao and
                  Jimmy Ba and
                  Sanja Fidler},
  title        = {NerveNet: Learning Structured Policy with Graph Neural Networks},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=S1sqHMZCb},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/WangLBF18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/WenVBTG18,
  author       = {Yeming Wen and
                  Paul Vicol and
                  Jimmy Ba and
                  Dustin Tran and
                  Roger B. Grosse},
  title        = {Flipout: Efficient Pseudo-Independent Weight Perturbations on Mini-Batches},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=rJNpifWAb},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/WenVBTG18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/SanjabiBRL18,
  author       = {Maziar Sanjabi and
                  Jimmy Ba and
                  Meisam Razaviyayn and
                  Jason D. Lee},
  editor       = {Samy Bengio and
                  Hanna M. Wallach and
                  Hugo Larochelle and
                  Kristen Grauman and
                  Nicol{\`{o}} Cesa{-}Bianchi and
                  Roman Garnett},
  title        = {On the Convergence and Robustness of Training GANs with Regularized
                  Optimal Transport},
  booktitle    = {Advances in Neural Information Processing Systems 31: Annual Conference
                  on Neural Information Processing Systems 2018, NeurIPS 2018, December
                  3-8, 2018, Montr{\'{e}}al, Canada},
  pages        = {7091--7101},
  year         = {2018},
  url          = {https://proceedings.neurips.cc/paper/2018/hash/5a9d8bf5b7a4b35f3110dde8673bdda2-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/SanjabiBRL18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/MacKayVBG18,
  author       = {Matthew MacKay and
                  Paul Vicol and
                  Jimmy Ba and
                  Roger B. Grosse},
  editor       = {Samy Bengio and
                  Hanna M. Wallach and
                  Hugo Larochelle and
                  Kristen Grauman and
                  Nicol{\`{o}} Cesa{-}Bianchi and
                  Roman Garnett},
  title        = {Reversible Recurrent Neural Networks},
  booktitle    = {Advances in Neural Information Processing Systems 31: Annual Conference
                  on Neural Information Processing Systems 2018, NeurIPS 2018, December
                  3-8, 2018, Montr{\'{e}}al, Canada},
  pages        = {9043--9054},
  year         = {2018},
  url          = {https://proceedings.neurips.cc/paper/2018/hash/4ff6fa96179cdc2838e8d8ce64cd10a7-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/MacKayVBG18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1802-08249,
  author       = {Maziar Sanjabi and
                  Jimmy Ba and
                  Meisam Razaviyayn and
                  Jason D. Lee},
  title        = {Solving Approximate Wasserstein GANs to Stationarity},
  journal      = {CoRR},
  volume       = {abs/1802.08249},
  year         = {2018},
  url          = {http://arxiv.org/abs/1802.08249},
  eprinttype    = {arXiv},
  eprint       = {1802.08249},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1802-08249.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1803-04386,
  author       = {Yeming Wen and
                  Paul Vicol and
                  Jimmy Ba and
                  Dustin Tran and
                  Roger B. Grosse},
  title        = {Flipout: Efficient Pseudo-Independent Weight Perturbations on Mini-Batches},
  journal      = {CoRR},
  volume       = {abs/1803.04386},
  year         = {2018},
  url          = {http://arxiv.org/abs/1803.04386},
  eprinttype    = {arXiv},
  eprint       = {1803.04386},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1803-04386.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-10999,
  author       = {Matthew MacKay and
                  Paul Vicol and
                  Jimmy Ba and
                  Roger B. Grosse},
  title        = {Reversible Recurrent Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1810.10999},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.10999},
  eprinttype    = {arXiv},
  eprint       = {1810.10999},
  timestamp    = {Mon, 22 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-10999.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/BaGM17,
  author       = {Jimmy Ba and
                  Roger B. Grosse and
                  James Martens},
  title        = {Distributed Second-Order Optimization using Kronecker-Factored Approximations},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=SkkTMpjex},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/BaGM17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/WuMGLB17,
  author       = {Yuhuai Wu and
                  Elman Mansimov and
                  Roger B. Grosse and
                  Shun Liao and
                  Jimmy Ba},
  editor       = {Isabelle Guyon and
                  Ulrike von Luxburg and
                  Samy Bengio and
                  Hanna M. Wallach and
                  Rob Fergus and
                  S. V. N. Vishwanathan and
                  Roman Garnett},
  title        = {Scalable trust-region method for deep reinforcement learning using
                  Kronecker-factored approximation},
  booktitle    = {Advances in Neural Information Processing Systems 30: Annual Conference
                  on Neural Information Processing Systems 2017, December 4-9, 2017,
                  Long Beach, CA, {USA}},
  pages        = {5279--5288},
  year         = {2017},
  url          = {https://proceedings.neurips.cc/paper/2017/hash/361440528766bbaaaa1901845cf4152b-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 13:58:27 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/WuMGLB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1708-05144,
  author       = {Yuhuai Wu and
                  Elman Mansimov and
                  Shun Liao and
                  Roger B. Grosse and
                  Jimmy Ba},
  title        = {Scalable trust-region method for deep reinforcement learning using
                  Kronecker-factored approximation},
  journal      = {CoRR},
  volume       = {abs/1708.05144},
  year         = {2017},
  url          = {http://arxiv.org/abs/1708.05144},
  eprinttype    = {arXiv},
  eprint       = {1708.05144},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1708-05144.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/bioinformatics/KrausBF16,
  author       = {Oren Z. Kraus and
                  Lei Jimmy Ba and
                  Brendan J. Frey},
  title        = {Classifying and segmenting microscopy images with deep multiple instance
                  learning},
  journal      = {Bioinform.},
  volume       = {32},
  number       = {12},
  pages        = {52--59},
  year         = {2016},
  url          = {https://doi.org/10.1093/bioinformatics/btw252},
  doi          = {10.1093/BIOINFORMATICS/BTW252},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/bioinformatics/KrausBF16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BaHMLI16,
  author       = {Jimmy Ba and
                  Geoffrey E. Hinton and
                  Volodymyr Mnih and
                  Joel Z. Leibo and
                  Catalin Ionescu},
  editor       = {Daniel D. Lee and
                  Masashi Sugiyama and
                  Ulrike von Luxburg and
                  Isabelle Guyon and
                  Roman Garnett},
  title        = {Using Fast Weights to Attend to the Recent Past},
  booktitle    = {Advances in Neural Information Processing Systems 29: Annual Conference
                  on Neural Information Processing Systems 2016, December 5-10, 2016,
                  Barcelona, Spain},
  pages        = {4331--4339},
  year         = {2016},
  url          = {https://proceedings.neurips.cc/paper/2016/hash/9f44e956e3a2b7b5598c625fcc802c36-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BaHMLI16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/MansimovPBS15,
  author       = {Elman Mansimov and
                  Emilio Parisotto and
                  Lei Jimmy Ba and
                  Ruslan Salakhutdinov},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Generating Images from Captions with Attention},
  booktitle    = {4th International Conference on Learning Representations, {ICLR} 2016,
                  San Juan, Puerto Rico, May 2-4, 2016, Conference Track Proceedings},
  year         = {2016},
  url          = {http://arxiv.org/abs/1511.02793},
  timestamp    = {Wed, 17 Jul 2019 10:40:54 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/MansimovPBS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/ParisottoBS15,
  author       = {Emilio Parisotto and
                  Lei Jimmy Ba and
                  Ruslan Salakhutdinov},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Actor-Mimic: Deep Multitask and Transfer Reinforcement Learning},
  booktitle    = {4th International Conference on Learning Representations, {ICLR} 2016,
                  San Juan, Puerto Rico, May 2-4, 2016, Conference Track Proceedings},
  year         = {2016},
  url          = {http://arxiv.org/abs/1511.06342},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ParisottoBS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BaKH16,
  author       = {Lei Jimmy Ba and
                  Jamie Ryan Kiros and
                  Geoffrey E. Hinton},
  title        = {Layer Normalization},
  journal      = {CoRR},
  volume       = {abs/1607.06450},
  year         = {2016},
  url          = {http://arxiv.org/abs/1607.06450},
  eprinttype    = {arXiv},
  eprint       = {1607.06450},
  timestamp    = {Tue, 23 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BaKH16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BaHMLI16,
  author       = {Jimmy Ba and
                  Geoffrey E. Hinton and
                  Volodymyr Mnih and
                  Joel Z. Leibo and
                  Catalin Ionescu},
  title        = {Using Fast Weights to Attend to the Recent Past},
  journal      = {CoRR},
  volume       = {abs/1610.06258},
  year         = {2016},
  url          = {http://arxiv.org/abs/1610.06258},
  eprinttype    = {arXiv},
  eprint       = {1610.06258},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BaHMLI16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/gamesem/MannJRHB15,
  author       = {Steve Mann and
                  Ryan E. Janzen and
                  Valmiki Rampersad and
                  Jason Huang and
                  Lei Jimmy Ba},
  editor       = {Elena G. Bertozzi and
                  Bill Kapralos and
                  Nahum D. Gershon and
                  Jim R. Parker},
  title        = {"SQUEAKeys": {A} friction idiophone, for physical interaction
                  with mobile devices},
  booktitle    = {2015 {IEEE} Games Entertainment Media Conference, {GEM} 2015, Toronto,
                  ON, Canada, October 14-16, 2015},
  pages        = {1--4},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/GEM.2015.7377235},
  doi          = {10.1109/GEM.2015.7377235},
  timestamp    = {Mon, 18 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/gamesem/MannJRHB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/BaSFS15,
  author       = {Lei Jimmy Ba and
                  Kevin Swersky and
                  Sanja Fidler and
                  Ruslan Salakhutdinov},
  title        = {Predicting Deep Zero-Shot Convolutional Neural Networks Using Textual
                  Descriptions},
  booktitle    = {2015 {IEEE} International Conference on Computer Vision, {ICCV} 2015,
                  Santiago, Chile, December 7-13, 2015},
  pages        = {4247--4255},
  publisher    = {{IEEE} Computer Society},
  year         = {2015},
  url          = {https://doi.org/10.1109/ICCV.2015.483},
  doi          = {10.1109/ICCV.2015.483},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iccv/BaSFS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/XuBKCCSZB15,
  author       = {Kelvin Xu and
                  Jimmy Ba and
                  Ryan Kiros and
                  Kyunghyun Cho and
                  Aaron C. Courville and
                  Ruslan Salakhutdinov and
                  Richard S. Zemel and
                  Yoshua Bengio},
  editor       = {Francis R. Bach and
                  David M. Blei},
  title        = {Show, Attend and Tell: Neural Image Caption Generation with Visual
                  Attention},
  booktitle    = {Proceedings of the 32nd International Conference on Machine Learning,
                  {ICML} 2015, Lille, France, 6-11 July 2015},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {37},
  pages        = {2048--2057},
  publisher    = {JMLR.org},
  year         = {2015},
  url          = {http://proceedings.mlr.press/v37/xuc15.html},
  timestamp    = {Wed, 29 May 2019 08:41:45 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/XuBKCCSZB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BaSGF15,
  author       = {Jimmy Ba and
                  Ruslan Salakhutdinov and
                  Roger B. Grosse and
                  Brendan J. Frey},
  editor       = {Corinna Cortes and
                  Neil D. Lawrence and
                  Daniel D. Lee and
                  Masashi Sugiyama and
                  Roman Garnett},
  title        = {Learning Wake-Sleep Recurrent Attention Models},
  booktitle    = {Advances in Neural Information Processing Systems 28: Annual Conference
                  on Neural Information Processing Systems 2015, December 7-12, 2015,
                  Montreal, Quebec, Canada},
  pages        = {2593--2601},
  year         = {2015},
  url          = {https://proceedings.neurips.cc/paper/2015/hash/db1915052d15f7815c8b88e879465a1e-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BaSGF15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/BaMK14,
  author       = {Jimmy Ba and
                  Volodymyr Mnih and
                  Koray Kavukcuoglu},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Multiple Object Recognition with Visual Attention},
  booktitle    = {3rd International Conference on Learning Representations, {ICLR} 2015,
                  San Diego, CA, USA, May 7-9, 2015, Conference Track Proceedings},
  year         = {2015},
  url          = {http://arxiv.org/abs/1412.7755},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BaMK14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/KingmaB14,
  author       = {Diederik P. Kingma and
                  Jimmy Ba},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Adam: {A} Method for Stochastic Optimization},
  booktitle    = {3rd International Conference on Learning Representations, {ICLR} 2015,
                  San Diego, CA, USA, May 7-9, 2015, Conference Track Proceedings},
  year         = {2015},
  url          = {http://arxiv.org/abs/1412.6980},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/KingmaB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/XuBKCCSZB15,
  author       = {Kelvin Xu and
                  Jimmy Ba and
                  Ryan Kiros and
                  Kyunghyun Cho and
                  Aaron C. Courville and
                  Ruslan Salakhutdinov and
                  Richard S. Zemel and
                  Yoshua Bengio},
  title        = {Show, Attend and Tell: Neural Image Caption Generation with Visual
                  Attention},
  journal      = {CoRR},
  volume       = {abs/1502.03044},
  year         = {2015},
  url          = {http://arxiv.org/abs/1502.03044},
  eprinttype    = {arXiv},
  eprint       = {1502.03044},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/XuBKCCSZB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BaSFS15,
  author       = {Jimmy Ba and
                  Kevin Swersky and
                  Sanja Fidler and
                  Ruslan Salakhutdinov},
  title        = {Predicting Deep Zero-Shot Convolutional Neural Networks using Textual
                  Descriptions},
  journal      = {CoRR},
  volume       = {abs/1506.00511},
  year         = {2015},
  url          = {http://arxiv.org/abs/1506.00511},
  eprinttype    = {arXiv},
  eprint       = {1506.00511},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BaSFS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BaGSF15,
  author       = {Jimmy Ba and
                  Roger B. Grosse and
                  Ruslan Salakhutdinov and
                  Brendan J. Frey},
  title        = {Learning Wake-Sleep Recurrent Attention Models},
  journal      = {CoRR},
  volume       = {abs/1509.06812},
  year         = {2015},
  url          = {http://arxiv.org/abs/1509.06812},
  eprinttype    = {arXiv},
  eprint       = {1509.06812},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BaGSF15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/KrausBF15,
  author       = {Oren Z. Kraus and
                  Lei Jimmy Ba and
                  Brendan J. Frey},
  title        = {Classifying and Segmenting Microscopy Images Using Convolutional Multiple
                  Instance Learning},
  journal      = {CoRR},
  volume       = {abs/1511.05286},
  year         = {2015},
  url          = {http://arxiv.org/abs/1511.05286},
  eprinttype    = {arXiv},
  eprint       = {1511.05286},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/KrausBF15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BaC14,
  author       = {Jimmy Ba and
                  Rich Caruana},
  editor       = {Zoubin Ghahramani and
                  Max Welling and
                  Corinna Cortes and
                  Neil D. Lawrence and
                  Kilian Q. Weinberger},
  title        = {Do Deep Nets Really Need to be Deep?},
  booktitle    = {Advances in Neural Information Processing Systems 27: Annual Conference
                  on Neural Information Processing Systems 2014, December 8-13 2014,
                  Montreal, Quebec, Canada},
  pages        = {2654--2662},
  year         = {2014},
  url          = {https://proceedings.neurips.cc/paper/2014/hash/ea8fcd92d59581717e06eb187f10666d-Abstract.html},
  timestamp    = {Fri, 10 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/BaC14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BaF13,
  author       = {Lei Jimmy Ba and
                  Brendan J. Frey},
  editor       = {Christopher J. C. Burges and
                  L{\'{e}}on Bottou and
                  Zoubin Ghahramani and
                  Kilian Q. Weinberger},
  title        = {Adaptive dropout for training deep neural networks},
  booktitle    = {Advances in Neural Information Processing Systems 26: 27th Annual
                  Conference on Neural Information Processing Systems 2013. Proceedings
                  of a meeting held December 5-8, 2013, Lake Tahoe, Nevada, United States},
  pages        = {3084--3092},
  year         = {2013},
  url          = {https://proceedings.neurips.cc/paper/2013/hash/7b5b23f4aadf9513306bcd59afb6e4c9-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BaF13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BaC13,
  author       = {Lei Jimmy Ba and
                  Rich Caruana},
  title        = {Do Deep Nets Really Need to be Deep?},
  journal      = {CoRR},
  volume       = {abs/1312.6184},
  year         = {2013},
  url          = {http://arxiv.org/abs/1312.6184},
  eprinttype    = {arXiv},
  eprint       = {1312.6184},
  timestamp    = {Fri, 10 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/BaC13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/tei/MannJHKBC11,
  author       = {Steve Mann and
                  Ryan E. Janzen and
                  Jason Huang and
                  Matthew B. Kelly and
                  Lei Jimmy Ba and
                  Alexander Chen},
  editor       = {Mark D. Gross and
                  Nuno Jardim Nunes and
                  Ellen Yi{-}Luen Do and
                  Stephen A. Brewster and
                  Ian Oakley},
  title        = {User-interfaces based on the water-hammer effect: water-hammer piano
                  as an interactive percussion surface},
  booktitle    = {Proceedings of the 5th International Conference on Tangible and Embedded
                  Interaction 2011, Funchal, Madeira, Portugal, January 22-26, 2011},
  pages        = {1--8},
  publisher    = {{ACM}},
  year         = {2011},
  url          = {https://doi.org/10.1145/1935701.1935703},
  doi          = {10.1145/1935701.1935703},
  timestamp    = {Mon, 18 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/tei/MannJHKBC11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics