<?xml version="1.0"?>
<dblpperson name="George E. Dahl" pid="10/7998" n="55">
<person key="homepages/10/7998" mdate="2025-07-10">
<author pid="10/7998">George E. Dahl</author>
<author pid="10/7998">George Edward Dahl</author>
<url>https://www.cs.toronto.edu/~gdahl/</url>
<url>https://scholar.google.com/citations?user=ghbWy-0AAAAJ</url>
<url>https://openreview.net/profile?id=~George_E._Dahl1</url>
</person>
<r><article key="journals/tmlr/KasimbegRAMPAD25" mdate="2025-06-24">
<author pid="251/9611">Priya Kasimbeg</author>
<author pid="164/6165">Vincent Roulet</author>
<author pid="72/3910">Naman Agarwal</author>
<author pid="325/5349">Sourabh Medapati</author>
<author pid="11/9764">Fabian Pedregosa</author>
<author pid="265/6410">Atish Agarwala</author>
<author pid="10/7998">George E. Dahl</author>
<title>How far away are truly hyperparameter-free learning algorithms?</title>
<year>2025</year>
<volume>2025</volume>
<journal>Trans. Mach. Learn. Res.</journal>
<ee type="oa">https://openreview.net/forum?id=6BlOCx5c5T</ee>
<url>db/journals/tmlr/tmlr2025.html#KasimbegRAMPAD25</url>
</article>
</r>
<r><inproceedings key="conf/iclr/Kasimbeg0EBSSFW25" mdate="2025-05-15">
<author pid="251/9611">Priya Kasimbeg</author>
<author pid="41/328-1">Frank Schneider 0001</author>
<author pid="242/9235">Runa Eschenhagen</author>
<author pid="158/9492">Juhan Bae</author>
<author pid="223/6317">Chandramouli Shama Sastry</author>
<author pid="118/5750">Mark Saroufim</author>
<author pid="227/2946">Boyuan Feng</author>
<author pid="295/9883">Less Wright</author>
<author pid="118/9819">Edward Z. Yang</author>
<author pid="228/7785">Zachary Nado</author>
<author pid="325/5349">Sourabh Medapati</author>
<author pid="08/9077">Philipp Hennig</author>
<author pid="47/1744">Michael Rabbat</author>
<author pid="10/7998">George E. Dahl</author>
<title>Accelerating neural network training: An analysis of the AlgoPerf competition.</title>
<year>2025</year>
<booktitle>ICLR</booktitle>
<ee type="oa">https://openreview.net/forum?id=CtM5xjRSfm</ee>
<crossref>conf/iclr/2025</crossref>
<url>db/conf/iclr/iclr2025.html#Kasimbeg0EBSSFW25</url>
</inproceedings>
</r>
<r><article publtype="informal" key="journals/corr/abs-2502-15015" mdate="2025-03-20">
<author pid="251/9611">Priya Kasimbeg</author>
<author pid="41/328-1">Frank Schneider 0001</author>
<author pid="242/9235">Runa Eschenhagen</author>
<author pid="158/9492">Juhan Bae</author>
<author pid="223/6317">Chandramouli Shama Sastry</author>
<author pid="118/5750">Mark Saroufim</author>
<author pid="227/2946">Boyuan Feng</author>
<author pid="295/9883">Less Wright</author>
<author pid="118/9819">Edward Z. Yang</author>
<author pid="228/7785">Zachary Nado</author>
<author pid="325/5349">Sourabh Medapati</author>
<author pid="08/9077">Philipp Hennig</author>
<author pid="47/1744">Michael Rabbat</author>
<author pid="10/7998">George E. Dahl</author>
<title>Accelerating Neural Network Training: An Analysis of the AlgoPerf Competition.</title>
<year>2025</year>
<month>February</month>
<volume>abs/2502.15015</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2502.15015</ee>
<url>db/journals/corr/corr2502.html#abs-2502-15015</url>
<stream>streams/journals/corr</stream>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2503-03986" mdate="2025-04-11">
<author pid="325/5349">Sourabh Medapati</author>
<author pid="251/9611">Priya Kasimbeg</author>
<author pid="38/5647">Shankar Krishnan</author>
<author pid="72/3910">Naman Agarwal</author>
<author pid="10/7998">George E. Dahl</author>
<title>Training neural networks faster with minimal tuning using pre-computed lists of hyperparameters for NAdamW.</title>
<year>2025</year>
<month>March</month>
<volume>abs/2503.03986</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2503.03986</ee>
<url>db/journals/corr/corr2503.html#abs-2503-03986</url>
<stream>streams/journals/corr</stream>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2505-24005" mdate="2025-06-29">
<author pid="251/9611">Priya Kasimbeg</author>
<author pid="164/6165">Vincent Roulet</author>
<author pid="72/3910">Naman Agarwal</author>
<author pid="325/5349">Sourabh Medapati</author>
<author pid="11/9764">Fabian Pedregosa</author>
<author pid="265/6410">Atish Agarwala</author>
<author pid="10/7998">George E. Dahl</author>
<title>How far away are truly hyperparameter-free learning algorithms?</title>
<year>2025</year>
<month>May</month>
<volume>abs/2505.24005</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2505.24005</ee>
<url>db/journals/corr/corr2505.html#abs-2505-24005</url>
<stream>streams/journals/corr</stream>
</article>
</r>
<r><article key="journals/jmlr/WangDSLNGSG24" mdate="2024-09-16">
<author pid="78/8711">Zi Wang</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="35/9381">Kevin Swersky</author>
<author pid="137/3219">Chansoo Lee</author>
<author pid="228/7785">Zachary Nado</author>
<author pid="131/6545">Justin Gilmer</author>
<author pid="95/6097">Jasper Snoek</author>
<author pid="g/ZoubinGhahramani">Zoubin Ghahramani</author>
<title>Pre-trained Gaussian Processes for Bayesian Optimization.</title>
<pages>212:1-212:83</pages>
<year>2024</year>
<volume>25</volume>
<journal>J. Mach. Learn. Res.</journal>
<ee type="oa">https://jmlr.org/papers/v25/23-0269.html</ee>
<url>db/journals/jmlr/jmlr25.html#WangDSLNGSG24</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2306-07179" mdate="2023-06-16">
<author pid="10/7998">George E. Dahl</author>
<author pid="41/328-1">Frank Schneider 0001</author>
<author pid="228/7785">Zachary Nado</author>
<author pid="72/3910">Naman Agarwal</author>
<author pid="223/6317">Chandramouli Shama Sastry</author>
<author pid="08/9077">Philipp Hennig</author>
<author pid="325/5349">Sourabh Medapati</author>
<author pid="242/9235">Runa Eschenhagen</author>
<author pid="251/9611">Priya Kasimbeg</author>
<author pid="186/8419">Daniel Suo</author>
<author pid="158/9492">Juhan Bae</author>
<author pid="131/6545">Justin Gilmer</author>
<author pid="349/3715">Abel L. Peirson</author>
<author pid="71/2824">Bilal Khan</author>
<author pid="182/1833">Rohan Anil</author>
<author pid="47/1744">Mike Rabbat</author>
<author pid="38/5647">Shankar Krishnan</author>
<author pid="324/5277">Daniel Snider</author>
<author pid="142/5754">Ehsan Amid</author>
<author pid="297/3463">Kongtao Chen</author>
<author pid="139/1388">Chris J. Maddison</author>
<author pid="349/2430">Rakshith Vasudev</author>
<author pid="325/5394">Michal Badura</author>
<author pid="86/7221">Ankush Garg</author>
<author pid="47/739">Peter Mattson</author>
<title>Benchmarking Neural Network Training Algorithms.</title>
<year>2023</year>
<volume>abs/2306.07179</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2306.07179</ee>
<url>db/journals/corr/corr2306.html#abs-2306-07179</url>
</article>
</r>
<r><inproceedings key="conf/aistats/AriafarGNSJD22" mdate="2022-05-20">
<author pid="169/2463">Setareh Ariafar</author>
<author pid="131/6545">Justin Gilmer</author>
<author pid="228/7785">Zachary Nado</author>
<author pid="95/6097">Jasper Snoek</author>
<author pid="68/8398">Rodolphe Jenatton</author>
<author pid="10/7998">George E. Dahl</author>
<title>Predicting the utility of search spaces for black-box optimization: a simple, budget-aware approach.</title>
<pages>11056-11071</pages>
<year>2022</year>
<booktitle>AISTATS</booktitle>
<ee type="oa">https://proceedings.mlr.press/v151/ariafar22a.html</ee>
<crossref>conf/aistats/2022</crossref>
<url>db/conf/aistats/aistats2022.html#AriafarGNSJD22</url>
</inproceedings>
</r>
<r><inproceedings key="conf/iclr/GilmerGGKNCDNF22" mdate="2022-08-20">
<author pid="131/6545">Justin Gilmer</author>
<author pid="162/0166">Behrooz Ghorbani</author>
<author pid="86/7221">Ankush Garg</author>
<author pid="248/7500">Sneha Kudugunta</author>
<author pid="131/9898">Behnam Neyshabur</author>
<author pid="304/2067">David Cardoze</author>
<author pid="10/7998">George Edward Dahl</author>
<author pid="228/7785">Zachary Nado</author>
<author pid="120/2225">Orhan Firat</author>
<title>A Loss Curvature Perspective on Training Instabilities of Deep Learning Models.</title>
<year>2022</year>
<booktitle>ICLR</booktitle>
<ee type="oa">https://openreview.net/forum?id=OcKMT-36vUs</ee>
<crossref>conf/iclr/2022</crossref>
<url>db/conf/iclr/iclr2022.html#GilmerGGKNCDNF22</url>
</inproceedings>
</r>
<r><article publtype="informal" key="journals/corr/abs-2203-10139" mdate="2022-03-30">
<author pid="317/0391">Ryan G. Gomes</author>
<author pid="317/0293">Bellington Vwalika</author>
<author pid="317/0270">Chace Lee</author>
<author pid="180/1370">Angelica Willis</author>
<author pid="48/8770">Marcin Sieniek</author>
<author pid="317/0179">Joan T. Price</author>
<author pid="278/2847">Christina Chen</author>
<author pid="317/0237">Margaret P. Kasaro</author>
<author pid="316/9899">James A. Taylor 0003</author>
<author pid="317/0406">Elizabeth M. Stringer</author>
<author pid="284/0700">Scott Mayer McKinney</author>
<author pid="316/9859">Ntazana Sindano</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="317/0204">William Goodnight III</author>
<author pid="131/6545">Justin Gilmer</author>
<author pid="317/0233">Benjamin H. Chi</author>
<author pid="277/1204">Charles Lau</author>
<author pid="317/0325">Terry Spitz</author>
<author pid="317/0264">T. Saensuksopa</author>
<author pid="133/2109">Kris Liu</author>
<author pid="317/0382">Jonny Wong</author>
<author pid="292/7059">Rory Pilgrim</author>
<author pid="317/0324">Akib Uddin</author>
<author pid="05/8414">Greg Corrado</author>
<author pid="198/1261">Lily Peng</author>
<author pid="210/1097">Katherine Chou</author>
<author pid="63/9281">Daniel Tse</author>
<author pid="316/9959">Jeffrey S. A. Stringer</author>
<author pid="49/1617">Shravya Shetty</author>
<title>AI system for fetal ultrasound in low-resource settings.</title>
<year>2022</year>
<volume>abs/2203.10139</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2203.10139</ee>
<url>db/journals/corr/corr2203.html#abs-2203-10139</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2207-03084" mdate="2022-07-13">
<author pid="78/8711">Zi Wang</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="35/9381">Kevin Swersky</author>
<author pid="137/3219">Chansoo Lee</author>
<author pid="164/7319">Zelda Mariet</author>
<author pid="228/7785">Zachary Nado</author>
<author pid="131/6545">Justin Gilmer</author>
<author pid="95/6097">Jasper Snoek</author>
<author pid="g/ZoubinGhahramani">Zoubin Ghahramani</author>
<title>Pre-training helps Bayesian optimization too.</title>
<year>2022</year>
<volume>abs/2207.03084</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2207.03084</ee>
<url>db/journals/corr/corr2207.html#abs-2207-03084</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2207-14484" mdate="2023-08-07">
<author pid="25/3538-1">Jeremy Cohen 0001</author>
<author pid="162/0166">Behrooz Ghorbani</author>
<author pid="38/5647">Shankar Krishnan</author>
<author pid="72/3910">Naman Agarwal</author>
<author pid="325/5349">Sourabh Medapati</author>
<author pid="325/5394">Michal Badura</author>
<author pid="186/8419">Daniel Suo</author>
<author pid="304/2067">David Cardoze</author>
<author pid="228/7785">Zachary Nado</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="131/6545">Justin Gilmer</author>
<title>Adaptive Gradient Methods at the Edge of Stability.</title>
<year>2022</year>
<volume>abs/2207.14484</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2207.14484</ee>
<url>db/journals/corr/corr2207.html#abs-2207-14484</url>
</article>
</r>
<r><inproceedings key="conf/naacl/BowmanD21" mdate="2021-08-06">
<author pid="116/0502">Samuel R. Bowman</author>
<author pid="10/7998">George E. Dahl</author>
<title>What Will it Take to Fix Benchmarking in Natural Language Understanding?</title>
<pages>4843-4855</pages>
<year>2021</year>
<booktitle>NAACL-HLT</booktitle>
<ee type="oa">https://doi.org/10.18653/v1/2021.naacl-main.385</ee>
<ee type="oa">https://aclanthology.org/2021.naacl-main.385/</ee>
<crossref>conf/naacl/2021</crossref>
<url>db/conf/naacl/naacl2021.html#BowmanD21</url>
</inproceedings>
</r>
<r><article publtype="informal" key="journals/corr/abs-2102-06356" mdate="2021-02-18">
<author pid="228/7785">Zachary Nado</author>
<author pid="131/6545">Justin Gilmer</author>
<author pid="126/6014">Christopher J. Shallue</author>
<author pid="182/1833">Rohan Anil</author>
<author pid="10/7998">George E. Dahl</author>
<title>A Large Batch Optimizer Reality Check: Traditional, Generic Optimizers Suffice Across Batch Sizes.</title>
<year>2021</year>
<volume>abs/2102.06356</volume>
<journal>CoRR</journal>
<ee type="oa">https://arxiv.org/abs/2102.06356</ee>
<url>db/journals/corr/corr2102.html#abs-2102-06356</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2104-02145" mdate="2021-04-12">
<author pid="116/0502">Samuel R. Bowman</author>
<author pid="10/7998">George E. Dahl</author>
<title>What Will it Take to Fix Benchmarking in Natural Language Understanding?</title>
<year>2021</year>
<volume>abs/2104.02145</volume>
<journal>CoRR</journal>
<ee type="oa">https://arxiv.org/abs/2104.02145</ee>
<url>db/journals/corr/corr2104.html#abs-2104-02145</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2109-08215" mdate="2021-09-22">
<author pid="78/8711">Zi Wang</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="35/9381">Kevin Swersky</author>
<author pid="137/3219">Chansoo Lee</author>
<author pid="164/7319">Zelda Mariet</author>
<author pid="228/7785">Zachary Nado</author>
<author pid="131/6545">Justin Gilmer</author>
<author pid="95/6097">Jasper Snoek</author>
<author pid="g/ZoubinGhahramani">Zoubin Ghahramani</author>
<title>Automatic prior selection for meta Bayesian optimization with a case study on tuning deep neural network optimizers.</title>
<year>2021</year>
<volume>abs/2109.08215</volume>
<journal>CoRR</journal>
<ee type="oa">https://arxiv.org/abs/2109.08215</ee>
<url>db/journals/corr/corr2109.html#abs-2109-08215</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2110-04369" mdate="2021-11-17">
<author pid="131/6545">Justin Gilmer</author>
<author pid="162/0166">Behrooz Ghorbani</author>
<author pid="86/7221">Ankush Garg</author>
<author pid="248/7500">Sneha Kudugunta</author>
<author pid="131/9898">Behnam Neyshabur</author>
<author pid="304/2067">David Cardoze</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="228/7785">Zachary Nado</author>
<author pid="120/2225">Orhan Firat</author>
<title>A Loss Curvature Perspective on Training Instability in Deep Learning.</title>
<year>2021</year>
<volume>abs/2110.04369</volume>
<journal>CoRR</journal>
<ee type="oa">https://arxiv.org/abs/2110.04369</ee>
<url>db/journals/corr/corr2110.html#abs-2110-04369</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2112-08250" mdate="2022-01-03">
<author pid="169/2463">Setareh Ariafar</author>
<author pid="131/6545">Justin Gilmer</author>
<author pid="228/7785">Zachary Nado</author>
<author pid="95/6097">Jasper Snoek</author>
<author pid="68/8398">Rodolphe Jenatton</author>
<author pid="10/7998">George E. Dahl</author>
<title>Predicting the utility of search spaces for black-box optimization: a simple, budget-aware approach.</title>
<year>2021</year>
<volume>abs/2112.08250</volume>
<journal>CoRR</journal>
<ee type="oa">https://arxiv.org/abs/2112.08250</ee>
<url>db/journals/corr/corr2112.html#abs-2112-08250</url>
</article>
</r>
<r><article key="journals/jmlr/ShallueLASFD19" mdate="2024-09-11">
<author pid="126/6014">Christopher J. Shallue</author>
<author pid="95/386-1">Jaehoon Lee 0001</author>
<author pid="222/3147">Joseph M. Antognini</author>
<author pid="51/7117">Jascha Sohl-Dickstein</author>
<author pid="136/9091">Roy Frostig</author>
<author pid="10/7998">George E. Dahl</author>
<title>Measuring the Effects of Data Parallelism on Neural Network Training.</title>
<pages>112:1-112:49</pages>
<year>2019</year>
<volume>20</volume>
<journal>J. Mach. Learn. Res.</journal>
<ee type="oa">https://jmlr.org/papers/v20/18-789.html</ee>
<url>db/journals/jmlr/jmlr20.html#ShallueLASFD19</url>
</article>
</r>
<r><inproceedings key="conf/nips/ZhangLNMSDSG19" mdate="2024-11-13">
<author pid="28/4937-6">Guodong Zhang 0006</author>
<author pid="49/7563">Lala Li</author>
<author pid="228/7785">Zachary Nado</author>
<author pid="12/8412">James Martens</author>
<author pid="25/9221">Sushant Sachdeva</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="126/6014">Christopher J. Shallue</author>
<author pid="26/7058">Roger B. Grosse</author>
<title>Which Algorithmic Choices Matter at Which Batch Sizes? Insights From a Noisy Quadratic Model.</title>
<pages>8194-8205</pages>
<year>2019</year>
<booktitle>NeurIPS</booktitle>
<ee type="oa">https://proceedings.neurips.cc/paper/2019/hash/e0eacd983971634327ae1819ea8b6214-Abstract.html</ee>
<ee type="oa">http://papers.nips.cc/paper/9030-which-algorithmic-choices-matter-at-which-batch-sizes-insights-from-a-noisy-quadratic-model</ee>
<crossref>conf/nips/2019</crossref>
<url>db/conf/nips/nips2019.html#ZhangLNMSDSG19</url>
</inproceedings>
</r>
<r><article publtype="informal" key="journals/corr/abs-1907-04164" mdate="2024-11-13">
<author pid="28/4937-6">Guodong Zhang 0006</author>
<author pid="49/7563">Lala Li</author>
<author pid="228/7785">Zachary Nado</author>
<author pid="12/8412">James Martens</author>
<author pid="25/9221">Sushant Sachdeva</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="126/6014">Christopher J. Shallue</author>
<author pid="26/7058">Roger B. Grosse</author>
<title>Which Algorithmic Choices Matter at Which Batch Sizes? Insights From a Noisy Quadratic Model.</title>
<year>2019</year>
<volume>abs/1907.04164</volume>
<journal>CoRR</journal>
<ee type="oa">http://arxiv.org/abs/1907.04164</ee>
<url>db/journals/corr/corr1907.html#abs-1907-04164</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-1907-05550" mdate="2019-07-17">
<author pid="209/9687">Dami Choi</author>
<author pid="47/10827">Alexandre Passos</author>
<author pid="126/6014">Christopher J. Shallue</author>
<author pid="10/7998">George E. Dahl</author>
<title>Faster Neural Network Training with Data Echoing.</title>
<year>2019</year>
<volume>abs/1907.05550</volume>
<journal>CoRR</journal>
<ee type="oa">http://arxiv.org/abs/1907.05550</ee>
<url>db/journals/corr/corr1907.html#abs-1907-05550</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-1910-05446" mdate="2024-07-17">
<author pid="209/9687">Dami Choi</author>
<author pid="126/6014">Christopher J. Shallue</author>
<author pid="228/7785">Zachary Nado</author>
<author pid="95/386-1">Jaehoon Lee 0001</author>
<author pid="139/1388">Chris J. Maddison</author>
<author pid="10/7998">George E. Dahl</author>
<title>On Empirical Comparisons of Optimizers for Deep Learning.</title>
<year>2019</year>
<volume>abs/1910.05446</volume>
<journal>CoRR</journal>
<ee type="oa">http://arxiv.org/abs/1910.05446</ee>
<url>db/journals/corr/corr1910.html#abs-1910-05446</url>
</article>
</r>
<r><inproceedings key="conf/emnlp/FordD0D18" mdate="2021-08-06">
<author pid="223/9765">Nicolas Ford</author>
<author pid="10/8371">Daniel Duckworth</author>
<author pid="12/7659-2">Mohammad Norouzi 0002</author>
<author pid="10/7998">George E. Dahl</author>
<title>The Importance of Generation Order in Language Modeling.</title>
<pages>2942-2946</pages>
<year>2018</year>
<booktitle>EMNLP</booktitle>
<ee type="oa">https://doi.org/10.18653/v1/d18-1324</ee>
<ee type="oa">https://aclanthology.org/D18-1324/</ee>
<crossref>conf/emnlp/2018</crossref>
<url>db/conf/emnlp/emnlp2018.html#FordD0D18</url>
</inproceedings>
</r>
<r><inproceedings key="conf/iclr/AnilPPODH18" mdate="2019-07-25">
<author pid="182/1833">Rohan Anil</author>
<author pid="170/0034">Gabriel Pereyra</author>
<author pid="47/10827">Alexandre Passos</author>
<author pid="35/4647">R&#243;bert Orm&#225;ndi</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="10/3248">Geoffrey E. Hinton</author>
<title>Large scale distributed neural network training through online distillation.</title>
<year>2018</year>
<booktitle>ICLR (Poster)</booktitle>
<ee type="oa">https://openreview.net/forum?id=rkr1UDeC-</ee>
<crossref>conf/iclr/2018</crossref>
<url>db/conf/iclr/iclr2018.html#AnilPPODH18</url>
</inproceedings>
</r>
<r><inproceedings key="conf/textgraphs/DhingraSNDD18" mdate="2021-08-06">
<author pid="180/5692">Bhuwan Dhingra</author>
<author pid="126/6014">Christopher J. Shallue</author>
<author pid="12/7659-2">Mohammad Norouzi 0002</author>
<author pid="59/9736">Andrew M. Dai</author>
<author pid="10/7998">George E. Dahl</author>
<title>Embedding Text in Hyperbolic Spaces.</title>
<pages>59-69</pages>
<year>2018</year>
<booktitle>TextGraphs@NAACL-HLT</booktitle>
<ee type="oa">https://doi.org/10.18653/v1/w18-1708</ee>
<ee type="oa">https://aclanthology.org/W18-1708/</ee>
<crossref>conf/textgraphs/2018</crossref>
<url>db/conf/textgraphs/textgraphs2018.html#DhingraSNDD18</url>
</inproceedings>
</r>
<r><article publtype="informal" key="journals/corr/abs-1804-03235" mdate="2019-02-22">
<author pid="182/1833">Rohan Anil</author>
<author pid="170/0034">Gabriel Pereyra</author>
<author pid="47/10827">Alexandre Passos</author>
<author pid="35/4647">R&#243;bert Orm&#225;ndi</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="10/3248">Geoffrey E. Hinton</author>
<title>Large scale distributed neural network training through online distillation.</title>
<year>2018</year>
<volume>abs/1804.03235</volume>
<journal>CoRR</journal>
<ee type="oa">http://arxiv.org/abs/1804.03235</ee>
<url>db/journals/corr/corr1804.html#abs-1804-03235</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-1805-10255" mdate="2025-09-22">
<author orcid="0000-0003-1373-9296" pid="58/1076-19">Manoj Kumar 0019</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="08/2793">Vijay Vasudevan</author>
<author pid="12/7659-2">Mohammad Norouzi 0002</author>
<title>Parallel Architecture and Hyperparameter Search via Successive Halving and Classification.</title>
<year>2018</year>
<volume>abs/1805.10255</volume>
<journal>CoRR</journal>
<ee type="oa">http://arxiv.org/abs/1805.10255</ee>
<url>db/journals/corr/corr1805.html#abs-1805-10255</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-1806-01261" mdate="2024-06-18">
<author pid="41/3400">Peter W. Battaglia</author>
<author pid="155/1885">Jessica B. Hamrick</author>
<author pid="120/7601">Victor Bapst</author>
<author pid="222/1889">Alvaro Sanchez-Gonzalez</author>
<author pid="146/6224">Vin&#237;cius Flores Zambaldi</author>
<author pid="10/3451">Mateusz Malinowski</author>
<author pid="127/6624">Andrea Tacchetti</author>
<author pid="52/11138">David Raposo</author>
<author pid="180/5951">Adam Santoro</author>
<author pid="159/6155">Ryan Faulkner 0001</author>
<author pid="125/2132">&#199;aglar G&#252;l&#231;ehre</author>
<author pid="150/6469">H. Francis Song</author>
<author pid="190/7271">Andrew J. Ballard</author>
<author pid="131/6545">Justin Gilmer</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="26/9012">Ashish Vaswani</author>
<author pid="153/9528">Kelsey R. Allen</author>
<author pid="16/6892">Charles Nash</author>
<author pid="222/1565">Victoria Langston</author>
<author pid="41/6895">Chris Dyer</author>
<author pid="76/9181">Nicolas Heess</author>
<author pid="65/6056">Daan Wierstra</author>
<author pid="94/248">Pushmeet Kohli</author>
<author pid="98/5712">Matthew M. Botvinick</author>
<author pid="05/726">Oriol Vinyals</author>
<author pid="67/3069-1">Yujia Li 0001</author>
<author pid="65/8368">Razvan Pascanu</author>
<title>Relational inductive biases, deep learning, and graph networks.</title>
<year>2018</year>
<volume>abs/1806.01261</volume>
<journal>CoRR</journal>
<ee type="oa">http://arxiv.org/abs/1806.01261</ee>
<url>db/journals/corr/corr1806.html#abs-1806-01261</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-1806-04313" mdate="2018-08-13">
<author pid="180/5692">Bhuwan Dhingra</author>
<author pid="126/6014">Christopher J. Shallue</author>
<author pid="12/7659-2">Mohammad Norouzi 0002</author>
<author pid="59/9736">Andrew M. Dai</author>
<author pid="10/7998">George E. Dahl</author>
<title>Embedding Text in Hyperbolic Spaces.</title>
<year>2018</year>
<volume>abs/1806.04313</volume>
<journal>CoRR</journal>
<ee type="oa">http://arxiv.org/abs/1806.04313</ee>
<url>db/journals/corr/corr1806.html#abs-1806-04313</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-1807-06732" mdate="2020-10-07">
<author pid="131/6545">Justin Gilmer</author>
<author pid="32/909">Ryan P. Adams</author>
<author pid="43/7940">Ian J. Goodfellow</author>
<author pid="a/DavidGAndersen">David G. Andersen</author>
<author pid="10/7998">George E. Dahl</author>
<title>Motivating the Rules of the Game for Adversarial Example Research.</title>
<year>2018</year>
<volume>abs/1807.06732</volume>
<journal>CoRR</journal>
<ee type="oa">http://arxiv.org/abs/1807.06732</ee>
<url>db/journals/corr/corr1807.html#abs-1807-06732</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-1808-07910" mdate="2018-09-02">
<author pid="223/9765">Nicolas Ford</author>
<author pid="10/8371">Daniel Duckworth</author>
<author pid="12/7659-2">Mohammad Norouzi 0002</author>
<author pid="10/7998">George E. Dahl</author>
<title>The Importance of Generation Order in Language Modeling.</title>
<year>2018</year>
<volume>abs/1808.07910</volume>
<journal>CoRR</journal>
<ee type="oa">http://arxiv.org/abs/1808.07910</ee>
<url>db/journals/corr/corr1808.html#abs-1808-07910</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-1811-03600" mdate="2022-01-18">
<author pid="126/6014">Christopher J. Shallue</author>
<author pid="95/386-1">Jaehoon Lee 0001</author>
<author pid="222/3147">Joseph M. Antognini</author>
<author pid="51/7117">Jascha Sohl-Dickstein</author>
<author pid="136/9091">Roy Frostig</author>
<author pid="10/7998">George E. Dahl</author>
<title>Measuring the Effects of Data Parallelism on Neural Network Training.</title>
<year>2018</year>
<volume>abs/1811.03600</volume>
<journal>CoRR</journal>
<ee type="oa">http://arxiv.org/abs/1811.03600</ee>
<url>db/journals/corr/corr1811.html#abs-1811-03600</url>
</article>
</r>
<r><inproceedings key="conf/icml/GilmerSRVD17" mdate="2019-04-03">
<author pid="131/6545">Justin Gilmer</author>
<author pid="190/7108">Samuel S. Schoenholz</author>
<author pid="r/PatrickRiley">Patrick F. Riley</author>
<author pid="05/726">Oriol Vinyals</author>
<author pid="10/7998">George E. Dahl</author>
<title>Neural Message Passing for Quantum Chemistry.</title>
<pages>1263-1272</pages>
<year>2017</year>
<booktitle>ICML</booktitle>
<ee type="oa">http://proceedings.mlr.press/v70/gilmer17a.html</ee>
<crossref>conf/icml/2017</crossref>
<url>db/conf/icml/icml2017.html#GilmerSRVD17</url>
</inproceedings>
</r>
<r><article publtype="informal" key="journals/corr/LiuGNDKBVTNCHPS17" mdate="2021-01-23">
<author orcid="0000-0003-4079-8275" pid="50/2482-13">Yun Liu 0013</author>
<author pid="198/1178">Krishna Gadepalli</author>
<author pid="12/7659-2">Mohammad Norouzi 0002</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="42/895">Timo Kohlberger</author>
<author pid="151/6713">Aleksey Boyko</author>
<author pid="21/11044">Subhashini Venugopalan</author>
<author pid="198/1268">Aleksei Timofeev</author>
<author pid="198/0706">Philip Q. Nelson</author>
<author pid="05/8414">Gregory S. Corrado</author>
<author pid="198/0949">Jason D. Hipp</author>
<author pid="198/1261">Lily Peng</author>
<author pid="13/11026">Martin C. Stumpe</author>
<title>Detecting Cancer Metastases on Gigapixel Pathology Images.</title>
<year>2017</year>
<volume>abs/1703.02442</volume>
<journal>CoRR</journal>
<ee type="oa">http://arxiv.org/abs/1703.02442</ee>
<url>db/journals/corr/corr1703.html#LiuGNDKBVTNCHPS17</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/GilmerSRVD17" mdate="2018-08-13">
<author pid="131/6545">Justin Gilmer</author>
<author pid="190/7108">Samuel S. Schoenholz</author>
<author pid="r/PatrickRiley">Patrick F. Riley</author>
<author pid="05/726">Oriol Vinyals</author>
<author pid="10/7998">George E. Dahl</author>
<title>Neural Message Passing for Quantum Chemistry.</title>
<year>2017</year>
<volume>abs/1704.01212</volume>
<journal>CoRR</journal>
<ee type="oa">http://arxiv.org/abs/1704.01212</ee>
<url>db/journals/corr/corr1704.html#GilmerSRVD17</url>
</article>
</r>
<r><phdthesis key="phd/ca/Dahl15" mdate="2022-07-29">
<author pid="10/7998">George E. Dahl</author>
<title>Deep Learning Approaches to Problems in Speech Recognition, Computational Chemistry, and Natural Language Text Processing.</title>
<school>University of Toronto, Canada</school>
<year>2015</year>
<ee>http://hdl.handle.net/1807/69304</ee>
</phdthesis>
</r>
<r><article key="journals/jcisd/MaSLDS15" mdate="2020-03-06">
<author pid="78/288">Junshui Ma</author>
<author pid="60/5415">Robert P. Sheridan</author>
<author pid="67/731">Andy Liaw</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="55/3190">Vladimir Svetnik</author>
<title>Deep Neural Nets as a Method for Quantitative Structure-Activity Relationships.</title>
<pages>263-274</pages>
<year>2015</year>
<volume>55</volume>
<journal>J. Chem. Inf. Model.</journal>
<number>2</number>
<ee>https://doi.org/10.1021/ci500747n</ee>
<ee>https://www.wikidata.org/entity/Q41506565</ee>
<url>db/journals/jcisd/jcisd55.html#MaSLDS15</url>
</article>
</r>
<r><article key="journals/nn/SainathKSSMDR15" mdate="2024-10-06">
<author pid="28/7825">Tara N. Sainath</author>
<author pid="98/4359">Brian Kingsbury</author>
<author orcid="0009-0004-6837-5009" pid="52/6787">George Saon</author>
<author pid="07/2072">Hagen Soltau</author>
<author pid="28/8759">Abdel-rahman Mohamed</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="39/1849">Bhuvana Ramabhadran</author>
<title>Deep Convolutional Neural Networks for Large-scale Speech Tasks.</title>
<pages>39-48</pages>
<year>2015</year>
<volume>64</volume>
<journal>Neural Networks</journal>
<ee>https://doi.org/10.1016/j.neunet.2014.08.005</ee>
<ee>https://www.wikidata.org/entity/Q50620670</ee>
<url>db/journals/nn/nn64.html#SainathKSSMDR15</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/DahlJS14" mdate="2018-08-13">
<author pid="10/7998">George E. Dahl</author>
<author pid="04/6137">Navdeep Jaitly</author>
<author pid="62/5884">Ruslan Salakhutdinov</author>
<title>Multi-task Neural Networks for QSAR Predictions.</title>
<year>2014</year>
<volume>abs/1406.1231</volume>
<journal>CoRR</journal>
<ee type="oa">http://arxiv.org/abs/1406.1231</ee>
<url>db/journals/corr/corr1406.html#DahlJS14</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/AdamsDM14" mdate="2018-08-13">
<author pid="32/909">Ryan Prescott Adams</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="82/384">Iain Murray 0001</author>
<title>Incorporating Side Information in Probabilistic Matrix Factorization with Gaussian Processes.</title>
<year>2014</year>
<volume>abs/1408.2039</volume>
<journal>CoRR</journal>
<ee type="oa">http://arxiv.org/abs/1408.2039</ee>
<url>db/journals/corr/corr1408.html#AdamsDM14</url>
</article>
</r>
<r><inproceedings key="conf/asru/SainathKMDSSBAR13" mdate="2024-10-06">
<author pid="28/7825">Tara N. Sainath</author>
<author pid="98/4359">Brian Kingsbury</author>
<author pid="28/8759">Abdel-rahman Mohamed</author>
<author pid="10/7998">George E. Dahl</author>
<author orcid="0009-0004-6837-5009" pid="52/6787">George Saon</author>
<author pid="07/2072">Hagen Soltau</author>
<author pid="95/4892">Tom&#225;s Beran</author>
<author pid="85/10541">Aleksandr Y. Aravkin</author>
<author pid="39/1849">Bhuvana Ramabhadran</author>
<title>Improvements to Deep Convolutional Neural Networks for LVCSR.</title>
<pages>315-320</pages>
<year>2013</year>
<booktitle>ASRU</booktitle>
<ee>https://doi.org/10.1109/ASRU.2013.6707749</ee>
<crossref>conf/asru/2013</crossref>
<url>db/conf/asru/asru2013.html#SainathKMDSSBAR13</url>
</inproceedings>
</r>
<r><inproceedings key="conf/icassp/DahlSDY13" mdate="2018-07-12">
<author pid="10/7998">George E. Dahl</author>
<author pid="24/6478">Jack W. Stokes</author>
<author pid="31/1974-1">Li Deng 0001</author>
<author pid="71/4598-1">Dong Yu 0001</author>
<title>Large-scale malware classification using random projections and neural networks.</title>
<pages>3422-3426</pages>
<year>2013</year>
<booktitle>ICASSP</booktitle>
<ee>https://doi.org/10.1109/ICASSP.2013.6638293</ee>
<crossref>conf/icassp/2013</crossref>
<url>db/conf/icassp/icassp2013.html#DahlSDY13</url>
</inproceedings>
</r>
<r><inproceedings key="conf/icassp/DahlSH13" mdate="2017-05-19">
<author pid="10/7998">George E. Dahl</author>
<author pid="28/7825">Tara N. Sainath</author>
<author pid="10/3248">Geoffrey E. Hinton</author>
<title>Improving deep neural networks for LVCSR using rectified linear units and dropout.</title>
<pages>8609-8613</pages>
<year>2013</year>
<booktitle>ICASSP</booktitle>
<ee>https://doi.org/10.1109/ICASSP.2013.6639346</ee>
<crossref>conf/icassp/2013</crossref>
<url>db/conf/icassp/icassp2013.html#DahlSH13</url>
</inproceedings>
</r>
<r><inproceedings key="conf/icml/SutskeverMDH13" mdate="2019-05-29">
<author pid="60/5276">Ilya Sutskever</author>
<author pid="12/8412">James Martens</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="10/3248">Geoffrey E. Hinton</author>
<title>On the importance of initialization and momentum in deep learning.</title>
<pages>1139-1147</pages>
<year>2013</year>
<booktitle>ICML (3)</booktitle>
<ee type="oa">http://proceedings.mlr.press/v28/sutskever13.html</ee>
<crossref>conf/icml/2013</crossref>
<url>db/conf/icml/icml2013.html#SutskeverMDH13</url>
</inproceedings>
</r>
<r><article publtype="informal" key="journals/corr/SainathKMDSSBAR13" mdate="2018-08-13">
<author pid="28/7825">Tara N. Sainath</author>
<author pid="98/4359">Brian Kingsbury</author>
<author pid="28/8759">Abdel-rahman Mohamed</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="52/6787">George Saon</author>
<author pid="07/2072">Hagen Soltau</author>
<author pid="95/4892">Tom&#225;s Beran</author>
<author pid="85/10541">Aleksandr Y. Aravkin</author>
<author pid="39/1849">Bhuvana Ramabhadran</author>
<title>Improvements to deep convolutional neural networks for LVCSR.</title>
<year>2013</year>
<journal>CoRR</journal>
<ee type="oa">http://arxiv.org/abs/1309.1501</ee>
<volume>abs/1309.1501</volume>
<url>db/journals/corr/corr1309.html#SainathKMDSSBAR13</url>
</article>
</r>
<r><article key="journals/taslp/MohamedDH12" mdate="2020-05-17">
<author pid="28/8759">Abdel-rahman Mohamed</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="10/3248">Geoffrey E. Hinton</author>
<title>Acoustic Modeling Using Deep Belief Networks.</title>
<pages>14-22</pages>
<year>2012</year>
<volume>20</volume>
<journal>IEEE Trans. Speech Audio Process.</journal>
<number>1</number>
<ee>https://doi.org/10.1109/TASL.2011.2109382</ee>
<ee>https://www.wikidata.org/entity/Q56058041</ee>
<url>db/journals/taslp/taslp20.html#MohamedDH12</url>
</article>
</r>
<r><article key="journals/taslp/DahlYDA12" mdate="2025-03-03">
<author pid="10/7998">George E. Dahl</author>
<author pid="71/4598-1">Dong Yu 0001</author>
<author pid="31/1974-1">Li Deng 0001</author>
<author orcid="0009-0009-0299-6642" pid="a/AlexAcero">Alex Acero</author>
<title>Context-Dependent Pre-Trained Deep Neural Networks for Large-Vocabulary Speech Recognition.</title>
<pages>30-42</pages>
<year>2012</year>
<volume>20</volume>
<journal>IEEE Trans. Speech Audio Process.</journal>
<number>1</number>
<ee>https://doi.org/10.1109/TASL.2011.2134090</ee>
<ee>https://www.wikidata.org/entity/Q55897737</ee>
<url>db/journals/taslp/taslp20.html#DahlYDA12</url>
</article>
</r>
<r><inproceedings key="conf/icml/DahlAL12" mdate="2019-04-03">
<author pid="10/7998">George E. Dahl</author>
<author pid="32/909">Ryan Prescott Adams</author>
<author pid="86/3862">Hugo Larochelle</author>
<title>Training Restricted Boltzmann Machines on Word Observations.</title>
<year>2012</year>
<booktitle>ICML</booktitle>
<ee type="oa">http://icml.cc/2012/papers/364.pdf</ee>
<crossref>conf/icml/2012</crossref>
<url>db/conf/icml/icml2012.html#DahlAL12</url>
</inproceedings>
</r>
<r><article publtype="informal" key="journals/corr/abs-1202-5695" mdate="2018-08-13">
<author pid="10/7998">George E. Dahl</author>
<author pid="32/909">Ryan Prescott Adams</author>
<author pid="86/3862">Hugo Larochelle</author>
<title>Training Restricted Boltzmann Machines on Word Observations</title>
<ee type="oa">http://arxiv.org/abs/1202.5695</ee>
<year>2012</year>
<journal>CoRR</journal>
<volume>abs/1202.5695</volume>
<url>db/journals/corr/corr1202.html#abs-1202-5695</url>
</article>
</r>
<r><inproceedings key="conf/icassp/DahlYDA11" mdate="2025-03-03">
<author pid="10/7998">George E. Dahl</author>
<author pid="71/4598-1">Dong Yu 0001</author>
<author pid="31/1974-1">Li Deng 0001</author>
<author orcid="0009-0009-0299-6642" pid="a/AlexAcero">Alex Acero</author>
<title>Large vocabulary continuous speech recognition with context-dependent DBN-HMMS.</title>
<pages>4688-4691</pages>
<year>2011</year>
<booktitle>ICASSP</booktitle>
<ee>https://doi.org/10.1109/ICASSP.2011.5947401</ee>
<crossref>conf/icassp/2011</crossref>
<url>db/conf/icassp/icassp2011.html#DahlYDA11</url>
</inproceedings>
</r>
<r><inproceedings key="conf/icassp/MohamedSDRHP11" mdate="2017-05-19">
<author pid="28/8759">Abdel-rahman Mohamed</author>
<author pid="28/7825">Tara N. Sainath</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="39/1849">Bhuvana Ramabhadran</author>
<author pid="10/3248">Geoffrey E. Hinton</author>
<author pid="73/4588">Michael A. Picheny</author>
<title>Deep Belief Networks using discriminative features for phone recognition.</title>
<pages>5060-5063</pages>
<year>2011</year>
<booktitle>ICASSP</booktitle>
<ee>https://doi.org/10.1109/ICASSP.2011.5947494</ee>
<crossref>conf/icassp/2011</crossref>
<url>db/conf/icassp/icassp2011.html#MohamedSDRHP11</url>
</inproceedings>
</r>
<r><inproceedings key="conf/nips/DahlRMH10" mdate="2021-01-21">
<author pid="10/7998">George E. Dahl</author>
<author pid="28/1732">Marc'Aurelio Ranzato</author>
<author pid="28/8759">Abdel-rahman Mohamed</author>
<author pid="10/3248">Geoffrey E. Hinton</author>
<title>Phone Recognition with the Mean-Covariance Restricted Boltzmann Machine.</title>
<pages>469-477</pages>
<year>2010</year>
<booktitle>NIPS</booktitle>
<ee type="oa">https://proceedings.neurips.cc/paper/2010/hash/b73ce398c39f506af761d2277d853a92-Abstract.html</ee>
<ee type="oa">http://papers.nips.cc/paper/4169-phone-recognition-with-the-mean-covariance-restricted-boltzmann-machine</ee>
<crossref>conf/nips/2010</crossref>
<url>db/conf/nips/nips2010.html#DahlRMH10</url>
</inproceedings>
</r>
<r><inproceedings key="conf/uai/AdamsDM10" mdate="2021-02-03">
<author pid="32/909">Ryan Prescott Adams</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="82/384">Iain Murray 0001</author>
<title>Incorporating Side Information in Probabilistic Matrix Factorization with Gaussian Processes.</title>
<pages>1-9</pages>
<year>2010</year>
<booktitle>UAI</booktitle>
<ee type="archive">https://dslpitt.org/uai/displayArticleDetails.jsp?mmnu=1&#38;smnu=2&#38;article_id=2085&#38;proceeding_id=26</ee>
<crossref>conf/uai/2010</crossref>
<url>db/conf/uai/uai2010.html#AdamsDM10</url>
</inproceedings>
</r>
<r><article publtype="informal" key="journals/corr/abs-1003-4944" mdate="2018-08-13">
<author pid="32/909">Ryan Prescott Adams</author>
<author pid="10/7998">George E. Dahl</author>
<author pid="82/384">Iain Murray 0001</author>
<title>Incorporating Side Information in Probabilistic Matrix Factorization with Gaussian Processes</title>
<ee type="oa">http://arxiv.org/abs/1003.4944</ee>
<year>2010</year>
<journal>CoRR</journal>
<volume>abs/1003.4944</volume>
<url>db/journals/corr/corr1003.html#abs-1003-4944</url>
</article>
</r>
<coauthors n="157" nc="2">
<co c="0"><na f="a/Acero:Alex" pid="a/AlexAcero">Alex Acero</na></co>
<co c="0" n="2"><na f="a/Adams:Ryan_P=" pid="32/909">Ryan P. Adams</na><na>Ryan Prescott Adams</na></co>
<co c="0"><na f="a/Agarwal:Naman" pid="72/3910">Naman Agarwal</na></co>
<co c="0"><na f="a/Agarwala:Atish" pid="265/6410">Atish Agarwala</na></co>
<co c="0"><na f="a/Allen:Kelsey_R=" pid="153/9528">Kelsey R. Allen</na></co>
<co c="0"><na f="a/Amid:Ehsan" pid="142/5754">Ehsan Amid</na></co>
<co c="0"><na f="a/Andersen:David_G=" pid="a/DavidGAndersen">David G. Andersen</na></co>
<co c="0"><na f="a/Anil:Rohan" pid="182/1833">Rohan Anil</na></co>
<co c="0"><na f="a/Antognini:Joseph_M=" pid="222/3147">Joseph M. Antognini</na></co>
<co c="0"><na f="a/Aravkin:Aleksandr_Y=" pid="85/10541">Aleksandr Y. Aravkin</na></co>
<co c="0"><na f="a/Ariafar:Setareh" pid="169/2463">Setareh Ariafar</na></co>
<co c="0"><na f="b/Badura:Michal" pid="325/5394">Michal Badura</na></co>
<co c="0"><na f="b/Bae:Juhan" pid="158/9492">Juhan Bae</na></co>
<co c="0"><na f="b/Ballard:Andrew_J=" pid="190/7271">Andrew J. Ballard</na></co>
<co c="0"><na f="b/Bapst:Victor" pid="120/7601">Victor Bapst</na></co>
<co c="0"><na f="b/Battaglia:Peter_W=" pid="41/3400">Peter W. Battaglia</na></co>
<co c="0"><na f="b/Beran:Tom=aacute=s" pid="95/4892">Tom&#225;s Beran</na></co>
<co c="0" n="2"><na f="b/Botvinick:Matt_M=" pid="98/5712">Matt M. Botvinick</na><na>Matthew M. Botvinick</na></co>
<co c="0"><na f="b/Bowman:Samuel_R=" pid="116/0502">Samuel R. Bowman</na></co>
<co c="0"><na f="b/Boyko:Aleksey" pid="151/6713">Aleksey Boyko</na></co>
<co c="0"><na f="c/Cardoze:David" pid="304/2067">David Cardoze</na></co>
<co c="0"><na f="c/Chen:Christina" pid="278/2847">Christina Chen</na></co>
<co c="0"><na f="c/Chen:Kongtao" pid="297/3463">Kongtao Chen</na></co>
<co c="0"><na f="c/Chi:Benjamin_H=" pid="317/0233">Benjamin H. Chi</na></co>
<co c="0"><na f="c/Choi:Dami" pid="209/9687">Dami Choi</na></co>
<co c="0"><na f="c/Chou:Katherine" pid="210/1097">Katherine Chou</na></co>
<co c="0"><na f="c/Cohen_0001:Jeremy" pid="25/3538-1">Jeremy Cohen 0001</na></co>
<co c="0" n="2"><na f="c/Corrado:Gregory_S=" pid="05/8414">Gregory S. Corrado</na><na>Greg Corrado</na></co>
<co c="0"><na f="d/Dai:Andrew_M=" pid="59/9736">Andrew M. Dai</na></co>
<co c="0"><na f="d/Deng_0001:Li" pid="31/1974-1">Li Deng 0001</na></co>
<co c="0"><na f="d/Dhingra:Bhuwan" pid="180/5692">Bhuwan Dhingra</na></co>
<co c="0"><na f="d/Duckworth:Daniel" pid="10/8371">Daniel Duckworth</na></co>
<co c="0"><na f="d/Dyer:Chris" pid="41/6895">Chris Dyer</na></co>
<co c="0"><na f="e/Eschenhagen:Runa" pid="242/9235">Runa Eschenhagen</na></co>
<co c="0"><na f="f/Faulkner_0001:Ryan" pid="159/6155">Ryan Faulkner 0001</na></co>
<co c="0"><na f="f/Feng:Boyuan" pid="227/2946">Boyuan Feng</na></co>
<co c="0"><na f="f/Firat:Orhan" pid="120/2225">Orhan Firat</na></co>
<co c="0"><na f="f/Ford:Nicolas" pid="223/9765">Nicolas Ford</na></co>
<co c="0"><na f="f/Frostig:Roy" pid="136/9091">Roy Frostig</na></co>
<co c="0"><na f="g/Gadepalli:Krishna" pid="198/1178">Krishna Gadepalli</na></co>
<co c="0"><na f="g/Garg:Ankush" pid="86/7221">Ankush Garg</na></co>
<co c="0"><na f="g/Ghahramani:Zoubin" pid="g/ZoubinGhahramani">Zoubin Ghahramani</na></co>
<co c="0"><na f="g/Ghorbani:Behrooz" pid="162/0166">Behrooz Ghorbani</na></co>
<co c="0"><na f="g/Gilmer:Justin" pid="131/6545">Justin Gilmer</na></co>
<co c="0"><na f="g/Gomes:Ryan_G=" pid="317/0391">Ryan G. Gomes</na></co>
<co c="0"><na f="g/Goodfellow:Ian_J=" pid="43/7940">Ian J. Goodfellow</na></co>
<co c="0"><na f="g/Goodnight_III:William" pid="317/0204">William Goodnight III</na></co>
<co c="0"><na f="g/Grosse:Roger_B=" pid="26/7058">Roger B. Grosse</na></co>
<co c="0" n="2"><na f="g/Gulcehre:Caglar" pid="125/2132">Caglar Gulcehre</na><na>&#199;aglar G&#252;l&#231;ehre</na></co>
<co c="0"><na f="h/Hamrick:Jessica_B=" pid="155/1885">Jessica B. Hamrick</na></co>
<co c="0"><na f="h/Heess:Nicolas" pid="76/9181">Nicolas Heess</na></co>
<co c="0"><na f="h/Hennig:Philipp" pid="08/9077">Philipp Hennig</na></co>
<co c="0"><na f="h/Hinton:Geoffrey_E=" pid="10/3248">Geoffrey E. Hinton</na></co>
<co c="0"><na f="h/Hipp:Jason_D=" pid="198/0949">Jason D. Hipp</na></co>
<co c="0"><na f="j/Jaitly:Navdeep" pid="04/6137">Navdeep Jaitly</na></co>
<co c="0"><na f="j/Jenatton:Rodolphe" pid="68/8398">Rodolphe Jenatton</na></co>
<co c="0"><na f="k/Kasaro:Margaret_P=" pid="317/0237">Margaret P. Kasaro</na></co>
<co c="0"><na f="k/Kasimbeg:Priya" pid="251/9611">Priya Kasimbeg</na></co>
<co c="0"><na f="k/Khan:Bilal" pid="71/2824">Bilal Khan</na></co>
<co c="0"><na f="k/Kingsbury:Brian" pid="98/4359">Brian Kingsbury</na></co>
<co c="0"><na f="k/Kohlberger:Timo" pid="42/895">Timo Kohlberger</na></co>
<co c="0"><na f="k/Kohli:Pushmeet" pid="94/248">Pushmeet Kohli</na></co>
<co c="0"><na f="k/Krishnan:Shankar" pid="38/5647">Shankar Krishnan</na></co>
<co c="0" n="2"><na f="k/Kudugunta:Sneha_Reddy" pid="248/7500">Sneha Reddy Kudugunta</na><na>Sneha Kudugunta</na></co>
<co c="0"><na f="k/Kumar_0019:Manoj" pid="58/1076-19">Manoj Kumar 0019</na></co>
<co c="0"><na f="l/Langston:Victoria" pid="222/1565">Victoria Langston</na></co>
<co c="0"><na f="l/Larochelle:Hugo" pid="86/3862">Hugo Larochelle</na></co>
<co c="0"><na f="l/Lau:Charles" pid="277/1204">Charles Lau</na></co>
<co c="0"><na f="l/Lee:Chace" pid="317/0270">Chace Lee</na></co>
<co c="0"><na f="l/Lee:Chansoo" pid="137/3219">Chansoo Lee</na></co>
<co c="0"><na f="l/Lee_0001:Jaehoon" pid="95/386-1">Jaehoon Lee 0001</na></co>
<co c="0"><na f="l/Li:Lala" pid="49/7563">Lala Li</na></co>
<co c="0"><na f="l/Li_0001:Yujia" pid="67/3069-1">Yujia Li 0001</na></co>
<co c="1"><na f="l/Liaw:Andy" pid="67/731">Andy Liaw</na></co>
<co c="0"><na f="l/Liu:Kris" pid="133/2109">Kris Liu</na></co>
<co c="0"><na f="l/Liu_0013:Yun" pid="50/2482-13">Yun Liu 0013</na></co>
<co c="1"><na f="m/Ma:Junshui" pid="78/288">Junshui Ma</na></co>
<co c="0"><na f="m/Maddison:Chris_J=" pid="139/1388">Chris J. Maddison</na></co>
<co c="0"><na f="m/Malinowski:Mateusz" pid="10/3451">Mateusz Malinowski</na></co>
<co c="0"><na f="m/Mariet:Zelda" pid="164/7319">Zelda Mariet</na></co>
<co c="0"><na f="m/Martens:James" pid="12/8412">James Martens</na></co>
<co c="0"><na f="m/Mattson:Peter" pid="47/739">Peter Mattson</na></co>
<co c="0"><na f="m/McKinney:Scott_Mayer" pid="284/0700">Scott Mayer McKinney</na></co>
<co c="0"><na f="m/Medapati:Sourabh" pid="325/5349">Sourabh Medapati</na></co>
<co c="0"><na f="m/Mohamed:Abdel=rahman" pid="28/8759">Abdel-rahman Mohamed</na></co>
<co c="0"><na f="m/Murray_0001:Iain" pid="82/384">Iain Murray 0001</na></co>
<co c="0"><na f="n/Nado:Zachary" pid="228/7785">Zachary Nado</na></co>
<co c="0"><na f="n/Nash:Charles" pid="16/6892">Charles Nash</na></co>
<co c="0"><na f="n/Nelson:Philip_Q=" pid="198/0706">Philip Q. Nelson</na></co>
<co c="0"><na f="n/Neyshabur:Behnam" pid="131/9898">Behnam Neyshabur</na></co>
<co c="0"><na f="n/Norouzi_0002:Mohammad" pid="12/7659-2">Mohammad Norouzi 0002</na></co>
<co c="0"><na f="o/Orm=aacute=ndi:R=oacute=bert" pid="35/4647">R&#243;bert Orm&#225;ndi</na></co>
<co c="0"><na f="p/Pascanu:Razvan" pid="65/8368">Razvan Pascanu</na></co>
<co c="0" n="2"><na f="p/Passos:Alexandre_Tachard" pid="47/10827">Alexandre Tachard Passos</na><na>Alexandre Passos</na></co>
<co c="0"><na f="p/Pedregosa:Fabian" pid="11/9764">Fabian Pedregosa</na></co>
<co c="0"><na f="p/Peirson:Abel_L=" pid="349/3715">Abel L. Peirson</na></co>
<co c="0"><na f="p/Peng:Lily" pid="198/1261">Lily Peng</na></co>
<co c="0"><na f="p/Pereyra:Gabriel" pid="170/0034">Gabriel Pereyra</na></co>
<co c="0" n="2"><na f="p/Picheny:Michael" pid="73/4588">Michael Picheny</na><na>Michael A. Picheny</na></co>
<co c="0"><na f="p/Pilgrim:Rory" pid="292/7059">Rory Pilgrim</na></co>
<co c="0"><na f="p/Price:Joan_T=" pid="317/0179">Joan T. Price</na></co>
<co c="0" n="3"><na f="r/Rabbat:Michael_G=" pid="47/1744">Michael G. Rabbat</na><na>Michael Rabbat</na><na>Mike Rabbat</na></co>
<co c="0"><na f="r/Ramabhadran:Bhuvana" pid="39/1849">Bhuvana Ramabhadran</na></co>
<co c="0"><na f="r/Ranzato:Marc=Aurelio" pid="28/1732">Marc'Aurelio Ranzato</na></co>
<co c="0"><na f="r/Raposo:David" pid="52/11138">David Raposo</na></co>
<co c="0"><na f="r/Riley:Patrick_F=" pid="r/PatrickRiley">Patrick F. Riley</na></co>
<co c="0"><na f="r/Roulet:Vincent" pid="164/6165">Vincent Roulet</na></co>
<co c="0"><na f="s/Sachdeva:Sushant" pid="25/9221">Sushant Sachdeva</na></co>
<co c="0"><na f="s/Saensuksopa:T=" pid="317/0264">T. Saensuksopa</na></co>
<co c="0"><na f="s/Sainath:Tara_N=" pid="28/7825">Tara N. Sainath</na></co>
<co c="0"><na f="s/Salakhutdinov:Ruslan" pid="62/5884">Ruslan Salakhutdinov</na></co>
<co c="0"><na f="s/Sanchez=Gonzalez:Alvaro" pid="222/1889">Alvaro Sanchez-Gonzalez</na></co>
<co c="0"><na f="s/Santoro:Adam" pid="180/5951">Adam Santoro</na></co>
<co c="0"><na f="s/Saon:George" pid="52/6787">George Saon</na></co>
<co c="0"><na f="s/Saroufim:Mark" pid="118/5750">Mark Saroufim</na></co>
<co c="0"><na f="s/Sastry:Chandramouli_Shama" pid="223/6317">Chandramouli Shama Sastry</na></co>
<co c="0"><na f="s/Schneider_0001:Frank" pid="41/328-1">Frank Schneider 0001</na></co>
<co c="0"><na f="s/Schoenholz:Samuel_S=" pid="190/7108">Samuel S. Schoenholz</na></co>
<co c="0"><na f="s/Shallue:Christopher_J=" pid="126/6014">Christopher J. Shallue</na></co>
<co c="1"><na f="s/Sheridan:Robert_P=" pid="60/5415">Robert P. Sheridan</na></co>
<co c="0"><na f="s/Shetty:Shravya" pid="49/1617">Shravya Shetty</na></co>
<co c="0"><na f="s/Sieniek:Marcin" pid="48/8770">Marcin Sieniek</na></co>
<co c="0"><na f="s/Sindano:Ntazana" pid="316/9859">Ntazana Sindano</na></co>
<co c="0"><na f="s/Snider:Daniel" pid="324/5277">Daniel Snider</na></co>
<co c="0"><na f="s/Snoek:Jasper" pid="95/6097">Jasper Snoek</na></co>
<co c="0"><na f="s/Sohl=Dickstein:Jascha" pid="51/7117">Jascha Sohl-Dickstein</na></co>
<co c="0"><na f="s/Soltau:Hagen" pid="07/2072">Hagen Soltau</na></co>
<co c="0"><na f="s/Song:H=_Francis" pid="150/6469">H. Francis Song</na></co>
<co c="0"><na f="s/Spitz:Terry" pid="317/0325">Terry Spitz</na></co>
<co c="0"><na f="s/Stokes:Jack_W=" pid="24/6478">Jack W. Stokes</na></co>
<co c="0"><na f="s/Stringer:Elizabeth_M=" pid="317/0406">Elizabeth M. Stringer</na></co>
<co c="0"><na f="s/Stringer:Jeffrey_S=_A=" pid="316/9959">Jeffrey S. A. Stringer</na></co>
<co c="0"><na f="s/Stumpe:Martin_C=" pid="13/11026">Martin C. Stumpe</na></co>
<co c="0"><na f="s/Suo:Daniel" pid="186/8419">Daniel Suo</na></co>
<co c="0"><na f="s/Sutskever:Ilya" pid="60/5276">Ilya Sutskever</na></co>
<co c="1"><na f="s/Svetnik:Vladimir" pid="55/3190">Vladimir Svetnik</na></co>
<co c="0"><na f="s/Swersky:Kevin" pid="35/9381">Kevin Swersky</na></co>
<co c="0"><na f="t/Tacchetti:Andrea" pid="127/6624">Andrea Tacchetti</na></co>
<co c="0"><na f="t/Taylor_0003:James_A=" pid="316/9899">James A. Taylor 0003</na></co>
<co c="0"><na f="t/Timofeev:Aleksei" pid="198/1268">Aleksei Timofeev</na></co>
<co c="0"><na f="t/Tse:Daniel" pid="63/9281">Daniel Tse</na></co>
<co c="0"><na f="u/Uddin:Akib" pid="317/0324">Akib Uddin</na></co>
<co c="0"><na f="v/Vasudev:Rakshith" pid="349/2430">Rakshith Vasudev</na></co>
<co c="0"><na f="v/Vasudevan:Vijay" pid="08/2793">Vijay Vasudevan</na></co>
<co c="0"><na f="v/Vaswani:Ashish" pid="26/9012">Ashish Vaswani</na></co>
<co c="0"><na f="v/Venugopalan:Subhashini" pid="21/11044">Subhashini Venugopalan</na></co>
<co c="0"><na f="v/Vinyals:Oriol" pid="05/726">Oriol Vinyals</na></co>
<co c="0"><na f="v/Vwalika:Bellington" pid="317/0293">Bellington Vwalika</na></co>
<co c="0"><na f="w/Wang:Zi" pid="78/8711">Zi Wang</na></co>
<co c="0"><na f="w/Wierstra:Daan" pid="65/6056">Daan Wierstra</na></co>
<co c="0"><na f="w/Willis:Angelica" pid="180/1370">Angelica Willis</na></co>
<co c="0"><na f="w/Wong:Jonny" pid="317/0382">Jonny Wong</na></co>
<co c="0"><na f="w/Wright:Less" pid="295/9883">Less Wright</na></co>
<co c="0"><na f="y/Yang:Edward_Z=" pid="118/9819">Edward Z. Yang</na></co>
<co c="0"><na f="y/Yu_0001:Dong" pid="71/4598-1">Dong Yu 0001</na></co>
<co c="0"><na f="z/Zambaldi:Vin=iacute=cius_Flores" pid="146/6224">Vin&#237;cius Flores Zambaldi</na></co>
<co c="0"><na f="z/Zhang_0006:Guodong" pid="28/4937-6">Guodong Zhang 0006</na></co>
</coauthors>
</dblpperson>

