%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % This file is automatically generated. Do not modify this % file directly, or else your changes will be overwritten. %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%" @inproceedings{bastani2016measuring, author = {Osbert Bastani and Yani Ioannou and Leonidas Lampropoulos and Dimitrios Vytiniotis and Aditya Nori and Antonio Criminisi}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {2613--2621}, title = {Measuring neural net robustness with constraints}, year = {2016}, } @inproceedings{wong2018provable, author = {Eric Wong and J. Zico Kolter}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Provable defenses against adversarial examples via the convex outer adversarial polytope}, year = {2018}, } @article{dvijotham2018dual, author = {Krishnamurthy Dvijotham and Robert Stanforth and Sven Gowal and Timothy Mann and Pushmeet Kohli}, journal = {arXiv preprint arXiv:1803.06567}, title = {A Dual Approach to Scalable Verification of Deep Networks}, year = {2018}, } @inproceedings{hein2017formal, author = {Matthias Hein and Maksym Andriushchenko}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {2263--2273}, title = {Formal guarantees on the robustness of a classifier against adversarial manipulation}, year = {2017}, } @article{ahmadi2017dsos, author = {Amir Ali Ahmadi and Anirudha Majumdar}, journal = {arXiv preprint arXiv:1706.02586}, title = {{DSOS} and {SDSOS} optimization: more tractable alternatives to sum of squares and semidefinite optimization}, year = {2017}, } @article{dvijotham2018training, author = {Krishnamurthy Dvijotham and Sven Gowal and Robert Stanforth and Relja Arandjelovic and Brendan O'Donoghue and Jonathan Uesato and Pushmeet Kohli}, journal = {arXiv preprint arXiv:1805.10265}, title = {Training verified learners with learned verifiers}, year = {2018}, } @inproceedings{wong2018scaling, author = {Eric Wong and Frank Schmidt and Jan Hendrik Metzen and J Zico Kolter}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Scaling provable adversarial defenses}, year = {2018}, } @article{gowal2018effectiveness, author = {Sven Gowal and Krishnamurthy Dvijotham and Robert Stanforth and Rudy Bunel and Chongli Qin and Jonathan Uesato and Timothy Mann and Pushmeet Kohli}, journal = {arXiv preprint arXiv:1810.12715}, title = {On the Effectiveness of Interval Bound Propagation for Training Verifiably Robust Models}, year = {2018}, } @inproceedings{belinkov2018synthetic, author = {Yonatan Belinkov and Yonatan Bisk}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Synthetic and natural noise both break neural machine translation}, year = {2018}, } @inproceedings{ebrahimi2018hotflip, author = {Javid Ebrahimi and Anyi Rao and Daniel Lowd and Dejing Dou}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Hotflip: White-box adversarial examples for text classification}, year = {2018}, } @article{tsipras2018there, author = {Dimitris Tsipras and Shibani Santurkar and Logan Engstrom and Alexander Turner and Aleksander Madry}, journal = {arXiv preprint arXiv:1805.12152}, title = {There is no free lunch in adversarial robustness (but there are unexpected benefits)}, year = {2018}, } @inproceedings{schmidt2018adversarially, author = {Ludwig Schmidt and Shibani Santurkar and Dimitris Tsipras and Kunal Talwar and Aleksander Madry}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {5014--5026}, title = {Adversarially robust generalization requires more data}, year = {2018}, } @inproceedings{zhang2019theoretically, author = {Hongyang Zhang and Yaodong Yu and Jiantao Jiao and Eric P Xing and Laurent El Ghaoui and Michael I Jordan}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Theoretically principled trade-off between robustness and accuracy}, year = {2019}, } @inproceedings{zheng2016improving, author = {Stephan Zheng and Yang Song and Thomas Leung and Ian Goodfellow}, booktitle = {Proceedings of the ieee conference on computer vision and pattern recognition}, pages = {4480--4488}, title = {Improving the robustness of deep neural networks via stability training}, year = {2016}, } @inproceedings{cohen2019certified, author = {Jeremy M Cohen and Elan Rosenfeld and J Zico Kolter}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Certified adversarial robustness via randomized smoothing}, year = {2019}, } @inproceedings{rosenberg2005semi, author = {Chuck Rosenberg and Martial Hebert and Henry Schneiderman}, booktitle = {Proceedings of the Seventh IEEE Workshops on Application of Computer Vision}, title = {Semi-supervised self-training of object detection models}, year = {2005}, } @article{miyato2018virtual, author = {Takeru Miyato and Shin-ichi Maeda and Shin Ishii and Masanori Koyama}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence}, title = {Virtual adversarial training: a regularization method for supervised and semi-supervised learning}, year = {2018}, } @inproceedings{cubuk2019autoaugment, author = {Ekin D Cubuk and Barret Zoph and Dandelion Mane and Vijay Vasudevan and Quoc V Le}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Autoaugment: Learning augmentation policies from data}, year = {2019}, } @article{devries2017improved, author = {Terrance DeVries and Graham W Taylor}, journal = {arXiv preprint arXiv:1708.04552}, title = {Improved regularization of convolutional neural networks with cutout}, year = {2017}, } @article{torralba2008million, author = {Antonio Torralba and Rob Fergus and William T Freeman}, journal = {IEEE transactions on pattern analysis and machine intelligence}, number = {11}, pages = {1958--1970}, title = {80 million tiny images: A large data set for nonparametric object and scene recognition}, volume = {30}, year = {2008}, } @inproceedings{lecuyer2019certified, author = {Mathias Lecuyer and Vaggelis Atlidakis and Roxana Geambasu and Daniel Hsu and Suman Jana}, booktitle = {In IEEE Symposium on Security and Privacy (SP)}, title = {Certified robustness to adversarial examples with differential privacy}, year = {2019}, } @article{li2018second, author = {Bai Li and Changyou Chen and Wenlin Wang and Lawrence Carin}, journal = {arXiv preprint arXiv:1809.03113}, title = {Second-Order Adversarial Attack and Certifiable Robustness}, year = {2018}, } @inproceedings{zagoruyko2016wide, author = {Sergey Zagoruyko and Nikos Komodakis}, booktitle = {British Machine Vision Conference}, title = {Wide residual networks}, year = {2016}, } @inproceedings{oliver2018realistic, author = {Avital Oliver and Augustus Odena and Colin A Raffel and Ekin Dogus Cubuk and Ian Goodfellow}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {3235--3246}, title = {Realistic evaluation of deep semi-supervised learning algorithms}, year = {2018}, } @article{xie2019unsupervised, author = {Qizhe Xie and Zihang Dai and Eduard Hovy and Minh-Thang Luong and Quoc V Le}, journal = {arXiv preprint arXiv:1904.12848}, title = {Unsupervised data augmentation}, year = {2019}, } @inproceedings{laine2017temporal, author = {Samuli Laine and Timo Aila}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Temporal ensembling for semi-supervised learning}, year = {2017}, } @inproceedings{sajjadi2016regularization, author = {Mehdi Sajjadi and Mehran Javanmardi and Tolga Tasdizen}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1163--1171}, title = {Regularization with stochastic transformations and perturbations for deep semi-supervised learning}, year = {2016}, } @inproceedings{tarvainen2017mean, author = {Antti Tarvainen and Harri Valpola}, booktitle = {Advances in neural information processing systems}, pages = {1195--1204}, title = {Mean teachers are better role models: Weight-averaged consistency targets improve semi-supervised deep learning results}, year = {2017}, } @inproceedings{zhu2003semi, author = {Xiaojin Zhu and Zoubin Ghahramani and John D Lafferty}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {912--919}, title = {Semi-supervised learning using gaussian fields and harmonic functions}, year = {2003}, } @inproceedings{lee2013pseudo, author = {Dong-Hyun Lee}, booktitle = {ICML Workshop on Challenges in Representation Learning}, title = {Pseudo-label: The simple and efficient semi-supervised learning method for deep neural networks}, year = {2013}, } @article{montasser2019vc, author = {Omar Montasser and Steve Hanneke and Nathan Srebro}, journal = {arXiv preprint arXiv:1902.04217}, title = {{VC} Classes are Adversarially Robustly Learnable, but Only Improperly}, year = {2019}, } @inproceedings{bubeck2019adversarial, author = {Sebastien Bubeck and Eric Price and Ilya Razenshteyn}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Adversarial examples from computational constraints}, year = {2019}, } @article{gilmer2018adversarial, author = {Justin Gilmer and Luke Metz and Fartash Faghri and Samuel S Schoenholz and Maithra Raghu and Martin Wattenberg and Ian Goodfellow}, journal = {arXiv preprint arXiv:1801.02774}, title = {Adversarial spheres}, year = {2018}, } @inproceedings{tsipras2019robustness, author = {Dimitris Tsipras and Shibani Santurkar and Logan Engstrom and Alexander Turner and Aleksander Madry}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Robustness may be at odds with accuracy}, year = {2019}, } @article{fawzi2018analysis, author = {Alhussein Fawzi and Omar Fawzi and Pascal Frossard}, journal = {Machine Learning}, number = {3}, pages = {481--508}, title = {Analysis of classifiers' robustness to adversarial perturbations}, volume = {107}, year = {2018}, } @article{kannan2018adversarial, author = {Harini Kannan and Alexey Kurakin and Ian Goodfellow}, journal = {arXiv preprint arXiv:1803.06373}, title = {Adversarial logit pairing}, year = {2018}, } @article{engstrom2018evaluating, author = {Logan Engstrom and Andrew Ilyas and Anish Athalye}, journal = {arXiv preprint arXiv:1807.10272}, title = {Evaluating and understanding the robustness of adversarial logit pairing}, year = {2018}, } @article{papernot2018cleverhans, author = {Nicolas Papernot and Fartash Faghri and Nicholas Carlini and Ian Goodfellow and Reuben Feinman and Alexey Kurakin and Cihang Xie and Yash Sharma and Tom Brown and Aurko Roy and Alexander Matyasko and Vahid Behzadan and Karen Hambardzumyan and Zhishuai Zhang and Yi-Lin Juang and Zhi Li and Ryan Sheatsley and Abhibhav Garg and Jonathan Uesato and Willi Gierke and Yinpeng Dong and David Berthelot and Paul Hendricks and Jonas Rauber and Rujun Long}, journal = {arXiv preprint arXiv:1610.00768}, title = {Technical Report on the CleverHans v2.1.0 Adversarial Examples Library}, year = {2018}, } @inproceedings{netzer2011reading, author = {Netzer, Yuval and Wang, Tao and Coates, Adam and Bissacco, Alessandro and Wu, Bo and Ng, Andrew Y}, booktitle = {NIPS Workshop on Deep Learning and Unsupervised Feature Learning}, title = {Reading Digits in Natural Images with Unsupervised Feature Learning }, year = {2011}, } @inproceedings{loshchilov2017sgdr, author = {Ilya Loshchilov and Frank Hutter}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Sgdr: Stochastic gradient descent with warm restarts}, year = {2017}, } @inproceedings{uesato2019are, author = {Jonathan Uesato and Jean-Baptiste Alayrac and Po-Sen Huang and Robert Stanforth and Alhussein Fawzi and Pushmeet Kohli}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Are Labels Required for Improving Adversarial Robustness?}, year = {2019}, } @article{nakkiran2019adversarial, author = {Preetum Nakkiran}, journal = {arXiv preprint arXiv:1901.00532}, title = {Adversarial robustness may be at odds with simplicity}, year = {2019}, } @article{stutz2018disentangling, author = {David Stutz and Matthias Hein and Bernt Schiele}, journal = {arXiv preprint arXiv:1812.00740}, title = {Disentangling adversarial robustness and generalization}, year = {2018}, } @article{khim2018adversarial, author = {Justin Khim and Po-Ling Loh}, journal = {arXiv preprint arXiv:1810.09519}, title = {Adversarial risk bounds for binary classification via function transformation}, year = {2018}, } @inproceedings{najafi2019robustness, author = {Amir Najafi and Shin-ichi Maeda and Masanori Koyama and Takeru Miyato}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Robustness to Adversarial Perturbations in Learning from Incomplete Data}, year = {2019}, } @article{zhai2019adversarially, author = {Runtian Zhai and Tianle Cai and Di He and Chen Dan and Kun He and John Hopcroft and Liwei Wang}, journal = {arXiv preprint arXiv:1906.00555}, title = {Adversarially Robust Generalization Just Requires More Unlabeled Data}, year = {2019}, } @article{tibshirani1996regression, author = {Robert Tibshirani}, journal = {Journal of the Royal Statistical Society: Series B (Methodological)}, number = {1}, pages = {267--288}, title = {Regression shrinkage and selection via the lasso}, volume = {58}, year = {1996}, } @article{nagarajan2019uniform, author = {Vaishnavh Nagarajan and J Zico Kolter}, journal = {arXiv preprint arXiv:1902.04742}, title = {Uniform convergence may be unable to explain generalization in deep learning}, year = {2019}, } @article{ilyas2019adversarial, author = {Andrew Ilyas and Shibani Santurkar and Dimitris Tsipras and Logan Engstrom and Brandon Tran and Aleksander Madry}, journal = {arXiv preprint arXiv:1905.02175}, title = {Adversarial examples are not bugs, they are features}, year = {2019}, } @article{hastie2019surprises, author = {Trevor Hastie and Andrea Montanari and Saharon Rosset and Ryan J Tibshirani}, journal = {arXiv preprint arXiv:1903.08560}, title = {Surprises in high-dimensional ridgeless least squares interpolation}, year = {2019}, } @article{chen2019invariance, author = {Shuxiao Chen and Edgar Dobriban and Jane H Lee}, journal = {arXiv preprint arXiv:1907.10905}, title = {Invariance reduces Variance: Understanding Data Augmentation in Deep Learning and Beyond}, year = {2019}, } @inproceedings{engstrom2019exploring, author = {Logan Engstrom and Brandon Tran and Dimitris Tsipras and Ludwig Schmidt and Aleksander Madry}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1802--1811}, title = {Exploring the Landscape of Spatial Robustness}, year = {2019}, } @inproceedings{yang2019invariance, author = {Fanny Yang and Zuowen Wang and Christina Heinze-Deml}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Invariance-inducing regularization using worst-case transformations suffices to boost accuracy and spatial robustness}, year = {2019}, } @inproceedings{ma2018power, author = {Siyuan Ma and Raef Bassily and Mikhail Belkin}, booktitle = {International Conference on Machine Learning (ICML)}, title = {The power of interpolation: Understanding the effectiveness of {SGD} in modern over-parametrized learning}, year = {2018}, } @inproceedings{belkin2018understand, author = {Mikhail Belkin and Siyuan Ma and Soumik Mandal}, booktitle = {International Conference on Machine Learning (ICML)}, title = {To understand deep learning we need to understand kernel learning}, year = {2018}, } @article{liang2018just, author = {Tengyuan Liang and Alexander Rakhlin}, journal = {arXiv preprint arXiv:1808.00387}, title = {Just interpolate: Kernel" ridgeless" regression can generalize}, year = {2018}, } @article{zoph2016neural, author = {Barret Zoph and Quoc V Le}, journal = {arXiv preprint arXiv:1611.01578}, title = {Neural architecture search with reinforcement learning}, year = {2016}, } @article{cubuk2017intriguing, author = {Ekin D Cubuk and Barret Zoph and Samuel S Schoenholz and Quoc V Le}, journal = {arXiv preprint arXiv:1711.02846}, title = {Intriguing properties of adversarial examples}, year = {2017}, } @article{scudder1965probability, author = {H Scudder}, journal = {IEEE Transactions on Information Theory}, number = {3}, pages = {363--371}, title = {Probability of error of some adaptive pattern-recognition machines}, volume = {11}, year = {1965}, } @inproceedings{zou2018unsupervised, author = {Yang Zou and Zhiding Yu and BVK Vijaya Kumar and Jinsong Wang}, booktitle = {European Conference on Computer Vision (ECCV)}, pages = {289--305}, title = {Unsupervised domain adaptation for semantic segmentation via class-balanced self-training}, year = {2018}, } @inproceedings{inoue2018cross, author = {Naoto Inoue and Ryosuke Furuta and Toshihiko Yamasaki and Kiyoharu Aizawa}, booktitle = {Proceedings of the IEEE conference on computer vision and pattern recognition}, pages = {5001--5009}, title = {Cross-domain weakly-supervised object detection through progressive domain adaptation}, year = {2018}, } @inproceedings{saito2017asymmetric, author = {Kuniaki Saito and Yoshitaka Ushiku and Tatsuya Harada}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {2988--2997}, title = {Asymmetric tri-training for unsupervised domain adaptation}, year = {2017}, } @inproceedings{zhang2018collaborative, author = {Weichen Zhang and Wanli Ouyang and Wen Li and Dong Xu}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {3801--3809}, title = {Collaborative and adversarial network for unsupervised domain adaptation}, year = {2018}, } @inproceedings{chen2017no, author = {Yi-Hsin Chen and Wei-Yu Chen and Yu-Ting Chen and Bo-Cheng Tsai and Yu-Chiang Frank Wang and Min Sun}, booktitle = {International Conference on Computer Vision (ICCV)}, pages = {1992--2001}, title = {No more discrimination: Cross city adaptation of road scene segmenters}, year = {2017}, } @inproceedings{long2013transfer, author = {Mingsheng Long and Jianmin Wang and Guiguang Ding and Jiaguang Sun and Philip S Yu}, booktitle = {Proceedings of the IEEE international conference on computer vision}, pages = {2200--2207}, title = {Transfer feature learning with joint distribution adaptation}, year = {2013}, } @article{zou2019confidence, author = {Yang Zou and Zhiding Yu and Xiaofeng Liu and BVK Kumar and Jinsong Wang}, journal = {arXiv preprint arXiv:1908.09822}, title = {Confidence regularized self-training}, year = {2019}, } @inproceedings{attias2019improved, author = {Idan Attias and Aryeh Kontorovich and Yishay Mansour}, booktitle = {Algorithmic Learning Theory}, pages = {162--183}, title = {Improved Generalization Bounds for Robust Learning}, year = {2019}, } @inproceedings{yin2019rademacher, author = {Dong Yin and Ramchandran Kannan and Peter Bartlett}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {7085--7094}, title = {Rademacher Complexity for Adversarially Robust Generalization}, year = {2019}, } @inproceedings{biggio2013evasion, author = {Battista Biggio and Igino Corona and Davide Maiorca and Blaine Nelson and Nedim {\v{S}}rndi{\'c} and Pavel Laskov and Giorgio Giacinto and Fabio Roli}, booktitle = {Joint European conference on machine learning and knowledge discovery in databases}, pages = {387--402}, title = {Evasion attacks against machine learning at test time}, year = {2013}, } @article{biggio2018wild, author = {Battista Biggio and Fabio Roli}, journal = {Pattern Recognition}, pages = {317--331}, title = {Wild patterns: Ten years after the rise of adversarial machine learning}, volume = {84}, year = {2018}, } @inproceedings{yin2019fourier, author = {Dong Yin and Raphael Gontijo Lopes and Jonathon Shlens and Ekin D Cubuk and Justin Gilmer}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {A fourier perspective on model robustness in computer vision}, year = {2019}, } @inproceedings{degwekar2019computational, author = {Akshay Degwekar and Preetum Nakkiran and Vinod Vaikuntanathan}, booktitle = {Conference on Learning Theory (COLT)}, title = {Computational Limitations in Robust Classification and Win-Win Results}, year = {2019}, } @article{advani2017high, author = {Madhu S Advani and Andrew M Saxe}, journal = {arXiv preprint arXiv:1710.03667}, title = {High-dimensional dynamics of generalization error in neural networks}, year = {2017}, } @article{nakkiran2019deep, author = {Preetum Nakkiran and Gal Kaplun and Yamini Bansal and Tristan Yang and Boaz Barak and Ilya Sutskever}, journal = {arXiv preprint arXiv:1912.02292}, title = {Deep double descent: Where bigger models and more data hurt}, year = {2019}, } @article{opper1995statistical, author = {Manfred Opper}, journal = {The Handbook of Brain Theory and Neural Networks,}, pages = {922--925}, title = {Statistical mechanics of learning: Generalization}, year = {1995}, } @article{belkin2019reconciling, author = {Mikhail Belkin and Daniel Hsu and Siyuan Ma and Soumik Mandal}, journal = {Science}, number = {32}, title = {Reconciling modern machine-learning practice and the classical bias--variance trade-off}, volume = {116}, year = {2019}, } @article{mei2019generalization, author = {Song Mei and Andrea Montanari}, journal = {arXiv preprint arXiv:1908.05355}, title = {The generalization error of random features regression: Precise asymptotics and double descent curve}, year = {2019}, } @article{du2018power, author = {Simon S Du and Jason D Lee}, journal = {arXiv preprint arXiv:1803.01206}, title = {On the power of over-parametrization in neural networks with quadratic activation}, year = {2018}, } @inproceedings{nguyen2017loss, author = {Quynh Nguyen and Matthias Hein}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {2603--2612}, title = {The loss surface of deep and wide neural networks}, year = {2017}, } @inproceedings{arora2018optimization, author = {Sanjeev Arora and Nadav Cohen and Elad Hazan}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {244--253}, title = {On the Optimization of Deep Networks: Implicit Acceleration by Overparameterization}, year = {2018}, } @article{soudry2018implicit, author = {Daniel Soudry and Elad Hoffer and Mor Shpigel Nacson and Suriya Gunasekar and Nathan Srebro}, journal = {Journal of Machine Learning Research (JMLR)}, number = {1}, pages = {2822--2878}, title = {The implicit bias of gradient descent on separable data}, volume = {19}, year = {2018}, } @article{min2020curious, author = {Yifei Min and Lin Chen and Amin Karbasi}, journal = {arXiv preprint arXiv:2002.11080}, title = {The curious case of adversarially robust models: More data can help, double descend, or hurt generalization}, year = {2020}, } @inproceedings{xie2020adversarial, author = {Cihang Xie and Mingxing Tan and Boqing Gong and Jiang Wang and Alan L Yuille and Quoc V Le}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {819--828}, title = {Adversarial examples improve image recognition}, year = {2020}, } @inproceedings{stallkamp2011german, author = {Johannes Stallkamp and Marc Schlipsing and Jan Salmen and Christian Igel}, booktitle = {The 2011 international joint conference on neural networks}, pages = {1453--1460}, title = {The German traffic sign recognition benchmark: a multi-class classification competition}, year = {2011}, } @article{shankar2019image, author = {Vaishaal Shankar and Achal Dave and Rebecca Roelofs and Deva Ramanan and Benjamin Recht and Ludwig Schmidt}, journal = {arXiv preprint arXiv:1906.02168}, title = {Do Image Classifiers Generalize Across Time?}, year = {2019}, } @article{muthukumar2020harmless, author = {Vidya Muthukumar and Kailas Vodrahalli and Vignesh Subramanian and Anant Sahai}, journal = {IEEE Journal on Selected Areas in Information Theory}, number = {1}, pages = {67--83}, title = {Harmless interpolation of noisy data in regression}, volume = {1}, year = {2020}, } @inproceedings{bibas2019new, author = {Koby Bibas and Yaniv Fogel and Meir Feder}, booktitle = {2019 IEEE International Symposium on Information Theory (ISIT)}, pages = {2304--2308}, title = {A new look at an old problem: A universal learning approach to linear regression}, year = {2019}, } @inproceedings{ji2019implicit, author = {Ziwei Ji and Matus Telgarsky}, booktitle = {Conference on Learning Theory (COLT)}, pages = {1772--1798}, title = {The implicit bias of gradient descent on nonseparable data}, year = {2019}, } @inproceedings{zhang2020crown, author = {Huan Zhang and Hongge Chen and Chaowei Xiao and Sven Gowal and Robert Stanforth and Bo Li and Duane Boning and Cho-Jui Hsieh}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Towards stable and efficient training of verifiably robust neural networks}, year = {2020}, } @inproceedings{yang2020randomized, author = {Greg Yang and Tony Duan and J Edward Hu and Hadi Salman and Ilya Razenshteyn and Jerry Li}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Randomized smoothing of all shapes and sizes}, year = {2020}, } @article{fazlyab2019safety, author = {Mahyar Fazlyab and Manfred Morari and George J Pappas}, journal = {arXiv preprint arXiv:1903.01287}, title = {Safety Verification and Robustness Analysis of Neural Networks via Quadratic Constraints and Semidefinite Programming}, year = {2019}, } @article{monteiro2003first, author = {Renato DC Monteiro}, journal = {Mathematical Programming}, number = {1}, pages = {209--244}, title = {First-and second-order methods for semidefinite programming}, volume = {97}, year = {2003}, } @techreport{tu2014practical, author = {Stephen Tu and Jingyan Wang}, institution = {University of California, Berkeley}, title = {Practical first order methods for large scale semidefinite programming}, year = {2014}, } @techreport{wen2009first, author = {Zaiwen Wen}, institution = {Columbia University}, title = {First-order methods for semidefinite programming}, year = {2009}, } @article{renegar2014efficient, author = {James Renegar}, journal = {arXiv preprint arXiv:1409.5832}, title = {Efficient first-order methods for linear programming and semidefinite programming}, year = {2014}, } @article{helmberg2007spectral, author = {Yurii Nesterov}, journal = {Mathematical Programming}, number = {2}, pages = {245--259}, title = {Smoothing technique and its applications in semidefinite optimization}, volume = {110}, year = {2007}, } @article{danskin1966theory, author = {John M Danskin}, journal = {SIAM Journal on Applied Math}, title = {The theory of max-min with applications}, year = {1966 1966}, } @inproceedings{agrawal2014analyzing, author = {Pulkit Agrawal and Ross Girshick and Jitendra Malik}, booktitle = {European conference on computer vision}, pages = {329--344}, title = {Analyzing the performance of multilayer neural networks for object recognition}, year = {2014}, } @article{chatfield2014return, author = {Ken Chatfield and Karen Simonyan and Andrea Vedaldi and Andrew Zisserman}, journal = {arXiv preprint arXiv:1405.3531}, title = {Return of the devil in the details: Delving deep into convolutional nets}, year = {2014}, } @inproceedings{girshick2014rich, author = {Ross Girshick and Jeff Donahue and Trevor Darrell and Jitendra Malik}, booktitle = {Proceedings of the IEEE conference on computer vision and pattern recognition}, pages = {580--587}, title = {Rich feature hierarchies for accurate object detection and semantic segmentation}, year = {2014}, } @inproceedings{yosinski2014transferable, author = {Jason Yosinski and Jeff Clune and Yoshua Bengio and Hod Lipson}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {How transferable are features in deep neural networks?}, year = {2014}, } @inproceedings{chu2016best, author = {Brian Chu and Vashisht Madhavan and Oscar Beijbom and Judy Hoffman and Trevor Darrell}, booktitle = {European conference on computer vision}, pages = {435--442}, title = {Best practices for fine-tuning visual classifiers to new domains}, year = {2016}, } @article{chen2021empirical, author = {Xinlei Chen and Saining Xie and Kaiming He}, journal = {arXiv preprint arXiv:2104.02057}, title = {An empirical study of training self-supervised vision transformers}, year = {2021}, } @inproceedings{belinkov2017neural, author = {Yonatan Belinkov and Nadir Durrani and Fahim Dalvi and Hassan Sajjad and James Glass}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {861--872}, title = {What do Neural Machine Translation Models Learn about Morphology?}, year = {2017}, } @inproceedings{peters2019tune, author = {Matthew E Peters and Sebastian Ruder and Noah A Smith}, booktitle = {Proceedings of the 4th Workshop on Representation Learning for NLP (RepL4NLP-2019)}, pages = {7--14}, title = {To Tune or Not to Tune? Adapting Pretrained Representations to Diverse Tasks}, year = {2019}, } @article{lester2021power, author = {Brian Lester and Rami Al-Rfou and Noah Constant}, journal = {arXiv preprint arXiv:2104.08691}, title = {The power of scale for parameter-efficient prompt tuning}, year = {2021}, } @article{utama2021avoiding, author = {Prasetya Ajie Utama and Nafise Sadat Moosavi and Victor Sanh and Iryna Gurevych}, journal = {arXiv preprint arXiv:2109.04144}, title = {Avoiding Inference Heuristics in Few-shot Prompt-based Finetuning}, year = {2021}, } @article{zhou2021learning, author = {Kaiyang Zhou and Jingkang Yang and Chen Change Loy and Ziwei Liu}, journal = {arXiv preprint arXiv:2109.01134}, title = {Learning to Prompt for Vision-Language Models}, year = {2021}, } @article{wortsman2021robust, author = {Mitchell Wortsman and Gabriel Ilharco and Mike Li and Jong Wook Kim and Hannaneh Hajishirzi and Ali Farhadi and Hongseok Namkoong and Ludwig Schmidt}, journal = {arXiv preprint arXiv:2109.01903}, title = {Robust fine-tuning of zero-shot models}, year = {2021}, } @article{chua2021fine, author = {Kurtland Chua and Qi Lei and Jason D Lee}, journal = {arXiv preprint arXiv:2105.02221}, title = {How fine-tuning allows for effective meta-learning}, year = {2021}, } @inproceedings{guo2017calibration, author = {Chuan Guo and Geoff Pleiss and Yu Sun and Kilian Q. Weinberger}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1321--1330}, title = {On Calibration of Modern Neural Networks}, year = {2017}, } @inproceedings{zadrozny2001calibrated, author = {Bianca Zadrozny and Charles Elkan}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {609--616}, title = {Obtaining calibrated probability estimates from decision trees and naive Bayesian classifiers}, year = {2001}, } @article{naeini2014binary, author = {Mahdi Pakdaman Naeini and Gregory F. Cooper and Milos Hauskrecht}, journal = {arXiv}, title = {Binary Classifier Calibration: Non-parametric approach}, year = {2014}, } @inproceedings{hendrycks2019anomaly, author = {Dan Hendrycks and Mantas Mazeika and Thomas Dietterich}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Deep Anomaly Detection with Outlier Exposure}, year = {2019}, } @inproceedings{hendrycks2019pretraining, author = {Dan Hendrycks and Kimin Lee and Mantas Mazeika}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Using Pre-Training Can Improve Model Robustness and Uncertainty}, year = {2019}, } @article{degroot1983forecasters, author = {Morris H. DeGroot and Stephen E. Fienberg}, journal = {Journal of the Royal Statistical Society. Series D (The Statistician)}, pages = {12--22}, title = {The Comparison and Evaluation of Forecasters}, volume = {32}, year = {1983}, } @article{kull2017sigmoids, author = {Meelis Kull and Telmo M. Silva Filho and Peter Flach}, journal = {Electronic Journal of Statistics}, pages = {5052--5080}, title = {Beyond sigmoids: How to obtain well-calibrated probabilities from binary classifiers with beta calibration}, volume = {11}, year = {2017}, } @article{ferro2012bias, author = {C. A. T. Ferro and Thomas E. Fricker}, journal = {Quarterly Journal of the Royal Meteorological Society}, number = {668}, pages = {1954--1960}, title = {A bias-corrected decomposition of the Brier score}, volume = {138}, year = {2012}, } @article{crowson2017calibration, author = {Cynthia S. Crowson and Elizabeth J. Atkinson and Terry M. Therneau}, journal = {Statistical Methods in Medical Research}, pages = {1692--1706}, title = {Assessing Calibration of Prognostic Risk Scores}, volume = {25}, year = {2017}, } @inproceedings{malik2019calibrated, author = {Ali Malik and Volodymyr Kuleshov and Jiaming Song and Danny Nemer and Harlan Seymour and Stefano Ermon}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Calibrated Model-Based Deep Reinforcement Learning}, year = {2019}, } @inproceedings{kuleshov2018accurate, author = {Volodymyr Kuleshov and Nathan Fenner and Stefano Ermon}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Accurate Uncertainties for Deep Learning Using Calibrated Regression}, year = {2018}, } @article{hosmer1980goodness, author = {David W. Hosmer and Stanley Lemeshow}, journal = {Communications in Statistics - Theory and Methods}, pages = {1043--1069}, title = {Goodness of fit tests for the multiple logistic regression model}, volume = {9}, year = {1980}, } @article{brocker2007reliability, author = {Jochen Bröcker and Leonard A. Smith}, journal = {Weather and Forecasting}, number = {3}, pages = {651--661}, title = {Increasing the Reliability of Reliability Diagrams}, volume = {22}, year = {2007}, } @article{harrell1996prognostic, author = {Frank E. Harrell and Kerry Lamont Lee and Daniel B. Mark}, journal = {Statistics in medicine}, number = {4}, pages = {361--387}, title = {Multivariable prognostic models: issues in developing models, evaluating assumptions and adequacy, and measuring and reducing errors}, volume = {15}, year = {1996}, } @article{paninski2003entropy, author = {Liam Paninski}, journal = {Neural Computation}, pages = {1191--1253}, title = {Estimation of Entropy and Mutual Information}, volume = {15}, year = {2003}, } @article{gneiting2005weather, author = {Tilmann Gneiting and Adrian E. Raftery}, journal = {Science}, title = {Weather Forecasting with Ensemble Methods}, volume = {310}, year = {2005}, } @inproceedings{naeini2015obtaining, author = {Mahdi Pakdaman Naeini and Gregory F. Cooper and Milos Hauskrecht}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Obtaining Well Calibrated Probabilities Using Bayesian Binning}, year = {2015}, } @article{nixon2019calibration, author = {Jeremy V. Nixon and Michael W. Dusenberry and Linchuan Zhang and Ghassen Jerfel and Dustin Tran}, journal = {arXiv}, title = {Measuring Calibration in Deep Learning}, year = {2019}, } @inproceedings{card2018calibration, author = {Dallas Card and Noah A. Smith}, booktitle = {Association for Computational Linguistics (ACL)}, title = {The Importance of Calibration for Estimating Proportions from Annotations}, year = {2018}, } @article{murphy1977reliability, author = {Allan H. Murphy and Robert L. Winkler}, journal = {Journal of the Royal Statistical Society. Series C (Applied Statistics)}, pages = {41--47}, title = {Reliability of Subjective Probability Forecasts of Precipitation and Temperature}, volume = {26}, year = {1977}, } @article{lei2016distribution, author = {Jing Lei and Max G'Sell and Alessandro Rinaldo and Ryan J. Tibshirani and Larry Wasserman}, journal = {Journal of the American Statistical Association}, pages = {1094--1111}, title = {Distribution-Free Predictive Inference For Regression}, volume = {113}, year = {2016}, } @book{hubbard1998vector, author = {John H. Hubbard and Barbara B. Hubbard}, publisher = {Prentice Hall}, title = {Vector Calculus, Linear Algebra, And Differential Forms}, year = {1998}, } @inproceedings{liu2019implicit, author = {Lydia T. Liu and Max Simchowitz and Moritz Hardt}, booktitle = {International Conference on Machine Learning (ICML)}, title = {The Implicit Fairness Criterion of Unconstrained Learning}, year = {2019}, } @inproceedings{johnson2018multicalibration, author = {Ursula Hebert-Johnson and Michael P. Kim and Omer Reingold and Guy N. Rothblum}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Multicalibration: Calibration for the (Computationally-Identifiable) Masses}, year = {2018}, } @article{yadlowsky2019calibration, author = {Steve Yadlowsky and Sanjay Basu and Lu Tian}, journal = {Machine Learning for Healthcare}, title = {A Calibration Metric for Risk Scores with Survival Data}, year = {2019}, } @inproceedings{kull2019temperature, author = {Meelis Kull and Miquel Perello Nieto and Markus Kängsepp and Telmo Silva Filho and Hao Song and Peter Flach}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Beyond temperature scaling: Obtaining well-calibrated multi-class probabilities with Dirichlet calibration}, year = {2019}, } @article{efron1979bootstrap, author = {Brad Efron}, journal = {Annals of Statistics}, title = {Bootstrap Methods: Another Look at the Jackknife}, volume = {7}, year = {1979}, } @inproceedings{widmann2019calibration, author = {David Widmann and Fredrik Lindsten and Dave Zachariah}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Calibration tests in multi-class classification: A unifying framework}, year = {2019}, } @inproceedings{vaicenavicius2019calibration, author = {Juozas Vaicenavicius and David Widmann and Carl Andersson and Fredrik Lindsten and Jacob Roll and Thomas B. Schön}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, title = {Evaluating model calibration in classification}, year = {2019}, } @article{vergara2012Chemical, author = {Alexander Vergara and Shankar Vembu and Tuba Ayhan and Margaret A. Ryan and Margie L. Homer and Ramón Huerta}, journal = {Journal of the American Statistical Association}, pages = {320--329}, title = {Chemical gas sensor drift compensation using classifier ensembles}, volume = {-1}, year = {2012}, } @inproceedings{bobu2018adapting, author = {Andreea Bobu and Eric Tzeng and Judy Hoffman and Trevor Darrell}, booktitle = {International Conference on Learning Representations Workshop (ICLR)}, title = {Adapting to Continuously Shifting Domains}, year = {2018}, } @inproceedings{farshchian2019adversarial, author = {Ali Farshchian and Juan A. Gallego and Joseph P. Cohen and Yoshua Bengio and Lee E. Miller and Sara A. Solla}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Adversarial Domain Adaptation for Stable Brain-Machine Interfaces}, year = {2019}, } @inproceedings{amini2003semisupervised, author = {Massih-Reza Amini and Patrick Gallinari}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Semi-Supervised Learning with Explicit Misclassification Modeling}, year = {2003}, } @inproceedings{hoffman2014continuous, author = {Judy Hoffman and Trevor Darrell and Kate Saenko}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Continuous Manifold Based Adaptation for Evolving Visual Domains}, year = {2014}, } @article{sethi2017reliable, author = {Tegjyot Singh Sethi and Mehmed Kantardzic}, journal = {Expert Systems with Applications}, pages = {77--99}, title = {On the reliable detection of concept drift from streaming unlabeled data}, volume = {82}, year = {2017}, } @article{gama2014survey, author = {Gama, João and Žliobaitė, Indrė and Bifet, Albert and Pechenizkiy, Mykola and Bouchachia, Hamid}, journal = {ACM Computing Surveys (CSUR)}, title = {A Survey on Concept Drift Adaptation}, volume = {46}, year = {2014}, } @article{xie2020selftraining, author = {Qizhe Xie and Minh-Thang Luong and Eduard Hovy and Quoc V. Le}, journal = {arXiv}, title = {Self-training with Noisy Student improves ImageNet classification}, year = {2020}, } @inproceedings{huang2006correcting, author = {Huang, Jiayuan and Smola, Alexander J. and Gretton, Arthur and Borgwardt, Karsten M. and Scholkopf, Bernhard}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Correcting Sample Selection Bias by Unlabeled Data}, year = {2006}, } @article{sugiyama2007covariate, author = {Masashi Sugiyama and Matthias Krauledat and Klaus-Robert Muller}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {985--1005}, title = {Covariate Shift Adaptation by Importance Weighted Cross Validation}, volume = {8}, year = {2007}, } @inproceedings{shu2018dirtt, author = {Rui Shu and Hung H. Bui and Hirokazu Narui and Stefano Ermon}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {A {DIRT}-{T} Approach to Unsupervised Domain Adaptation}, year = {2018}, } @inproceedings{zhao2019zhao, author = {Han Zhao and Remi Tachet des Combes and Kun Zhang and Geoffrey J. Gordon}, booktitle = {International Conference on Machine Learning (ICML)}, title = {On Learning Invariant Representations for Domain Adaptation}, year = {2019}, } @article{ginosar2017portraits, author = {Shiry Ginosar and Kate Rakelly and Sarah M. Sachs and Brian Yin and Crystal Lee and Philipp Krähenbühl and Alexei A. Efros}, journal = {IEEE Transactions on Computational Imaging}, title = {A Century of Portraits: A Visual Historical Record of American High School Yearbooks}, volume = {3}, year = {2017}, } @inproceedings{luo2019towards, author = {Ping Luo and Xinjiang Wang and Wenqi Shao and Zhanglin Peng}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Towards Understanding Regularization in Batch Normalization}, year = {2019}, } @article{fralick1967learning, author = {Stanley C. Fralick}, journal = {IEEE Transactions on Information Theory}, title = {Learning to recognize patterns without a teacher}, volume = {13}, year = {1967}, } @article{agrawala1970learning, author = {Ashok K. Agrawala}, journal = {IEEE Transactions on Information Theory}, pages = {373--379}, title = {Learning with a probabilistic teacher}, volume = {16}, year = {1970}, } @article{celeux1992classification, author = {Gilles Celeux and Gérard Govaert}, journal = {Computational Statistics & Data Analysis}, pages = {315--332}, title = {A classification {EM} algorithm for clustering and two stochastic versions}, volume = {14}, year = {1992}, } @article{sohn2020fixmatch, author = {Kihyuk Sohn and David Berthelot and Chun-Liang Li and Zizhao Zhang and Nicholas Carlini and Ekin D. Cubuk and Alex Kurakin and Han Zhang and Colin Raffel}, journal = {arXiv}, title = {FixMatch: Simplifying Semi-Supervised Learning with Consistency and Confidence}, year = {2020}, } @article{rigollet2007generalization, author = {Philippe Rigollet}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {1369--1392}, title = {Generalization Error Bounds in Semi-supervised Classification Under the Cluster Assumption}, volume = {8}, year = {2007}, } @inproceedings{singh2008unlabeled, author = {Aarti Singh and Robert Nowak and Jerry Zhu}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Unlabeled data: Now it helps, now it doesn't}, year = {2008}, } @inproceedings{shai2008unlabeled, author = {Shai Ben-David and Tyler Lu and David Pal}, booktitle = {Conference on Learning Theory (COLT)}, title = {Does Unlabeled Data Provably Help? Worst-case Analysis of the Sample Complexity of Semi-Supervised Learning}, year = {2008}, } @inproceedings{hoffman2018cycada, author = {Judy Hoffman and Eric Tzeng and Taesung Park and Jun-Yan Zhu and Phillip Isola and Kate Saenko and Alexei A. Efros and Trevor Darrell}, booktitle = {International Conference on Machine Learning (ICML)}, title = {CyCADA: Cycle Consistent Adversarial Domain Adaptation}, year = {2018}, } @inproceedings{peng2019moment, author = {Xingchao Peng and Qinxun Bai and Xide Xia and Zijun Huang and Kate Saenko and Bo Wang}, booktitle = {International Conference on Computer Vision (ICCV)}, title = {Moment Matching for Multi-Source Domain Adaptation}, year = {2019}, } @inproceedings{bartlett1992learning, author = {Peter L. Bartlett}, booktitle = {Conference on Learning Theory (COLT)}, title = {Learning with a slowly changing distribution}, year = {1992}, } @inproceedings{gadermayr2018gradual, author = {Gadermayr, Michael and Eschweiler, Dennis and Klinkhammer, Barbara Mara and Boor, Peter and Merhof, Dorit}, booktitle = {Image and Signal Processing}, title = {Gradual Domain Adaptation for Segmenting Whole Slide Images Showing Pathological Variability}, year = {2018}, } @inproceedings{wulfmeier2018incremental, author = {Wulfmeier, Markus and Bewley, Alex and Posner, Ingmar}, booktitle = {International Conference on Robotics and Automation (ICRA)}, title = {Incremental Adversarial Domain Adaptation for Continually Changing Environments}, year = {2018}, } @inproceedings{hinton2015distilling, author = {Geoffrey Hinton and Oriol Vinyals and Jeffrey Dean}, booktitle = {NIPS Deep Learning and Representation Learning Workshop}, title = {Distilling the Knowledge in a Neural Network}, year = {2015}, } @inproceedings{sun2017revisiting, author = {Chen Sun and Abhinav Shrivastava and Saurabh Singh1 and Abhinav Gupta}, booktitle = {International Conference on Computer Vision (ICCV)}, title = {Revisiting Unreasonable Effectiveness of Data in Deep Learning Era}, year = {2017}, } @article{hendrycks2019natural, author = {Dan Hendrycks and Kevin Zhao and Steven Basart and Jacob Steinhardt and Dawn Song}, journal = {arXiv preprint arXiv:1907.07174}, title = {Natural adversarial examples}, year = {2019}, } @inproceedings{uesato2019rigorous, author = {Jonathan Uesato and Ananya Kumar and Csaba Szepesvari and Tom Erez and Avraham Ruderman and Keith Anderson and Krishmamurthy (Dj) Dvijotham and Nicolas Heess and Pushmeet Kohli}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Rigorous Agent Evaluation: An Adversarial Approach to Uncover Catastrophic Failures}, year = {2019}, } @article{bartlett1996learning, author = {Peter L. Bartlett and Shai Ben-David and Sanjeev R. Kulkarni}, journal = {Machine Learning}, title = {Learning Changing Concepts by Exploiting the Structure of Change}, volume = {41}, year = {1996}, } @inproceedings{kramer1988learning, author = {Alan H. Kramer}, booktitle = {Connectionist Models Summer School}, title = {Learning despite distribution shift}, year = {1988}, } @inproceedings{mey2016softlabeled, author = {Alexander Mey and Marco Loog}, booktitle = {d International Conference on Pattern Recognition}, title = {A Soft-Labeled Self-Training Approach}, year = {2016}, } @inproceedings{blackard1999comparative, author = {Jock A. Blackard and Denis J. Dean}, booktitle = {Computers and Electronics in Agriculture}, title = {Comparative accuracies of artificial neural networks and discriminant analysis in predicting forest cover types from cartographic variables}, year = {1999}, } @inproceedings{kornblith2019better, author = {Simon Kornblith and Jonathon Shlens and Quoc V. Le}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Do Better ImageNet Models Transfer Better?}, year = {2019}, } @book{tao2012random, author = {Terrence Tao}, publisher = {American Mathematical Society}, title = {Topics in random matrix theory}, year = {2012}, } @inproceedings{hsu2012random, author = {Daniel Hsu and Sham M. Kakade and Tong Zhang}, booktitle = {Conference on Learning Theory (COLT)}, title = {Random Design Analysis of Ridge Regression}, year = {2012}, } @article{chen2020improved, author = {Xinlei Chen and Haoqi Fan and Ross B. Girshick and Kaiming He}, journal = {arXiv}, title = {Improved Baselines with Momentum Contrastive Learning}, year = {2020}, } @inproceedings{yu2020bdd, author = {Fisher Yu and Haofeng Chen and Xin Wang and Wenqi Xian and Yingying Chen and Fangchen Liu and Vashisht Madhavan and Trevor Darrell}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {BDD100K: A Diverse Driving Dataset for Heterogeneous Multitask Learning}, year = {2020}, } @article{andreassen2021evolution, author = {Anders Andreassen and Yasaman Bahri and Behnam Neyshabur and Rebecca Roelofs}, journal = {arXiv}, title = {The Evolution of Out-of-Distribution Robustness Throughout Fine-Tuning}, year = {2021}, } @article{zhai2020largescale, author = {Xiaohua Zhai and Joan Puigcerver and Alexander Kolesnikov and Pierre Ruyssen and Carlos Riquelme and Mario Lucic and Josip Djolonga and Andre Susano Pinto and Maxim Neumann and Alexey Dosovitskiy and Lucas Beyer and Olivier Bachem and Michael Tschannen and Marcin Michalski and Olivier Bousquet and Sylvain Gelly and Neil Houlsby}, journal = {arXiv}, title = {A Large-scale Study of Representation Learning with the Visual Task Adaptation Benchmark}, year = {2020}, } @inproceedings{kamath2021invariant, author = {Pritish Kamath and Akilesh Tangella and Danica J. Sutherland and Nathan Srebro}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, title = {Does Invariant Risk Minimization Capture Invariance?}, year = {2021}, } @article{chen2021iterative, author = {Yining Chen and Elan Rosenfeld and Mark Sellke and Tengyu Ma and Andrej Risteski}, journal = {arXiv}, title = {Iterative Feature Matching: Toward Provable Domain Generalization with Logarithmic Environments}, year = {2021}, } @inproceedings{rosenfeld2021risks, author = {Elan Rosenfeld and Pradeep Ravikumar and Andrej Risteski}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {The Risks of Invariant Risk Minimization}, year = {2021}, } @article{ayush2020geography, author = {Kumar Ayush and Burak Uzkent and Chenlin Meng and Kumar Tanmay and M. Burke and D. Lobell and Stefano Ermon}, journal = {arXiv}, title = {Geography-Aware Self-Supervised Learning}, year = {2020}, } @article{saxe2014exact, author = {Andrew M. Saxe and James L. McClelland and Surya Ganguli}, journal = {arXiv}, title = {Exact solutions to the nonlinear dynamics of learning in deep linear neural networks}, year = {2014}, } @inproceedings{gidel2019implicit, author = {Gauthier Gidel and Francis R. Bach and Simon Lacoste-Julien}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Implicit Regularization of Discrete Gradient Dynamics in Deep Linear Neural Networks}, year = {2019}, } @inproceedings{du2018algorithmic, author = {Simon Shaolei Du and Wei Hu and Jason Lee}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Algorithmic Regularization in Learning Deep Homogeneous Models: Layers are Automatically Balanced}, year = {2018}, } @inproceedings{cai2021theory, author = {Tianle Cai and Ruiqi Gao and J. Lee and Qi Lei}, booktitle = {International Conference on Machine Learning (ICML)}, title = {A Theory of Label Propagation for Subpopulation Shift}, year = {2021}, } @inproceedings{laurent2018deep, author = {Thomas Laurent and James H. von Brecht}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Deep linear neural networks with arbitrary loss: All local minima are global}, year = {2018}, } @article{absil2006largest, author = {Pierre Antoine Absil and Alan Edelman and Plamen Koev}, journal = {Linear Algebra and its Applications}, number = {1}, pages = {288--294}, title = {On the largest principal angle between random subspaces}, volume = {414}, year = {2006}, } @article{wu2021ensemble, author = {Xixin Wu and M. Gales}, journal = {arXiv}, title = {Should Ensemble Members Be Calibrated?}, year = {2021}, } @article{stickland2020diverse, author = {Asa Cooper Stickland and Iain Murray}, journal = {arXiv}, title = {Diverse Ensembles Improve Calibration}, year = {2020}, } @inproceedings{li2018explicit, author = {Xuhong Li and Yves Grandvalet and Franck Davoine}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Explicit Inductive Bias for Transfer Learning with Convolutional Networks}, year = {2018}, } @inproceedings{kanavati2021transfusion, author = {Fahdi Kanavati and Masayuki Tsuneki}, booktitle = {Medical Imaging with Deep Learning}, title = {Partial transfusion: on the expressive influence of trainable batch norm parameters for transfer learning}, year = {2021}, } @inproceedings{aghajanyan2021finetuning, author = {Armen Aghajanyan and Akshat Shrivastava and Anchit Gupta and Naman Goyal and Luke Zettlemoyer and Sonal Gupta}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Better Fine-Tuning by Reducing Representational Collapse}, year = {2021}, } @inproceedings{jiang2021smart, author = {Haoming Jiang and Pengcheng He and Weizhu Chen and Xiaodong Liu and Jianfeng Gao and Tuo Zhao}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {SMART: Robust and Efficient Fine-Tuning for Pre-trained Natural Language Models through Principled Regularized Optimization}, year = {2021}, } @inproceedings{guo2019spottune, author = {Yunhui Guo and Honghui Shi and Abhishek Kumar and Kristen Grauman and Tajana Rosing and Rogerio Feris}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {SpotTune: Transfer Learning through Adaptive Fine-tuning}, year = {2019}, } @inproceedings{zhang2020sidetuning, author = {Jeffrey O Zhang and Alexander Sax and Amir Zamir and Leonidas Guibas and Jitendra Malik}, booktitle = {European Conference on Computer Vision (ECCV)}, title = {Side-Tuning: A Baseline for Network Adaptation via Additive Side Networks}, year = {2020}, } @inproceedings{ge2017borrowing, author = {Weifeng Ge and Yizhou Yu}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Borrowing Treasures from the Wealthy: Deep Transfer Learning through Selective Joint Fine-tuning}, year = {2017}, } @article{rudelson2009smallest, author = {Mark Rudelson and Roman Vershynin}, journal = {Communications on Pure and Applied Mathematics}, pages = {1707--1739}, title = {Smallest Singular Value of a Random Rectangular Matrix}, volume = {62}, year = {2009}, } @book{golub2013matrix, author = {Gene H. Golub and Charles F. Van Loan}, publisher = {The Johns Hopkins University Press}, title = {Matrix Computations}, year = {2013}, } @inproceedings{minderer2021revisiting, author = {Matthias Minderer and Josip Djolonga and Rob Romijnders and Frances Hubis and Xiaohua Zhai and Neil Houlsby and Dustin Tran and Mario Lucic}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Revisiting the Calibration of Modern Neural Networks}, year = {2021}, } @inproceedings{mukhoti2020calibrating, author = {Jishnu Mukhoti and Viveka Kulharia and Amartya Sanyal and Stuart Golodetz and Philip H.S. Torr and Puneet K. Dokania}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Calibrating Deep Neural Networks using Focal Loss}, year = {2020}, } @article{bai2021dont, author = {Yu Bai and Song Mei and Huan Wang and Caiming Xiong}, journal = {arXiv}, title = {Don't Just Blame Over-parametrization for Over-confidence: Theoretical Analysis of Calibration in Binary Classification}, year = {2021}, } @article{desai2020calibration, author = {Shrey Desai and Greg Durrett}, journal = {arXiv}, title = {Calibration of Pre-trained Transformers}, year = {2020}, } @article{sill2009feature, author = {Joseph Sill and Gabor Takacs and Lester Mackey and David Lin}, journal = {arXiv}, title = {Feature-Weighted Linear Stacking}, year = {2009}, } @inproceedings{shachaf2021theoretical, author = {Gal Shachaf and Alon Brutzkus and Amir Globerson}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {A Theoretical Analysis of Fine-tuning with Linear Teachers}, year = {2021}, } @inproceedings{wald2021calibration, author = {Yoav Wald and Amir Feder and Daniel Greenfeld and Uri Shalit}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {On Calibration and Out-of-domain Generalization}, year = {2021}, } @article{luo2020privacy, author = {Rachel Luo and Shengjia Zhao and Jiaming Song and Jonathan Kuck and Stefano Ermon and Silvio Savarese}, journal = {arXiv}, title = {Privacy Preserving Recalibration under Domain Shift}, year = {2020}, } @article{kumar2022sgd, author = {Ananya Kumar and Ruoqi Shen and Sébastien Bubeck and Suriya Gunasekar}, journal = {arXiv}, title = {How to Fine-Tune Vision Models with {SGD}}, year = {2022}, } @inproceedings{wortsman2022modelsoups, author = {Mitchell Wortsman and Gabriel Ilharco and Samir Yitzhak Gadre and Rebecca Roelofs and Raphael Gontijo-Lopes and Ari S. Morcos and Hongseok Namkoong and Ali Farhadi and Yair Carmon and Simon Kornblith and Ludwig Schmidt}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Model soups: averaging weights of multiple fine-tuned models improves accuracy without increasing inference time}, year = {2022}, } @article{goyal2022finetune, author = {Sachin Goyal and Ananya Kumar and Sankalp Garg and Zico Kolter and Aditi Raghunathan}, journal = {arXiv}, title = {Finetune like you pretrain: Improved finetuning of zero-shot vision models}, year = {2022}, } @inproceedings{sanchez2011cvpr, author = {Jorge Sanchez and Florent Perronnin}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {High-dimensional signature compression for large-scale image classification}, year = {2011}, } @inproceedings{pham2021meta, author = {Hieu Pham and Zihang Dai and Qizhe Xie and Quoc V. Le}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Meta Pseudo Labels}, year = {2021}, } @article{ramesh2022hierarchical, author = {Aditya Ramesh and Prafulla Dhariwal and Alex Nichol and Casey Chu and Mark Chen}, journal = {arXiv}, title = {Hierarchical Text-Conditional Image Generation with {CLIP} Latents}, year = {2022}, } @article{touvron2023llama, author = {Hugo Touvron and Thibaut Lavril and Gautier Izacard and Xavier Martinet and Marie-Anne Lachaux and Timothée Lacroix and Baptiste Rozière and Naman Goyal and Eric Hambro and Faisal Azhar and Aurelien Rodriguez and Armand Joulin and Edouard Grave and Guillaume Lample}, journal = {arXiv}, title = {LLaMA: Open and Efficient Foundation Language Models}, year = {2023}, } @article{rosenfeld2022domain, author = {Elan Rosenfeld and Pradeep Ravikumar and Andrej Risteski}, journal = {arXiv}, title = {Domain-Adjusted Regression or: {ERM} May Already Learn Features Sufficient for Out-of-Distribution Generalization}, year = {2022}, } @inproceedings{goodfellow2014empirical, author = {Ian J. Goodfellow and Mehdi Mirza and Xia Da and Aaron C. Courville and Yoshua Bengio}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {An Empirical Investigation of Catastrophic Forgeting in Gradient-Based Neural Networks}, year = {2014}, } @article{baxter2000model, author = {Jonathan Baxter}, journal = {Journal of Artificial Intelligence Research (JAIR)}, title = {A model of inductive bias learning}, volume = {12}, year = {2000}, } @article{maurer2016benefit, author = {Andreas Maurer and Massimiliano Pontil and Bernardino Romera-Paredes}, journal = {Journal of Machine Learning Research (JMLR)}, title = {The Benefit of Multitask Representation Learning}, volume = {7}, year = {2016}, } @inproceedings{lee2021predicting, author = {Jason D. Lee and Qi Lei and Nikunj Saunshi and Jiacheng Zhuo}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Predicting What You Already Know Helps: Provable Self-Supervised Learning}, year = {2021}, } @inproceedings{hu2022lora, author = {Edward J. Hu and Yelong Shen and Phillip Wallis and Zeyuan Allen-Zhu and Yuanzhi Li and Shean Wang and Lu Wang and Weizhu Chen}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {LoRA: Low-Rank Adaptation of Large Language Models}, year = {2022}, } @article{balestriero2023cookbook, author = {Randall Balestriero and Mark Ibrahim and Vlad Sobal and Ari Morcos and Shashank Shekhar and Tom Goldstein and Florian Bordes and Adrien Bardes and Gregoire Mialon and Yuandong Tian and Avi Schwarzschild and Andrew Gordon Wilson and Jonas Geiping and Quentin Garrido and Pierre Fernandez and Amir Bar and Hamed Pirsiavash and Yann LeCun and Micah Goldblum}, journal = {arXiv}, title = {A Cookbook of Self-Supervised Learning}, year = {2023}, } @inproceedings{wei2021theoretical, author = {Colin Wei and Kendrick Shen and Yining Chen and Tengyu Ma}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Theoretical Analysis of Self-Training with Deep Networks on Unlabeled Data}, year = {2021}, } @inproceedings{wang2023selfinstruct, author = {Yizhong Wang and Yeganeh Kordi and Swaroop Mishra and Alisa Liu and Noah A. Smith and Daniel Khashabi and Hannaneh Hajishirzi}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Self-Instruct: Aligning Language Models with Self-Generated Instructions}, year = {2023}, } @article{bai2023constitutional, author = {Yuntao Bai and Saurav Kadavath and Sandipan Kundu and Amanda Askell and Jackson Kernion and Andy Jones and Anna Chen and Anna Goldie and Azalia Mirhoseini and Cameron McKinnon and Carol Chen and Catherine Olsson and Christopher Olah and Danny Hernandez and Dawn Drain and Deep Ganguli and Dustin Li and Eli Tran-Johnson and Ethan Perez and Jamie Kerr and Jared Mueller and Jeffrey Ladish and Joshua Landau and Kamal Ndousse and Kamile Lukosuite and Liane Lovitt and Michael Sellitto and Nelson Elhage and Nicholas Schiefer and Noemi Mercado and Nova DasSarma and Robert Lasenby and Robin Larson and Sam Ringer and Scott Johnston and Shauna Kravec and Sheer El Showk and Stanislav Fort and Tamera Lanham and Timothy Telleen-Lawton and Tom Conerly and Tom Henighan and Tristan Hume and Samuel R. Bowman and Zac Hatfield-Dodds and Ben Mann and Dario Amodei and Nicholas Joseph and Sam McCandlish and Tom Brown and Jared Kaplan}, journal = {arXiv}, title = {Constitutional {AI}: Harmlessness from {AI} Feedback}, year = {2023}, } @inproceedings{dalvi2013aggregating, author = {Nilesh Dalvi and Anirban Dasgupta and Ravi Kumar and Vibhor Rastogi}, booktitle = {World Wide Web (WWW)}, pages = {285--294}, title = {Aggregating crowdsourced binary ratings}, year = {2013}, } @inproceedings{joglekar2015comprehensive, author = {Manas Joglekar and Hector Garcia-Molina and Aditya Parameswaran}, booktitle = {Data Engineering (ICDE), 2015 IEEE 31st International Conference on}, pages = {195--206}, title = {Comprehensive and reliable crowd assessment algorithms}, year = {2015}, } @article{zhang2016spectral, author = {Yuchen Zhang and Xi Chen and Dengyong Zhou and Michael I Jordan}, journal = {Journal of Machine Learning Research (JMLR)}, number = {102}, pages = {1--44}, title = {Spectral methods meet EM: A provably optimal algorithm for crowdsourcing}, volume = {17}, year = {2016}, } @inproceedings{balsubramani2015scalable, author = {Akshay Balsubramani and Yoav Freund}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1351--1359}, title = {Scalable semi-supervised aggregation of classifiers}, year = {2015}, } @inproceedings{craven1999constructing, author = {Mark Craven and Johan Kumlien and others}, booktitle = {ISMB}, pages = {77--86}, title = {Constructing biological knowledge bases by extracting information from text sources}, year = {1999}, } @article{varma2017socratic, author = {Paroma Varma and Bryan He and Dan Iter and Peng Xu and Rose Yu and C De Sa and C R\'{e}}, journal = {arXiv preprint arXiv:1610.08123}, title = {Socratic Learning: Augmenting Generative Models to Incorporate Latent Subsets in Training Data}, year = {2017}, } @inproceedings{shin2015incremental, author = {Jaeho Shin and Sen Wu and Feiran Wang and Christopher De Sa and Ce Zhang and Christopher R\'{e}}, booktitle = {Very Large Data Bases (VLDB)}, number = {11}, pages = {1310--1321}, title = {Incremental knowledge base construction using {DeepDive}}, year = {2015}, } @inproceedings{roth2013combining, author = {Benjamin Roth and Dietrich Klakow}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {24--29}, title = {Combining Generative and Discriminative Model Scores for Distant Supervision}, year = {2013}, } @inproceedings{takamatsu2012reducing, author = {Shingo Takamatsu and Issei Sato and Hiroshi Nakagawa}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {721--729}, title = {Reducing wrong labels in distant supervision for relation extraction}, year = {2012}, } @article{de2016deepdive, author = {Christopher De Sa and Alex Ratner and Christopher R\'{e} and Jaeho Shin and Feiran Wang and Sen Wu and Ce Zhang}, journal = {ACM SIGMOD Record}, number = {1}, pages = {60--67}, title = {Deepdive: declarative knowledge base construction}, volume = {45}, year = {2016}, } @inproceedings{wu2018fonduer, author = {Sen Wu and Luke Hsiao and Xiao Cheng and Braden Hancock and Theodoros Rekatsinas and Philip Levis and Christopher R\'{e}}, booktitle = {Proceedings of SIGMOD 2018}, title = {Fonduer: Knowledge Base Construction from Richly Formatted Data}, year = {2018}, } @inproceedings{alfonseca2012pattern, author = {Enrique Alfonseca and Katja Filippova and Jean-Yves Delort and Guillermo Garrido}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {54--59}, title = {Pattern learning for relation extraction with a hierarchical topic model}, year = {2012}, } @inproceedings{bunescu2007learning, author = {Razvan Bunescu and Raymond Mooney}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Learning to extract relations from the web using minimal supervision}, year = {2007}, } @inproceedings{parkash2012attributes, author = {Amar Parkash and Devi Parikh}, booktitle = {European Conference on Computer Vision (ECCV)}, pages = {354--368}, title = {Attributes for classifier feedback}, year = {2012}, } @inproceedings{druck2009active, author = {Gregory Druck and Burr Settles and Andrew McCallum}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {81--90}, title = {Active learning by labeling features}, year = {2009}, } @inproceedings{raghavan2005interactive, author = {Hema Raghavan and Omid Madani and Rosie Jones}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, pages = {841--846}, title = {InterActive Feature Selection}, volume = {5}, year = {2005}, } @article{mann2010generalized, author = {Gideon S Mann and Andrew McCallum}, journal = {Journal of machine learning research}, number = {0}, pages = {955--984}, title = {Generalized expectation criteria for semi-supervised learning with weakly labeled data}, volume = {11}, year = {2010}, } @manual{maccartney2015sippy, author = {Bill MacCartney}, howpublished = {\url{https://github.com/wcmac/sippycup}}, title = {SippyCup}, year = {2015}, } @article{younger1967recognition, author = {Daniel H Younger}, journal = {Information and control}, number = {2}, pages = {189--208}, title = {Recognition and parsing of context-free languages in time n3}, volume = {10}, year = {1967}, } @inproceedings{ratner2016data, author = {Alexander J Ratner and Christopher M De Sa and Sen Wu and Daniel Selsam and Christopher R\'{e}}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {3567--3575}, title = {Data programming: Creating large training sets, quickly}, year = {2016}, } @inproceedings{bach17structure, author = {Bach, Stephen H. and He, Bryan and Ratner, Alexander and R'e, Christopher}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Learning the Structure of Generative Models without Labeled Data}, year = {2017}, } @inproceedings{corney2016million, author = {David Corney and Dyaa Albakour and Miguel Martinez-Alvarez and Samir Moussa}, booktitle = {NewsIR@ ECIR}, pages = {42--47}, title = {What do a million news articles look like?}, year = {2016}, } @inproceedings{wei2015overview, author = {Chih-Hsuan Wei and Yifan Peng and Robert Leaman and Allan Peter Davis and Carolyn J Mattingly and Jiao Li and Thomas C Wiegers and Zhiyong Lu}, booktitle = {Proceedings of the Fifth BioCreative Challenge Evaluation Workshop}, pages = {154--166}, title = {Overview of the {BioCreative} {V} chemical disease relation (CDR) task}, year = {2015}, } @inproceedings{srivastava2017joint, author = {Shashank Srivastava and Igor Labutov and Tom Mitchell}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1528--1537}, title = {Joint concept learning and semantic parsing from natural language explanations}, year = {2017}, } @inproceedings{ling2017teaching, author = {Huan Ling and Sanja Fidler}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Teaching Machines to Describe Images via Natural Language Feedback}, year = {2017}, } @article{li2016learning, author = {Jiwei Li and Alexander H Miller and Sumit Chopra and Marc'Aurelio Ranzato and Jason Weston}, journal = {arXiv preprint arXiv:1612.04936}, title = {Learning Through Dialogue Interactions}, year = {2016}, } @article{andreas2017learning, author = {Jacob Andreas and Dan Klein and Sergey Levine}, journal = {arXiv preprint arXiv:1711.00482}, title = {Learning with Latent Language}, year = {2017}, } @inproceedings{weston2016dialog, author = {Jason E Weston}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {829--837}, title = {Dialog-based language learning}, year = {2016}, } @inproceedings{von2006peekaboom, author = {Luis Von Ahn and Ruoran Liu and Manuel Blum}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, pages = {55--64}, title = {Peekaboom: a game for locating objects in images}, year = {2006}, } @article{krening2017learning, author = {Samantha Krening and Brent Harrison and Karen M Feigh and Charles Lee Isbell and Mark Riedl and Andrea Thomaz}, journal = {IEEE Transactions on Cognitive and Developmental Systems}, number = {1}, pages = {44--55}, title = {Learning from explanations using sentiment and advice in {RL}}, volume = {9}, year = {2017}, } @article{guidotti2018survey, author = {Riccardo Guidotti and Anna Monreale and Franco Turini and Dino Pedreschi and Fosca Giannotti}, journal = {arXiv preprint arXiv:1802.01933}, title = {A Survey Of Methods For Explaining Black Box Models}, year = {2018}, } @inproceedings{yessenalina2010automatically, author = {Ainur Yessenalina and Yejin Choi and Claire Cardie}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {336--341}, title = {Automatically generating annotator rationales to improve sentiment classification}, year = {2010}, } @inproceedings{arora2009interactive, author = {Shilpa Arora and Eric Nyberg}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {55--60}, title = {Interactive annotation learning with indirect feature voting}, year = {2009}, } @article{grechkin2017ezlearn, author = {Maxim Grechkin and Hoifung Poon and Bill Howe}, journal = {arXiv preprint arXiv:1709.08600}, title = {EZLearn: Exploiting Organic Supervision in Large-Scale Data Annotation}, year = {2017}, } @inproceedings{bothe2017dialogue, author = {Chandrakant Bothe and Sven Magg and Cornelius Weber and Stefan Wermter}, booktitle = {International Conference on Artificial Neural Networks (ICANN)}, pages = {477--485}, title = {Dialogue-Based Neural Learning to Estimate the Sentiment of a Next Upcoming Utterance}, year = {2017}, } @inproceedings{hashimoto2018detecting, author = {Chikara Hashimoto and Manabu Sassano}, booktitle = {World Wide Web (WWW)}, pages = {147--156}, title = {Detecting absurd conversations from intelligent assistant logs by exploiting user feedback utterances}, year = {2018}, } @article{zhang2018personalizing, author = {Saizheng Zhang and Emily Dinan and Jack Urbanek and Arthur Szlam and Douwe Kiela and Jason Weston}, journal = {arXiv preprint arXiv:1801.07243}, title = {Personalizing Dialogue Agents: {I} have a dog, do you have pets too?}, year = {2018}, } @article{zhang2017listen, author = {Haichao Zhang and Haonan Yu and Wei Xu}, journal = {arXiv preprint arXiv:1705.09906}, title = {Listen, Interact and Talk: Learning to Speak via Interaction}, year = {2017}, } @article{shuster2018engaging, author = {Kurt Shuster and Samuel Humeau and Hexiang Hu and Antoine Bordes and Jason Weston}, journal = {arXiv preprint arXiv:1810.10665}, title = {Engaging Image Captioning Via Personality}, year = {2018}, } @article{shuster2018imagechat, author = {Kurt Shuster and Samuel Humeau and Antoine Bordes and Jason Weston}, journal = {arXiv preprint arXiv:1811.00945}, title = {Engaging Image Chat: Modeling Personality in Grounded Dialogue}, year = {2018}, } @article{luo2018learning, author = {Liangchen Luo and Wenhao Huang and Qi Zeng and Zaiqing Nie and Xu Sun}, journal = {arXiv preprint arXiv:1811.04604}, title = {Learning Personalized End-to-End Goal-Oriented Dialog}, year = {2018}, } @article{rashkin2018know, author = {Hannah Rashkin and Eric Michael Smith and Margaret Li and Y-Lan Boureau}, journal = {arXiv preprint arXiv:1811.00207}, title = {{I} Know the Feeling: Learning to Converse with Empathy}, year = {2018}, } @article{strub2017end, author = {Florian Strub and Harm De Vries and Jeremie Mary and Bilal Piot and Aaron Courville and Olivier Pietquin}, journal = {arXiv preprint arXiv:1703.05423}, title = {End-to-end optimization of goal-driven and visually grounded dialogue systems}, year = {2017}, } @article{wang2018questions, author = {Yansen Wang and Chenyi Liu and Minlie Huang and Liqiang Nie}, journal = {arXiv preprint arXiv:1805.04843}, title = {Learning to Ask Questions in Open-domain Conversational Systems with Typed Decoders}, year = {2018}, } @article{rao2018learning, author = {Sudha Rao and Hal Daum\'{e} III}, journal = {arXiv preprint arXiv:1805.04655}, title = {Learning to Ask Good Questions: Ranking Clarification Questions using Neural Expected Value of Perfect Information}, year = {2018}, } @inproceedings{liu2018end, author = {Bing Liu and Ian Lane}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {67--73}, title = {End-to-End Learning of Task-Oriented Dialogs}, year = {2018}, } @article{zhang2018interactive, author = {Haichao Zhang and Haonan Yu and Wei Xu}, journal = {arXiv preprint arXiv:1805.00462}, title = {Interactive Language Acquisition with One-shot Visual Concept Learning through a Conversational Game}, year = {2018}, } @inproceedings{wang2019glue, author = {Alex Wang and Amapreet Singh and Julian Michael and Felix Hill and Omer Levy and Samuel R Bowman}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {{GLUE}: A Multi-Task Benchmark and Analysis Platform for Natural Language Understanding}, year = {2019}, } @article{mccann2018natural, author = {Bryan McCann and Nitish Shirish Keskar and Caiming Xiong and Richard Socher}, journal = {arXiv preprint arXiv:1806.08730}, title = {The natural language decathlon: Multitask learning as question answering}, year = {2018}, } @article{conneau2018senteval, author = {Alexis Conneau and Douwe Kiela}, journal = {arXiv preprint arXiv:1803.05449}, title = {SentEval: An Evaluation Toolkit for Universal Sentence Representations}, year = {2018}, } @article{sanh2018hierarchical, author = {Victor Sanh and Thomas Wolf and Sebastian Ruder}, journal = {arXiv preprint arXiv:1811.06031}, title = {A Hierarchical Multi-task Approach for Learning Embeddings from Semantic Tasks}, year = {2018}, } @article{werts1995instructive, author = {Margaret G Werts and Mark Wolery and Ariane Holcombe and David L Gast}, journal = {Journal of Behavioral Education}, number = {1}, pages = {55--75}, title = {Instructive feedback: Review of parameters and effects}, volume = {5}, year = {1995}, } @article{tong2001support, author = {Simon Tong and Daphne Koller}, journal = {Journal of machine learning research}, number = {0}, pages = {45--66}, title = {Support vector machine active learning with applications to text classification}, volume = {2}, year = {2001}, } @article{schmidhuber1991learning, author = {Juergen Schmidhuber and Rudolf Huber}, journal = {International Journal of Neural Systems}, number = {1}, pages = {125--134}, title = {Learning to generate artificial fovea trajectories for target detection}, volume = {2}, year = {1991}, } @inproceedings{pappu2013predicting, author = {Aasish Pappu and Alexander Rudnicky}, booktitle = {Proceedings of the SIGDIAL 2013 Conference}, pages = {242--250}, title = {Predicting tasks in goal-oriented spoken dialog systems using semantic knowledge bases}, year = {2013}, } @article{schatzmann2006survey, author = {Jost Schatzmann and Karl Weilhammer and Matt Stuttle and Steve Young}, journal = {The knowledge engineering review}, number = {2}, pages = {97--126}, title = {A survey of statistical user simulation techniques for reinforcement-learning of dialogue management strategies}, volume = {21}, year = {2006}, } @article{serban2017deep, author = {Iulian V Serban and Chinnadhurai Sankar and Mathieu Germain and Saizheng Zhang and Zhouhan Lin and Sandeep Subramanian and Taesup Kim and Michael Pieper and Sarath Chandar and Nan Rosemary Ke and others}, journal = {arXiv preprint arXiv:1709.02349}, title = {A deep reinforcement learning chatbot}, year = {2017}, } @inproceedings{ratner2017snorkel, author = {Alexander Ratner and Stephen H Bach and Henry Ehrenberg and Jason Fries and Sen Wu and Christopher R\'{e}}, booktitle = {Very Large Data Bases (VLDB)}, number = {3}, pages = {269--282}, title = {Snorkel: Rapid training data creation with weak supervision}, year = {2017}, } @article{dinan2018wizard, author = {Emily Dinan and Stephen Roller and Kurt Shuster and Angela Fan and Michael Auli and Jason Weston}, journal = {arXiv preprint arXiv:1811.01241}, title = {Wizard of {Wikipedia}: Knowledge-Powered Conversational agents}, year = {2018}, } @article{bassiri2011interactional, author = {Mohammad Amin Bassiri}, journal = {English Language and Literature Studies}, number = {2}, pages = {61--73}, title = {Interactional feedback and the impact of attitude and motivation on noticing l2 form}, volume = {1}, year = {2011}, } @misc{burtsev2018convai2, author = {Mikhail Burtsev and Varvara Logacheva and Valentin Malykh and Ryan Lowe and Iulian Serban and Shrimai Prabhumoye and Emily Dinan and Douwe Kiela and Alexander Miller and Kurt Shuster and Arthur Szlam and Jack Urbanek and Jason Weston}, title = {The Conversational Intelligence Challenge 2 ({ConvAI2})}, year = {2018}, } @article{kruger1999unskilled, author = {Justin Kruger and David Dunning}, journal = {Journal of personality and social psychology}, number = {6}, pages = {1121--1134}, title = {Unskilled and unaware of it: how difficulties in recognizing one's own incompetence lead to inflated self-assessments}, volume = {77}, year = {1999}, } @article{mazumder2018towards, author = {Sahisnu Mazumder and Nianzu Ma and Bing Liu}, journal = {arXiv preprint arXiv:1802.06024}, title = {Towards a Continuous Knowledge Learning Engine for Chatbots}, year = {2018}, } @misc{paszke2017automatic, author = {Adam Paszke and Sam Gross and Soumith Chintala and Gregory Chanan and Edward Yang and Zachary DeVito and Zeming Lin and Alban Desmaison and Luca Antiga and Adam Lerer}, title = {Automatic differentiation in PyTorch}, year = {2017}, } @techreport{radford2018improving, author = {Alec Radford and Karthik Narasimhan and Tim Salimans and Ilya Sutskever}, institution = {OpenAI}, title = {Improving language understanding by generative pre-training}, year = {2018}, } @article{rieser2011reinforcement, author = {Verena Rieser and Oliver Lemon}, journal = {Springer Science \& Business Media}, title = {Reinforcement learning for adaptive dialogue systems: a data-driven methodology for dialogue management and natural language generation}, year = {2011}, } @techreport{ross2009turkers, author = {Joel Ross and Andrew Zaldivar and Lilly Irani and Bill Tomlinson}, institution = {Department of Informatics, University of California, Irvine}, title = {Who are the turkers? worker demographics in amazon mechanical turk}, year = {2009}, } @inproceedings{silver2013lifelong, author = {Daniel L Silver and Qiang Yang and Lianghao Li}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Lifelong Machine Learning Systems: Beyond Learning Algorithms}, volume = {13}, year = {2013}, } @article{bojanowski2017enriching, author = {Piotr Bojanowski and Edouard Grave and Armand Joulin and Tomas Mikolov}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, pages = {135--146}, title = {Enriching word vectors with subword information}, volume = {5}, year = {2017}, } @inproceedings{kinga2015method, author = {Diederik P. Kinga and Jimmy Ba}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {A method for stochastic optimization}, volume = {5}, year = {2015}, } @inproceedings{li2017dialogue, author = {Jiwei Li and Alexander H Miller and Sumit Chopra and Marc\'Aurelio Ranzato and Jason Weston}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Dialogue learning with human-in-the-loop}, year = {2017}, } @inproceedings{li2017learning, author = {Jiwei Li and Alexander H Miller and Sumit Chopra and Marc\'Aurelio Ranzato and Jason Weston}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Learning through dialogue interactions by asking questions}, year = {2017}, } @inproceedings{luan2017multi, author = {Yi Luan and Chris Brockett and Bill Dolan and Jianfeng Gao and Michel Galley}, booktitle = {Association for Computational Linguistics and International Joint Conference on Natural Language Processing (ACL-IJCNLP)}, pages = {605--614}, title = {Multi-Task Learning for Speaker-Role Adaptation in Neural Conversation Models}, volume = {1}, year = {2017}, } @inproceedings{mazare2018training, author = {Pierre-Emmanuel Mazar\'{e} and Samuel Humeau and Martin Raison and Antoine Bordes}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {2775--2779}, title = {Training Millions of Personalized Dialogue Agents}, year = {2018}, } @inproceedings{miller2017parlai, author = {Alexander H Miller and Will Feng and Adam Fisch and Jiasen Lu and Dhruv Batra and Antoine Bordes and Devi Parikh and Jason Weston}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {79--84}, title = {ParlAI: A Dialog Research Software Platform}, year = {2017}, } @inproceedings{ratinov2011local, author = {Lee Ratinov and Dan Roth and D. Downey and M. Anderson}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Local and Global Algorithms for Disambiguation to {W}ikipedia}, year = {2011}, } @article{kalyanpur2012structured, author = {Aditya Kalyanpur and Branimir K. Boguraev and Siddharth Patwardhan and J. William Murdock and Adam Lally and Christopher A. Welty and John M. Prager and Bonaventura Coppola and Achille Fokoue-Nkoutche and Lei Zhang and Yue Pan and Zhao Ming Qui}, journal = {{IBM} Journal of Research and Development}, pages = {351--364}, title = {Structured data and inference in DeepQA}, volume = {56}, year = {2012}, } @article{lee2015conversational, author = {Kyusong Lee and Paul Hongsuck Seo and Junhwi Choi and Sangjun Koo and Gary Geunbae Lee}, journal = {16th Annual Meeting of the Special Interest Group on Discourse and Dialogue}, pages = {139--143}, title = {Conversational knowledge teaching agent that uses a knowledge base}, year = {2015}, } @article{han2015exploiting, author = {Sangdo Han and Jeesoo Bang and Seonghan Ryu and Gary Geunbae Lee}, journal = {16th Annual Meeting of the Special Interest Group on Discourse and Dialogue}, pages = {129--133}, title = {Exploiting knowledge base to generate responses for natural language dialog listening agents}, year = {2015}, } @article{ellis2015tackbp, author = {Joe Ellis and Jeremy Getman and Heather Simpson and Kira Griffitt and Hoa Trang Dang and Ralph Grishman and Heng Ji and Catherine DePrince and Thomas Riese and Neil Kuster}, journal = {Linguistic Data Consortium}, title = {{TAC} {KBP} 2015 Slot Descriptions}, year = {2015}, } @inproceedings{aslam2006statistical, author = {Javed A. Aslam and Virgil Pavlu and Emine Yilmaz}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, pages = {541--548}, title = {A statistical method for system evaluation using incomplete judgments}, year = {2006}, } @inproceedings{buckley2007bias, author = {Chris Buckley and Darrin Dimmick and Ian Soboroff and Ellen Voorhees}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, title = {Bias and the limits of pooling for large collections}, year = {2007}, } @inproceedings{buckley2004incomplete, author = {Chris Buckley and Ellen M. Voorhees}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, pages = {25--32}, title = {Retrieval evaluation with incomplete information}, year = {2004}, } @inproceedings{sakai2008information, author = {Tetsuya Sakai and Noriko Kando}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, pages = {447--470}, title = {On information retrieval metrics designed for evaluation with incomplete relevance assessments}, year = {2008}, } @inproceedings{cormack1998efficient, author = {Gordon V Cormack and Christopher R Palmer and Charles L A Clarke}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, title = {Efficient Construction of Large Test Collections}, year = {1998}, } @inproceedings{yilmaz2008simple, author = {Emine Yilmaz and Evangelos Kanoulas and Javed A Aslam}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, pages = {603--610}, title = {A simple and efficient sampling method for estimating {AP} and {NDCG}}, year = {2008}, } @inproceedings{vannella2014validating, author = {Daniele Vannella and David Jurgens and Daniele Scarfini and Domenico Toscani and Roberto Navigli}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {1294--1304}, title = {Validating and Extending Semantic Knowledge Bases using Video Games with a Purpose}, year = {2014}, } @inproceedings{pavlick2016gun, author = {Ellie Pavlick and Heng Ji and Xiaoman Pan and Chris Callison-Burch}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1018--1024}, title = {The Gun Violence Database: A new task and data set for {NLP}}, year = {2016}, } @phdthesis{webber2010measurement, author = {William Edward Webber}, school = {University of Melbourne}, title = {Measurement in Information Retrieval Evaluation}, year = {2010}, } @inproceedings{zobel1998reliable, author = {Justin Zobel}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, title = {How reliable are the results of large-scale information retrieval experiments?}, year = {1998}, } @inproceedings{voorhees1999overview, author = {Ellen M. Voorhees and Donna Harman}, booktitle = {TREC-8}, title = {Overview of the Eight Text REtreival Conference ({TREC}-8)}, year = {1999}, } @inproceedings{adel2016comparing, author = {Heike Adel and Benjamin Roth and Hinrich Sch\"{u}tze}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, title = {Comparing Convolutional Neural Networks to Traditional Models for Slot Filling}, year = {2016}, } @book{owen2013monte, author = {Art B. Owen}, publisher = {}, title = {Monte Carlo theory, methods and examples}, year = {2013}, } @article{sparck1975report, author = {K Sparck Jones and C Van Rijsbergen}, journal = {Information Retrieval Test Collection}, title = {Report on the Need for and Provision of an ``Ideal test collection}, year = {1975}, } @article{harman1993trec, author = {Donna K. Harman}, journal = {Information Processing and Management}, pages = {411--414}, title = {The first text retrieval conference (TREC-1) Rockville, MD, U.S.A., 4-6 November, 1992}, volume = {29}, year = {1993}, } @inproceedings{ji2011kbp, author = {Heng Ji and Ralph Grishman and Hoa {Trang Dang}}, booktitle = {Text Analytics Conference}, title = {Overview of the {TAC} 2011 Knowledge Base Population Track}, year = {2011}, } @book{burden1985bisection, author = {Richard L. Burden and J. Douglas Faires}, publisher = {PWS Publishers}, title = {Numerical Analysis (3rd ed.)}, year = {1985}, } @inproceedings{liu2016effective, author = {Angli Liu and Stephen Soderland and Jonathan Bragg and Christopher H Lin and Xiao Ling and Daniel S Weld}, booktitle = {North American Association for Computational Linguistics (NAACL)}, pages = {897--906}, title = {Effective Crowd Annotation for Relation Extraction}, year = {2016}, } @article{dang2016kbp, author = {Hoa Trang Dang}, journal = {Text Analytics Conference}, title = {Cold Start Knowledge Base Population at {TAC} {KBP} 2016}, year = {2016}, } @article{ellis2016overview, author = {Joe Ellis and Jeremy Getman and Dana Fore and Neil Kuster and Zhiyi Song and Ann Bies and Stephanie Strassel}, journal = {Text Analytics Conference}, title = {Overview of linguistic resources for the {TAC} {KBP} 2016 evaluations: Methodologies and results}, year = {2016}, } @article{ellis2012kbp, author = {Joe Ellis and Xuansong Li and Kira Griffitt and Stephanie M. Strassel}, journal = {Text Analytics Conference}, title = {Linguistic Resources for 2012 Knowledge Base Population Evaluations}, year = {2012}, } @article{plank16nonstandard, author = {Barbara Plank}, journal = {arXiv}, title = {What to do about non-standard (or non-canonical) language in {NLP}}, year = {2016}, } @inproceedings{novikova2017why, author = {Jekaterina Novikova and Ond\v{r}ej Du\v{s}ek and Amanda Cercas Curry and Verena Rieser}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Why We Need New Evaluation Metrics for {NLG}}, year = {2017}, } @inproceedings{lin2004rouge, author = {Chin-yew Lin and Marina Rey}, booktitle = {NTCIR Workshop}, title = {Looking for a Few Good Metrics: {ROUGE} and its Evaluation}, year = {2004}, } @inproceedings{cohan2016revisiting, author = {Arman Cohan and Nazli Goharian}, booktitle = {Language Resources and Evaluation Conference (LREC)}, title = {Revisiting Summarization Evaluation for Scientific Articles}, year = {2016}, } @article{lavie2009meteor, author = {Alon Lavie and Michael Denkowski}, journal = {Machine Translation}, title = {The Meteor Metric for Automatic Evaluation of Machine Translation}, volume = {23}, year = {2009}, } @inproceedings{denkowski2014meteor, author = {Michael Denkowski and Alon Lavie}, booktitle = {Workshop on Statistical Machine Translation}, title = {Meteor Universal: Language Specific Translation Evaluation for Any Target Language}, year = {2014}, } @inproceedings{vedantam2015cider, author = {Ramakrishna Vedantam and C. Lawrence Zitnick and Devi Parikh}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {4566--4575}, title = {{CIDEr}: Consensus-based image description evaluation}, year = {2015}, } @article{miller1956psychological, author = {George A. Miller and J. G. Beebe-Center}, journal = {Mechanical Translation}, pages = {73--80}, title = {Some Psychological Methods for Evaluating the Quality of Translations}, volume = {3}, year = {1956}, } @article{lau2017grammaticality, author = {Jey Han Lau and Alexander Clark and Shalom Lappin}, journal = {Cognitive Science}, pages = {1202--1241}, title = {Grammaticality, Acceptability, and Probability: A Probabilistic View of Linguistic Knowledge}, volume = {41}, year = {2017}, } @inproceedings{see2017point, author = {Abigail See and Peter J. Liu and Christopher D. Manning}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Get To The Point: Summarization with Pointer-Generator Networks}, year = {2017}, } @inproceedings{paulus2018deep, author = {Romain Paulus and Caiming Xiong and Richard Socher}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {A Deep Reinforced Model for Abstractive Summarization}, year = {2018}, } @inproceedings{lin2014microsoft, author = {Tsung-Yi Lin and Michael Maire and Serge Belongie and James Hays and Pietro Perona and Deva Ramanan and Piotr Doll{\'a}r and C. Lawrence Zitnick}, booktitle = {European Conference on Computer Vision (ECCV)}, pages = {740--755}, title = {Microsoft {COCO}: Common objects in context}, year = {2014}, } @inproceedings{conroy2008mind, author = {John M Conroy and Hoa Trang Dang}, booktitle = {International Conference on Computational Linguistics (COLING)}, pages = {145--152}, title = {Mind the Gap : Dangers of Divorcing Evaluations of Summary Content from Linguistic Quality}, year = {2008}, } @inproceedings{snover2006ter, author = {Matthew Snover and Bonnie Dorr and Richard Schwartz and Linnea Micciulla and John Makhoul}, booktitle = {Association for Machine Translation in the Americas}, pages = {223--231}, title = {A Study of Translation Edit Rate with Targeted Human Annotation}, year = {2006}, } @inproceedings{chang2017affordable, author = {Cheng Chang and Runzhe Yang and Lu Chen and Xiang Zhou and Kai Yu}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {223--231}, title = {Affordable On-Line Dialogue Policy Learning}, year = {2017}, } @inproceedings{dang2006overview, author = {Hoa Trang Dang}, booktitle = {Document Understanding Conference}, title = {Overview of {DUC} 2006}, year = {2006}, } @inproceedings{tan2018s, author = {Chuanqi Tan and Furu Wei and Nan Yang and Weifeng Lv and Ming Zhou}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {{S}-{N}et: From answer extraction to answer generation for machine reading comprehension}, year = {2018}, } @article{pagliardini2017unsupervised, author = {Matteo Pagliardini and Prakhar Gupta and Martin Jaggi}, journal = {arXiv}, title = {Unsupervised learning of sentence embeddings using compositional n-gram features}, year = {2017}, } @inproceedings{passonneau2014benefits, author = {Rebecca J. Passonneau and Bob Carpenter}, booktitle = {Association for Computational Linguistics (ACL)}, title = {The Benefits of a Model of Annotation}, year = {2014}, } @inproceedings{lowe2017towards, author = {Ryan Lowe and Michael Noseworthy and Iulian V. Serban and Nicolas Angelard-Gontier and Yoshua Bengio and Joelle Pineau}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Towards an Automatic Turing Test: Learning to Evaluate Dialogue Responses}, year = {2017}, } @article{dusek2017referenceless, author = {Ondrej Dusek and Jekaterina Novikova and Verena Rieser}, journal = {arXiv}, title = {Referenceless Quality Estimation for Natural Language Generation}, year = {2017}, } @article{novikova2016crowd, author = {Jekaterina Novikova and Oliver Lemon and Verena Rieser}, journal = {arXiv}, title = {Crowd-sourcing {NLG} data: Pictures elicit better data}, year = {2016}, } @inproceedings{mnih2008empirical, author = {Volodymyr Mnih and Csaba Szepesv{'{a}}ri and Jean-Yves Audibert}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Empirical Berstein stopping}, year = {2008}, } @article{luhn1958automatic, author = {Henry P. Luhn}, journal = {{IBM} Journal of Research and Development}, pages = {159--165}, title = {The Automatic Creation of Literature Abstracts}, volume = {2}, year = {1958}, } @inproceedings{passonneau2005applying, author = {Rebecca J. Passonneau and Ani Nenkova and Kathleen McKeown and Sergey Sigelman}, booktitle = {Document Understanding Conference}, title = {Applying the pyramid method in {DUC} 2005}, year = {2005}, } @article{brandow1995automatic, author = {Ronald Brandow and Karl Mitze and Lisa F. Rau}, journal = {Information Processing and Management}, pages = {675--685}, title = {Automatic condensation of electronic publications by sentence selection}, volume = {31}, year = {1995}, } @inproceedings{mani1999tipster, author = {Inderjeet Mani and Gary Klein and Lynette Hirschman and Therese Firmin and David House and Beth Sundheim}, booktitle = {European Association for Computational Linguistics (EACL)}, title = {The {TIPSTER} {SUMMAC} text summarization evaluation}, year = {1999}, } @inproceedings{mckeown2005summaries, author = {Kathleen Mckeown and Rebecca J Passonneau and David K Elson and Julia Hirschberg}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, title = {Do Summaries Help? A Task-Based Evaluation of Multi-Document Summarization}, year = {2005}, } @inproceedings{white1994arpa, author = {John White and Theresa O'Connell and Francis O'Mara}, booktitle = {First Conference of the Association for Machine Translation in the Americas}, title = {The {ARPA} {MT} evaluation methodologies: evaluation, lessons, and future approaches}, year = {1994}, } @inproceedings{toutanova2016dataset, author = {Kristina Toutanova and Chris Brockett}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {340--350}, title = {A Dataset and Evaluation Metrics for Abstractive Compression of Sentences and Short Paragraphs}, year = {2016}, } @inproceedings{culy2003limits, author = {Christopher Culy and Susanne Z Riehemann}, booktitle = {MT Summit IX}, pages = {71--78}, title = {The Limits of n-gram Translation Evaluation Metrics}, year = {2003}, } @inproceedings{vanhalteren2003factoid, author = {Hans Van Halteren and Simone Teufel}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, pages = {57--64}, title = {Examining the consensus between human summaries: initial experiments with factoid analysis}, year = {2003}, } @inproceedings{kumar2009attribute, author = {Neeraj Kumar and Alexander C Berg and Peter N Belhumeur and Shree K Nayar}, booktitle = {International Conference on Computer Vision (ICCV)}, pages = {365--372}, title = {Attribute and simile classifiers for face verification}, year = {2009}, } @book{casella1990statistical, author = {George Casella and Roger L. Berger}, publisher = {Wadsworth and Brooks}, title = {Statistical Inference}, year = {1990}, } @article{recht2018cifar, author = {Benjamin Recht and Rebecca Roelofs and Ludwig Schmidt and Vaishaal Shankar}, journal = {arXiv}, title = {Do {CIFAR}-10 Classifiers Generalize to {CIFAR}-10?}, year = {2018}, } @phdthesis{mcclosky2010any, author = {David McClosky}, school = {Brown University}, title = {Any domain parsing: automatic domain adaptation for natural language parsing}, year = {2010}, } @inproceedings{foster2011news, author = {Jennifer Foster and Ozlem Cetinoglu and Joachim Wagner and Joseph Le Roux and Joakim Nivre and Deirdre Hogan and Josef VanGenabith}, booktitle = {Association for Computational Linguistics and International Joint Conference on Natural Language Processing (ACL-IJCNLP)}, title = {From news to comment: Resources and benchmarks for parsing the language of {Web} 2.0}, year = {2011}, } @inproceedings{branson2017lean, author = {Steve Branson and Grant Van Horn and Pietro Perona}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {7474--7483}, title = {Lean Crowdsourcing : Combining Humans and Machines in an Online System}, year = {2017}, } @inproceedings{ahn2004labeling, author = {Luis von Ahn and Laura A. Dabbish}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Labeling images with a computer game}, year = {2004}, } @inproceedings{poesio2013phrase, author = {Massimo Poesio and Jon Chamberlain and Udo Kruschwitz and Livio Robaldo and Luca Ducceschi}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Phrase {D}etectives: Utilizing collective intelligence for internet-scale language resource creation}, year = {2013}, } @inproceedings{krishna2016embracing, author = {Ranjay Krishna and Kenji Hata and Stephanie Chen and Joshua Kravitz and David A. Shamma and Li Fei-Fei and Michael S. Bernstein}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Embracing Error to Enable Rapid Crowdsourcing}, year = {2016}, } @inproceedings{christiano2017deep, author = {Paul Christiano and Jan Leike and Tom B. Brown and Miljan Martic and Shane Legg and Dario Amodei}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Deep Reinforcement Learning from Human Preferences}, year = {2017}, } @inproceedings{stanford2017kbp, author = {Arun Tejasvi Chaganty and Ashwin Paranjape and Jason Bolton and Matthew Lamm and Jinhao Lei and Abigail See and Kevin Clark and Yuhao Zhang and Peng Qi and Christopher D Manning}, booktitle = {Text Analytics Conference}, title = {Stanford at {TAC} {KBP} 2017: Building a Trilingual Relational Knowledge Graph}, year = {2017}, } @inproceedings{mayfield2012evaluating, author = {James Mayfield and Tim Finin}, booktitle = {Joint Workshop on Automatic Knowledge Base Construction and Web-scale Knowledge Extraction}, title = {Evaluating the quality of a knowledge base populated from text}, year = {2012}, } @inproceedings{paek2007toward, author = {Tim Paek}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Toward evaluation that leads to best practices: reconciling dialog evaluation in research and industry}, year = {2007}, } @phdthesis{plank2011domain, author = {Barbara Plank}, school = {University of Groningen}, title = {Domain adaptation for parsing}, year = {2011}, } @article{weiss2016survey, author = {Karl Weiss and Taghi M Khoshgoftaar and DingDing Wang}, journal = {Journal of Big Data}, title = {A survey of transfer learning}, volume = {3}, year = {2016}, } @article{pierce1970whither, author = {J. R. Pierce}, journal = {Journal of the Acoustical Society of America}, pages = {1616--1617}, title = {Whither Speech Recognition?}, volume = {47}, year = {1970}, } @article{salton1965smart, author = {Gerard Salton and Michael E. Lesk}, journal = {Communications of the ACM}, number = {6}, pages = {391--398}, title = {The {SMART} automatic document retrieval systems—an illustration}, volume = {8}, year = {1965}, } @inproceedings{cleverdon1962report, author = {Cyril W. Cleverdon}, booktitle = {{ASLIB}}, title = {Report on the testing and analysis of an investigation into the comparative efficiency of indexing systems}, year = {1962}, } @inproceedings{cleverdon1967cranfield, author = {Cyril W. Cleverdon}, booktitle = {{ASLIB}}, title = {The Cranfield tests on index language devices}, year = {1967}, } @inproceedings{harman1992overview, author = {D. K. Harman}, booktitle = {Text Retrieval Conference}, title = {Overview of the first {TREC} Text Retrieval Conference}, year = {1992}, } @article{voorhees2007trec, author = {Ellen M. Voorhees }, journal = {Communications of the ACM}, number = {11}, pages = {51--54}, title = {TREC: Continuing Information Retrieval's Tradition of Experimentation}, volume = {50}, year = {2007}, } @article{lane2016genome, author = {Jacqueline M Lane and Irma Vlasac and Simon G Anderson and Simon D Kyle and William G Dixon and David A Bechtold and Shubhroz Gill and Max A Little and Annemarie Luik and Andrew Loudon and others}, journal = {Nature Communications}, title = {Genome-wide association analysis identifies novel loci for chronotype in 100,420 individuals from the {UK} Biobank}, volume = {7}, year = {2016}, } @article{wain2015novel, author = {Louise V Wain and Nick Shrine and Suzanne Miller and Victoria E Jackson and Ioanna Ntalla and Maria Soler Artigas and Charlotte K Billington and Abdul Kader Kheirallah and Richard Allen and James P Cook and others}, journal = {The Lancet Respiratory Medicine}, number = {10}, pages = {769--781}, title = {Novel insights into the genetics of smoking behaviour, lung function, and chronic obstructive pulmonary disease ({UK} {B}iLEVE): a genetic association study in {UK} {B}iobank}, volume = {3}, year = {2015}, } @article{o2012multiphen, author = {Paul F O'Reilly and Clive J Hoggart and Yotsawat Pomyen and Federico CF Calboli and Paul Elliott and Marjo-Riitta Jarvelin and Lachlan JM Coin}, journal = {PloS One}, number = {5}, title = {Multi{P}hen: joint model of multiple phenotypes can increase discovery in {GWAS}}, volume = {7}, year = {2012}, } @article{rossol2012cd14brightcd16, author = {Manuela Rossol and Stephan Kraus and Matthias Pierer and Christoph Baerwald and Ulf Wagner}, journal = {Arthritis \& Rheumatology}, number = {3}, pages = {671--677}, title = {The {CD}14bright{CD}16+ monocyte subset is expanded in rheumatoid arthritis and promotes expansion of the {T}h17 cell population}, volume = {64}, year = {2012}, } @article{milovanovic2004relationships, author = {Micha Milovanovic and E Nilsson and Petter J{\"a}remo}, journal = {Clinica {C}himica {A}cta}, number = {1}, pages = {237--240}, title = {Relationships between platelets and inflammatory markers in rheumatoid arthritis}, volume = {343}, year = {2004}, } @article{maddison2016concrete, author = {Chris J Maddison and Andriy Mnih and Yee Whye Teh}, journal = {arXiv preprint arXiv:1611.00712}, title = {The concrete distribution: A continuous relaxation of discrete random variables}, year = {2016}, } @article{abid2018exploring, author = {Abubakar Abid and Martin J Zhang and Vivek K Bagaria and James Zou}, journal = {Nature Communications}, number = {1}, title = {Exploring patterns enriched in a dataset with contrastive principal component analysis}, volume = {9}, year = {2018}, } @article{perez2022red, author = {Ethan Perez and Saffron Huang and Francis Song and Trevor Cai and Roman Ring and John Aslanides and Amelia Glaese and Nat McAleese and Geoffrey Irving}, journal = {arXiv preprint arXiv:2202.03286}, title = {Red Teaming Language Models with Language Models}, year = {2022}, } @article{hemmatian2022debiased, author = {Babak Hemmatian and Lav R. Varshney}, journal = {arXiv preprint arXiv:2208.04417}, title = {Debiased Large Language Models Still Associate Muslims with Uniquely Violent Acts}, year = {2022}, } @article{lewkowycz2022solving, author = {Aitor Lewkowycz and Anders Andreassen and David Dohan and Ethan Dyer and Henryk Michalewski and Vinay Ramasesh and Ambrose Slone and Cem Anil and Imanol Schlag and Theo Gutman-Solo and Yuhuai Wu and Behnam Neyshabur and Guy Gur-Ari and Vedant Misra}, journal = {arXiv preprint arXiv:2206.14858}, title = {Solving Quantitative Reasoning Problems with Language Models}, year = {2022}, } @article{li2022alphacode, author = {Yujia Li and David Choi and Junyoung Chung and Nate Kushman and Julian Schrittwieser and Rémi Leblond and Tom Eccles and James Keeling and Felix Gimeno and Agustin Dal Lago and Thomas Hubert and Peter Choy and Cyprien de Masson d'Autume and Igor Babuschkin and Xinyun Chen and Po-Sen Huang and Johannes Welbl and Sven Gowal and Alexey Cherepanov and James Molloy and Daniel J. Mankowitz and Esme Sutherland Robson and Pushmeet Kohli and Nando de Freitas and Koray Kavukcuoglu and Oriol Vinyals}, journal = {arXiv preprint arXiv:2203.07814}, title = {Competition-Level Code Generation with AlphaCode}, year = {2022}, } @inproceedings{hoffmann2022chinchilla, author = {Jordan Hoffmann and Sebastian Borgeaud and Arthur Mensch and Elena Buchatskaya and Trevor Cai and Eliza Rutherford and Diego de Las Casas and Lisa Anne Hendricks and Johannes Welbl and Aidan Clark and Tom Hennigan and Eric Noland and Katie Millican and George van den Driessche and Bogdan Damoc and Aurelia Guy and Simon Osindero and Karen Simonyan and Erich Elsen and Jack W. Rae and Oriol Vinyals and Laurent Sifre}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {An Empirical Analysis of Compute-Optimal Large Language Model Training}, year = {2022}, } @inproceedings{yang2021fudge, author = {Kevin Yang and Dan Klein}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {FUDGE: Controlled Text Generation With Future Discriminators}, year = {2021}, } @inproceedings{liu2021dexperts, author = {Alisa Liu and Maarten Sap and Ximing Lu and Swabha Swayamdipta and Chandra Bhagavatula and Noah A. Smith and Yejin Choi}, booktitle = {Association for Computational Linguistics (ACL)}, title = {DExperts: Decoding-Time Controlled Text Generation with Experts and Anti-Experts}, year = {2021}, } @inproceedings{krause2021gedi, author = {Ben Krause and Akhilesh Deepak Gotmare and Bryan McCann and Nitish Shirish Keskar and Shafiq Joty and Richard Socher and Nazneen Fatema Rajani}, booktitle = {Findings of Empirical Methods in Natural Language Processing (Findings of EMNLP)}, title = {GeDi: Generative Discriminator Guided Sequence Generation}, year = {2021}, } @inproceedings{sheng2020towards, author = {Emily Sheng and Kai-Wei Chang and Premkumar Natarajan and Nanyun Peng}, booktitle = {Findings of Empirical Methods in Natural Language Processing (Findings of EMNLP)}, title = {Towards Controllable Biases in Language Generation}, year = {2020}, } @inproceedings{dathathri2020plug, author = {Sumanth Dathathri and Andrea Madotto and Janice Lan and Jane Hung and Eric Frank and Piero Molino and Jason Yosinski and Rosanne Liu}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Plug and Play Language Models: A Simple Approach to Controlled Text Generation}, year = {2020}, } @inproceedings{qin2022cold, author = {Lianhui Qin and Sean Welleck and Daniel Khashabi and Yejin Choi}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {{COLD} Decoding: Energy-based Constrained Text Generation with Langevin Dynamics}, year = {2022}, } @inproceedings{kumar2021controlled, author = {Sachin Kumar and Eric Malmi and Aliaksei Severyn and Yulia Tsvetkov}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Controlled Text Generation as Continuous Optimization with Multiple Constraints}, year = {2021}, } @inproceedings{shin2020autoprompt, author = {Taylor Shin and Yasaman Razeghi and Robert L. Logan IV and Eric Wallace and Sameer Singh}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {AutoPrompt: Eliciting Knowledge from Language Models with Automatically Generated Prompts}, year = {2020}, } @inproceedings{guo2021gradient, author = {Chuan Guo and Alexandre Sablayrolles and Hervé Jégou and Douwe Kiela}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Gradient-based Adversarial Attacks against Text Transformers}, year = {2021}, } @article{nijkamp2022codegen, author = {Erik Nijkamp and Bo Pang and Hiroaki Hayashi and Lifu Tu and Huam Wang and Yingbo Zhou and Silvio Savarese and Caiming Xiong}, journal = {arXiv preprint arXiv:2203.13474}, title = {A Conversational Paradigm for Program Synthesis}, year = {2022}, } @article{steinhardt2022anchor, author = {Jacob Steinhardt}, journal = {Bounded Regret}, title = {Anchor Weights for {ML}}, year = {2022}, } @article{herrmann2011effect, author = {Andreas Herrmann and Daniel G. Goldstein and Rupert Stadler and Jan R. Landwehr and Mark Heitmann and Reto Hofstetter and Framk Huber}, journal = {Journal of Retailing and Consumer Services}, number = {6}, pages = {483--491}, title = {The effect of default options on choice---Evidence from online product configurators}, volume = {18}, year = {2011}, } @article{thoppilan2022lambda, author = {Romal Thoppilan and Daniel De Freitas and Jamie Hall and Noam Shazeer and Apoorv Kulshreshtha and Heng-Tze Cheng and Alicia Jin and Taylor Bos and Leslie Baker and Yu Du and YaGuang Li and Hongrae Lee and Huaixiu Steven Zheng and Amin Ghafouri and Marcelo Menegali and Yanping Huang and Maxim Krikun and Dmitry Lepikhin and James Qin and Dehao Chen and Yuanzhong Xu and Zhifeng Chen and Adam Roberts and Maarten Bosma and Yanqi Zhou and Chung-Ching Chang and Igor Krivokon and Will Rusch and Marc Pickett and Kathleen Meier-Hellstern and Meredith Ringel Morris and Tulsee Doshi and Renelito Delos Santos and Toju Duke and Johnny Soraker and Ben Zevenbergen and Vinodkumar Prabhakaran and Mark Diaz and Ben Hutchinson and Kristen Olson and Alejandra Molina and Erin Hoffman-John and Josh Lee and Lora Aroyo and Ravi Rajakumar and Alena Butryna and Matthew Lamm and Viktoriya Kuzmina and Joe Fenton and Aaron Cohen and Rachel Bernstein and Ray Kurzweil and Blaise Aguera-Arcas and Claire Cui and Marian Croak and Ed Chi and Quoc Le}, journal = {arXiv preprint arXiv:2201.08239}, title = {{LaMDA}: Language Models for Dialog Applications}, year = {2022}, } @article{liu2021what, author = {Jiachang Liu and Dinghan Shen and Yizhe Zhang and Bill Dolan and Lawrence Carin and Weizhu Chen}, journal = {arXiv preprint arXiv:2101.06804}, title = {What Makes Good In-Context Examples for {GPT}-3}, year = {2021}, } @article{meyer2014semantic, author = {David E. Meyer}, journal = {Science}, number = {6196}, pages = {523--523}, title = {Semantic priming well established}, volume = {345}, year = {2014}, } @article{weidinger2021ethical, author = {Laura Weidinger and John Mellor and Maribeth Rauh and Conor Griffin and Jonathan Uesato and Po-Sen Huang and Myra Cheng and Mia Glaese and Borja Balle and Atoosa Kasirzadeh and Zac Kenton and Sasha Brown and Will Hawkins and Tom Stepleton and Courtney Biles and Abeba Birhane and Julia Haas and Laura Rimell and Lisa Anne Hendricks and William Isaac and Sean Legassick and Geoffrey Irving and Iason Gabriel}, journal = {arXiv preprint arXiv:2112.04359}, title = {Ethical and social risks of harm from Language Models}, year = {2021}, } @inproceedings{bender2021stochastic, author = {Emily Bender and Timnit Gebru and Angelina McMillan-Major and Shmargaret Shmitchel}, booktitle = {ACM Conference on Fairness, Accountability, and Transparency (FAccT)}, title = {On the Dangers of Stochastic Parrots: Can Language Models Be Too Big?}, year = {2021}, } @article{carlini2020extracting, author = {Nicholas Carlini and Florian Tramer and Eric Wallace and Matthew Jagielski and Ariel Herbert-Voss and Katherine Lee and Adam Roberts and Tom Brown and Dawn Song and Ulfar Erlingsson and Alina Oprea and Colin Raffel}, journal = {arXiv preprint arXiv:2012.07805}, title = {Extracting Training Data from Large Language Models}, year = {2020}, } @article{li2021hidden, author = {Shaofeng Li and Hui Liu and Tian Dong and Benjamin Zi Hao Zhao and Minhui Xue and Haojin Zhu and Jialiang Lu}, journal = {arXiv preprint arXiv:2105.00164}, title = {Hidden Backdoors in Human-Centric Language Models}, year = {2021}, } @inproceedings{jacobs2021measurement, author = {Abigail Z. Jacobs and Hanna Wallach}, booktitle = {ACM Conference on Fairness, Accountability, and Transparency (FAccT)}, title = {Measurement and Fairness}, year = {2021}, } @inproceedings{groenwold2020investigating, author = {Sophie Groenwold and Lily Ou and Aesha Parekh and Samhita Honnavalli and Sharon Levy and Diba Mirza and William Yang Wang}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Investigating African-American Vernacular English in Transformer-Based Text Generation}, year = {2020}, } @inproceedings{blodgett2021stereotyping, author = {Su Lin Blodgett and Gilsinia Lopez and Alexandra Olteanu and Robert Sim and Hanna Wallach}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Stereotyping Norwegian Salmon: An Inventory of Pitfalls in Fairness Benchmark Datasets}, year = {2021}, } @inproceedings{sheng2019woman, author = {Emily Sheng and Kai-Wei Chang and Premkumar Natarajan and Nanyun Peng}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {The Woman Worked as a Babysitter: On Biases in Language Generation}, year = {2019}, } @inproceedings{hendrycks2021coding, author = {Dan Hendrycks and Steven Basart and Saurav Kadavath and Mantas Mazeika and Akul Arora and Ethan Guo and Collin Burns and Samir Puranik and Horace He and Dawn Song and Jacob Steinhardt}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Measuring Coding Challenge Competence With {APPS}}, year = {2021}, } @inproceedings{krishna2021hurdles, author = {Kalpesh Krishna and Aurko Roy and Mohit Iyyer}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Hurdles to Progress in Long-form Question Answering}, year = {2021}, } @article{shuster2021retrieval, author = {Kurt Shuster and Spencer Poff and Moya Chen and Douwe Kiela and Jason Weston}, journal = {arXiv preprint arXiv:2104.07567}, title = {Retrieval Augmentation Reduces Hallucination in Conversation}, year = {2021}, } @inproceedings{gabriel2021go, author = {Saadia Gabriel and Asli Celikyilmaz and Rahul Jha and Yejin Choi and Jianfeng Gao}, booktitle = {Findings of the Association for Computational Linguistics (Findings of ACL)}, title = {{GO FIGURE}: A Meta Evaluation of Factuality in Summarization}, year = {2021}, } @article{lin2021truthful, author = {Stephanie Lin and Jacob Hilton and Owain Evans}, journal = {arXiv preprint arXiv:2109.07958}, title = {TruthfulQA: Measuring How Models Mimic Human Falsehoods}, year = {2021}, } @article{cobbe2021training, author = {Karl Cobbe and Vineet Kosaraju and Mohammad Bavarian and Mark Chen and Heewoo Jun and Lukasz Kaiser and Matthias Plappert and Jerry Tworek and Jacob Hilton and Reiichiro Nakano and Christopher Hesse and John Schulman}, journal = {arXiv preprint arXiv:2110.14168}, title = {Training Verifiers to Solve Math Word Problems}, year = {2021}, } @inproceedings{hendrycks2021math, author = {Dan Hendrycks and Collin Burns and Saurav Kadavath and Akul Arora and Steven Basart and Eric Tang and Dawn Song and Jacob Steinhardt}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Measuring Mathematical Problem Solving With the {MATH} Dataset}, year = {2021}, } @article{tang2021solving, author = {Leonard Tang and Elizabeth Ke and Nikhil Singh and Nakul Verma and Iddo Drori}, journal = {arXiv preprint arXiv:2111.08276}, title = {Solving Probability and Statistics Problems by Program Synthesis}, year = {2021}, } @inproceedings{fan2019eli5, author = {Angela Fan and Yacine Jernite and Ethan Perez and David Grangier and Jason Weston and Michael Auli}, booktitle = {Association for Computational Linguistics (ACL)}, title = {{ELI5}: Long Form Question Answering}, year = {2019}, } @inproceedings{zhou2020learning, author = {Wangchunshu Zhou and Ke Xu}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Learning to Compare for Better Training and Evaluation of Open Domain Natural Language Generation Models}, year = {2020}, } @article{ram2018conversational, author = {Ashwin Ram and Rohit Prasad and Chandra Khatri and Anu Venkatesh and Raefer Gabriel and Qing Liu and Jeff Nunn and Behnam Hedayatnia and Ming Cheng and Ashish Nagar and Eric King and Kate Bland and Amanda Wartick and Yi Pan and Han Song and Sk Jayadevan and Gene Hwang and Art Pettigrue}, journal = {arXiv preprint arXiv:1801.03604}, title = {Conversational AI: The Science Behind the Alexa Prize}, year = {2018}, } @article{rothe2020leveraging, author = {Sascha Rothe and Shashi Narayan and Aliaksei Severyn}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, pages = {264--280}, title = {Leveraging Pre-trained Checkpoints for Sequence Generation Tasks}, volume = {8}, year = {2020}, } @article{ziegler2019fine, author = {Daniel M. Ziegler and Nisan Stiennon and Jeffrey Wu and Tom B. Brown and Alec Radford and Dario Amodei and Paul Christiano and Geoffrey Irving}, journal = {arXiv preprint arXiv:1909.08593}, title = {Fine-Tuning Language Models from Human Preferences}, year = {2019}, } @inproceedings{steinnon2020learning, author = {Nisan Stiennon and Long Ouyang and Jeff Wu and Daniel M. Ziegler and Ryan Lowe and Chelsea Voss and Alec Radford and Dario Amodei and Paul Christiano}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Learning to summarize from human feedback}, year = {2020}, } @article{strack1988priming, author = {Fritz Strack and Leonard L. Martin and Nobert Schwarz}, journal = {European Journal of Social Psychology}, number = {5}, pages = {429--442}, title = {Priming and communication: Social determinants of information use in judgments of life satisfaction}, volume = {18}, year = {1988}, } @incollection{kahneman2002representativeness, author = {Daniel Kahneman and Shane Frederick}, booktitle = {Heuristics and Biases: The Psychology of Intuitive Judgement}, pages = {49--81}, title = {Representativeness Revisited: Attribute Substitution in Intuitive Judgment}, year = {2002}, } @article{tversky1973availability, author = {Amos Tversky and Daniel Kahneman}, journal = {Cognitive Psychology}, number = {2}, pages = {207--232}, title = {Availability: A heuristic for judging frequency and probability}, volume = {5}, year = {1973}, } @article{windhager2010laying, author = {Sonja Windhager and Florian Hutzler and Claus-Christian Carbon and Elisabeth Oberzaucher and Katrin Schaefer and Truls Thorstensen and Helmut Leder and Karl Grammer}, journal = {Collegium Antropologicum}, number = {3}, pages = {1075--1080}, title = {Laying eyes on Headlights: Eye Movements Suggest Facial Features in Cars}, volume = {34}, year = {2010}, } @article{tversky1974judgement, author = {Amos Tversky and Daniel Kahneman}, journal = {Science}, number = {4157}, pages = {1124--1131}, title = {Judgment under Uncertainty: Heuristics and Biases}, volume = {185}, year = {1974}, } @article{jacowitz1995anchoring, author = {Karen E. Jacowitz and Daniel Kahneman}, journal = {Personality and Social Psychology Bulletin}, number = {11}, pages = {1161--1166}, title = {Measures of Anchoring in Estimation Tasks}, volume = {21}, year = {1995}, } @inproceedings{hendrycks2021measuring, author = {Dan Hendrycks and Collin Burns and Steven Basart and Andy Zou and Mantas Mazeika and Dawn Song and Jacob Steinhardt}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Measuring Massive Multitask Language Understanding}, year = {2021}, } @article{tversky1981framing, author = {Amos Tversky and Daniel Kahneman}, journal = {Science}, number = {4481}, pages = {453--458}, title = {The Framing of Decisions and the Psychology of Choice}, volume = {211}, year = {1981}, } @article{rae2021gopher, author = {Jack W. Rae and Sebastian Borgeaud and Trevor Cai and Katie Millican and Jordan Hoffmann and Francis Song and John Aslanides and Sarah Henderson and Roman Ring and Susannah Young and Eliza Rutherford and Tom Hennigan and Jacob Menick and Albin Cassirer and Richard Powell and George van den Driessche and Lisa Anne Hendricks and Maribeth Rauh and Po-Sen Huang and Amelia Glaese and Johannes Welbl and Sumanth Dathathri and Saffron Huang and Jonathan Uesato and John Mellor and Irina Higgins and Antonia Creswell and Nat McAleese and Amy Wu and Erich Elsen and Siddhant Jayakumar and Elena Buchatskaya and David Budden and Esme Sutherland and Karen Simonyan and Michela Paganini and Laurent Sifre and Lena Martens and Xiang Lorraine Li and Adhiguna Kuncoro and Aida Nematzadeh and Elena Gribovskaya and Domenic Donato and Angeliki Lazaridou and Arthur Mensch and Jean-Baptiste Lespiau and Maria Tsimpoukelli and Nikolai Grigorev and Doug Fritz and Thibault Sottiaux and Mantas Pajarskas and Toby Pohlen and Zhitao Gong and Daniel Toyama and Cyprien de Masson d'Autume and Yujia Li and Tayfun Terzi and Vladimir Mikulik and Igor Babuschkin and Aidan Clark and Diego de Las Casas and Aurelia Guy and Chris Jones and James Bradbury and Matthew Johnson and Blake Hechtman and Laura Weidinger and Iason Gabriel and William Isaac and Ed Lockhart and Simon Osindero and Laura Rimell and Chris Dyer and Oriol Vinyals and Kareem Ayoub and Jeff Stanway and Lorrayne Bennett and Demis Hassabis and Koray Kavukcuoglu and Geoffrey Irving}, journal = {arXiv preprint arXiv:2112.11446}, title = {Scaling Language Models: Methods, Analysis \& Insignts from Training Gopher}, year = {2021}, } @article{chen2021codex, author = {Mark Chen and Jerry Tworek and Heewoo Jun and Qiming Yuan and Henrique Ponde de Oliveira Pinto and Jared Kaplan and Harri Edwards and Yuri Burda and Nicholas Joseph and Greg Brockman and Alex Ray and Raul Puri and Gretchen Krueger and Michael Petrov and Heidy Khlaaf and Girish Sastry and Pamela Mishkin and Brooke Chan and Scott Gray and Nick Ryder and Mikhail Pavlov and Alethea Power and Lukasz Kaiser and Mohammad Bavarian and Clemens Winter and Philippe Tillet and Felipe Petroski Such and Dave Cummings and Matthias Plappert and Fotios Chantzis and Elizabeth Barnes and Ariel Herbert-Voss and William Hebgen Guss and Alex Nichol and Alex Paino and Nikolas Tezak and Jie Tang and Igor Babuschkin and Suchir Balaji and Shantanu Jain and William Saunders and Christopher Hesse and Andrew N. Carr and Jan Leike and Josh Achiam and Vedant Misra and Evan Morikawa and Alec Radford and Matthew Knight and Miles Brundage and Mira Murati and Katie Mayer and Peter Welinder and Bob McGrew and Dario Amodei and Sam McCandlish and Ilya Sutskever and Wojciech Zaremba}, journal = {arXiv preprint arXiv:2107.03374}, title = {Evaluating Large Language Models Trained on Code}, year = {2021}, } @inproceedings{zhou2016cams, author = {Bolei Zhou and Aditya Khosla and Agata Lapedriza and Aude Oliva and Antonio Torralba}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Learning Deep Features for Discriminative Localization}, year = {2016}, } @article{gebru2018datasheets, author = {Timnit Gebru and Jamie Morgenstern and Briana Vecchione and Jennifer Wortman Vaughan and Hanna Wallach and Hal Daumé Ill and Kate Crawford}, journal = {arXiv preprint arXiv:1803.09010}, title = {Datasheets for Datasets}, year = {2018}, } @article{rajpurkar2020chexpedition, author = {Pranav Rajpurkar and Anirudh Joshi and Anuj Pareek and Phil Chen and Amirhossein Kiani and Jeremy Irvin and Andrew Ng and Matthew Lungren}, journal = {arXiv preprint arXiv:2002.11379}, title = {CheXpedition: Investigating Generalization Challenges for Translation of Chest X{-}ray Algorithms to the Clinical Setting}, year = {2020}, } @article{bagnoli2005logconcave, author = {Mark Bagnoli and Ted Bergstrom}, journal = {Economic Theory}, pages = {445--469}, title = {Log-concave probability and its applications}, volume = {26}, year = {2005}, } @article{cule2010logconcave, author = {Madeleine Cule and Richard Samworth and Michael Stewart}, journal = {Journal of the Royal Statistical Society}, pages = {545--603}, title = {Maximum likelihood estimation of a multi-dimensional log-concave density}, volume = {73}, year = {2010}, } @inproceedings{cheng2019robust, author = {Yong Cheng and Lu Jiang and Wolfgang Macherey}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Robust Neural Machine Translation with Doubly Adversarial Inputs}, year = {2019}, } @inproceedings{sakaguchi2017robsut, author = {Keisuke Sakaguchi and Kevin Duh and Matt Post and Benjamin Van Durme}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Robsut Wrod Reocginiton via Semi-Character Recurrent Neural Network}, year = {2017}, } @inproceedings{gong2019context, author = {Hongyu Gong and Yuchen Li and Suma Bhat and Pramod Viswanath}, booktitle = {World Wide Web (WWW)}, pages = {2771--2777}, title = {Context-Sensitive Malicious Spelling Error Correction}, year = {2019}, } @inproceedings{edizel2019misspelling, author = {Bora Edizel and Alekxandra Piktus and Piotr Bojanowski and Rui Ferreira and Edouard Grave and Fabrizio Silvestri}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Misspelling Oblivious Word Embeddings}, year = {2019}, } @inproceedings{chen2019towards, author = {Jiefeng Chen and Xi Wu and Vaibhav Rastogi and Yingyu Liang and Somesh Jha}, booktitle = {IEEE European Symposium on Security and Privacy (EuroS\&P)}, title = {Towards Understanding Limitations of Pixel Discretization Against Adversarial Attacks}, year = {2019}, } @inproceedings{dolan2005mrpc, author = {William B Dolan and Chris Brockett}, booktitle = {International Workshop on Paraphrasing (IWP)}, title = {Automatically constructing a corpus of sentential paraphrases}, year = {2005}, } @misc{davies2008COCA, author = {Mark Davies}, howpublished = {\url{https://www.english-corpora.org/coca/}}, title = {The Corpus of Contemporary {A}merican {E}nglish ({COCA}): One billion words, 1990-2019}, year = {2008}, } @misc{rawlison1976letterpos, author = {Graham Ernest Rawlinson}, howpublished = {Ph.D. thesis, University of Nottingham}, title = {The significance of letter position in word recognition}, year = {1976}, } @misc{davis2003psycholinguistic, author = {Matt Davis}, howpublished = {\url{https://www.mrc-cbu.cam.ac.uk/}}, title = {Psycholinguistic evidence on scrambled letters in reading}, year = {2003}, } @inproceedings{schaul2015prioritized, author = {T. Schaul and J. Quan and I. Antonoglou and D. Silver}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Prioritized experience replay}, year = {2015}, } @article{bellemare2013arcade, author = {M. G. Bellemare and Y. Naddaf and J. Veness and M. Bowling}, journal = {Journal of Artificial Intelligence Research (JAIR)}, pages = {253--279}, title = {The Arcade Learning Environment: An evaluation platform for general agents}, volume = {47}, year = {2013}, } @article{silver2016mastering, author = {D. Silver and A. Huang and C. J. Maddison and A. Guez and L. Sifre and G. Van Den Driessche and J. Schrittwieser and I. Antonoglou and V. Panneershelvam and M. Lanctot and others}, journal = {Nature}, number = {7587}, pages = {484--489}, title = {Mastering the game of Go with deep neural networks and tree search}, volume = {529}, year = {2016}, } @article{silver2017mastering, author = {D. Silver and J. Schrittwieser and K. Simonyan and I. Antonoglou and A. Huang and A. Guez and T. Hubert and L. and M. Lai and A. Bolton and others}, journal = {Nature}, number = {7676}, pages = {354--359}, title = {Mastering the game of Go without human knowledge}, volume = {550}, year = {2017}, } @article{vecerik2017leveraging, author = {M. Vecerik and T. Hester and J. Scholz and F. Wang and O. Pietquin and B. Piot and N. Heess and T. Rothorl and T. Lampe and M. Riedmiller}, journal = {arXiv preprint arXiv:1707.08817}, title = {Leveraging Demonstrations for Deep Reinforcement Learning on Robotics Problems with Sparse Rewards}, year = {2017}, } @inproceedings{ross2010efficient, author = {S. Ross and D. Bagnell}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, pages = {661--668}, title = {Efficient reductions for imitation learning}, year = {2010}, } @article{nair2017overcoming, author = {A. Nair and B. McGrew and M. Andrychowicz and W. Zaremba and P. Abbeel}, journal = {arXiv preprint arXiv:1709.10089}, title = {Overcoming Exploration in Reinforcement Learning with Demonstrations}, year = {2017}, } @inproceedings{ho2016generative, author = {J. Ho and S. Ermon}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {4565--4573}, title = {Generative adversarial imitation learning}, year = {2016}, } @article{stadie2017third, author = {B. C. Stadie and P. Abbeel and I. Sutskever}, journal = {arXiv preprint arXiv:1703.01703}, title = {Third-Person Imitation Learning}, year = {2017}, } @inproceedings{baram2017end, author = {N. Baram and O. Anschel and I. Caspi and S. Mannor}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {390--399}, title = {End-to-end differentiable adversarial imitation learning}, year = {2017}, } @inproceedings{finn2016guided, author = {C. Finn and S. Levine and P. Abbeel}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {49--58}, title = {Guided cost learning: Deep inverse optimal control via policy optimization}, year = {2016}, } @inproceedings{bacon2017option, author = {P. Bacon and J. Harb and D. Precup}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {1726--1734}, title = {The Option-Critic Architecture}, year = {2017}, } @article{roderick2017deep, author = {M. Roderick and C. Grimm and S. Tellex}, journal = {arXiv preprint arXiv:1710.00459}, title = {Deep Abstract {Q}-Networks}, year = {2017}, } @article{sutton1999between, author = {R. S. Sutton and D. Precup and S. Singh}, journal = {Articial intelligence}, pages = {181--211}, title = {Between MDPs and semi-MDPs: A framework for temporal abstraction in reinforcement learning}, volume = {112}, year = {1999}, } @inproceedings{parr1998reinforcement, author = {R. Parr and S. J. Russell}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1043--1049}, title = {Reinforcement learning with hierarchies of machines}, year = {1998}, } @article{duan2017one, author = {Y. Duan and M. Andrychowicz and B. C. Stadie and J. Ho and J. Schneider and I. Sutskever and P. Abbeel and W. Zaremba}, journal = {arXiv preprint arXiv:1703.07326}, title = {One-Shot Imitation Learning}, year = {2017}, } @article{finn2017one, author = {C. Finn and T. Yu and T. Zhang and P. Abbeel and S. Levine}, journal = {arXiv preprint arXiv:1709.04905}, title = {One-Shot Visual Imitation Learning via Meta-Learning}, year = {2017}, } @inproceedings{konidaris2007building, author = {G. Konidaris and A. G. Barto}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Building Portable Options: Skill Transfer in Reinforcement Learning}, year = {2007}, } @article{hauser2008using, author = {K. Hauser and T. Bretl and K. Harada and J. Latombe}, journal = {Algorithmic foundation of robotics}, pages = {507--522}, title = {Using motion primitives in probabilistic sample-based planning for humanoid robots}, volume = {7}, year = {2008}, } @inproceedings{dietterich1998maxq, author = {T. G. Dietterich}, booktitle = {International Conference on Machine Learning (ICML)}, title = {The {MAXQ} Method for Hierarchical Reinforcement Learning}, year = {1998}, } @inproceedings{li2006towards, author = {L. Li and T. J. Walsh and M. L. Littman}, booktitle = {International Symposium on Artificial Intelligence and Mathematics (ISAIM)}, title = {Towards a Unified Theory of State Abstraction for MDPs}, year = {2006}, } @article{daniel2016hierarchical, author = {C. Daniel and G. Neumann and O. Kroemer and J. Peters}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {3190--3239}, title = {Hierarchical relative entropy policy search}, volume = {17}, year = {2016}, } @article{wiering2012reinforcement, author = {Wiering, Marco and Van Otterlo, Martijn}, journal = {Adaptation, Learning, and Optimization}, title = {Reinforcement learning}, volume = {12}, year = {2012}, } @inproceedings{chentanez2005intrinsically, author = {N. Chentanez and A. G. Barto and S. P. Singh}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1281--1288}, title = {Intrinsically motivated reinforcement learning}, year = {2005}, } @article{weber2017imagination, author = {T. Weber and S. Racani{\`e}re and D. P. Reichert and L. Buesing and A. Guez and D. J. Rezende and A. P. Badia and O. Vinyals and N. Heess and Y. Li and others}, journal = {arXiv preprint arXiv:1707.06203}, title = {Imagination-Augmented Agents for Deep Reinforcement Learning}, year = {2017}, } @inproceedings{perez2017c, author = {C. Perez-D'Arpino and J. A. Shah}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {4058--4065}, title = {{C}-LEARN: Learning geometric constraints from demonstrations for multi-step manipulation in shared autonomy}, year = {2017}, } @article{phillips2016learning, author = {M. Phillips and V. Hwang and S. Chitta and M. Likhachev}, journal = {Autonomous Robots}, number = {1}, pages = {109--124}, title = {Learning to plan for constrained manipulation from demonstrations}, volume = {40}, year = {2016}, } @phdthesis{andre2003programmable, author = {D. Andre}, school = {University of California, Berkeley}, title = {Programmable reinforcement learning agents}, year = {2003}, } @inproceedings{marthi2005concurrent, author = {B. Marthi and C. Guestrin}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Concurrent hierarchical reinforcement learning}, year = {2005}, } @inproceedings{ostrovski2017count, author = {G. Ostrovski and M. G. Bellemare and A. Oord and R. Munos}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {2721--2730}, title = {Count-based exploration with neural density models}, year = {2017}, } @inproceedings{martin2017count, author = {J. Martin and S. N. Sasikumar and T. Everitt and M. Hutter}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Count-based exploration in feature space for reinforcement learning}, year = {2017}, } @inproceedings{tang2017exploration, author = {H. Tang and R. Houthooft and D. Foote and A. Stooke and X. Chen and Y. Duan and J. Schulman and F. DeTurck and P. Abbeel}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {2753--2762}, title = {\#Exploration: A study of count-based exploration for deep reinforcement learning}, year = {2017}, } @inproceedings{abbeel2006using, author = {P. Abbeel and M. Quigley and A. Y. Ng}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1--8}, title = {Using inaccurate models in reinforcement learning}, year = {2006}, } @article{sutton1990integrated, author = {R. S. Sutton}, journal = {Machine Learning Proceedings}, pages = {216--224}, title = {Integrated architectures for learning, planning, and reacting based on approximating dynamic programming}, year = {1990}, } @article{zhang2018solar, author = {M. Zhang and S. Vikram and L. Smith and P. Abbeel and M. J. Johnson and S. Levine}, journal = {arXiv preprint arXiv:1808.09105}, title = {SOLAR: Deep Structured Latent Representations for Model-Based Reinforcement Learning}, year = {2018}, } @inproceedings{nagabandi2018neural, author = {A. Nagabandi and G. Kahn and R. S. Fearing and S. Levine}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {7559--7566}, title = {Neural network dynamics for model-based deep reinforcement learning with model-free fine-tuning}, year = {2018}, } @inproceedings{jong2008hierarchical, author = {N. K. Jong and P. Stone}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {432--439}, title = {Hierarchical model-based reinforcement learning: {R}-max+ MAX{Q}}, year = {2008}, } @article{henderson2017deep, author = {P. Henderson and R. Islam and P. Bachman and J. Pineau and D. Precup and D. Meger}, journal = {arXiv preprint arXiv:1709.06560}, title = {Deep reinforcement learning that matters}, year = {2017}, } @article{ha2018world, author = {David Ha and J{\"u}rgen Schmidhuber}, journal = {arXiv preprint arXiv:1803.10122}, title = {World Models}, year = {2018}, } @inproceedings{oh2015action, author = {Junhyuk Oh and Xiaoxiao Guo and Honglak Lee and Richard L Lewis and Satinder Singh}, booktitle = {Advances in neural information processing systems}, pages = {2863--2871}, title = {Action-conditional video prediction using deep networks in atari games}, year = {2015}, } @inproceedings{schmidhuber1993planning, author = {J{\"u}rgen Schmidhuber}, booktitle = {From Animals to Animats 2: Proceedings of the Second International Conference on Simulation of Adaptive Behavior}, title = {Planning simple trajectories using neural subgoal generators}, volume = {2}, year = {1993}, } @article{strehl2008analysis, author = {Alexander L Strehl and Michael L Littman}, journal = {Journal of Computer and System Sciences}, number = {8}, pages = {1309--1331}, title = {An analysis of model-based interval estimation for Markov decision processes}, volume = {74}, year = {2008}, } @inproceedings{talvitie2015agnostic, author = {Erik Talvitie}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {2986--2992}, title = {Agnostic System Identification for Monte Carlo Planning}, year = {2015}, } @phdthesis{kakade2003sample, author = {Sham Machandranath Kakade and others}, school = {University of London}, title = {On the sample complexity of reinforcement learning}, year = {2003}, } @article{choi2018contingency, author = {Jongwook Choi and Yijie Guo and Marcin Moczulski and Junhyuk Oh and Neal Wu and Mohammad Norouzi and Honglak Lee}, journal = {arXiv preprint arXiv:1811.01483}, title = {Contingency-Aware Exploration in Reinforcement Learning}, year = {2018}, } @inproceedings{finn2016unsupervised, author = {Chelsea Finn and Ian Goodfellow and Sergey Levine}, booktitle = {Advances in neural information processing systems}, pages = {64--72}, title = {Unsupervised learning for physical interaction through video prediction}, year = {2016}, } @article{chiappa2017recurrent, author = {Silvia Chiappa and S{'e}bastien Racaniere and Daan Wierstra and Shakir Mohamed}, journal = {arXiv preprint arXiv:1704.02254}, title = {Recurrent environment simulators}, year = {2017}, } @article{burda2018exploration, author = {Yuri Burda and Harrison Edwards and Amos Storkey and Oleg Klimov}, journal = {arXiv preprint arXiv:1810.12894}, title = {Exploration by random network distillation}, year = {2018}, } @inproceedings{guo2014deep, author = {Xiaoxiao Guo and Satinder Singh and Honglak Lee and Richard L Lewis and Xiaoshi Wang}, booktitle = {Advances in neural information processing systems}, pages = {3338--3346}, title = {Deep learning for real-time Atari game play using offline Monte-Carlo tree search planning}, year = {2014}, } @inproceedings{laroche2017transfer, author = {Romain Laroche and Merwan Barlier}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {2147--2153}, title = {Transfer Reinforcement Learning with Shared Dynamics}, year = {2017}, } @inproceedings{andre2002state, author = {David Andre and Stuart J Russell}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {119--125}, title = {State abstraction for programmable reinforcement learning agents}, year = {2002}, } @inproceedings{dietterich2000state, author = {Thomas G Dietterich}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {994--1000}, title = {State abstraction in {MAXQ} hierarchical reinforcement learning}, year = {2000}, } @inproceedings{martins2016softmax, author = {Andre Martins and Ramon Astudillo}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1614--1623}, title = {From softmax to sparsemax: A sparse model of attention and multi-label classification}, year = {2016}, } @article{ecoffet2019go, author = {Adrien Ecoffet and Joost Huizinga and Joel Lehman and Kenneth O Stanley and Jeff Clune}, journal = {arXiv preprint arXiv:1901.10995}, title = {Go-Explore: a New Approach for Hard-Exploration Problems}, year = {2019}, } @article{stanton2018deep, author = {Christopher Stanton and Jeff Clune}, journal = {arXiv preprint arXiv:1806.00553}, title = {Deep curiosity search: Intra-life exploration improves performance on challenging deep reinforcement learning problems}, year = {2018}, } @article{krishnamurthy2018semiparametric, author = {Akshay Krishnamurthy and Zhiwei Steven Wu and Vasilis Syrgkanis}, journal = {arXiv preprint arXiv:1803.04204}, title = {Semiparametric contextual bandits}, year = {2018}, } @inproceedings{greenewald2017action, author = {Kristjan Greenewald and Ambuj Tewari and Susan Murphy and Predag Klasnja}, booktitle = {Advances in neural information processing systems}, pages = {5977--5985}, title = {Action centered contextual bandits}, year = {2017}, } @article{jin2019provably, author = {Chi Jin and Zhuoran Yang and Zhaoran Wang and Michael I Jordan}, journal = {arXiv preprint arXiv:1907.05388}, title = {Provably efficient reinforcement learning with linear function approximation}, year = {2019}, } @article{rakelly2019efficient, author = {Kate Rakelly and Aurick Zhou and Deirdre Quillen and Chelsea Finn and Sergey Levine}, journal = {arXiv preprint arXiv:1903.08254}, title = {Efficient off-policy meta-reinforcement learning via probabilistic context variables}, year = {2019}, } @inproceedings{mendonca2019guided, author = {Russell Mendonca and Abhishek Gupta and Rosen Kralev and Pieter Abbeel and Sergey Levine and Chelsea Finn}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {9653--9664}, title = {Guided meta-policy search}, year = {2019}, } @article{nagabandi2018learning, author = {Anusha Nagabandi and Ignasi Clavera and Simin Liu and Ronald S Fearing and Pieter Abbeel and Sergey Levine and Chelsea Finn}, journal = {arXiv preprint arXiv:1803.11347}, title = {Learning to adapt in dynamic, real-world environments through meta-reinforcement learning}, year = {2018}, } @article{saemundsson2018meta, author = {Steind{'o}r S{\ae}mundsson and Katja Hofmann and Marc Peter Deisenroth}, journal = {arXiv preprint arXiv:1803.07551}, title = {Meta reinforcement learning with latent variable gaussian processes}, year = {2018}, } @article{rothfuss2018promp, author = {Jonas Rothfuss and Dennis Lee and Ignasi Clavera and Tamim Asfour and Pieter Abbeel}, journal = {arXiv preprint arXiv:1810.06784}, title = {Promp: Proximal meta-policy search}, year = {2018}, } @inproceedings{yang2019norml, author = {Yuxiang Yang and Ken Caluwaerts and Atil Iscen and Jie Tan and Chelsea Finn}, booktitle = {Proceedings of the 18th International Conference on Autonomous Agents and MultiAgent Systems}, pages = {323--331}, title = {Norml: No-reward meta learning}, year = {2019}, } @article{mishra2017simple, author = {Nikhil Mishra and Mostafa Rohaninejad and Xi Chen and Pieter Abbeel}, journal = {arXiv preprint arXiv:1707.03141}, title = {A simple neural attentive meta-learner}, year = {2017}, } @article{wang2016learning, author = {Jane X Wang and Zeb Kurth-Nelson and Dhruva Tirumala and Hubert Soyer and Joel Z Leibo and Remi Munos and Charles Blundell and Dharshan Kumaran and Matt Botvinick}, journal = {arXiv preprint arXiv:1611.05763}, title = {Learning to reinforcement learn}, year = {2016}, } @article{duan2016rl, author = {Yan Duan and John Schulman and Xi Chen and Peter L Bartlett and Ilya Sutskever and Pieter Abbeel}, journal = {arXiv preprint arXiv:1611.02779}, title = {{RL}$^2$: Fast reinforcement learning via slow reinforcement learning}, year = {2016}, } @article{zintgraf2019varibad, author = {Luisa Zintgraf and Kyriacos Shiarlis and Maximilian Igl and Sebastian Schulze and Yarin Gal and Katja Hofmann and Shimon Whiteson}, journal = {arXiv preprint arXiv:1910.08348}, title = {VariBAD: A Very Good Method for Bayes-Adaptive Deep {RL} via Meta-Learning}, year = {2019}, } @article{humplik2019meta, author = {Jan Humplik and Alexandre Galashov and Leonard Hasenclever and Pedro A Ortega and Yee Whye Teh and Nicolas Heess}, journal = {arXiv preprint arXiv:1905.06424}, title = {Meta reinforcement learning as task inference}, year = {2019}, } @inproceedings{stadie2018importance, author = {Bradly Stadie and Ge Yang and Rein Houthooft and Peter Chen and Yan Duan and Yuhuai Wu and Pieter Abbeel and Ilya Sutskever}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {9280--9290}, title = {The importance of sampling inmeta-reinforcement learning}, year = {2018}, } @inproceedings{gupta2018meta, author = {Abhishek Gupta and Russell Mendonca and YuXuan Liu and Pieter Abbeel and Sergey Levine}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {5302--5311}, title = {Meta-reinforcement learning of structured exploration strategies}, year = {2018}, } @article{fakoor2019meta, author = {Rasool Fakoor and Pratik Chaudhari and Stefano Soatto and Alexander J Smola}, journal = {arXiv preprint arXiv:1910.00125}, title = {Meta-{Q}-Learning}, year = {2019}, } @article{gurumurthy2019mame, author = {Swaminathan Gurumurthy and Sumit Kumar and Katia Sycara}, journal = {arXiv preprint arXiv:1911.04024}, title = {MAME: Model-Agnostic Meta-Exploration}, year = {2019}, } @article{zhou2019environment, author = {Wenxuan Zhou and Lerrel Pinto and Abhinav Gupta}, journal = {arXiv preprint arXiv:1907.11740}, title = {Environment probing interaction policies}, year = {2019}, } @phdthesis{schmidhuber1987evolutionary, author = {J{\"u}rgen Schmidhuber}, school = {Technische Universit{\"a}t M{\"u}nchen}, title = {Evolutionary principles in self-referential learning, or on learning how to learn: the meta-meta-... hook}, year = {1987}, } @article{kamienny2020learning, author = {Pierre-Alexandre Kamienny and Matteo Pirotta and Alessandro Lazaric and Thibault Lavril and Nicolas Usunier and Ludovic Denoyer}, journal = {arXiv preprint arXiv:2005.02934}, title = {Learning Adaptive Exploration Strategies in Dynamic Environments Through Informed Policy Regularization}, year = {2020}, } @inproceedings{barber2003algorithm, author = {David Barber and Felix V Agakov}, booktitle = {Advances in neural information processing systems}, title = {The {IM} algorithm: a variational approach to information maximization}, year = {2003}, } @article{zhou2019watch, author = {Allan Zhou and Eric Jang and Daniel Kappler and Alex Herzog and Mohi Khansari and Paul Wohlhart and Yunfei Bai and Mrinal Kalakrishnan and Sergey Levine and Chelsea Finn}, journal = {arXiv preprint arXiv:1906.03352}, title = {Watch, try, learn: Meta-learning from demonstrations and reward}, year = {2019}, } @article{ritter2018been, author = {Samuel Ritter and Jane X Wang and Zeb Kurth-Nelson and Siddhant M Jayakumar and Charles Blundell and Razvan Pascanu and Matthew Botvinick}, journal = {arXiv preprint arXiv:1805.09692}, title = {Been there, done that: Meta-learning with episodic recall}, year = {2018}, } @article{kaelbling1998planning, author = {Leslie Pack Kaelbling and Michael L Littman and Anthony R Cassandra}, journal = {Artificial intelligence}, number = {1}, pages = {99--134}, title = {Planning and acting in partially observable stochastic domains}, volume = {101}, year = {1998}, } @article{eysenbach2018diversity, author = {Benjamin Eysenbach and Abhishek Gupta and Julian Ibarz and Sergey Levine}, journal = {arXiv preprint arXiv:1802.06070}, title = {Diversity is all you need: Learning skills without a reward function}, year = {2018}, } @inproceedings{houthooft2016vime, author = {Rein Houthooft and Xi Chen and Yan Duan and John Schulman and Filip De Turck and Pieter Abbeel}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1109--1117}, title = {Vime: Variational information maximizing exploration}, year = {2016}, } @article{gregor2016variational, author = {Karol Gregor and Danilo Jimenez Rezende and Daan Wierstra}, journal = {arXiv preprint arXiv:1611.07507}, title = {Variational intrinsic control}, year = {2016}, } @article{warde2018unsupervised, author = {David Warde-Farley and Tom Van de Wiele and Tejas Kulkarni and Catalin Ionescu and Steven Hansen and Volodymyr Mnih}, journal = {arXiv preprint arXiv:1811.11359}, title = {Unsupervised control through non-parametric discriminative rewards}, year = {2018}, } @book{thrun2012learning, author = {Sebastian Thrun and Lorien Pratt}, publisher = {Springer Science \& Business Media Springer Science \& Business Media}, title = {Learning to learn}, year = {2012}, } @inproceedings{naik1992meta, author = {Devang K Naik and Richard J Mammone}, booktitle = {[Proceedings 1992] IJCNN International Joint Conference on Neural Networks}, pages = {437--442}, title = {Meta-neural networks that learn by learning}, volume = {1}, year = {1992}, } @inproceedings{bengio1992optimization, author = {Samy Bengio and Yoshua Bengio and Jocelyn Cloutier and Jan Gecsei}, booktitle = {Preprints Conf. Optimality in Artificial and Biological Neural Networks}, title = {On the optimization of a synaptic learning rule}, volume = {2}, year = {1992}, } @inproceedings{hochreiter2001learning, author = {Sepp Hochreiter and A Steven Younger and Peter R Conwell}, booktitle = {International Conference on Artificial Neural Networks (ICANN)}, pages = {87--94}, title = {Learning to learn using gradient descent}, year = {2001}, } @article{schmidhuber1992learning, author = {J{\"u}rgen Schmidhuber}, journal = {Neural Computation}, number = {1}, pages = {131--139}, title = {Learning to control fast-weight memories: An alternative to dynamic recurrent networks}, volume = {4}, year = {1992}, } @inproceedings{andrychowicz2016learning, author = {Marcin Andrychowicz and Misha Denil and Sergio Gomez and Matthew W Hoffman and David Pfau and Tom Schaul and Brendan Shillingford and Nando De Freitas}, booktitle = {Advances in neural information processing systems}, pages = {3981--3989}, title = {Learning to learn by gradient descent by gradient descent}, year = {2016}, } @inproceedings{younger2001meta, author = {A Steven Younger and Sepp Hochreiter and Peter R Conwell}, booktitle = {IJCNN'01. International Joint Conference on Neural Networks. Proceedings (Cat. No. 01CH37222)}, title = {Meta-learning with backpropagation}, volume = {3}, year = {2001}, } @article{santoro2016one, author = {Adam Santoro and Sergey Bartunov and Matthew Botvinick and Daan Wierstra and Timothy Lillicrap}, journal = {arXiv preprint arXiv:1605.06065}, title = {One-shot learning with memory-augmented neural networks}, year = {2016}, } @inproceedings{vinyals2016matching, author = {Oriol Vinyals and Charles Blundell and Timothy Lillicrap and Daan Wierstra and others}, booktitle = {Advances in neural information processing systems}, pages = {3630--3638}, title = {Matching networks for one shot learning}, year = {2016}, } @inproceedings{bengio1991learning, author = {Y Bengio and S Bengio and J Cloutier}, booktitle = {IJCNN-91-Seattle International Joint Conference on Neural Networks}, pages = {969--969}, title = {Learning a synaptic learning rule}, volume = {2}, year = {1991}, } @article{parisotto2015actor, author = {Emilio Parisotto and Jimmy Lei Ba and Ruslan Salakhutdinov}, journal = {arXiv preprint arXiv:1511.06342}, title = {Actor-mimic: Deep multitask and transfer reinforcement learning}, year = {2015}, } @article{rusu2015policy, author = {Andrei A Rusu and Sergio Gomez Colmenarejo and Caglar Gulcehre and Guillaume Desjardins and James Kirkpatrick and Razvan Pascanu and Volodymyr Mnih and Koray Kavukcuoglu and Raia Hadsell}, journal = {arXiv preprint arXiv:1511.06295}, title = {Policy distillation}, year = {2015}, } @article{alemi2016deep, author = {Alexander A Alemi and Ian Fischer and Joshua V Dillon and Kevin Murphy}, journal = {arXiv preprint arXiv:1612.00410}, title = {Deep variational information bottleneck}, year = {2016}, } @article{russo2017tutorial, author = {Daniel Russo and Benjamin Van Roy and Abbas Kazerouni and Ian Osband and Zheng Wen}, journal = {arXiv preprint arXiv:1707.02038}, title = {A tutorial on thompson sampling}, year = {2017}, } @misc{boisvert2018gym, author = {Maxime Chevalier-Boisvert}, howpublished = {\url{https://github.com/maximecb/gym-miniworld}}, title = {Gym-{M}iniworld environment for OpenAI Gym}, year = {2018}, } @inproceedings{kapturowski2019recurrent, author = {Steven Kapturowski and Georg Ostrovski and John Quan and Remi Munos and Will Dabney}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Recurrent experience replay in distributed reinforcement learning}, year = {2019}, } @article{maaten2008visualizing, author = {Laurens van der Maaten and Geoffrey Hinton}, journal = {Journal of machine learning research}, number = {0}, pages = {2579--2605}, title = {Visualizing data using {t}-{SNE}}, volume = {9}, year = {2008}, } @article{badia2020never, author = {Adri{\`a} Puigdom{\`e}nech Badia and Pablo Sprechmann and Alex Vitvitskyi and Daniel Guo and Bilal Piot and Steven Kapturowski and Olivier Tieleman and Mart{'\i}n Arjovsky and Alexander Pritzel and Andew Bolt and others}, journal = {arXiv preprint arXiv:2002.06038}, title = {Never Give Up: Learning Directed Exploration Strategies}, year = {2020}, } @article{zhang2020learn, author = {Jin Zhang and Jianhao Wang and Hao Hu and Yingfeng Chen and Changjie Fan and Chongjie Zhang}, journal = {arXiv preprint arXiv:2006.08170}, title = {Learn to Effectively Explore in Context-Based Meta-{RL}}, year = {2020}, } @article{dorfman2020offline, author = {Ron Dorfman and Aviv Tamar}, journal = {arXiv preprint arXiv:2008.02598}, title = {Offline Meta Reinforcement Learning}, year = {2020}, } @article{hiraoka2020meta, author = {Takuya Hiraoka and Takahisa Imagawa and Voot Tangkaratt and Takayuki Osa and Takashi Onishi and Yoshimasa Tsuruoka}, journal = {arXiv preprint arXiv:2006.02608}, title = {Meta-Model-Based Meta-Policy Optimization}, year = {2020}, } @inproceedings{houthooft2018evolved, author = {Rein Houthooft and Yuhua Chen and Phillip Isola and Bradly Stadie and Filip Wolski and OpenAI Jonathan Ho and Pieter Abbeel}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {5400--5409}, title = {Evolved policy gradients}, year = {2018}, } @article{liu2020imitation, author = {Evan Zheran Liu and Milad Hashemi and Kevin Swersky and Parthasarathy Ranganathan and Junwhan Ahn}, journal = {arXiv preprint arXiv:2006.16239}, title = {An Imitation Learning Approach for Cache Replacement}, year = {2020}, } @article{rieger2019interpretations, author = {Laura Rieger and Chandan Singh and W James Murdoch and Bin Yu}, journal = {arXiv preprint arXiv:1909.13584}, title = {Interpretations are useful: penalizing explanations to align neural networks with prior knowledge}, year = {2019}, } @article{goel2020model, author = {Karan Goel and Albert Gu and Yixuan Li and Christopher R{\'e}}, journal = {arXiv preprint arXiv:2008.06775}, title = {Model Patching: Closing the Subgroup Performance Gap with Data Augmentation}, year = {2020}, } @inproceedings{cidon2016cliffhanger, author = {Asaf Cidon and Assaf Eisenman and Mohammad Alizadeh and Sachin Katti}, booktitle = {13th $\{$USENIX$\}$ Symposium on Networked Systems Design and Implementation ($\{$NSDI$\}$ 16)}, pages = {379--392}, title = {Cliffhanger: Scaling performance cliffs in web memory caches}, year = {2016}, } @inproceedings{leibfried2019unified, author = {Felix Leibfried and Sergio Pascual-Diaz and Jordi Grau-Moya}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {7869--7880}, title = {A unified bellman optimality principle combining reward maximization and empowerment}, year = {2019}, } @article{sohoni2020no, author = {Nimit S Sohoni and Jared A Dunnmon and Geoffrey Angus and Albert Gu and Christopher R{\'e}}, journal = {arXiv preprint arXiv:2011.12945}, title = {No Subclass Left Behind: Fine-Grained Robustness in Coarse-Grained Classification Problems}, year = {2020}, } @article{pezeshki2020gradient, author = {Mohammad Pezeshki and S{\'e}kou-Oumar Kaba and Yoshua Bengio and Aaron Courville and Doina Precup and Guillaume Lajoie}, journal = {arXiv preprint arXiv:2011.09468}, title = {Gradient Starvation: A Learning Proclivity in Neural Networks}, year = {2020}, } @article{nam2020learning, author = {Junhyun Nam and Hyuntak Cha and Sungsoo Ahn and Jaeho Lee and Jinwoo Shin}, journal = {arXiv preprint arXiv:2007.02561}, title = {Learning from failure: Training debiased classifier from biased classifier}, year = {2020}, } @inproceedings{kim2019multiaccuracy, author = {Michael P Kim and Amirata Ghorbani and James Zou}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {247--254}, title = {Multiaccuracy: Black-box post-processing for fairness in classification}, year = {2019}, } @article{cao2020heteroskedastic, author = {Kaidi Cao and Yining Chen and Junwei Lu and Nikos Arechiga and Adrien Gaidon and Tengyu Ma}, journal = {arXiv preprint arXiv:2006.15766}, title = {Heteroskedastic and imbalanced deep learning with adaptive regularization}, year = {2020}, } @article{nagarajan2020understanding, author = {Vaishnavh Nagarajan and Anders Andreassen and Behnam Neyshabur}, journal = {arXiv preprint arXiv:2010.15775}, title = {Understanding the failure modes of out-of-distribution generalization}, year = {2020}, } @article{levy2020large, author = {Daniel Levy and Yair Carmon and John C Duchi and Aaron Sidford}, journal = {arXiv preprint arXiv:2010.05893}, title = {Large-Scale Methods for Distributionally Robust Optimization}, year = {2020}, } @article{zhang2020coping, author = {Jingzhao Zhang and Aditya Menon and Andreas Veit and Srinadh Bhojanapalli and Sanjiv Kumar and Suvrit Sra}, journal = {arXiv preprint arXiv:2010.12230}, title = {Coping with Label Shift via Distributionally Robust Optimisation}, year = {2020}, } @inproceedings{zhang2018generalized, author = {Zhilu Zhang and Mert R Sabuncu}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Generalized cross entropy loss for training deep neural networks with noisy labels}, year = {2018}, } @inproceedings{creager2021environment, author = {Elliot Creager and J{\"o}rn-Henrik Jacobsen and Richard Zemel}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {2189--2200}, title = {Environment inference for invariant learning}, year = {2021}, } @article{utama2020towards, author = {Prasetya Ajie Utama and Nafise Sadat Moosavi and Iryna Gurevych}, journal = {arXiv preprint arXiv:2009.12303}, title = {Towards debiasing {NLU} models from unknown biases}, year = {2020}, } @article{yaghoobzadeh2019increasing, author = {Yadollah Yaghoobzadeh and Soroush Mehri and Remi Tachet and Timothy J Hazen and Alessandro Sordoni}, journal = {arXiv preprint arXiv:1911.03861}, title = {Increasing Robustness to Spurious Correlations using Forgettable Examples}, year = {2019}, } @inproceedings{nie2021play, author = {Allen Nie and Emma Brunskill and Chris Piech}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Play to Grade: Testing Coding Games as Classifying Markov Decision Process}, year = {2021}, } @inproceedings{wang2021alchemy, author = {Jane X Wang and Michael King and Nicolas Pierre Mickael Porcel and Zeb Kurth-Nelson and Tina Zhu and Charlie Deck and Peter Choy and Mary Cassin and Malcolm Reynolds and H Francis Song and others}, booktitle = {Thirty-fifth Conference on Neural Information Processing Systems Datasets and Benchmarks Track (Round 2)}, title = {Alchemy: A benchmark and analysis toolkit for meta-reinforcement learning agents}, year = {2021}, } @inproceedings{arndt2020meta, author = {Karol Arndt and Murtaza Hazara and Ali Ghadirzadeh and Ville Kyrki}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {2725--2731}, title = {Meta reinforcement learning for sim-to-real domain adaptation}, year = {2020}, } @inproceedings{schoettler2020meta, author = {Gerrit Schoettler and Ashvin Nair and Juan Aparicio Ojea and Sergey Levine and Eugen Solowjow}, booktitle = {International Conference on Intelligent Robots and Systems (IROS)}, pages = {9728--9735}, title = {Meta-reinforcement learning for robotic industrial insertion tasks}, year = {2020}, } @inproceedings{orourke2014hint, author = {Eleanor O'Rourke and Christy Ballweber and Zoran Popovi{\'i}}, booktitle = {Proceedings of the first ACM conference on Learning@ scale conference}, pages = {51--60}, title = {Hint systems may negatively impact performance in educational games}, year = {2014}, } @article{wu2021prototransformer, author = {Mike Wu and Noah Goodman and Chris Piech and Chelsea Finn}, journal = {arXiv preprint arXiv:2107.14035}, title = {ProtoTransformer: A Meta-Learning Approach to Providing Student Feedback}, year = {2021}, } @article{malik2019generative, author = {Ali Malik and Mike Wu and Vrinda Vasavada and Jinpeng Song and Madison Coots and John Mitchell and Noah Goodman and Chris Piech}, journal = {arXiv preprint arXiv:1905.09916}, title = {Generative Grading: Near Human-level Accuracy for Automated Feedback on Richly Structured Problems}, year = {2019}, } @article{bhatia2016automated, author = {Sahil Bhatia and Rishabh Singh}, journal = {arXiv preprint arXiv:1603.06129}, title = {Automated correction for syntax errors in programming assignments using recurrent neural networks}, year = {2016}, } @inproceedings{piech2015learning, author = {Chris Piech and Jonathan Huang and Andy Nguyen and Mike Phulsuksombati and Mehran Sahami and Leonidas Guibas}, booktitle = {International conference on machine Learning}, pages = {1093--1102}, title = {Learning program embeddings to propagate feedback on student code}, year = {2015}, } @article{rivers2017data, author = {Kelly Rivers and Kenneth R Koedinger}, journal = {International Journal of Artificial Intelligence in Education}, number = {1}, pages = {37--64}, title = {Data-driven hint generation in vast solution spaces: a self-improving python programming tutor}, volume = {27}, year = {2017}, } @article{paassen2017continuous, author = {Benjamin Paa{\ss}en and Barbara Hammer and Thomas William Price and Tiffany Barnes and Sebastian Gross and Niels Pinkwart}, journal = {arXiv preprint arXiv:1708.06564}, title = {The continuous hint factory-providing hints in vast and sparsely populated edit distance spaces}, year = {2017}, } @inproceedings{godefroid2017learn, author = {Patrice Godefroid and Hila Peleg and Rishabh Singh}, booktitle = {Automated Software Engineering (ASE)}, pages = {50--59}, title = {Learn\&fuzz: Machine learning for input fuzzing}, year = {2017}, } @inproceedings{godefroid2008automated, author = {Patrice Godefroid and Michael Y Levin and David A Molnar and others}, booktitle = {NDSS}, pages = {151--166}, title = {Automated whitebox fuzz testing}, volume = {8}, year = {2008}, } @article{king1976symbolic, author = {James C King}, journal = {Communications of the ACM}, number = {7}, pages = {385--394}, title = {Symbolic execution and program testing}, volume = {19}, year = {1976}, } @inproceedings{zheng2019wuji, author = {Yan Zheng and Xiaofei Xie and Ting Su and Lei Ma and Jianye Hao and Zhaopeng Meng and Yang Liu and Ruimin Shen and Yingfeng Chen and Changjie Fan}, booktitle = {Automated Software Engineering (ASE)}, pages = {772--784}, title = {Wuji: Automatic online combat game testing using evolutionary deep reinforcement learning}, year = {2019}, } @article{gordillo2021improving, author = {Camilo Gordillo and Joakim Bergdahl and Konrad Tollmar and Linus Gissl{\'e}n}, journal = {arXiv preprint arXiv:2103.13798}, title = {Improving playtesting coverage via curiosity driven reinforcement learning agents}, year = {2021}, } @article{froyd2012five, author = {Jeffrey E Froyd and Phillip C Wankat and Karl A Smith}, journal = {Proceedings of the IEEE}, number = {0}, pages = {1344--1360}, title = {Five major shifts in 100 years of engineering education}, volume = {100}, year = {2012}, } @phdthesis{pfaffman2003manipulating, author = {Jay A Pfaffman}, school = {Vanderbilt University}, title = {Manipulating and measuring student engagement in computer-based instruction}, year = {2003 2003}, } @article{piech2015deep, author = {Chris Piech and Jonathan Bassen and Jonathan Huang and Surya Ganguli and Mehran Sahami and Leonidas J Guibas and Jascha Sohl-Dickstein}, journal = {Advances in neural information processing systems}, title = {Deep knowledge tracing}, volume = {28}, year = {2015}, } @inproceedings{d2008more, author = {Ryan SJ d Baker and Albert T Corbett and Vincent Aleven}, booktitle = {International conference on intelligent tutoring systems}, pages = {406--415}, title = {More accurate student modeling through contextual estimation of slip and guess probabilities in bayesian knowledge tracing}, year = {2008}, } @inproceedings{villano1992probabilistic, author = {Michael Villano}, booktitle = {International Conference on Intelligent Tutoring Systems}, pages = {491--498}, title = {Probabilistic student models: Bayesian belief networks and knowledge space theory}, year = {1992}, } @article{anderson1990cognitive, author = {John R Anderson and C Franklin Boyle and Albert T Corbett and Matthew W Lewis}, journal = {Artificial intelligence}, number = {1}, pages = {7--49}, title = {Cognitive modeling and intelligent tutoring}, volume = {42}, year = {1990}, } @article{balakrishnan2013predicting, author = {Girish Balakrishnan and Derrick Coetzee}, journal = {Science}, pages = {57--58}, title = {Predicting student retention in massive open online courses using hidden markov models}, volume = {53}, year = {2013}, } @article{sass2018structural, author = {Daniel A Sass and Felicia Castro-Villarreal and Steve Wilkerson and Norma Guerra and Jeremy Sullivan}, journal = {The Review of Higher Education}, number = {1}, pages = {103--135}, title = {A structural model for predicting student retention}, volume = {42}, year = {2018}, } @article{delen2011predicting, author = {Dursun Delen}, journal = {Journal of College Student Retention: Research, Theory \& Practice}, number = {1}, pages = {17--35}, title = {Predicting student attrition with data mining methods}, volume = {13}, year = {2011}, } @article{aulck2016predicting, author = {Lovenoor Aulck and Nishant Velagapudi and Joshua Blumenstock and Jevin West}, journal = {arXiv preprint arXiv:1606.06364}, title = {Predicting student dropout in higher education}, year = {2016}, } @article{nwana1990intelligent, author = {Hyacinth S Nwana}, journal = {Artificial Intelligence Review}, number = {4}, pages = {251--277}, title = {Intelligent tutoring systems: an overview}, volume = {4}, year = {1990}, } @misc{code2022org, author = {Code.org}, howpublished = {\url{https://code.org/about}}, title = {Code.org}, year = {2022}, } @inproceedings{singh2013automated, author = {Rishabh Singh and Sumit Gulwani and Armando Solar-Lezama}, booktitle = {Proceedings of the 34th ACM SIGPLAN conference on Programming language design and implementation}, pages = {15--26}, title = {Automated feedback generation for introductory programming assignments}, year = {2013}, } @inproceedings{wang2017data, author = {Ke Wang and Benjamin Lin and Bjorn Rettig and Paul Pardi and Rishabh Singh}, booktitle = {Proceedings of the Fourth (2017) ACM Conference on Learning@ Scale}, pages = {257--260}, title = {Data-driven feedback generator for online programing courses}, year = {2017}, } @inproceedings{glassman2015overcode, author = {Elena L Glassman and Jeremy Scott and Rishabh Singh and Philip J Guo and Robert C Miller}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, number = {2}, pages = {1--35}, title = {OverCode: Visualizing variation in student solutions to programming problems at scale}, year = {2015}, } @article{zheng2020ai, author = {Stephan Zheng and Alexander Trott and Sunil Srinivasa and Nikhil Naik and Melvin Gruesbeck and David C Parkes and Richard Socher}, journal = {arXiv preprint arXiv:2004.13332}, title = {The ai economist: Improving equality and productivity with ai-driven tax policies}, year = {2020}, } @article{bansal2017emergent, author = {Trapit Bansal and Jakub Pachocki and Szymon Sidor and Ilya Sutskever and Igor Mordatch}, journal = {arXiv preprint arXiv:1710.03748}, title = {Emergent complexity via multi-agent competition}, year = {2017}, } @article{baker2019emergent, author = {Bowen Baker and Ingmar Kanitscheider and Todor Markov and Yi Wu and Glenn Powell and Bob McGrew and Igor Mordatch}, journal = {arXiv preprint arXiv:1909.07528}, title = {Emergent tool use from multi-agent autocurricula}, year = {2019}, } @article{monroe2017colors, author = {Will Monroe and Robert XD Hawkins and Noah D Goodman and Christopher Potts}, journal = {arXiv preprint arXiv:1703.10186}, title = {Colors in Context: A Pragmatic Neural Model for Grounded Language Understanding}, year = {2017}, } @inproceedings{ullman2016pragmatics, author = {Tomer D Ullman and Yang Xu and Noah D Goodman}, booktitle = {Proceedings of the 38th Annual Conference of the Cognitive Science Society}, title = {The Pragmatics of Spatial Language}, year = {2016}, } @article{horn1984toward, author = {Laurence Horn}, journal = {Meaning, form, and use in context: Linguistic applications}, pages = {11--42}, title = {Toward a new taxonomy for pragmatic inference: {Q}-based and {R}-based implicature}, year = {1984}, } @book{allen2014reasoning, author = {James Allen and Henry Kautz and Richard Pelavin and Josh Tenenberg}, publisher = {Morgan Kaufmann}, title = {Reasoning about plans}, year = {2014}, } @inproceedings{allen2007plow, author = {James Allen and Nathanael Chambers and George Ferguson and Lucian Galescu and Hyuckchul Jung and Mary Swift and William Taysom}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {1514--1519}, title = {{PLOW}: A collaborative task learning agent}, year = {2007}, } @article{perrault1980plan, author = {C Raymond Perrault and James F Allen}, journal = {Computational Linguistics}, number = {3}, pages = {167--182}, title = {A plan-based analysis of indirect speech acts}, volume = {6}, year = {1980}, } @book{lewis2008convention, author = {David Lewis}, publisher = {John Wiley \& Sons}, title = {Convention: A philosophical study}, year = {2008}, } @article{clark1996using, author = {Herbert H Clark}, journal = {Cambridge University Press: Cambridge}, pages = {274--296}, title = {Using language}, volume = {952}, year = {1996}, } @article{van2003questioning, author = {Robert Van Rooy}, journal = {Linguistics and Philosophy}, number = {6}, pages = {727--763}, title = {Questioning to resolve decision problems}, volume = {26}, year = {2003}, } @book{franke2009signal, author = {Michael Franke}, publisher = {Institute for Logic, Language and Computation}, title = {Signal to act: Game theory in pragmatics}, year = {2009}, } @article{crawford1990learning, author = {Vincent P Crawford and Hans Haller}, journal = {Econometrica: Journal of the Econometric Society}, pages = {571--595}, title = {Learning how to cooperate: Optimal play in repeated coordination games}, year = {1990}, } @inproceedings{kao2014formalizing, author = {Justine T Kao and Leon Bergen and Noah Goodman}, booktitle = {CogSci}, title = {Formalizing the Pragmatics of Metaphor Understanding}, year = {2014}, } @inproceedings{qing2014gradable, author = {Ciyang Qing and Michael Franke}, booktitle = {Semantics and Linguistic Theory}, pages = {23--41}, title = {Gradable adjectives, vagueness, and optimal language use: A speaker-oriented model}, volume = {24}, year = {2014}, } @article{goodman2016pragmatic, author = {Noah D Goodman and Michael C Frank}, journal = {Trends in Cognitive Sciences}, number = {11}, pages = {818--829}, title = {Pragmatic language interpretation as probabilistic inference}, volume = {20}, year = {2016}, } @inproceedings{foerster2016learning, author = {Jakob Foerster and Yannis M Assael and Nando de Freitas and Shimon Whiteson}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {2137--2145}, title = {Learning to communicate with deep multi-agent reinforcement learning}, year = {2016}, } @inproceedings{lazaridou2017multi, author = {Angeliki Lazaridou and Alexander Peysakhovich and Marco Baroni}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Multi-agent cooperation and the emergence of (natural) language}, year = {2017}, } @inproceedings{mordatch2018emergence, author = {Igor Mordatch and Pieter Abbeel}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Emergence of Grounded Compositional Language in Multi-Agent Populations}, year = {2018}, } @inproceedings{sukhbaatar2016learning, author = {Sainbayar Sukhbaatar and Rob Fergus and others}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {2244--2252}, title = {Learning multiagent communication with backpropagation}, year = {2016}, } @inproceedings{peshkin2000learning, author = {Leonid Peshkin and Kee-Eung Kim and Nicolas Meuleau and Leslie Pack Kaelbling}, booktitle = {Proceedings of the Sixteenth conference on Uncertainty in artificial intelligence}, pages = {489--496}, title = {Learning to cooperate via policy search}, year = {2000}, } @book{box2011bayesian, author = {George EP Box and George C Tiao}, publisher = {John Wiley \& Sons}, title = {Bayesian inference in statistical analysis}, volume = {40}, year = {2011}, } @book{shoham2008multiagent, author = {Yoav Shoham and Kevin Leyton-Brown}, publisher = {Cambridge University Press}, title = {Multiagent systems: Algorithmic, game-theoretic, and logical foundations}, year = {2008}, } @article{bernheim1984rationalizable, author = {B Douglas Bernheim}, journal = {Econometrica: Journal of the Econometric Society}, pages = {1007--1028}, title = {Rationalizable strategic behavior}, year = {1984}, } @article{pearce1984rationalizable, author = {David G Pearce}, journal = {Econometrica: Journal of the Econometric Society}, pages = {1029--1050}, title = {Rationalizable strategic behavior and the problem of perfection}, year = {1984}, } @article{nowak1999evolutionary, author = {Martin A Nowak and Joshua B Plotkin and David C Krakauer}, journal = {Journal of Theoretical Biology}, number = {2}, pages = {147--162}, title = {The evolutionary language game}, volume = {200}, year = {1999}, } @article{huttegger2010evolutionary, author = {Simon M Huttegger and Brian Skyrms and Rory Smead and Kevin JS Zollman}, journal = {Synthese}, number = {1}, pages = {177--191}, title = {Evolutionary dynamics of {Lewis} signaling games: signaling systems vs. partial pooling}, volume = {172}, year = {2010}, } @article{kuhn2016extensive, author = {H Kuhn}, journal = {InH. KuhnandA. Tucker, editors, Contributions to the Theory of Games}, pages = {193--216}, title = {Extensive games and the problem of information}, year = {2016}, } @inproceedings{zermelo1913anwendung, author = {Ernst Zermelo}, booktitle = {Proceedings of the fifth international congress of mathematicians}, pages = {501--504}, title = {{\"U}ber eine Anwendung der Mengenlehre auf die Theorie des Schachspiels}, volume = {2}, year = {1913}, } @article{aumann1995backward, author = {Robert J Aumann}, journal = {Games and Economic Behavior}, number = {1}, pages = {6--19}, title = {Backward induction and common knowledge of rationality}, volume = {8}, year = {1995}, } @article{harsanyi2004games, author = {John C Harsanyi}, journal = {Management science}, pages = {1804--1817}, title = {Games with incomplete information played by "Bayesian" players}, volume = {50}, year = {2004}, } @inproceedings{vogel2013implicatures, author = {Adam Vogel and Christopher Potts and Dan Jurafsky}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {74--80}, title = {Implicatures and Nested Beliefs in Approximate Decentralized-{POMDP}s}, year = {2013}, } @article{grosz1986attention, author = {Barbara J Grosz and Candace L Sidner}, journal = {Computational Linguistics}, number = {3}, pages = {175--204}, title = {Attention, intentions, and the structure of discourse}, volume = {12}, year = {1986}, } @article{bobrow1977gus, author = {Daniel G Bobrow and Ronald M Kaplan and Martin Kay and Donald A Norman and Henry Thompson and Terry Winograd}, journal = {Artificial Intelligence}, number = {2}, pages = {155--173}, title = {GUS, a frame-driven dialog system}, volume = {8}, year = {1977}, } @article{weizenbaum1966eliza, author = {Joseph Weizenbaum}, journal = {Communications of the ACM}, number = {1}, pages = {36--45}, title = {{ELIZA}--a computer program for the study of natural language communication between man and machine}, volume = {9}, year = {1966}, } @article{allen1980analyzing, author = {James F Allen and C Raymond Perrault}, journal = {Artificial Intelligence}, number = {3}, pages = {143--178}, title = {Analyzing intention in utterances}, volume = {15}, year = {1980}, } @article{allen2001toward, author = {James F Allen and Donna K Byron and Myroslava Dzikovska and George Ferguson and Lucian Galescu and Amanda Stent}, journal = {AI magazine}, number = {4}, title = {Toward conversational human-computer interaction}, volume = {22}, year = {2001}, } @article{colby1971artificial, author = {Kenneth Mark Colby and Sylvia Weber and Franklin Dennis Hilf}, journal = {Artificial Intelligence}, number = {1}, pages = {1--25}, title = {Artificial paranoia}, volume = {2}, year = {1971}, } @book{perea2012epistemic, author = {Andr{'e}s Perea}, publisher = {Cambridge University Press}, title = {Epistemic game theory: reasoning and choice}, year = {2012}, } @article{cao2013overview, author = {Yongcan Cao and Wenwu Yu and Wei Ren and Guanrong Chen}, journal = {IEEE Transactions on Industrial informatics}, number = {1}, pages = {427--438}, title = {An overview of recent progress in the study of distributed multi-agent coordination}, volume = {9}, year = {2013}, } @article{stone1998towards, author = {Peter Stone and Manuela Veloso}, journal = {International Journal of Human-Computer Studies}, number = {1}, pages = {83--104}, title = {Towards collaborative and adversarial learning: A case study in robotic soccer}, volume = {48}, year = {1998}, } @inproceedings{lauer2000algorithm, author = {Martin Lauer and Martin Riedmiller}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {535--542}, title = {An algorithm for distributed reinforcement learning in cooperative multi-agent systems}, year = {2000}, } @article{littman2001value, author = {Michael L Littman}, journal = {Cognitive Systems Research}, number = {1}, pages = {55--66}, title = {Value-function reinforcement learning in {Markov} games}, volume = {2}, year = {2001}, } @article{louizos2015variational, author = {Christos Louizos and Kevin Swersky and Yujia Li and Max Welling and Richard Zemel}, journal = {arXiv preprint arXiv:1511.00830}, title = {The variational fair autoencoder}, year = {2015}, } @inproceedings{bolukbasi2016man, author = {Tolga Bolukbasi and Kai-Wei Chang and James Y Zou and Venkatesh Saligrama and Adam T Kalai}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {4349--4357}, title = {Man is to computer programmer as woman is to homemaker? {Debiasing} word embeddings}, year = {2016}, } @inproceedings{maurer2009empirical, author = {Andreas Maurer and Massimiliano Pontil}, booktitle = {Conference on Learning Theory (COLT)}, title = {Empirical Bernstein bounds and sample variance penalization}, year = {2009}, } @article{rothblum2018probably, author = {Guy N Rothblum and Gal Yona}, journal = {arXiv preprint arXiv:1803.03242}, title = {Probably Approximately Metric-Fair Learning}, year = {2018}, } @book{clark1991grounding, author = {Herbert H. Clark and Susan E. Brennan}, pages = {127--149}, publisher = {Perspectives on Socially Shared Cognition}, title = {Grounding in Communication}, year = {1991}, } @inproceedings{andreas2016reasoning, author = {Jacob Andreas and Dan Klein}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1173--1182}, title = {Reasoning about Pragmatics with Neural Listeners and Speakers}, year = {2016}, } @inproceedings{andreas2016learning, author = {Jacob Andreas and Marcus Rohrbach and Trevor Darrell and Dan Klein}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {1545--1554}, title = {Learning to Compose Neural Networks for Question Answering}, year = {2016}, } @article{busoniu2008comprehensive, author = {Lucian Busoniu and Robert Babuska and Bart De Schutter}, journal = {IEEE Trans. Systems, Man, and Cybernetics, Part C}, number = {2}, pages = {156--172}, title = {A comprehensive survey of multiagent reinforcement learning}, volume = {38}, year = {2008}, } @inproceedings{hawkins2015you, author = {Robert X. D. Hawkins and Andreas Stuhlm\"uller and Judith Degen and Noah D. Goodman}, booktitle = {Proceedings of the Thirty-Seventh Annual Conference of the {C}ognitive {S}cience {S}ociety}, title = {Why do you ask{? G}ood questions provoke informative answers}, year = {2015}, } @inproceedings{zhang2013coordinating, author = {Chongjie Zhang and Victor Lesser}, booktitle = {Proceedings of the 2013 International Conference on Autonomous Agents and Multi-agent Systems}, pages = {1101--1108}, title = {Coordinating Multi-agent Reinforcement Learning with Limited Communication}, year = {2013}, } @inproceedings{tan1993multi, author = {Ming Tan}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {330--337}, title = {Multi-Agent Reinforcement Learning: Independent vs. Cooperative Agents}, year = {1993}, } @book{dekel2015epistemic, author = {Eddie Dekel and Marciano Siniscalchi}, pages = {619--702}, publisher = {Handbook of Game Theory with Economic Applications}, title = {Epistemic game theory}, volume = {4}, year = {2015}, } @inproceedings{kilbertus2017avoiding, author = {Niki Kilbertus and Mateo Rojas Carulla and Giambattista Parascandolo and Moritz Hardt and Dominik Janzing and Bernhard Sch{\"o}lkopf}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {656--666}, title = {Avoiding discrimination through causal reasoning}, year = {2017}, } @article{hawkins2015conducting, author = {Robert XD Hawkins}, journal = {Behavior Research Methods}, number = {4}, pages = {966--976}, title = {Conducting real-time multiplayer experiments on the web}, volume = {47}, year = {2015}, } @article{bennett1962probability, author = {George Bennett}, journal = {Journal of the American Statistical Association (JASA)}, number = {297}, pages = {33--45}, title = {Probability inequalities for the sum of independent random variables}, volume = {57}, year = {1962}, } @article{audibert2009exploration, author = {Jean-Yves Audibert and R{'e}mi Munos and Csaba Szepesv{'a}ri}, journal = {Theoretical Computer Science}, number = {19}, pages = {1876--1902}, title = {Exploration--exploitation tradeoff using variance estimates in multi-armed bandits}, volume = {410}, year = {2009}, } @inproceedings{wang2013learning, author = {Tong Wang and Cynthia Rudin and Daniel Wagner and Rich Sevieri}, booktitle = {European Conference on Machine Learning (ECML)}, pages = {515--530}, title = {Learning to detect patterns of crime}, year = {2013}, } @inproceedings{zafar2017fairness, author = {Muhammad Bilal Zafar and Isabel Valera and Manuel Gomez Rodriguez and Krishna P Gummadi}, booktitle = {World Wide Web (WWW)}, pages = {1171--1180}, title = {Fairness beyond disparate treatment \& disparate impact: Learning classification without disparate mistreatment}, year = {2017}, } @book{kenney2013mathematics, author = {John Francis Kenney}, publisher = {D. Van Nostrand Company Inc; Toronto; Princeton; New Jersey; London; New York,; Affiliated East-West Press Pvt-Ltd; New Delhi}, title = {Mathematics of statistics}, year = {2013}, } @article{kamiran2012data, author = {Faisal Kamiran and Toon Calders}, journal = {Knowledge and Information Systems}, number = {1}, pages = {1--33}, title = {Data preprocessing techniques for classification without discrimination}, volume = {33}, year = {2012}, } @inproceedings{young2013pomdp, author = {Steve Young and Milica Ga{\v{s}}i{\'c} and Blaise Thomson and Jason D Williams}, booktitle = {Proceedings of the IEEE}, number = {5}, pages = {1160--1179}, title = {{POMDP}-based statistical spoken dialog systems: A review}, year = {2013}, } @inproceedings{calders2009building, author = {Toon Calders and Faisal Kamiran and Mykola Pechenizkiy}, booktitle = {Data mining workshops, 2009. ICDMW'09. IEEE international conference on}, pages = {13--18}, title = {Building classifiers with independency constraints}, year = {2009}, } @article{zliobaite2015relation, author = {Indre Zliobaite}, journal = {arXiv preprint arXiv:1505.05723}, title = {On the relation between accuracy and fairness in binary classification}, year = {2015}, } @article{zhang2016identifying, author = {Zhe Zhang and Daniel B Neill}, journal = {arXiv preprint arXiv:1611.08292}, title = {Identifying significant predictive bias in classifiers}, year = {2016}, } @misc{law1983sensitive, author = {official staff interpretations}, title = {Division of consumer and community affairs. 2011-07. 12 cfr supplement \i to part l02}, year = {1983}, } @article{massart1990tight, author = {Pascal Massart}, journal = {The annals of Probability}, pages = {1269--1283}, title = {The tight constant in the Dvoretzky-Kiefer-Wolfowitz inequality}, year = {1990}, } @article{delage2010distributionally, author = {Erick Delage and Yinyu Ye}, journal = {Operations research}, number = {3}, pages = {595--612}, title = {Distributionally robust optimization under moment uncertainty with application to data-driven problems}, volume = {58}, year = {2010}, } @article{wang2016likelihood, author = {Zizhuo Wang and Peter W Glynn and Yinyu Ye}, journal = {Computational Management Science}, number = {2}, pages = {241--261}, title = {Likelihood robust optimization for data-driven problems}, volume = {13}, year = {2016}, } @article{esfahani2018data, author = {Peyman Mohajerin Esfahani and Daniel Kuhn}, journal = {Mathematical Programming}, number = {1}, pages = {115--166}, title = {Data-driven distributionally robust optimization using the Wasserstein metric: Performance guarantees and tractable reformulations}, volume = {171}, year = {2018}, } @book{berk2012criminal, author = {Richard Berk}, publisher = {Springer Science \& Business Media}, title = {Criminal justice forecasts of risk: A machine learning approach}, year = {2012}, } @book{becker2010economics, author = {Gary S Becker}, publisher = {University of Chicago press}, title = {The economics of discrimination}, year = {2010}, } @article{corbett2018measure, author = {Sam Corbett-Davies and Sharad Goel}, journal = {arXiv preprint arXiv:1808.00023}, title = {The measure and mismeasure of fairness: A critical review of fair machine learning}, year = {2018}, } @article{arrow1973theory, author = {Kenneth Arrow}, journal = {Discrimination in labor markets}, number = {10}, pages = {3--33}, title = {The theory of discrimination}, volume = {3}, year = {1973}, } @article{phelps1972statistical, author = {Edmund S Phelps}, journal = {The american economic review}, number = {4}, pages = {659--661}, title = {The statistical theory of racism and sexism}, volume = {62}, year = {1972}, } @inproceedings{madras2019fairness, author = {David Madras and Elliot Creager and Toniann Pitassi and Richard Zemel}, booktitle = {Proceedings of the Conference on Fairness, Accountability, and Transparency}, pages = {349--358}, title = {Fairness through causal awareness: Learning causal latent-variable models for biased data}, year = {2019}, } @inproceedings{ustun2019fairness, author = {Berk Ustun and Yang Liu and David Parkes}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {6373--6382}, title = {Fairness without harm: Decoupled classifiers with preference guarantees}, year = {2019}, } @inproceedings{lipton2018does, author = {Zachary Lipton and Julian McAuley and Alexandra Chouldechova}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {8125--8135}, title = {Does mitigating ML's impact disparity require treatment disparity?}, year = {2018}, } @book{pearl2000causality, author = {Judea Pearl}, publisher = {Springer}, title = {{Causality: Models, Reasoning and Inference}}, volume = {29}, year = {2000}, } @inproceedings{dwork2018decoupled, author = {Cynthia Dwork and Nicole Immorlica and Adam Tauman Kalai and Max Leiserson}, booktitle = {Conference on Fairness, Accountability and Transparency}, pages = {119--133}, title = {Decoupled classifiers for group-fair and efficient machine learning}, year = {2018}, } @article{lehr2017playing, author = {David Lehr and Paul Ohm}, journal = {UCDL Rev.}, pages = {653--717}, title = {Playing with the data: what legal scholars should learn about machine learning}, volume = {51}, year = {2017}, } @inproceedings{domingos2000unified, author = {Pedro Domingos}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {231--238}, title = {A unified bias-variance decomposition}, year = {2000}, } @techreport{abel2017classical, author = {Andrew B Abel}, institution = {Working Paper}, title = {Classical measurement error with several regressors}, year = {2017}, } @article{miller1981inverse, author = {Kenneth S Miller}, journal = {Mathematics magazine}, number = {2}, pages = {67--72}, title = {On the inverse of the sum of matrices}, volume = {54}, year = {1981}, } @book{carroll2006measurement, author = {Raymond J Carroll and David Ruppert and Leonard A Stefanski and Ciprian M Crainiceanu}, publisher = {Chapman and Hall/CRC}, title = {Measurement error in nonlinear models: a modern perspective}, year = {2006}, } @book{o2016weapons, author = {Cathy O'Neil}, publisher = {Broadway Books}, title = {Weapons of math destruction: How big data increases inequality and threatens democracy}, year = {2016}, } @inproceedings{chouldechova2018case, author = {Alexandra Chouldechova and Diana Benavides-Prado and Oleksandr Fialko and Rhema Vaithianathan}, booktitle = {Conference on Fairness, Accountability and Transparency}, pages = {134--148}, title = {A case study of algorithm-assisted decision making in child maltreatment hotline screening decisions}, year = {2018}, } @book{fuller2009measurement, author = {Wayne A Fuller}, publisher = {John Wiley \& Sons}, title = {Measurement error models}, volume = {305}, year = {2009}, } @book{frisch1934statistical, author = {Ragnar Frisch}, publisher = {Universitetets {\O}konomiske Instituut}, title = {Statistical confluence analysis by means of complete regression systems}, volume = {5}, year = {1934}, } @book{wightman1998lsac, author = {Linda F Wightman and Henry Ramsey}, publisher = {Law School Admission Council}, title = {{LSAC} national longitudinal bar passage study}, year = {1998}, } @article{cortez2008using, author = {Paulo Cortez and Alice Maria Gon{\c{c}}alves Silva}, journal = {Proceedings of 5th FUture BUsiness TEChnology Conference}, title = {Using data mining to predict secondary school student performance}, year = {2008}, } @article{redmond2002data, author = {Michael Redmond and Alok Baveja}, journal = {European Journal of Operational Research}, number = {3}, pages = {660--678}, title = {A data-driven software tool for enabling cooperative information sharing among police departments}, volume = {141}, year = {2002}, } @article{sherman1950adjustment, author = {Jack Sherman and Winifred J Morrison}, journal = {The Annals of Mathematical Statistics}, number = {1}, pages = {124--127}, title = {Adjustment of an inverse matrix corresponding to a change in one element of a given matrix}, volume = {21}, year = {1950}, } @inproceedings{chiappa2019path, author = {Silvia Chiappa}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {7801--7808}, title = {Path-specific counterfactual fairness}, volume = {33}, year = {2019}, } @article{loftus2018causal, author = {Joshua R Loftus and Chris Russell and Matt J Kusner and Ricardo Silva}, journal = {arXiv preprint arXiv:1805.05859}, title = {Causal reasoning for algorithmic fairness}, year = {2018}, } @inproceedings{nabi2018fair, author = {Razieh Nabi and Ilya Shpitser}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Fair inference on outcomes}, year = {2018}, } @article{pierson2017fast, author = {Emma Pierson and Sam Corbett-Davies and Sharad Goel}, journal = {arXiv preprint arXiv:1702.08536}, title = {Fast threshold tests for detecting discrimination}, year = {2017}, } @article{simoiu2017problem, author = {Camelia Simoiu and Sam Corbett-Davies and Sharad Goel and others}, journal = {The Annals of Applied Statistics}, number = {3}, pages = {1193--1216}, title = {The problem of infra-marginality in outcome tests for discrimination}, volume = {11}, year = {2017}, } @inproceedings{calmon2017optimized, author = {Flavio Calmon and Dennis Wei and Bhanukiran Vinzamuri and Karthikeyan Natesan Ramamurthy and Kush R Varshney}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {3992--4001}, title = {Optimized pre-processing for discrimination prevention}, year = {2017}, } @article{chouldechova2018frontiers, author = {Alexandra Chouldechova and Aaron Roth}, journal = {arXiv preprint arXiv:1810.08810}, title = {The frontiers of fairness in machine learning}, year = {2018}, } @article{bechavod2017penalizing, author = {Yahav Bechavod and Katrina Ligett}, journal = {arXiv preprint arXiv:1707.00044}, title = {Penalizing unfairness in binary classification}, year = {2017}, } @article{clarke2005phantom, author = {Kevin A Clarke}, journal = {Conflict management and peace science}, number = {4}, pages = {341--352}, title = {The phantom menace: Omitted variable bias in econometric research}, volume = {22}, year = {2005}, } @inproceedings{canetti2019soft, author = {Ran Canetti and Aloni Cohen and Nishanth Dikkala and Govind Ramnarayan and Sarah Scheffler and Adam Smith}, booktitle = {Proceedings of the Conference on Fairness, Accountability, and Transparency}, pages = {309--318}, title = {From soft classifiers to hard decisions: How fair can we be?}, year = {2019}, } @article{gan2017equivalence, author = {Shengjun Gan and Yuqin Sun and Yongge Tian}, journal = {Communications in Statistics-Theory and Methods}, number = {11}, pages = {5368--5383}, title = {Equivalence of predictors under real and over-parameterized linear models}, volume = {46}, year = {2017}, } @article{shah2018minimum, author = {Vatsal Shah and Anastasios Kyrillidis and Sujay Sanghavi}, journal = {stat}, title = {Minimum norm solutions do not always generalize well for over-parameterized problems}, volume = {1050}, year = {2018}, } @article{jung2018omitted, author = {Jongbin Jung and Sam Corbett-Davies and Ravi Shroff and Sharad Goel}, journal = {arXiv preprint arXiv:1809.05651}, title = {Omitted and Included Variable Bias in Tests for Disparate Impact}, year = {2018}, } @article{jammalamadaka2007inclusion, author = {S Rao Jammalamadaka and D Sengupta}, journal = {Statistics \& probability letters}, number = {12}, pages = {1235--1247}, title = {Inclusion and exclusion of data or parameters in the general linear model}, volume = {77}, year = {2007}, } @article{haslett1996updating, author = {Stephen Haslett}, journal = {Linear algebra and its applications}, pages = {329--349}, title = {Updating linear models with dependent errors to include additional data and/or parameters}, volume = {237}, year = {1996}, } @article{bertrand2004emily, author = {Marianne Bertrand and Sendhil Mullainathan}, journal = {American economic review}, number = {4}, pages = {991--1013}, title = {Are Emily and Greg more employable than Lakisha and Jamal? A field experiment on labor market discrimination}, volume = {94}, year = {2004}, } @article{greiner2011causal, author = {D James Greiner and Donald B Rubin}, journal = {Review of Economics and Statistics}, number = {3}, pages = {775--785}, title = {Causal effects of perceived immutable characteristics}, volume = {93}, year = {2011}, } @article{sen2016race, author = {Maya Sen and Omar Wasow}, journal = {Annual Review of Political Science}, number = {1}, pages = {499--522}, title = {Race as a bundle of sticks: Designs that estimate effects of seemingly immutable characteristics}, volume = {19}, year = {2016}, } @article{holland1986statistics, author = {Paul W Holland}, journal = {Journal of the American statistical Association}, number = {396}, pages = {945--960}, title = {Statistics and causal inference}, volume = {81}, year = {1986}, } @article{freedman2004graphical, author = {David A Freedman}, journal = {Evaluation Review}, number = {4}, pages = {267--293}, title = {Graphical models for causation, and the identification problem}, volume = {28}, year = {2004}, } @article{rosenbaum1984consequences, author = {Paul R Rosenbaum}, journal = {Journal of the Royal Statistical Society: Series A (General)}, number = {5}, pages = {656--666}, title = {The consequences of adjustment for a concomitant variable that has been affected by the treatment}, volume = {147}, year = {1984}, } @article{holland2003causation, author = {Paul W Holland}, journal = {ETS Research Report Series}, number = {1}, title = {Causation and race}, volume = {2003}, year = {2003}, } @inproceedings{kleinberg2019simplicity, author = {Jon Kleinberg and Sendhil Mullainathan}, booktitle = {Proceedings of the 2019 ACM Conference on Economics and Computation}, pages = {807--808}, title = {Simplicity creates inequity: implications for fairness, stereotypes, and interpretability}, year = {2019}, } @inproceedings{wang2019balanced, author = {Tianlu Wang and Jieyu Zhao and Mark Yatskar and Kai-Wei Chang and Vicente Ordonez}, booktitle = {International Conference on Computer Vision (ICCV)}, pages = {5310--5319}, title = {Balanced datasets are not enough: Estimating and mitigating gender bias in deep image representations}, year = {2019}, } @article{yurochkin2020sensei, author = {Mikhail Yurochkin and Yuekai Sun}, journal = {arXiv preprint arXiv:2006.14168}, title = {SenSeI: Sensitive Set Invariance for Enforcing Individual Fairness}, year = {2020}, } @inproceedings{dixon2018measuring, author = {Lucas Dixon and John Li and Jeffrey Sorensen and Nithum Thain and Lucy Vasserman}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {67--73}, title = {Measuring and mitigating unintended bias in text classification}, year = {2018}, } @inproceedings{garg2019counterfactual, author = {Sahaj Garg and Vincent Perot and Nicole Limtiaco and Ankur Taly and Ed H Chi and Alex Beutel}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {219--226}, title = {Counterfactual fairness in text classification through robustness}, year = {2019}, } @article{elhabian2008moving, author = {Shireen Y Elhabian and Khaled M El-Sayed and Sumaya H Ahmed}, journal = {Recent patents on computer science}, number = {1}, pages = {32--54}, title = {Moving object detection in spatial domain using background removal techniques-state-of-art}, volume = {1}, year = {2008}, } @article{beutel2017data, author = {Alex Beutel and Jilin Chen and Zhe Zhao and Ed H Chi}, journal = {arXiv preprint arXiv:1707.00075}, title = {Data decisions and theoretical implications when adversarially learning fair representations}, year = {2017}, } @inproceedings{zhao2019inherent, author = {H. Zhao and Geoff Gordon}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Inherent Tradeoffs in Learning Fair Representations}, year = {2019}, } @inproceedings{dutta2020ista, author = {Sanghamitra Dutta and Dennis Wei and Hazar Yueksel and Pin-Yu Chen and Sijia Liu and Kush R. Varshney}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Is There a Trade-Off Between Fairness and Accuracy? A Perspective Using Mismatched Hypothesis Testing}, year = {2020}, } @article{madras2018learning, author = {David Madras and Elliot Creager and Toniann Pitassi and Richard Zemel}, journal = {arXiv preprint arXiv:1802.06309}, title = {Learning adversarially fair and transferable representations}, year = {2018}, } @article{creager2019flexibly, author = {Elliot Creager and David Madras and J{\"o}rn-Henrik Jacobsen and Marissa A Weis and Kevin Swersky and Toniann Pitassi and Richard Zemel}, journal = {arXiv preprint arXiv:1906.02589}, title = {Flexibly fair representation learning by disentanglement}, year = {2019}, } @article{mcnamara2017provably, author = {Daniel McNamara and Cheng Soon Ong and Robert C Williamson}, journal = {arXiv preprint arXiv:1710.04394}, title = {Provably fair representations}, year = {2017}, } @article{sun2019mitigating, author = {Tony Sun and Andrew Gaut and Shirlyn Tang and Yuxin Huang and Mai ElSherief and Jieyu Zhao and Diba Mirza and Elizabeth Belding and Kai-Wei Chang and William Yang Wang}, journal = {arXiv preprint arXiv:1906.08976}, title = {Mitigating gender bias in natural language processing: Literature review}, year = {2019}, } @article{zhao2018learning, author = {Jieyu Zhao and Yichao Zhou and Zeyu Li and Wei Wang and Kai-Wei Chang}, journal = {arXiv preprint arXiv:1809.01496}, title = {Learning gender-neutral word embeddings}, year = {2018}, } @inproceedings{quadrianto2019discovering, author = {Novi Quadrianto and Viktoriia Sharmanska and Oliver Thomas}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {8227--8236}, title = {Discovering fair representations in the data domain}, year = {2019}, } @inproceedings{gunasekar2017implicit, author = {Suriya Gunasekar and Blake E Woodworth and Srinadh Bhojanapalli and Behnam Neyshabur and Nati Srebro}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {6151--6159}, title = {Implicit regularization in matrix factorization}, year = {2017}, } @inproceedings{oymak2019overparameterized, author = {Samet Oymak and Mahdi Soltanolkotabi}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {4951--4960}, title = {Overparameterized nonlinear learning: Gradient descent takes the shortest path?}, year = {2019}, } @inproceedings{hardt2016strategic, author = {Moritz Hardt and Nimrod Megiddo and Christos Papadimitriou and Mary Wootters}, booktitle = {Proceedings of the 2016 ACM conference on innovations in theoretical computer science}, pages = {111--122}, title = {Strategic classification}, year = {2016}, } @inproceedings{jung2020fair, author = {Christopher Jung and Sampath Kannan and Changhwa Lee and Mallesh Pai and Aaron Roth and Rakesh Vohra}, booktitle = {Proceedings of the 21st ACM Conference on Economics and Computation}, pages = {677--678}, title = {Fair prediction with endogenous behavior}, year = {2020}, } @article{bessi2016users, author = {Alessandro Bessi and Fabiana Zollo and Michela Del Vicario and Michelangelo Puliga and Antonio Scala and Guido Caldarelli and Brian Uzzi and Walter Quattrociocchi}, journal = {PloS one}, number = {8}, title = {Users polarization on Facebook and Youtube}, volume = {11}, year = {2016}, } @article{bojinov2020avoid, author = {Iavor Bojinov and Guillaume Saint-Jacques and Martin Tingley}, journal = {Harvard Business Review}, number = {2}, pages = {48--53}, title = {Avoid the Pitfalls of {A/B} Testing Make sure your experiments recognize customers' varying needs}, volume = {98}, year = {2020}, } @inproceedings{luo2018efficient, author = {Haipeng Luo and Chen-Yu Wei and Alekh Agarwal and John Langford}, booktitle = {Conference On Learning Theory}, pages = {1739--1776}, title = {Efficient contextual bandits in non-stationary worlds}, year = {2018}, } @inproceedings{raghavan2018externalities, author = {Manish Raghavan and Aleksandrs Slivkins and Jennifer Vaughan Wortman and Zhiwei Steven Wu}, booktitle = {Conference on Learning Theory (COLT)}, pages = {1724--1738}, title = {The externalities of exploration and how data diversity helps exploitation}, year = {2018}, } @article{abadi2015tensorflow, author = {Martín Abadi and Ashish Agarwal and Paul Barham and Eugene Brevdo and Zhifeng Chen and Craig Citro and Gregory S. Corrado and Andy Davis and Jeffrey Dean and Matthieu Devin and Sanjay Ghemawat and Ian J. Goodfellow and Andrew Harp and Geoffrey Irving and Michael Isard and Yangqing Jia and Rafal Józefowicz and Lukasz Kaiser and Manjunath Kudlur and Josh Levenberg and Dan Mané and Rajat Monga and Sherry Moore and Derek Gordon Murray and Chris Olah and Mike Schuster and Jonathon Shlens and Benoit Steiner and Ilya Sutskever and Kunal Talwar and Paul A. Tucker and Vincent Vanhoucke and Vijay Vasudevan and Fernanda B. Viégas and Oriol Vinyals and Pete Warden and Martin Wattenberg and Martin Wicke and Yuan Yu and Xiaoqiang Zheng}, journal = {arXiv preprint arXiv:1603.04467}, title = {TensorFlow: Large-Scale Machine Learning on Heterogeneous Distributed Systems}, year = {2015}, } @inproceedings{liu2016evaluate, author = {Chia-Wei Liu and Ryan Lowe and Iulian V. Serban and Michael Noseworthy and Laurent Charlin and Joelle Pineau}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {How {NOT} To Evaluate Your Dialogue System: An Empirical Study of Unsupervised Evaluation Metrics for Dialogue Response Generation}, year = {2016}, } @inproceedings{li2016diversity, author = {Jiwei Li and Michel Galley and Chris Brockett and Jianfeng Gao and William B. Dolan}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, pages = {110--119}, title = {A Diversity-Promoting Objective Function for Neural Conversation Models}, year = {2016}, } @inproceedings{serban2017hierarchical, author = {Iulian Serban and Alessandro Sordoni and Ryan Lowe and Laurent Charlin and Joelle Pineau and Aaron C. Courville and Yoshua Bengio}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {A Hierarchical Latent Variable Encoder-Decoder Model for Generating Dialogues}, year = {2017}, } @article{sankaran2016temporal, author = {Baskaran Sankaran and Haitao Mi and Yaser Al-Onaizan and Abe Ittycheriah}, journal = {arXiv}, title = {Temporal Attention Model for Neural Machine Translation}, year = {2016}, } @inproceedings{kiddon2016globally, author = {Chlo'e Kiddon and Luke S. Zettlemoyer and Yejin Choi}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Globally Coherent Text Generation with Neural Checklist Models}, year = {2016}, } @inproceedings{tu2016modeling, author = {Zhaopeng Tu and Zhengdong Lu and Yang Liu and Xiaohua Liu and Hang Li}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Modeling Coverage for Neural Machine Translation}, year = {2016}, } @article{williams2016dstc, author = {Jason D. Williams and Antoine Raux and Matthew Henderson}, journal = {Dialogue and Discourse}, title = {The Dialog State Tracking Challenge Series: A Review}, volume = {7}, year = {2016}, } @article{li2016user, author = {Xiujun Li and Zachary C. Lipton and Bhuwan Dhingra and Lihong Li and Jianfeng Gao and Yun-Nung Chen}, journal = {arXiv}, title = {A User Simulator for Task-Completion Dialogues}, year = {2016}, } @inproceedings{henaff2017tracking, author = {Mikael Henaff and Jason Weston and Arthur Szlam and Antoine Bordes and Yann LeCun}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Tracking the World State with Recurrent Entity Networks}, year = {2017}, } @inproceedings{mei2016what, author = {Hongyuan Mei and Mohit Bansal and Matthew R. Walter}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, title = {What to talk about and how? Selective Generation using {LSTM}s with Coarse-to-Fine Alignment}, year = {2016}, } @inproceedings{serban2017multiresolution, author = {Iulian Serban and Tim Klinger and Gerald Tesauro and Kartik Talamadupula and Bowen Zhou and Yoshua Bengio and Aaron C. Courville}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Multiresolution Recurrent Neural Networks: An Application to Dialogue Response Generation}, year = {2017}, } @inproceedings{williams2017dialog, author = {Jason D. Williams and Kavoshi Asadi and Geoffrey Zweig}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Hybrid Code Networks: Practical and Efficient End-to-End Dialog Control with Supervised and Reinforcement Learning}, year = {2017}, } @inproceedings{dhingra2017information, author = {Bhuwan Dhingra and Lihong Li and Xiujun Li and Jianfeng Gao and Yun-Nung Chen and Faisal Ahmed and Li Deng}, booktitle = {Association for Computational Linguistics (ACL)}, title = {End-to-End Reinforcement Learning of Dialogue Agents for Information Access}, year = {2017}, } @article{maluuba2016frames, author = {Layla El Asri and Hannes Schulz and Shikhar Sharma and Jeremie Zumer and Justin Harris and Emery Fine and Rahul Mehrotra and Kaheer Suleman}, journal = {Maluuba Technical Report}, title = {Frames: A Corpus for Adding Memory to Goal-Oriented Dialogue Systems}, year = {2016}, } @inproceedings{bordes2017learning, author = {Antoine Bordes and Jason Weston}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Learning End-to-End Goal-Oriented Dialog}, year = {2017}, } @inproceedings{li2016rl, author = {Jiwei Li and Will Monroe and Alan Ritter and Daniel Jurafsky and Michel Galley and Jianfeng Gao}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Deep Reinforcement Learning for Dialogue Generation}, year = {2016}, } @inproceedings{ivanovic2005dialogue, author = {Edward Ivanovic}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Dialogue Act Tagging for Instant Messaging Chat Sessions}, year = {2005}, } @inproceedings{keizer2017negotiation, author = {Simon Keizer and Markus Guhe and Heriberto Cuayahuitl and Ioannis Efstathiou and Klaus-Peter Engelbrecht and Mihai Dobre and Alex Lascarides and Oliver Lemon}, booktitle = {European Association for Computational Linguistics (EACL)}, title = {Evaluating Persuasion Strategies and Deep Reinforcement Learning Methods for Negotiation Dialogue Agents}, year = {2017}, } @inproceedings{mei2017coherent, author = {Hongyuan Mei and Mohit Bansal and Matthew R. Walter}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Coherent Dialogue with Attention-Based Language Models}, year = {2017}, } @article{lowe2017ubuntu, author = {Ryan Thomas Lowe and Nissan Pow and Iulian Serban and Laurent Charlin and Chia-Wei Liu and Joelle Pineau}, journal = {Dialogue and Discourse}, title = {Training End-to-End Dialogue Systems with the Ubuntu Dialogue Corpus}, volume = {8}, year = {2017}, } @article{su2016continuous, author = {Pei-hao Su and Milica Gasic and Nikola Mrksic and Lina Maria Rojas-Barahona and Stefan Ultes and David Vandyke and Tsung-Hsien Wen and Steve J. Young}, journal = {arXiv preprint arXiv:1606.02689}, title = {Continuously Learning Neural Dialogue Management}, year = {2016}, } @article{clark1986collaborative, author = {Herbert H. Clark and Deanna Wilkes-Gibbs}, journal = {Cognition}, title = {Referring as a Collaborative Process}, volume = {22}, year = {1986}, } @inproceedings{shen2017style, author = {Tianxiao Shen and Tao Lei and Regina Barzilay and Tommi Jaakkola}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Style Transfer from Non-Parallel Text by Cross-Alignment}, year = {2017}, } @inproceedings{fu2018style, author = {Zhenxin Fu and Xiaoye Tan and Nanyun Peng and Dongyan Zhao and Rui Yan}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Style Transfer in Text: Exploration and Evaluation}, year = {2018}, } @inproceedings{vincent2008denoise, author = {Pascal Vincent and Hugo Larochelle and Yoshua Bengio and and Pierre-Antoine Manzagol}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Extracting and Composing Robust Features with Denoising Autoencoders}, year = {2008}, } @article{lample2017unsupervised, author = {Guillaume Lample and Ludovic Denoyer and Marc'Aurelio Ranzato}, journal = {arXiv preprint arXiv:1711.00043}, title = {Unsupervised Machine Translation Using Monolingual Corpora Only}, year = {2017}, } @inproceedings{zhu2017cycle, author = {Zhu, Jun-Yan and Park, Taesung and Isola, Phillip and Efros, Alexei A}, booktitle = {International Conference on Computer Vision (ICCV)}, title = {Unpaired Image-to-Image Translation using Cycle-Consistent Adversarial Networks}, year = {2017}, } @article{artetxe2017nmt, author = {Mikel Artetxe and Gorka Labaka and Eneko Agirre and Kyunghyun Cho}, journal = {arXiv preprint arXiv:1710.11041}, title = {Unsupervised Neural Machine Translation}, year = {2017}, } @article{pavlick2017style, author = {Ellie Pavlick and Joel Tetreault}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {An Empirical Analysis of Formality in Online Communication}, volume = {4}, year = {2017}, } @inproceedings{recasens2013bias, author = {Marta Recasens and Cristian Danescu-Niculescu-Mizil and Dan Jurafsky}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Linguistic Models for Analyzing and Detecting Biased Language}, year = {2013}, } @article{newman2003lying, author = {Matthew L. Newman and James W. Pennebaker and Diane S. Berry and J. Michael Richards}, journal = {Personality and Social Psychology Bulletin}, title = {Lying Words: Predicting Deception From Linguistic Styles}, volume = {29}, year = {2003}, } @inproceedings{schwartz2017roc, author = {Roy Schwartz and Maarten Sap and Yannis Konstas and Li Zilles and Yejin Choi and Noah A. Smith}, booktitle = {Computational Natural Language Learning (CoNLL)}, title = {The Effect of Different Writing Tasks on Linguistic Style: A Case Study of the {ROC} Story Cloze Task}, year = {2017}, } @inproceedings{lewis2017deal, author = {Mike Lewis and Denis Yarats and Yann N. Dauphin and Devi Parikh and Dhruv Batra}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Deal or No Deal? End-to-End Learning for Negotiation Dialogues}, year = {2017}, } @inproceedings{das2017visdial, author = {Abhishek Das and Satwik Kottur and Khushi Gupta and Avi Singh and Deshraj Yadav and Jos'e M.F. Moura and Devi Parikh and Dhruv Batra}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Visual Dialog}, year = {2017}, } @inproceedings{lu2017best, author = {Jiasen Lu and Anitha Kannan and Jianwei Yang and Devi Parikh and Dhruv Batra}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Best of Both Worlds: Transferring Knowledge from Discriminative Learning to a Generative Visual Dialog Model}, year = {2017}, } @article{matthew2012adadelta, author = {Matthew D. Zeiler}, journal = {arXiv preprint arXiv:1212.5701}, title = {{ADADELTA:} An Adaptive Learning Rate Method}, year = {2012}, } @article{igor2017attribute, author = {Igor Melnyk and Cicero Nogueira dos Santos and Kahini Wadhawan and Inkit Padhi and Abhishek Kumar}, journal = {arXiv preprint arXiv:1711.09395}, title = {Improved Neural Text Attribute Transfer with Non-parallel Data}, year = {2017}, } @inproceedings{guillaume2017fader, author = {Guillaume Lample and Neil Zeghidour and Nicolas Usunier and Antoine Bordes and Ludovic Denoyer and Marc'Aurelio Ranzato}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Fader Networks: Manipulating Images by Sliding Attributes}, year = {2017}, } @inproceedings{gan2017style, author = {Chuang Gan and Zhe Gan and Xiaodong He and Jianfeng Gao and Li Deng}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {StyleNet: Generating Attractive Visual Captions with Styles}, year = {2017}, } @inproceedings{zhao2018regularized, author = {Junbo Zhao and Yoon Kim and Kelly Zhang and Alexander M. Rush and Yann LeCun}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Adversarially Regularized Autoencoders}, year = {2018}, } @inproceedings{he2016amazonreview, author = {Ruining He and Julian McAuley}, booktitle = {World Wide Web (WWW)}, title = {Ups and Downs: Modeling the Visual Evolution of Fashion Trends with One-class Collaborative Filtering}, year = {2016}, } @inproceedings{devault2015toward, author = {David DeVault and Johnathan Mell and Jonathan Gratch}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Toward Natural Turn-taking in a Virtual Human Negotiation Agent}, year = {2015}, } @inproceedings{wen2017latent, author = {Tsung-Hsien Wen and Yishu Miao and Phil Blunsom and Steve Young}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Latent Intention Dialogue Models}, year = {2017}, } @inproceedings{zhao2018unsupervised, author = {Tiancheng Zhao and Kyusong Lee and Maxine Eskenazi}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Unsupervised Discrete Sentence Representation Learning for Interpretable Neural Dialog Generation}, year = {2018}, } @inproceedings{cao2018emergent, author = {Kris Cao and Angeliki Lazaridou and Marc Lanctot and Joel Z Leibo and Karl Tuyls and Stephen Clark}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Emergent Communication through Negotiation}, year = {2018}, } @inproceedings{cao2017latent, author = {Kris Cao and Stephen Clark}, booktitle = {European Association for Computational Linguistics (EACL)}, title = {Latent Variable Dialogue Models and Their Diversity}, year = {2017}, } @inproceedings{zhao2017learning, author = {Tiancheng Zhao and Ran Zhao and Maxine Eskenazi}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Learning Discourse-level Diversity for Neural Dialog Models using Conditional Variational Autoencoders}, year = {2017}, } @article{jang2017categorical, author = {Eric Jang and Shixiang Gu and Ben Poole}, journal = {arXiv preprint arXiv:1611.01144}, title = {Categorical Reparameterization with {G}umbel-Softmax}, year = {2017}, } @inproceedings{das2017learning, author = {Abhishek Das and Satwik Kottur and Jos{'e} MF Moura and Stefan Lee and Dhruv Batra}, booktitle = {International Conference on Computer Vision (ICCV)}, title = {Learning Cooperative Visual Dialog Agents with Deep Reinforcement Learning}, year = {2017}, } @inproceedings{cuayahuitl2015strategic, author = {Heriberto Cuayáhuitl and Simon Keizer and Oliver Lemon}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Strategic Dialogue Management via Deep Reinforcement Learning}, year = {2015}, } @inproceedings{afantenos2012modelling, author = {Stergos Afantenos and Nicholas Asher and Farah Benamara and Anais Cadilhac and Cedric Dégremont and Pascal Denis and Markus Guhe and Simon Keizer and Alex Lascarides and Oliver Lemon and others}, booktitle = {Proceedings of SemDial 2012: Workshop on the Semantics and Pragmatics of Dialogue}, pages = {167--168}, title = {Modelling Strategic Conversation: Model, Annotation Design and Corpus}, year = {2012}, } @inproceedings{traum2008multi, author = {David Traum and Stacy C Marsella and Jonathan Gratch and Jina Lee and Arno Hartholt}, booktitle = {International Workshop on Intelligent Virtual Agents}, pages = {117--130}, title = {Multi-party, Multi-issue, Multi-strategy Negotiation for Multi-modal Virtual Agents}, year = {2008}, } @inproceedings{asher2016catan, author = {Nicholas Asher and Julie Hunter and Mathieu Morey and Farah Benamara and Stergos Afantenos}, booktitle = {Language Resources and Evaluation Conference (LREC)}, title = {Discourse Structure and Dialogue Acts in Multiparty Dialogue: the {STAC} Corpus}, year = {2016}, } @inproceedings{efstathiou2014catan, author = {Ioannis Efstathiou and Oliver Lemon}, booktitle = {Special Interest Group on Discourse and Dialogue (SIGDIAL)}, title = {Learning Non-Cooperative Dialogue Behaviours}, year = {2014}, } @inproceedings{hiraoka2015trading, author = {Takuya Hiraoka and Kallirroi Georgila and Elnaz Nouri and David Traum}, booktitle = {Special Interest Group on Discourse and Dialogue (SIGDIAL)}, title = {Reinforcement Learning in Multi-Party Trading Dialog}, year = {2015}, } @inproceedings{english2005mixed, author = {Michael S. English and Peter A. Heeman}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Learning Mixed Initiative Dialog Strategies by Using Reinforcement Learning on Both Conversants}, year = {2005}, } @book{brams2003negotiation, author = {Steven J Brams}, publisher = {Psychology Press}, title = {Negotiation Games: Applying Game Theory to Bargaining and Arbitration}, year = {2003}, } @inproceedings{hiraoka2014framing, author = {Hiraoka, Takuya and Neubig, Graham and Sakti, Sakriani and Toda, Tomoki and Nakamura, Satoshi}, booktitle = {International Conference on Computational Linguistics (COLING)}, title = {Reinforcement Learning of Cooperative Persuasive Dialogue Policies using Framing}, year = {2014}, } @inproceedings{nouri2012cultural, author = {Nouri, Elnaz and Georgila, Kallirroi and Traum, David}, booktitle = {The Annual Meeting of the Cognitive Science Society}, title = {A Cultural Decision-making Model for Negotiation based on Inverse Reinforcement Learning}, year = {2012}, } @article{kao2015pun, author = {Justine T. Kao and Roger Levy and Noah D. Goodman}, journal = {Cognitive Science}, title = {A Computational Model of Linguistic Humor in Puns}, year = {2015}, } @article{veale2004incongruity, author = {Veale, Tony}, journal = {Humor: International Journal of Humor Research}, title = {Incongruity in humor: Root cause or epiphenomenon?}, volume = {17}, year = {2004}, } @inproceedings{semeval2017pun, author = {Samuel Doogan and Aniruddha Ghosh and Hanyang Chen and Tony Veale}, booktitle = {The 11th International Workshop on Semantic Evaluation}, title = {Idiom Savant at {S}em{E}val-2017 Task 7: Detection and Interpretation of {E}nglish Puns}, year = {2017}, } @article{zhu2015moviebook, author = {Yukun Zhu and Ryan Kiros and Richard Zemel and Ruslan Salakhutdinov and Raquel Urtasun and Antonio Torralba and Sanja Fidler}, journal = {arXiv preprint arXiv:1506.06724}, title = {Aligning Books and Movies: Towards Story-like Visual Explanations by Watching Movies and Reading Books}, year = {2015}, } @article{merity2016pointer, author = {Stephen Merity and Caiming Xiong and James Bradbury and Richard Socher}, journal = {arXiv preprint arXiv:1609.07843}, title = {Pointer Sentinel Mixture Models}, year = {2016}, } @inproceedings{pauls2012treelets, author = {Adam Pauls and Dan Klein}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Large-Scale Syntactic Language Modeling with Treelets}, year = {2012}, } @inproceedings{ghazvininejad2016poem, author = {Marjan Ghazvininejad and Xing Shi and Yejin Choi and Kevin Knight}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Generating Topical Poetry}, year = {2016}, } @inproceedings{zhang2014chinese, author = {Xingxing Zhang and Mirella Lapata}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Chinese Poetry Generation with Recurrent Neural Networks}, year = {2014}, } @inproceedings{peng2019plan, author = {Lili Yao and Nanyun Peng and Ralph Weischedel and Kevin Knight and Dongyan Zhao and Rui Yan}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Plan-And-Write: Towards Better Automatic Storytelling}, year = {2019}, } @article{fang2018sounding, author = {Fang, Hao and Cheng, Hao and Sap, Maarten and Clark, Elizabeth and Holtzman, Ari and Choi, Yejin and Smith, Noah A and Ostendorf, Mari}, journal = {arXiv preprint arXiv:1804.10202}, title = {Sounding Board: A User-Centric and Content-Driven Social Chatbot}, year = {2018}, } @phdthesis{binsted1996jape, author = {Kim Binsted}, school = {University of Edinburgh}, title = {Machine Humour: An Implemented Model of Puns}, year = {1996}, } @inproceedings{ritchie2005computational, author = {Graeme Ritchie}, booktitle = {the 10th European Natural Language Generation Workshop}, title = {Computational Mechanisms for Pun Generation}, year = {2005}, } @inproceedings{petrovic2013unsupervised, author = {Sasa Petrovic and David Matthews}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Unsupervised Joke Generation from Big Data}, year = {2013}, } @inproceedings{valitutti2013adult, author = {Alessandro Valitutti and Hannu Toivonen and Antoine Doucet and Jukka M. Toivanen}, booktitle = {Association for Computational Linguistics (ACL)}, title = {``Let Everything Turn Well in Your Wife: Generation of Adult Humor Using Lexical Constraints}, year = {2013}, } @inproceedings{ginzburg2015understanding, author = {Jonathan Ginzburg and Ellen Breithholtz and Robin Cooper and Julian Hough and Ye Tian}, booktitle = {Proceedings of the 20th Amsterdam Colloquium}, title = {Understanding Laughter}, year = {2015}, } @inproceedings{peng2018towards, author = {Nanyun Peng and Marjan Ghazvininejad and Jonathan May and Kevin Knight}, booktitle = {NAACL Workshop}, title = {Towards Controllable Story Generation}, year = {2018}, } @article{aarons2017puns, author = {Debra Aarons}, journal = {The Routledge Handbook of Language and Humor, Routledge, New York, NY, Routledge Handbooks in Linguistics}, title = {Puns and Tacit Linguistic Knowledge}, year = {2017}, } @inproceedings{miller2017semeval, author = {Tristan Miller and Christian Hempelmann and Iryna Gurevych}, booktitle = {Proceedings of the 11th International Workshop on Semantic Evaluation}, title = {{S}em{E}val-2017 Task 7: Detection and Interpretation of {E}nglish Puns}, year = {2017}, } @inproceedings{yu2018neural, author = {Zhiwei Yu and Jiwei Tan and Xiaojun Wan}, booktitle = {Association for Computational Linguistics (ACL)}, title = {A Neural Approach to Pun Generation}, year = {2018}, } @article{manurung2000towards, author = {Hisar Manurung and Graeme Ritchie and Henry Thompson}, journal = {The University of Edinburgh Technical Report}, title = {Towards a Computational Model of Poetry Generation}, year = {2000}, } @inproceedings{meehan1977tale, author = {James R Meehan}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {{TALE-SPIN}, An Interactive Program that Writes Stories}, year = {1977}, } @article{levy2013surprisal, author = {Roger Levy and Edward Gibson}, journal = {Frontiers in Psychology}, title = {Surprisal, the {PDC}, and the Primary Locus of Processing Difficulty in Relative Clauses}, volume = {4}, year = {2013}, } @incollection{levy2013memory, author = {Roger Levy}, booktitle = {Sentence Processing}, title = {Memory and Surprisal in Human Sentence Comprehension}, year = {2013}, } @inproceedings{banerjee2005meteor, author = {Satanjeev Banerjee and Alon Lavie}, booktitle = {Association for Computational Linguistics (ACL)}, title = {METEOR: An automatic metric for mt evaluation with improved correlation with human judgments}, year = {2005}, } @article{languagegans2018, author = {Massimo Caccia and Lucas Caccia and William Fedus and Hugo Larochelle and Joelle Pineau and Laurent Charlin }, journal = {arXiv preprint arXiv:1811.02549}, title = {Language GANs Falling Short}, year = {2018}, } @article{fan2018hierarchical, author = {Angela Fan and Mike Lewis and Yann Dauphin}, journal = {arXiv preprint arXiv:1805.04833}, title = {Hierarchical Neural Story Generation}, year = {2018}, } @article{theis2015note, author = {Lucas Theis and Aaron van den Oord and Matthias Bethge}, journal = {arXiv preprint arXiv:1511.01844}, title = {A note on the evaluation of generative models}, year = {2015}, } @article{karras2017progressive, author = {Tero Karras and Timo Aila and Samuli Laine and Jaakko Lehtinen}, journal = {arXiv preprint arXiv:1710.10196}, title = {Progressive Growing of GANs for Improved Quality, Stability, and Variation}, year = {2017}, } @article{sajjadi2018precision, author = {Mehdi S. M. Sajjadi and Olivier Bachem and Mario Lucic and Olivier Bousquet and Sylvain Gelly}, journal = {arXiv preprint arXiv:1806.00035}, title = {Assessing Generative Models via Precision and Recall}, year = {2018}, } @inproceedings{clarke2008diversity, author = {Charles L. A. Clarke and Maheedhar Kolla and Gordon V. Cormack and Olga Vechtomova and Azin Ashkan and Stefan Büttcher and Ian MacKinnon}, booktitle = {ACM SIGIR}, title = {Novelty and diversity in information retrieval evaluation}, year = {2008}, } @inproceedings{nenkova2007pyramid, author = {Ani Nenkova and Rebecca J. Passonneau and Kathleen McKeown}, booktitle = {ACM Transactions on Speech and Language Processing}, title = {The Pyramid Method: Incorporating human content selection variation in summarization evaluation}, year = {2007}, } @article{yu2017seq, author = {Lantao Yu and Weinan Zhang and Jun Wang and Yong Yu}, journal = {arXiv preprint arXiv:1609.05473}, title = {SeqGAN: Sequence Generative Adversarial Nets with Policy Gradient}, year = {2017}, } @article{olsson2018skill, author = {Catherine Olsson and Surya Bhupatiraju and Tom Brown and Augustus Odena and Ian Goodfellow}, journal = {arXiv preprint arXiv:1808.04888}, title = {Skill Rating for Generative Models}, year = {2018}, } @article{klein2017opennmt, author = {Guillaume Klein and Yoon Kim and Yuntian Deng and Jean Senellart and Alexander M. Rush}, journal = {arXiv preprint arXiv:1701.02810}, title = {Open{NMT}: Open-Source Toolkit for Neural Machine Translation}, year = {2017}, } @article{vinyals2015convo, author = {Oriol Vinyals and Quoc V. Le}, journal = {arXiv preprint arXiv:1506.05869}, title = {A Neural Conversational Model}, year = {2015}, } @inproceedings{roemmele2016writing, author = {Melissa Roemmele}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Writing Stories with Help from Recurrent Neural Networks}, year = {2016}, } @article{trunk1979problem, author = {G. V. Trunk}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence}, pages = {306--307}, title = {A Problem of Dimensionality: A Simple Example}, volume = {3}, year = {1979}, } @inproceedings{gehrmann2018bottom, author = {Sebastian Gehrmann and Yuntian Deng and Alexander M. Rush}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Bottom-Up Abstractive Summarization}, year = {2018}, } @article{galley2015delta, author = {Michel Galley and Chris Brockett and Alessandro Sordoni and Yangfeng Ji and Michael Auli and Chris Quirk and Margaret Mitchell and Jianfeng Gao and Bill Dolan}, journal = {arXiv preprint arXiv:1506.06863}, title = {deltaBLEU: A Discriminative Metric for Generation Tasks with Intrinsically Diverse Targets}, year = {2015}, } @article{jozefowicz2016exploring, author = {Rafal Jozefowicz and Oriol Vinyals and Mike Schuster and Noam Shazeer and Yonghui Wu}, journal = {arXiv preprint arXiv:1602.02410}, title = {Exploring the Limits of Language Modeling}, year = {2016}, } @book{surowiecki2004wisdom, author = {James Surowiecki}, publisher = {Doubleday and Co}, title = {The wisdom of crowds: Why the many are smarter than the few and how collective wisdom shapes business, economies, societies, and nations}, year = {2004}, } @inproceedings{shima2011diversity, author = {Hideki Shima and Teruko Mitamura}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Diversity-aware Evaluation for Paraphrase Patterns }, year = {2011}, } @inproceedings{huesel2017gans, author = {Martin Heusel and Hubert Ramsauer and Thomas Unterthiner and Bernhard Nessler and Sepp Hochreiter}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {GANs Trained by a Two Time-Scale Update Rule Converge to a Local Nash Equilibrium}, year = {2017}, } @inproceedings{bruni2017adversarial, author = {Elia Bruni and Raquel Fernandez}, booktitle = {Proceedings of the SIGDIAL 2017 Conference}, title = {Adversarial Evaluation for Open-Domain Dialogue Generation}, year = {2017}, } @inproceedings{kannan2016adversarial, author = {Anjuli Kannan and Oriol Vinyals}, booktitle = {NIPS 2016 Workshop on Adversarial Training}, title = {Adversarial Evaluation of Dialogue Models}, year = {2016}, } @inproceedings{sun2012joint, author = {Hong Sun and Ming Zhou}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Joint learning of a dual {SMT} system for paraphrase generation}, year = {2012}, } @inproceedings{ungar2012judgement, author = {Lyle Ungar and Barb Mellors and Ville Satopää and Jon Baron and Phil Tetlock and Jaime Ramos and Sam Swift}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {The Good Judgment Project: A Large Scale Test of Different Methods of Combining Expert Predictions}, year = {2012}, } @inproceedings{haug2018neural, author = {Till Haug and Octavian-Eugen Ganea and Paulina Grnarova}, booktitle = {European Conference on Information Retrieval}, title = {Neural Multi-Step Reasoning for Question Answering on Semi-Structured Tables}, year = {2018}, } @inproceedings{desai2016program, author = {Aditya Desai and Sumit Gulwani and Vineet Hingorani and Nidhi Jain and Amey Karkare and Mark Marron and Sailesh R and Subhajit Roy}, booktitle = {International Conference on Software Engineering (ICSE)}, pages = {345--356}, title = {Program synthesis using natural language}, year = {2016}, } @inproceedings{reddy2016transforming, author = {Siva Reddy and Oscar T{\"a}ckstr{\"o}m and Michael Collins and Tom Kwiatkowski and Dipanjan Das and Mark Steedman and Mirella Lapata}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {127--140}, title = {Transforming dependency structures to logical forms for semantic parsing}, year = {2016}, } @inproceedings{kocisk2016semantic, author = {Tom{\'a}s Kocisk{\'y} and G{\'a}bor Melis and Edward Grefenstette and Chris Dyer and Wang Ling and Phil Blunsom and Karl Moritz Hermann}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1078--1087}, title = {Semantic Parsing with Semi-Supervised Sequential Autoencoders}, year = {2016}, } @inproceedings{wang2006discriminative, author = {Ye-Yi Wang and Alex Acero}, booktitle = {InterSpeech}, title = {Discriminative models for spoken language understanding}, year = {2006}, } @techreport{zhu2002learning, author = {Xiaojin Zhu and Zoubin Ghahramani}, institution = {CMU CALD}, title = {Learning from Labeled and Unlabeled Data with Label Propagation}, year = {2002}, } @inproceedings{indyk2004approximate, author = {Piotr Indyk}, booktitle = {Symposium on Discrete Algorithms (SODA)}, pages = {646--650}, title = {Approximate nearest neighbor under edit distance via product metrics}, year = {2004}, } @inproceedings{nogueira2016end, author = {Rodrigo Nogueira and Kyunghyun Cho}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {End-to-End Goal-Driven Web Navigation}, year = {2016}, } @inproceedings{yeh2009sikuli, author = {Tom Yeh and Tsung-Hsiang Chang and Rob Miller}, booktitle = {User Interface Software and Technology (UIST)}, title = {Sikuli: using {GUI} screenshots for search and automation}, year = {2009}, } @inproceedings{mnih2016asynchronous, author = {Volodymyr Mnih and Adri{\`{a}} Puigdom{\`{e}}nech Badia and Mehdi Mirza and Alex Graves and Timothy P. Lillicrap and Tim Harley and David Silver and Koray Kavukcuoglu}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Asynchronous Methods for Deep Reinforcement Learning}, year = {2016}, } @inproceedings{brys2015reinforcement, author = {Tim Brys and Anna Harutyunyan and Halit Bener Suay and Sonia Chernova and Matthew E. Taylor and Ann Now{'{e}}}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Reinforcement Learning from Demonstration through Shaping}, year = {2015}, } @inproceedings{hussein2017deep, author = {Ahmed Hussein and Eyad Elyan and Mohamed Medhat Gaber and Chrisina Jayne}, booktitle = {International Joint Conference on Neural Networks}, title = {Deep reward shaping from demonstrations}, year = {2017}, } @inproceedings{levine2013guided, author = {Sergey Levine and Vladlen Koltun}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Guided Policy Search}, year = {2013}, } @article{ross2014reinforce, author = {St{'{e}}phane Ross and J. Andrew Bagnell}, journal = {arXiv preprint arXiv:1406.5979}, title = {Reinforcement and Imitation Learning via Interactive No-Regret Learning}, year = {2014}, } @inproceedings{sun2017deeply, author = {Wen Sun and Arun Venkatraman and Geoffrey J. Gordon and Byron Boots and J. Andrew Bagnell}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Deeply AggreVaTeD: Differentiable Imitation Learning for Sequential Prediction}, year = {2017}, } @inproceedings{ziebart2008maximum, author = {Brian D. Ziebart and Andrew L. Maas and J. Andrew Bagnell and Anind K. Dey}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Maximum Entropy Inverse Reinforcement Learning}, year = {2008}, } @inproceedings{hosu2016playing, author = {Ionel-Alexandru Hosu and Traian Rebedea}, booktitle = {Evaluating General Purpose AI}, title = {Playing {A}tari Games with Deep Reinforcement Learning and Human Checkpoint Replay}, year = {2016}, } @inproceedings{hamilton2017inductive, author = {William L. Hamilton and Rex Ying and Jure Leskovec}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Inductive Representation Learning on Large Graphs}, year = {2017}, } @inproceedings{kipf2017semi, author = {Thomas N. Kipf and Max Welling}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Semi-Supervised Classification with Graph Convolutional Networks}, year = {2017}, } @inproceedings{pham2017column, author = {Trang Pham and Truyen Tran and Dinh Phung and Svetha Venkatesh}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Column Networks for Collective Classification}, year = {2017}, } @article{hammoudi2016why, author = {Mouna Hammoudi and Gregg Rothermel and Paolo Tonella}, journal = {IEEE International Conference on Software Testing, Verification and Validation}, title = {Why do Record/Replay Tests of Web Applications Break?}, year = {2016}, } @article{janner2018representation, author = {Michael Janner and Karthik Narasimhan and Regina Barzilay}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {Representation Learning for Grounded Spatial Reasoning}, volume = {6}, year = {2018}, } @inproceedings{fried2018unified, author = {Daniel Fried and Jacob Andreas and Dan Klein}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Unified Pragmatic Models for Generating and Following Instructions}, year = {2018}, } @inproceedings{su2017building, author = {Yu Su and Ahmed Hassan Awadallah and Madian Khabsa and Patrick Pantel and Michael Gamon and Mark J. Encarnaci\'{o}n}, booktitle = {Conference on Information and Knowledge Management (CIKM)}, title = {Building Natural Language Interfaces to Web APIs}, year = {2017}, } @article{yin2016abcnn, author = {Wenpeng Yin and Hinrich Sch{\"u}tze and Bing Xiang and Bowen Zhou}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {{ABCNN}: Attention-Based Convolutional Neural Network for Modeling Sentence Pairs}, volume = {4}, year = {2016}, } @inproceedings{yu2018qanet, author = {Adams Wei Yu and David Dohan and Minh-Thang Luong and Rui Zhao and Kai Chen and Mohammad Norouzi and Quoc V. Le}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {{QANet}: Combining Local Convolution with Global Self-Attention for Reading Comprehension}, year = {2018}, } @inproceedings{kiros2015skip, author = {Ryan Kiros and Yukun Zhu and Ruslan Salakhutdinov and Richard S. Zemel and Raquel Urtasun and Antonio Torralba and Sanja Fidler}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Skip-Thought Vectors}, year = {2015}, } @inproceedings{zajicek1998blind, author = {Mary Zajicek and Chris Powell and Chris Reeves}, booktitle = {International ACM Conference on Assistive Technologies}, title = {A Web Navigation Tool for the Blind}, year = {1998}, } @misc{soh2017tagui, author = {Ken Soh}, howpublished = {\url{https://github.com/kelaberetiv/TagUI}}, title = {{TagUI}: {RPA} / {CLI} tool for automating user interactions}, year = {2017}, } @inproceedings{spalteholz2008keysurf, author = {Leo Spalteholz and Kin Fun Li and Nigel Livingston and Foad Hamidi}, booktitle = {World Wide Web (WWW)}, title = {Keysurf: a character controlled browser for people with physical disabilities}, year = {2008}, } @article{yu2005haptics, author = {Wai Yu and Ravi Kuber and Emma Murphy and Philip Strain and Graham McAllister}, journal = {Virtual Reality}, title = {A novel multimodal interface for improving visually impaired people's web accessibility}, volume = {9}, year = {2005}, } @inproceedings{kumar2007eyepoint, author = {Manu Kumar and Andreas Paepcke and Terry Winograd}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {EyePoint: practical pointing and selection using gaze and keyboard}, year = {2007}, } @inproceedings{ashok2014wizard, author = {Vikas Ashok and Yevgen Borodin and Svetlana Stoyanchev and Yury Puzis and I. V. Ramakrishnan}, booktitle = {Web for All Conference}, title = {Wizard-of-{O}z evaluation of speech-driven web browsing interface for people with vision impairments}, year = {2014}, } @inproceedings{yu2017joint, author = {Licheng Yu and Hao Tan and Mohit Bansal and Tamara L. Berg}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {A Joint Speaker-Listener-Reinforcer Model for Referring Expressions}, year = {2017}, } @inproceedings{celikyilmaz2014resolving, author = {Asli \c{C}elikyilmaz and Zhaleh Feizollahi and Dilek Z. Hakkani-T{\"u}r and Ruhi Sarikaya}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Resolving Referring Expressions in Conversational Dialogs for Natural User Interfaces}, year = {2014}, } @inproceedings{zarriass2017obtaining, author = {Sina Zarriai{\ss} and David Schlangen}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Obtaining referential word meanings from visual and distributional information: Experiments on object naming}, year = {2017}, } @inproceedings{zavershynskyi2018naps, author = {Maksym Zavershynskyi and Alexander Skidanov and Illia Polosukhin}, booktitle = {Workshop on Neural Abstract Machines \& Program Induction (NAMPI)}, title = {{NAPS}: Natural Program Synthesis Dataset}, year = {2018}, } @inproceedings{yu2018syntaxsqlnet, author = {Tao Yu and Michihiro Yasunaga and Kai Yang and Rui Zhang and Dongxu Wang and Zifan Li and Dragomir R. Radev}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {{SyntaxSQLNet}: Syntax Tree Networks for Complex and Cross-DomainText-to-{SQL} Task}, year = {2018}, } @inproceedings{dong2018coarse, author = {Li Dong and Mirella Lapata}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Coarse-to-Fine Decoding for Neural Semantic Parsing}, year = {2018}, } @article{oda2015learning, author = {Yusuke Oda and Hiroyuki Fudaba and Graham Neubig and Hideaki Hata and Sakriani Sakti and Tomoki Toda and Satoshi Nakamura}, journal = {IEEE/ACM International Conference on Automated Software Engineering (ASE)}, pages = {574--584}, title = {Learning to Generate Pseudo-Code from Source Code Using Statistical Machine Translation}, volume = {30}, year = {2015}, } @inproceedings{hartmann2010what, author = {Bj{\"o}rn Hartmann and Daniel MacDougall and Joel Brandt and Scott R. Klemmer}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {What would other programmers do: suggesting solutions to error messages}, year = {2010}, } @inproceedings{vasic2019neural, author = {Vasic, Marko and Kanade, Aditya and Maniatis, Petros and Bieber, David and Singh, Rishabh}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Neural Program Repair by Jointly Learning to Localize and Repair}, year = {2019}, } @inproceedings{brockschmidt2019generative, author = {Marc Brockschmidt and Miltiadis Allamanis and Alexander L. Gaunt and Oleksandr Polozov}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Generative Code Modeling with Graphs}, year = {2019}, } @article{mudrakarta2018it, author = {Pramod Kaushik Mudrakarta and Ankur Taly and Mukund Sundararajan and Kedar Dhamdhere}, journal = {arXiv preprint arXiv:1803.04579}, title = {It was the training data pruning too!}, year = {2018}, } @inproceedings{yu2018spider, author = {Tao Yu and Rui Zhang and Kai Yang and Michihiro Yasunaga and Dongxu Wang and Zifan Li and James Ma and Irene Li and Qingning Yao and Shanelle Roman and Zilin Zhang and Dragomir R. Radev}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Spider: A Large-Scale Human-Labeled Dataset for Complex and Cross-Domain Semantic Parsing and Text-to-{SQL} Task}, year = {2018}, } @article{embley2016converting, author = {David W. Embley and Mukkai S. Krishnamoorthy and George Nagy and Sharad C. Seth}, journal = {International Journal on Document Analysis and Recognition (IJDAR)}, pages = {119--138}, title = {Converting heterogeneous statistical tables on the web to searchable databases}, volume = {19}, year = {2016}, } @inproceedings{omari2016lossless, author = {Adi Omari and Benny Kimelfeld and Eran Yahav and Sharon Shoham}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, title = {Lossless Separation of Web Pages into Layout Code and Data}, year = {2016}, } @article{kreuzer2015quantitative, author = {Robert Kreuzer and Jurriaan Hage and A. J. Feelders}, journal = {International Conference on Web Engineering (ICWE)}, title = {A Quantitative Comparison of Semantic Web Page Segmentation Approaches}, year = {2015}, } @inproceedings{bing2014web, author = {Lidong Bing and Rui Guo and Wai Lam and Zheng-Yu Niu and Haifeng Wang}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, title = {Web page segmentation with structured prediction and its application in web page classification}, year = {2014}, } @article{grigalis2014unsupervised, author = {Tomas Grigalis and Antanas Cenys}, journal = {Journal of Universal Computer Science}, pages = {169--192}, title = {Unsupervised structured data extraction from template-generated web pages}, volume = {20}, year = {2014}, } @inproceedings{kumar2011bricolage, author = {Ranjitha Kumar and Jerry O. Talton and Salman Ahmad and Scott R. Klemmer}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Bricolage: example-based retargeting for web design}, year = {2011}, } @inproceedings{kumar2013webzeitgeist, author = {Ranjitha Kumar and Arvind Satyanarayan and C{'e}sar Torres and Maxine Lim and Salman Ahmad and Scott R. Klemmer and Jerry O. Talton}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Webzeitgeist: design mining the web}, year = {2013}, } @article{spengler2010document, author = {Alex Spengler and Patrick Gallinari}, journal = {ACM Symposium on Document Engineering}, title = {Document structure meets page layout: loopy random fields for web news content extraction}, year = {2010}, } @inproceedings{gordon2018iqa, author = {Daniel Gordon and Aniruddha Kembhavi and Mohammad Rastegari and Joseph Redmon and Dieter Fox and Ali Farhadi}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {{IQA}: Visual Question Answering in Interactive Environments}, year = {2018}, } @inproceedings{hudson2019gqa, author = {Drew A. Hudson and Christopher D. Manning}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {{GQA}: A New Dataset for Real-World Visual Reasoning and Compositional Question Answering}, year = {2019}, } @inproceedings{bisk2016evaluating, author = {Yonatan Bisk and Siva Reddy and John Blitzer and Julia Hockenmaier and Mark Steedman}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Evaluating Induced {CCG} Parsers on Grounded Semantic Parsing}, year = {2016}, } @inproceedings{su2016graphquestions, author = {Yu Su and Huan Sun and Brian M. Sadler and Mudhakar Srivatsa and Izzeddin Gur and Zenghui Yan and Xifeng Yan}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {On Generating Characteristic-rich Question Sets for {QA} Evaluation}, year = {2016}, } @inproceedings{locascio2016regex, author = {Nicholas Locascio and Kumaravelu Narasimhan and Eduardo DeLeon and Nate Kushman and Regina Barzilay}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Neural Generation of Regular Expressions from Natural Language with Minimal Domain Knowledge}, year = {2016}, } @inproceedings{polosukhin2018neural, author = {Illia Polosukhin and Alexander Skidanov}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Neural Program Search: Solving Programming Tasks from Description and Examples}, year = {2018}, } @article{he2006spoken, author = {Yulan He and Steve Young}, journal = {Speech Communication}, pages = {262--275}, title = {Spoken language understanding using the hidden vector state model}, volume = {48}, year = {2006}, } @article{hendrix1978developing, author = {Gary G Hendrix and Earl D Sacerdoti and Daniel Sagalowicz and Jonathan Slocum}, journal = {ACM Transactions on Database Systems (TODS)}, pages = {105--147}, title = {Developing a natural language interface to complex data}, volume = {3}, year = {1978}, } @inproceedings{szegedy2015googlenet, author = {Christian Szegedy and Wei Liu and Yangqing Jia and Pierre Sermanet and Scott E. Reed and Dragomir Anguelov and Dumitru Erhan and Vincent Vanhoucke and Andrew Rabinovich}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Going deeper with convolutions}, year = {2015}, } @inproceedings{he2016resnet, author = {Kaiming He and Xiangyu Zhang and Shaoqing Ren and Jian Sun}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Deep Residual Learning for Image Recognition}, year = {2016}, } @inproceedings{pieraccini1991stochastic, author = {Roberto Pieraccini and Esther Levin and Chin-Hui Lee}, booktitle = {Human Language Technology (HLT)}, title = {Stochastic Representation of Conceptual Structure in the {ATIS} Task}, year = {1991}, } @inproceedings{raymond2007generative, author = {Christian Raymond and Giuseppe Riccardi}, booktitle = {InterSpeech}, title = {Generative and discriminative algorithms for spoken language understanding}, year = {2007}, } @article{mesnil2014using, author = {Gr{\'e}goire Mesnil and Yann Dauphin and Kaisheng Yao and Yoshua Bengio and Li Deng and Dilek Hakkani-Tur and Xiaodong He and Larry Heck and Gokhan Tur and Dong Yu}, journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing}, title = {Using recurrent neural networks for slot filling in spoken language understanding}, volume = {23}, year = {2014}, } @misc{gabrilovich2013facc1, author = {Evgeniy Gabrilovich and Michael Ringgaard and Amarnag Subramanya}, howpublished = {\url{http://lemurproject.org/clueweb09/}}, title = {FACC1: Freebase annotation of ClueWeb corpora}, year = {2013}, } @inproceedings{fang2015captions, author = {Hao Fang and Saurabh Gupta and Forrest Iandola and Rupesh K Srivastava and Li Deng and Piotr Doll{\'a}r and Jianfeng Gao and Xiaodong He and Margaret Mitchell and John C Platt}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {From captions to visual concepts and back}, year = {2015}, } @inproceedings{mao2015deep, author = {Junhua Mao and Wei Xu and Yi Yang and Jiang Wang and Zhiheng Huang and Alan Yuille}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Deep captioning with multimodal recurrent neural networks (m-{RNN})}, year = {2015}, } @inproceedings{agrawal2016analyzing, author = {Aishwarya Agrawal and Dhruv Batra and Devi Parikh}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Analyzing the behavior of visual question answering models}, year = {2016}, } @inproceedings{goyal2017making, author = {Yash Goyal and Tejas Khot and Douglas Summers-Stay and Dhruv Batra and Devi Parikh}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Making the {V} in {VQA} matter: Elevating the role of image understanding in Visual Question Answering}, year = {2017}, } @inproceedings{andreas2016neural, author = {Jacob Andreas and Marcus Rohrbach and Trevor Darrell and Dan Klein}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Neural module networks}, year = {2016}, } @inproceedings{lopez2013evaluating, author = {Vanessa Lopez and Christina Unger and Philipp Cimiano and Enrico Motta}, booktitle = {World Wide Web (WWW)}, title = {Evaluating question answering over linked data}, year = {2013}, } @article{wang2018robust, author = {Chenglong Wang and Kedar Tatwawadi and Marc Brockschmidt and Po-Sen Huang and Yi Mao and Oleksandr Polozov and Rishabh Singh}, journal = {arXiv preprint arXiv:1807.03100}, title = {Robust text-to-{SQL} generation with execution-guided decoding}, year = {2018}, } @article{robertson2009probabilistic, author = {Stephen Robertson and Hugo Zaragoza}, journal = {Foundations and Trends in Information Retrieval}, title = {The probabilistic relevance framework: {BM25} and beyond}, volume = {3}, year = {2009}, } @inproceedings{agichtein2000snowball, author = {Eugene Agichtein and Luis Gravano}, booktitle = {Proceedings of the fifth ACM conference on Digital Libraries}, title = {Snowball: Extracting relations from large plain-text collections}, year = {2000}, } @inproceedings{wang2015transition, author = {Chuan Wang and Nianwen Xue and Sameer Pradhan}, booktitle = {Association for Computational Linguistics (ACL)}, title = {A transition-based algorithm for {AMR} parsing}, year = {2015}, } @inproceedings{yakout2012infogather, author = {Mohamed Yakout and Kris Ganjam and Kaushik Chakrabarti and Surajit Chaudhuri}, booktitle = {International Conference on Management of Data (SIGMOD)}, title = {Infogather: entity augmentation and attribute discovery by holistic matching with web tables}, year = {2012}, } @inproceedings{dua2019drop, author = {Dheeru Dua and Yizhong Wang and Pradeep Dasigi and Gabriel Stanovsky and Sameer Singh and Matt Gardner}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {{DROP}: A Reading Comprehension Benchmark Requiring Discrete Reasoning Over Paragraphs}, year = {2019}, } @inproceedings{mitchell2015nell, author = {Tom Mitchell and William Cohen and Estevam Hruschka and Partha Talukdar and Bo Yang and Justin Betteridge and Andrew Carlson and B Dalvi and Matt Gardner and Bryan Kisiel and others}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Never-ending learning}, year = {2015}, } @inproceedings{yang2018hotpotqa, author = {Zhilin Yang and Peng Qi and Saizheng Zhang and Yoshua Bengio and William W Cohen and Ruslan Salakhutdinov and Christopher D Manning}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {{HotpotQA}: A dataset for diverse, explainable multi-hop question answering}, year = {2018}, } @inproceedings{hermann2014semantic, author = {Karl Moritz Hermann and Dipanjan Das and Jason Weston and Kuzman Ganchev}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Semantic frame identification with distributed word representations}, year = {2014}, } @article{pasca2003open, author = {Marius Pa{\c{s}}ca}, journal = {Computational Linguistics}, title = {Open-domain question answering from large text collections}, volume = {29}, year = {2003}, } @article{hearst1998automated, author = {Marti A Hearst}, journal = {WordNet: an electronic lexical database}, title = {Automated discovery of WordNet relations}, year = {1998}, } @inproceedings{zeng2014relation, author = {Daojian Zeng and Kang Liu and Siwei Lai and Guangyou Zhou and Jun Zhao}, booktitle = {International Conference on Computational Linguistics (COLING)}, title = {Relation classification via convolutional deep neural network}, year = {2014}, } @inproceedings{miwa2016end, author = {Makoto Miwa and Mohit Bansal}, booktitle = {Association for Computational Linguistics (ACL)}, title = {End-to-end relation extraction using lstms on sequences and tree structures}, year = {2016}, } @article{ritter2013modeling, author = {Alan Ritter and Luke Zettlemoyer and Mausam and Oren Etzioni}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {Modeling missing data in distant supervision for information extraction}, volume = {1}, year = {2013}, } @inproceedings{riedel2011robust, author = {Sebastian Riedel and Andrew McCallum}, booktitle = {Proceedings of the BioNLP Shared Task 2011 Workshop}, title = {Robust biomedical event extraction with dual decomposition and minimal domain adaptation}, year = {2011}, } @article{iyer2019learning, author = {Srinivasan Iyer and Alvin Cheung and Luke Zettlemoyer}, journal = {arXiv preprint arXiv:1904.09086}, title = {Learning Programmatic Idioms for Scalable Semantic Parsing}, year = {2019}, } @inproceedings{li2013joint, author = {Qi Li and Heng Ji and Liang Huang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Joint event extraction via structured prediction with global features}, year = {2013}, } @inproceedings{chen2015event, author = {Yubo Chen and Liheng Xu and Kang Liu and Daojian Zeng and Jun Zhao}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Event extraction via dynamic multi-pooling convolutional neural networks}, year = {2015}, } @inproceedings{gamon2013identifying, author = {Michael Gamon and Tae Yano and Xinying Song and Johnson Apacible and Patrick Pantel}, booktitle = {Conference on Information and Knowledge Management (CIKM)}, title = {Identifying salient entities in web pages}, year = {2013}, } @inproceedings{shen2014webpage, author = {Chengyao Shen and Qi Zhao}, booktitle = {European Conference on Computer Vision (ECCV)}, title = {Webpage saliency}, year = {2014}, } @inproceedings{bhagavatula2015tabel, author = {Chandra Sekhar Bhagavatula and Thanapon Noraset and Doug Downey}, booktitle = {International Semantic Web Conference (ISWC)}, title = {{TabEL}: entity linking in web tables}, year = {2015}, } @inproceedings{madaan2016numerical, author = {Aman Madaan and Ashish Mittal and Ganesh Ramakrishnan and Sunita Sarawagi}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Numerical relation extraction with minimal supervision}, year = {2016}, } @inproceedings{govindaraju2013understanding, author = {Vidhya Govindaraju and Ce Zhang and Christopher R{\'e}}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Understanding tables in context using standard {NLP} toolkits}, year = {2013}, } @phdthesis{zhang2015deepdive, author = {Ce Zhang}, school = {University of Wisconsin-Madison}, title = {{DeepDive}: a data management system for automatic knowledge base construction}, year = {2015}, } @inproceedings{labutov2018learning, author = {Igor Labutov and Bishan Yang and Tom Mitchell}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Learning to Learn Semantic Parsers from Natural Language Supervision}, year = {2018}, } @inproceedings{wang2017program, author = {Xinyu Wang and Isil Dillig and Rishabh Singh}, booktitle = {Principles of Programming Languages (POPL)}, title = {Program synthesis using abstraction refinement}, year = {2017}, } @inproceedings{misra2018policy, author = {Dipendra Misra and Ming-Wei Chang and Xiaodong He and Wen-tau Yih}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Policy Shaping and Generalized Update Equations for Semantic Parsing from Denotations}, year = {2018}, } @inproceedings{neelakantan2017learning, author = {Arvind Neelakantan and Quoc V Le and Martin Abadi and Andrew McCallum and Dario Amodei}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Learning a natural language interface with neural programmer}, year = {2017}, } @article{dhamdhere2017abductive, author = {Kedar Dhamdhere and Kevin S McCurley and Mukund Sundararajan and Ankur Taly}, journal = {arXiv preprint arXiv:1709.03036}, title = {Abductive Matching in Question Answering}, year = {2017}, } @inproceedings{dhamdhere2017analyza, author = {Kedar Dhamdhere and Kevin S McCurley and Ralfi Nahmias and Mukund Sundararajan and Qiqi Yan}, booktitle = {Proceedings of the 22nd International Conference on Intelligent User Interfaces}, title = {Analyza: Exploring data with conversation}, year = {2017}, } @inproceedings{biloki2019neural, author = {Jacob Biloki and Chen Liang and Ni Lao}, booktitle = {Deep Reinforcement Learning Meets Structured Prediction Workshop at ICLR 2019}, title = {Neural Program Planner for Structured Predictions}, year = {2019}, } @article{agarwal2019learning, author = {Rishabh Agarwal and Chen Liang and Dale Schuurmans and Mohammad Norouzi}, journal = {arXiv preprint arXiv:1902.07198}, title = {Learning to Generalize from Sparse and Underspecified Rewards}, year = {2019}, } @inproceedings{mou2017coupling, author = {Lili Mou and Zhengdong Lu and Hang Li and Zhi Jin}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Coupling distributed and symbolic execution for natural language queries}, year = {2017}, } @inproceedings{iyyer2017search, author = {Mohit Iyyer and Wen-tau Yih and Ming-Wei Chang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Search-based neural structured learning for sequential question answering}, year = {2017}, } @inproceedings{dong2018confidence, author = {Li Dong and Chris Quirk and Mirella Lapata}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Confidence modeling for neural semantic parsing}, year = {2018}, } @inproceedings{lehnert1977conceptual, author = {Wendy G Lehnert}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {A conceptual theory of question answering}, year = {1977}, } @article{hirschman2001natural, author = {Lynette Hirschman and Robert Gaizauskas}, journal = {Natural Language Engineering}, title = {Natural language question answering: the view from here}, volume = {7}, year = {2001}, } @inproceedings{abiteboul1997querying, author = {Serge Abiteboul}, booktitle = {International Conference on Database Theory}, title = {Querying semi-structured data}, year = {1997}, } @article{mchugh1997lore, author = {Jason McHugh and Serge Abiteboul and Roy Goldman and Dallan Quass and Jennifer Widom}, journal = {SIGMOD record}, title = {Lore: A database management system for semistructured data}, volume = {26}, year = {1997}, } @article{burke1997question, author = {Robin D Burke and Kristian J Hammond and Vladimir Kulyukin and Steven L Lytinen and Noriko Tomuro and Scott Schoenberg}, journal = {AI magazine}, title = {Question answering from frequently asked question files: Experiences with the {FAQ} finder system}, volume = {18}, year = {1997}, } @article{soricut2006automatic, author = {Radu Soricut and Eric Brill}, journal = {Information Retrieval}, title = {Automatic question answering using the web: Beyond the factoid}, volume = {9}, year = {2006}, } @inproceedings{kwiatkowski2019natural, author = {Tom Kwiatkowski and Jennimaria Palomaki and Olivia Redfield and Michael Collins and Ankur Parikh and Chris Alberti and Danielle Epstein and Illia Polosukhin and Matthew Kelcey and Jacob Devlin and Kenton Lee and Kristina N. Toutanova and Llion Jones and Ming-Wei Chang and Andrew Dai and Jakob Uszkoreit and Quoc Le and Slav Petrov}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Natural Questions: A Benchmark for Question Answering Research}, year = {2019}, } @inproceedings{cafarella2009data, author = {Michael J Cafarella and Alon Halevy and Nodira Khoussainova}, booktitle = {Very Large Data Bases (VLDB)}, title = {Data integration for the relational web}, year = {2009}, } @inproceedings{katz2002omnibase, author = {Boris Katz and Sue Felshin and Deniz Yuret and Ali Ibrahim and Jimmy Lin and Gregory Marton and Alton Jerome McFarland and Baris Temelkuran}, booktitle = {International Conference on Application of Natural Language to Information Systems}, title = {Omnibase: Uniform access to heterogeneous data for question answering}, year = {2002}, } @inproceedings{yang2016stacked, author = {Zichao Yang and Xiaodong He and Jianfeng Gao and Li Deng and Alex Smola}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Stacked attention networks for image question answering}, year = {2016}, } @article{jones1972tfidf, author = {Karen Sparck Jones}, journal = {Journal of documentation}, title = {A statistical interpretation of term specificity and its application in retrieval}, volume = {28}, year = {1972}, } @article{carpineto2012expansion, author = {Claudio Carpineto and Giovanni Romano}, journal = {ACM Computing Surveys (CSUR)}, title = {A survey of automatic query expansion in information retrieval}, volume = {44}, year = {2012}, } @inproceedings{cao2006adapting, author = {Yunbo Cao and Jun Xu and Tie-Yan Liu and Hang Li and Yalou Huang and Hsiao-Wuen Hon}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, title = {Adapting ranking {SVM} to document retrieval}, year = {2006}, } @inproceedings{yue2007support, author = {Yisong Yue and Thomas Finley and Filip Radlinski and Thorsten Joachims}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, title = {A support vector method for optimizing average precision}, year = {2007}, } @inproceedings{haveliwala2002topic, author = {Taher H Haveliwala}, booktitle = {World Wide Web (WWW)}, title = {Topic-sensitive pagerank}, year = {2002}, } @inproceedings{gyongyi2004combating, author = {Zolt{\'a}n Gy{\"o}ngyi and Hector Garcia-Molina and Jan Pedersen}, booktitle = {Very Large Data Bases (VLDB)}, title = {Combating web spam with trustrank}, year = {2004}, } @inproceedings{zhang2020pegasus, author = {Jingqing Zhang and Yao Zhao and Mohammad Saleh and Peter Liu}, booktitle = {International Conference on Machine Learning (ICML)}, title = {{PEGASUS}: Pre-training with Extracted Gap-sentences for Abstractive Summarization}, year = {2020}, } @article{flower1981cognitive, author = {Linda Flower and John R Hayes}, journal = {College composition and communication}, title = {A cognitive process theory of writing}, volume = {32}, year = {1981}, } @inproceedings{glass1999challenges, author = {James Glass}, booktitle = {In Proceedings of the 1999 IEEE ASRU Workshop}, title = {Challenges for spoken dialogue systems}, year = {1999}, } @inproceedings{clark2019makes, author = {Leigh Clark and Nadia Pantidi and Orla Cooney and Philip Doyle and Diego Garaialde and Justin Edwards and Brendan Spillane and Emer Gilmartin and Christine Murad and Cosmin Munteanu and et al.}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {What makes a good conversation? challenges in designing truly conversational agents}, year = {2019}, } @inproceedings{clarksmith2021choose, author = {Elizabeth Clark and Noah A. Smith}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Choose Your Own Adventure: Paired Suggestions in Collaborative Writing for Evaluating Story Generation Models}, year = {2021}, } @inproceedings{lengevin2021heuristic, author = {Raina Langevin and Ross J Lordon and Thi Avrahami and Benjamin R Cowan and Tad Hirsch and Gary Hsieh}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Heuristic evaluation of conversational agents}, year = {2021}, } @inproceedings{bentley2018understanding, author = {Frank Bentley and Chris Luvogt and Max Silverman and Rushani Wirasinghe and Brooke White and Danielle Lottridge}, booktitle = {Proc. ACM Interact. Mob. Wearable Ubiquitous Technol}, title = {Understanding the Long-Term Use of Smart Speaker Assistants}, year = {2018}, } @inproceedings{cowan2018help, author = {Benjamin R. Cowan and Nadia Pantidi and David Coyle and Kellie Morrissey and Peter Clarke and Sara Al-Shehri and David Earley and Natasha Bandeira}, booktitle = {Proceedings of the 19th International Conference on Human-Computer Interaction with Mobile Devices and Services (MobileHCI ’17)}, title = {"What Can {I} Help You with?": Infrequent Users’ Experiences of Intelligent Personal Assistants}, year = {2018}, } @inproceedings{jain2018farmchat, author = {Mohit Jain and Pratyush Kumar and Ishita Bhansali and Q Vera Liao and Khai Truong and Shwetak Patel}, booktitle = {ACM Conference on Interactive, Mobile, Wearable and Ubiquitous Technologies}, title = {FarmChat: A Conversational Agent to Answer Farmer Queries}, year = {2018}, } @inproceedings{pillutla2021mauve, author = {Krishna Pillutla and Swabha Swayamdipta and Rowan Zellers and John Thickstun and Sean Welleck and Yejin Choi and Zaid Harchaoui}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {MAUVE: Measuring the Gap Between Neural Text and Human Text using Divergence Frontiers}, year = {2021}, } @inproceedings{horvitz1999principles, author = {Eric Horvitz}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Principles of Mixed-Initiative User Interfaces}, year = {1999}, } @article{brynjolfsson2022turing, author = {Erik Brynjolfsson}, journal = {Daedalus}, title = {The Turing Trap: The Promise \& Peril of Human-Like Artificial Intelligence}, volume = {151}, year = {2022}, } @article{janlert2017meaning, author = {Lars-Erik Janlert and Erik Stolterman}, journal = {Human–Computer Interaction}, title = {The Meaning of Interactivity—Some Proposals for Definitions and Measures}, volume = {32}, year = {2017}, } @inproceedings{clark2018creative, author = {Elizabeth Clark and Anne Spencer Ross and Chenhao Tan and Yangfeng Ji and Noah A. Smith}, booktitle = {23rd International Conference on Intelligent User Interfaces}, title = {Creative writing with a machine in the loop: Case studies on slogans and stories}, year = {2018}, } @article{clark2019state, author = {Leigh Clark and Phillip Doyle and Diego Garaialde and Emer Gilmartin and Stephan Schlögl and Jens Edlund and Matthew Aylett and Joao Cabral and Cosmin Munteanu and Benjamin Cowan}, journal = {Interacting with Computers}, title = {{The State of Speech in HCI: Trends, Themes and Challenges}}, volume = {31}, year = {2019}, } @inproceedings{thomas2020expressions, author = {Paul Thomas and Daniel McDuff and Mary Czerwinski and Nick Craswell}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, title = {Expressions of Style in Information Seeking Conversation with an Agent}, year = {2020}, } @article{deriu2021survey, author = {Jan Deriu and Alvaro Rodrigo and Arantxa Otegi and Guillermo Echegoyen and Sophie Rosset and Eneko Agirre and Mark Cieliebak}, journal = {Artificial Intelligence Review}, title = {Survey on evaluation methods for dialogue systems}, volume = {54}, year = {2021}, } @article{huang2020challenges, author = {Minlie Huang and Xiaoyan Zhu and Jianfeng Gao}, journal = {ACM Transactions on Information Systems (TOIS)}, title = {{Challenges in building intelligent open-domain dialog systems}}, volume = {38}, year = {2020}, } @inproceedings{roller2021recipes, author = {Stephen Roller and Emily Dinan and Naman Goyal and Da Ju and Mary Williamson and Yinhan Liu and Jing Xu and Myle Ott and Eric Michael Smith and Y-Lan Boureau and Jason Weston}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Recipes for Building an Open-Domain Chatbot}, year = {2021}, } @inproceedings{deriu2020spot, author = {Jan Deriu and Don Tuggener and Pius von Däniken and Jon Ander Campos and Alvaro Rodrigo and Thiziri Belkacem and Aitor Soroa and Eneko Agirre and Mark Cieliebak}, booktitle = {Human Language Technology and Empirical Methods in Natural Language Processing (HLT/EMNLP)}, journal = {arXiv preprint arXiv:2010.02140}, title = {{Spot the bot: A robust and efficient framework for the evaluation of conversational dialogue systems}}, year = {2020 2020}, } @inproceedings{hu2021alexaprize, author = {Shui Hu and Yang Liu and Anna Gottardi and Behnam Hedayatnia and Anju Khatri and Anjali Chadha and Qinlang Chen and Pankaj Rajan and Ali Binici and Varun Somani and Yao Lu and Prerna Dwivedi and Lucy Hu and Hangjie Shi and Sattvik Sahai and Mihail Eric and Karthik Gopalakrishnan and Seokhwan Kim and Spandana Gella and Alexandros Papangelis and Patrick Lange and Di Jin and Nicole Chartier and Mahdi Namazifar and Aishwarya Padmakumar and Sarik Ghazarian and Shereen Oraby and Anjali Narayan-Chen and Yuheng Du and Lauren Stubell and Savanna Stiff and Kate Bland and Arindam Mandal and Reza Ghanadan and Dilek Hakkani-Tür}, booktitle = {Alexa Prize SocialBot Grand Challenge 4 Proceedings}, title = {Further advances in open domain dialog systems in the Fourth Alexa Prize SocialBot Grand Challenge}, year = {2021}, } @inproceedings{smith2022human, author = {Eric Smith and Orion Hsu and Rebecca Qian and Stephen Roller and Y-Lan Boureau and Jason Weston}, booktitle = {Proceedings of the 4th Workshop on NLP for Conversational AI}, title = {Human Evaluation of Conversations is an Open Problem: comparing the sensitivity of various methods for evaluating dialogue agents}, year = {2022}, } @article{konstan2004introduction, author = {Joseph A Konstan}, journal = {ACM Transactions on Information Systems (TOIS)}, title = {Introduction to recommender systems: Algorithms and evaluation}, volume = {22}, year = {2004}, } @article{hancock2020communication, author = {Jeffrey T Hancock and Mor Naaman and Karen Levy}, journal = {Journal of Computer-Mediated Communication}, title = {{AI}-mediated communication: Definition, research agenda, and ethical considerations}, year = {2020}, } @article{goldberg1992using, author = {David Goldberg and David Nichols and Brian M Oki and Douglas Terry}, journal = {Communications of the ACM}, title = {Using collaborative filtering to weave an information tapestry}, volume = {35}, year = {1992}, } @article{white2009exploratory, author = {Ryen W White and Resa A Roth}, journal = {Synthesis lectures on information concepts, retrieval, and services}, title = {Exploratory search: Beyond the query-response paradigm}, volume = {1}, year = {2009}, } @article{kelly2009methods, author = {Diane Kelly}, journal = {Foundations and Trends{\textregistered} in Information Retrieval}, title = {Methods for evaluating interactive information retrieval systems with users}, volume = {3}, year = {2009}, } @article{mataric2017socially, author = {Maja J Mataric}, journal = {Science}, title = {Socially assistive robotics: Human augmentation versus automation}, volume = {2}, year = {2017}, } @article{spink1997study, author = {Amanda Spink}, journal = {Journal of the american society for information science}, title = {Study of interactive feedback during mediated information retrieval}, volume = {48}, year = {1997}, } @article{settles2012active, author = {Burr Settles}, journal = {Synthesis lectures on artificial intelligence and machine learning}, title = {Active learning}, volume = {6}, year = {2012}, } @inproceedings{amershi2011effective, author = {Saleema Amershi and James Fogarty and Ashish Kapoor and Desney Tan}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Effective end-user interaction with machine learning}, year = {2011}, } @inproceedings{rashkin2019towards, author = {Hannah Rashkin and Eric Michael Smith and Margaret Li and Y-Lan Boureau}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Towards Empathetic Open-domain Conversation Models: a New Benchmark and Dataset}, year = {2019}, } @article{hassani2020artificial, author = {Hossein Hassani and Emmanuel Sirimal Silva and Stephane Unger and Maedeh TajMazinani and Stephen Mac Feely}, journal = {Ai}, title = {Artificial intelligence (AI) or intelligence augmentation (IA): what is the future?}, volume = {1}, year = {2020}, } @techreport{engelbart1962augmenting, author = {Douglas C Engelbart}, institution = {SRI Summary Report AFOSR-3223}, title = {Augmenting human intellect: A conceptual framework}, year = {1962}, } @article{skagestad1993thinking, author = {Peter Skagestad}, journal = {Journal of Social and Evolutionary Systems}, title = {Thinking with machines: Intelligence augmentation, evolutionary epistemology, and semiotic}, volume = {16}, year = {1993}, } @article{skagestad1996mind, author = {Peter Skagestad}, journal = {Semiotica}, title = {The mind's machines: The Turing machine, the Memex, and the personal computer}, volume = {111}, year = {1996}, } @inproceedings{chen2019gmail, author = {Mia Xu Chen and Benjamin N Lee and Gagan Bansal and Yuan Cao and Shuyuan Zhang and Justin Lu and Jackie Tsay and Yinan Wang and Andrew M Dai and Zhifeng Chen and others}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, title = {Gmail smart compose: Real-time assisted writing}, year = {2019}, } @inproceedings{brown2016designing, author = {Deana Brown and Rebecca E. Grinter}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Designing for Transient Use: A Human-in-the-Loop Translation Platform for Refugees}, year = {2016}, } @inproceedings{fede2022ideamachine, author = {Giulia Di Fede and Davide Rocchesso and Steven P. Dow and Salvatore Andolina}, booktitle = {ACM}, title = {The Idea Machine: {LLM}-based Expansion, Rewriting, Combination, and Suggestion of Ideas}, year = {2022}, } @inproceedings{jakesch2019perception, author = {Maurice Jakesch and Megan French and Xiao Ma and Jeffrey T. Hancock and Mor Naaman}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {{AI}-Mediated Communication: How the Perception That Profile Text Was Written by {AI} Affects Trustworthiness}, year = {2019}, } @inproceedings{miller1968response, author = {Robert B Miller}, booktitle = {Proceedings of the December 9-11, 1968, fall joint computer conference, part I}, title = {Response time in man-computer conversational transactions}, year = {1968}, } @book{shneiderman2010designing, author = {Ben Shneiderman and Catherine Plaisant}, publisher = {Pearson}, title = {Designing the user interface: Strategies for effective human-computer interaction}, year = {2010}, } @book{nielsen1994usability, author = {Jakob Nielsen}, publisher = {Morgan Kaufmann}, title = {Usability engineering}, year = {1994}, } @inproceedings{card1991information, author = {Stuart K Card and George G Robertson and Jock D Mackinlay}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {The information visualizer, an information workspace}, year = {1991}, } @article{jakesch2022human, author = {Maurice Jakesch and Jeffrey Hancock and Mor Naaman}, journal = {arXiv preprint arXiv:2206.07271}, title = {Human Heuristics for {AI}-Generated Language Are Flawed}, year = {2022}, } @article{ethayarajh2022human, author = {Kawin Ethayarajh and Dan Jurafsky}, journal = {arXiv preprint arXiv:2205.11930}, title = {How Human is Human Evaluation? Improving the Gold Standard for {NLG} with Utility Theory}, year = {2022}, } @book{lakoff2009more, author = {George Lakoff and Mark Turner}, publisher = {University of Chicago press}, title = {More than cool reason: A field guide to poetic metaphor}, year = {2009}, } @article{mio1997metaphor, author = {Jeffery Scott Mio}, journal = {Metaphor and symbol}, title = {Metaphor and politics}, volume = {12}, year = {1997}, } @article{niebert2012understanding, author = {Kai Niebert and Sabine Marsch and David F Treagust}, journal = {Science}, title = {Understanding needs embodiment: A theory-guided reanalysis of the role of metaphors and analogies in understanding science}, volume = {96}, year = {2012}, } @inproceedings{gero2019metaphoria, author = {Katy Ilonka Gero and Lydia B Chilton}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Metaphoria: An algorithmic companion for metaphor creation}, year = {2019}, } @inproceedings{gero2018challenges, author = {Katy Gero and Lydia Chilton}, booktitle = {Proceedings of the Workshop on Figurative Language Processing}, title = {Challenges in finding metaphorical connections}, year = {2018}, } @book{glucksberg2001understanding, author = {Sam Glucksberg and Matthew S McGlone}, publisher = {Oxford University Press on Demand}, title = {Understanding figurative language: From metaphor to idioms}, year = {2001}, } @inproceedings{maynez2020faithfulness, author = {Joshua Maynez and Shashi Narayan and Bernd Bohnet and Ryan McDonald}, booktitle = {Association for Computational Linguistics (ACL)}, title = {On Faithfulness and Factuality in Abstractive Summarization}, year = {2020}, } @article{sheng2021societal, author = {Emily Sheng and Kai{-}Wei Chang and Premkumar Natarajan and Nanyun Peng}, journal = {CoRR}, title = {Societal Biases in Language Generation: Progress and Challenges}, volume = {0}, year = {2021}, } @inproceedings{gero2022design, author = {Katy Gero and Alex Calderwood and Charlotte Li and Lydia Chilton}, booktitle = {Proceedings of the First Workshop on Intelligent and Interactive Writing Assistants (In2Writing 2022)}, title = {A Design Space for Writing Support Tools Using a Cognitive Process Model of Writing}, year = {2022}, } @inproceedings{buschbeck2020parallel, author = {Bianka Buschbeck and Miriam Exel}, booktitle = {Proceedings of the 7th Workshop on Asian Translation}, title = {A Parallel Evaluation Data Set of Software Documentation with Document Structure Annotation}, year = {2020}, } @inproceedings{zhou2021commonsense, author = {Pei Zhou and Karthik Gopalakrishnan and Behnam Hedayatnia and Seokhwan Kim and Jay Pujara and Xiang Ren and Yang Liu and Dilek Hakkani-Tur}, booktitle = {Proceedings of the 22nd Annual Meeting of the Special Interest Group on Discourse and Dialogue}, title = {Commonsense-Focused Dialogues for Response Generation: An Empirical Study}, year = {2021}, } @inproceedings{pagnoni2021understanding, author = {Artidoro Pagnoni and Vidhisha Balachandran and Yulia Tsvetkov}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Understanding Factuality in Abstractive Summarization with {FRANK}: A Benchmark for Factuality Metrics}, year = {2021}, } @inproceedings{narayan2018dont, author = {Shashi Narayan and Shay B. Cohen and Mirella Lapata}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Don{'}t Give Me the Details, Just the Summary! Topic-Aware Convolutional Neural Networks for Extreme Summarization}, year = {2018}, } @article{buschek2021nine, author = {Daniel Buschek and Lukas Mecke and Florian Lehmann and Hai Dang}, journal = {arXiv preprint arXiv:2104.00358}, title = {Nine Potential Pitfalls when Designing Human-{AI} Co-Creative Systems}, year = {2021}, } @inproceedings{akoury2020storium, author = {Nader Akoury and Shufan Wang and Josh Whiting and Stephen Hood and Nanyun Peng and Mohit Iyyer}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {{STORIUM}: A Dataset and Evaluation Platform for Machine-in-the-Loop Story Generation}, year = {2020}, } @article{liu2021pre, author = {Pengfei Liu and Weizhe Yuan and Jinlan Fu and Zhengbao Jiang and Hiroaki Hayashi and Graham Neubig}, journal = {arXiv}, title = {{Pre-train}, Prompt, and Predict: A Systematic Survey of Prompting Methods in Natural Language Processing}, year = {2021}, } @article{berthelot2021adamatch, author = {David Berthelot and Rebecca Roelofs and Kihyuk Sohn and Nicholas Carlini and Alex Kurakin}, journal = {arXiv preprint arXiv:2106.04732}, title = {AdaMatch: A Unified Approach to Semi-Supervised Learning and Domain Adaptation}, year = {2021}, } @inproceedings{cubuk2020randaugment, author = {Ekin D Cubuk and Barret Zoph and Jonathon Shlens and Quoc V Le}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {702--703}, title = {Randaugment: Practical automated data augmentation with a reduced search space}, year = {2020}, } @article{zhang2021semi, author = {Yabin Zhang and Haojian Zhang and Bin Deng and Shuai Li and Kui Jia and Lei Zhang}, journal = {arXiv preprint arXiv:2106.00417}, title = {Semi-supervised Models are Strong Unsupervised Domain Adaptation Learners}, year = {2021}, } @misc{jiang2020tll, author = {Junguang Jiang and Baixu Chen and Bo Fu and Mingsheng Long}, howpublished = {\url{https://github.com/thuml/Transfer-Learning-Library}}, title = {Transfer Learning library}, year = {2020}, } @inproceedings{herzig2017multi, author = {Jonathan Herzig and Jonathan Berant}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Neural Semantic Parsing over Multiple Knowledge-bases}, year = {2017}, } @inproceedings{bao2016constraint, author = {Junwei Bao and Nan Duan and Zhao Yan and Ming Zhou and Tiejun Zhao}, booktitle = {International Conference on Computational Linguistics (COLING)}, title = {Constraint-Based Question Answering with Knowledge Graph}, year = {2016}, } @inproceedings{onishi2016wdw, author = {Takeshi Onishi and Hai Wang and Mohit Bansal and Kevin Gimpel and David McAllester}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Who did what: A large-scale person-centered cloze dataset}, year = {2016}, } @article{kwok2001scaling, author = {Cody Kwok and Oren Etzioni and Daniel S. Weld}, journal = {ACM Transactions on Information Systems (TOIS)}, pages = {242--262}, title = {Scaling question answering to the web}, volume = {19}, year = {2001}, } @book{bird2009nltk, author = {Steven Bird and Edward Loper and Ewan Klein}, publisher = {O’Reilly Media Inc.}, title = {Natural Language Processing with Python}, year = {2009}, } @inproceedings{press2017language, author = {Ofir Press and Amir Bar and Ben Bogin and Jonathan Berant and Lior Wolf}, booktitle = {Fist Workshop on Learning to Generate Natural Language@ICML}, title = {Language Generation with Recurrent Generative Adversarial Networks without Pre-training}, year = {2017}, } @inproceedings{talmor2017evaluating, author = {Alon Talmor and Mor Geva and Jonathan Berant}, booktitle = {*SEM}, title = {Evaluating Semantic Parsing against a Simple Web-based Question Answering Model}, year = {2017}, } @inproceedings{xiong2017dynamic, author = {Caiming Xiong and Victor Zhong and Richard Socher}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Dynamic Coattention Networks For Question Answering}, year = {2017}, } @inproceedings{levy2017zero, author = {Omer Levy and Minjoon Seo and Eunsol Choi and Luke Zettlemoyer}, booktitle = {Computational Natural Language Learning (CoNLL)}, title = {Zero-Shot Relation Extraction via Reading Comprehension}, year = {2017}, } @inproceedings{trischler2017newsqa, author = {Adam Trischler and Tong Wang and Xingdi Yuan and Justin Harris and Alessandro Sordoni and Philip Bachman and Kaheer Suleman}, booktitle = {Workshop on Representation Learning for NLP}, title = {{NewsQA}: A Machine Comprehension Dataset}, year = {2017}, } @inproceedings{nguyen2016ms, author = {Tri Nguyen and Mir Rosenberg and Xia Song and Jianfeng Gao and Saurabh Tiwary and Rangan Majumder and Li Deng}, booktitle = {Workshop on Cognitive Computing at NIPS}, title = {{MS MARCO}: A human generated machine reading comprehension dataset}, year = {2016}, } @article{dunn2017searchqa, author = {Matthew Dunn and and Levent Sagun and Mike Higgins and Ugur Guney and Volkan Cirik and Kyunghyn Cho}, journal = {arXiv}, title = {{SearchQA}: A New {Q}\&{A} Dataset Augmented with Context from a Search Engine}, year = {2017}, } @inproceedings{joshi2017triviaqa, author = {Mandar Joshi and Eunsol Choi and Daniel Weld and Luke Zettlemoyer}, booktitle = {Association for Computational Linguistics (ACL)}, title = {{TriviaQA}: A Large Scale Distantly Supervised Challenge Dataset for Reading Comprehension}, year = {2017}, } @inproceedings{miller2016keyvalue, author = {Alexander Miller and Adam Fisch and Jesse Dodge and Amir Hossein Karimi and Antoine Bordes and Jason Weston}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = { Key-value memory networks for directly reading documents}, year = {2016}, } @inproceedings{rabinovich2017abstract, author = {Maxim Rabinovich and Mitchell Stern and Dan Klein}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Abstract Syntax Networks for Code Generation and Semantic Parsing}, year = {2017}, } @inproceedings{das2017question, author = {Rajarshi Das and Manzil Zaheer and Siva Reddy and Andrew McCallum}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Question Answering on Knowledge Bases and Text using Universal Schema and Memory Networks}, year = {2017}, } @inproceedings{beltagy2014probabilistic, author = {Islam Beltagy and Katherin Erk and Raymond J. Mooney}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Probabilistic Soft Logic for Semantic Textual Similarity}, year = {2014}, } @article{lewis2013combining, author = {Mike Lewis and Mark Steedman}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {Combining distributional and logical semantics}, volume = {1}, year = {2013}, } @inproceedings{demeester2016lifted, author = {Thomas Demeester and Tim Rockt{\"{a}}schel and Sebastian Riedel}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Lifted Rule Injection for Relation Embeddings}, year = {2016}, } @article{santoro2017simple, author = {Adam Santoro and David Raposo and David GT Barrett and Mateusz Malinowski and Razvan Pascanu and Peter Battaglia and Timothy Lillicrap}, journal = {arXiv}, title = {A simple neural network module for relational reasoning}, year = {2017}, } @inproceedings{yih2016value, author = {Wen-tau Yih and Matthew Richardson and Chris Meek and Ming-Wei Chang and Jina Suh}, booktitle = {Association for Computational Linguistics (ACL)}, title = {The Value of Semantic Parse Labeling for Knowledge Base Question Answering}, year = {2016}, } @inproceedings{krishnamurthy2017neural, author = {Jayant Krishnamurthy and Pradeep Dasigi and Matt Gardner}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Neural Semantic Parsing with Type Constraints for Semi-Structured Tables}, year = {2017}, } @inproceedings{bahdanau2017actor, author = {Dzmitry Bahdanau and Philemon Brakel and Kelvin Xu and Anirudh Goyal and Ryan Lowe and Joelle Pineau and Aaron Courville and Yoshua Bengio}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {An actor-critic algorithm for sequence prediction}, year = {2017}, } @inproceedings{fang2017learning, author = {Meng Fang and Yuan Li and Trevor Cohn}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Learning how to Active Learn: A Deep Reinforcement Learning Approach}, year = {2017}, } @inproceedings{dai2015semi, author = {Andrew M. Dai and Quoc V. Le}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Semi-supervised sequence learning}, year = {2015}, } @inproceedings{dyer2016recurrent, author = {Chris Dyer and Adhiguna Kuncoro and Miguel Ballesteros and Noah A Smith}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Recurrent neural network grammars}, year = {2016}, } @inproceedings{lee2016global, author = {Kenton lee and Mike Lewis and Luke Zettlemoyer}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Global neural {CCG} parsing with optimality guarantees}, year = {2016}, } @inproceedings{devlin2016captioning, author = {Jacob Devlin and Hao Cheng and Hao Fang and Saurabh Gupta and Li Deng and Xiaodong He and Geoffrey Zweig and Margaret Mitchell}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Language Models for Image Captioning: The Quirks and What Works}, year = {2016}, } @inproceedings{rocktaschel2015injecting, author = {Tim Rockt{\"a}schel and Sameer Singh and Sebastian Riedel}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Injecting Logical Background Knowledge into Embeddings for Relation Extraction}, year = {2015}, } @article{hu2016harnessing, author = {Zhiting Hu and Xuezhe Ma and Zhengzhong Liu and Eduard Hovy and Eric Xing}, journal = {arXiv preprint arXiv:1603.06318}, title = {Harnessing deep neural networks with logic rules}, year = {2016}, } @inproceedings{lai2017race, author = {Guokun Lai and Qizhe Xie and Hanxiao Liu and Yiming Yang and Eduard Hovy}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {RACE: Large-scale ReAding Comprehension Dataset From Examinations}, year = {2017}, } @inproceedings{cheng2017learning, author = {Jianpeng Cheng and Siva Reddy and Vijay Saraswat and Mirella Lapata}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Learning Structured Natural Language Representations for Semantic Parsing}, year = {2017}, } @inproceedings{johnson2017inferring, author = {Justin Johnson and Bharath Hariharan and Laurens van der Maaten and Judy Hoffman and Li Fei-Fei and C Lawrence Zitnick and Ross Girshick}, booktitle = {International Conference on Computer Vision (ICCV)}, title = {Inferring and Executing Programs for Visual Reasoning}, year = {2017}, } @inproceedings{suhr2017nlvr, author = {Alane Suhr and Mike Lewis and James Yeh and Yoav Artzi}, booktitle = {Association for Computational Linguistics (ACL)}, title = {A Corpus of Natural Language for Visual Reasoning}, year = {2017}, } @article{andrychowicz2017hindsight, author = {Marcin Andrychowicz and Filip Wolski and Alex Ray and Jonas Schneider and Rachel Fong and Peter Welinder and Bob McGrew and Josh Tobin and Pieter Abbeel and Wojciech Zaremba}, journal = {arXiv preprint arXiv:1707.01495}, title = {Hindsight Experience Replay}, year = {2017}, } @article{kazemi2017show, author = {Vahid Kazemi and Ali Elqursh}, journal = {arXiv preprint arXiv:1704.03162}, title = {Show, Ask, Attend, and Answer: A Strong Baseline For Visual Question Answering}, year = {2017}, } @article{noh2016training, author = {Hyeonwoo Noh and Bohyung Han}, journal = {arXiv preprint arXiv:1606.03647}, title = {Training recurrent answering units with joint loss minimization for vqa}, year = {2016}, } @article{wu2017visual, author = {Qi Wu and Damien Teney and Peng Wang and Chunhua Shen and Anthony Dick and Anton van den Hengel}, journal = {Computer Vision and Image Understanding}, title = {Visual question answering: A survey of methods and datasets}, year = {2017}, } @inproceedings{pasunuru2017reinforced, author = {Ramakanth Pasunuru and Mohit Bansal}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Reinforced Video Captioning with Entailment Rewards}, year = {2017}, } @inproceedings{xu2016question, author = {Kun Xu and Siva Reddy and Yansong Feng and Songfang Huang and Dongyan Zhao}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Question answering on freebase via relation extraction and textual evidence}, year = {2016}, } @inproceedings{gardner2017open, author = {Matt Gardner and Jayant Krishnamurthy}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Open-Vocabulary Semantic Parsing with both Distributional Statistics and Formal Knowledge}, year = {2017}, } @inproceedings{fan2017transfer, author = {Xing Fan and Emilio Monti and Lambert Mathias and Markus Dreyer}, booktitle = {Workshop on Representation Learning for NLP}, title = {Transfer Learning for Neural Semantic Parsing}, year = {2017}, } @inproceedings{su2017cross, author = {Yu Su and Xifeng Yan}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Cross-domain Semantic Parsing via Paraphrasing}, year = {2017}, } @inproceedings{hashimoto2017joint, author = {Kazuma Hashimoto and Caiming Xiong and Yoshimasa Tsuruoka and Richard Socher}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {A joint many-task model: Growing a neural network for multiple {NLP} tasks}, year = {2017}, } @article{ruder2017overview, author = {Sebastian Ruder}, journal = {arXiv preprint arXiv:1706.05098}, title = {An overview of multi-task learning in deep neural networks}, year = {2017}, } @article{buck2017ask, author = {Christian Buck and Jannis Bulian and Massimiliano Ciaramita and Andrea Gesmundo and Neil Houlsby and Wojciech Gajewski and Wei Wang}, journal = {arXiv preprint arXiv:1705.07830}, title = {Ask the Right Questions: Active Question Reformulation with Reinforcement Learning}, year = {2017}, } @inproceedings{nogueira2017task, author = {Rodrigo Nogueira and Kyunghyun Cho}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Task-oriented query reformulation with reinforcement learning}, year = {2017}, } @inproceedings{choe2016parsing, author = {Do Kook Choe and Eugene Charniak}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Parsing as Language Modeling}, year = {2016}, } @article{linzen2016assessing, author = {Tal Linzen and Emmanuel Dupoux and Yoav Goldberg}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {Assessing the ability of {LSTMs} to learn syntax-sensitive dependencies}, volume = {4}, year = {2016}, } @inproceedings{lewis1994sequential, author = {David D Lewis and William A Gale}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, title = {A sequential algorithm for training text classifiers}, year = {1994}, } @inproceedings{west2014knowledge, author = {Robert West and Evgeniy Gabrilovich and Kevin Murphy and Shaohua Sun and Rahul Gupta and Dekang Lin}, booktitle = {Proceedings of the 23rd international conference on World wide web}, title = {Knowledge base completion via search-based question answering}, year = {2014}, } @article{vieira2017learning, author = {Tim Vieira and Jason Eisner}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, pages = {263--278}, title = {Learning to Prune: Exploring the Frontier of Fast and Accurate Parsing}, volume = {5}, year = {2017}, } @misc{squad2016url, author = {Pranav Rajpurkar}, howpublished = {\url{https://rajpurkar.github.io/SQuAD-explorer/}}, title = {{SQuAD}}, year = {2016}, } @article{baltruvsaitis2017multimodal, author = {Tadas Baltru{\v{s}}aitis and Chaitanya Ahuja and Louis-Philippe Morency}, journal = {arXiv preprint arXiv:1705.09406}, title = {Multimodal Machine Learning: A Survey and Taxonomy}, year = {2017}, } @article{turney2001mining, author = {Peter Turney}, journal = {Machine Learning}, pages = {491--502}, title = {Mining the web for synonyms: {PMI}-{IR} versus {LSA} on {TOEFL}}, volume = {2167}, year = {2001}, } @article{littlestone1994weighted, author = {Nick Littlestone and Manfred K Warmuth}, journal = {Information and computation}, number = {2}, pages = {212--261}, title = {The weighted majority algorithm}, volume = {108}, year = {1994}, } @article{beltagy2017representing, author = {Islam Beltagy and Stephen Roller and Pengxiang Cheng and Katrin Erk and Raymond J Mooney}, journal = {Computational Linguistics}, title = {Representing meaning with a combination of logical and distributional models}, volume = {42}, year = {2017}, } @inproceedings{hu2017learning, author = {Ronghang Hu and Jacob Andreas and Marcus Rohrbach and Trevor Darrell and Kate Saenko}, booktitle = {International Conference on Computer Vision (ICCV)}, title = {Learning to reason: End-to-end module networks for visual question answering}, year = {2017}, } @inproceedings{johnson2017clevr, author = {Justin Johnson and Bharath Hariharan and Laurens van der Maaten and Li Fei-Fei and C Lawrence Zitnick and Ross Girshick}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {CLEVR: A diagnostic dataset for compositional language and elementary visual reasoning}, year = {2017}, } @inproceedings{wang2017gated, author = {Wenhui Wang and Nan Yang and Furu Wei and Baobao Chang and Ming Zhou}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Gated self-matching networks for reading comprehension and question answering}, year = {2017}, } @article{zhong2017seq2sql, author = {Victor Zhong and Caiming Xiong and Richard Socher}, journal = {arXiv preprint arXiv:1709.00103}, title = {Seq2{SQL}: Generating Structured Queries from Natural Language using Reinforcement Learning}, year = {2017}, } @article{welbl2017constructing, author = {Johannes Welbl and Pontus Stenetorp and Sebastian Riedel}, journal = {arXiv preprint arXiv:1710.06481}, title = {Constructing Datasets for Multi-hop Reading Comprehension Across Documents}, year = {2017}, } @inproceedings{clark2018simple, author = {Christopher Clark and Matt Gardner}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Simple and effective multi-paragraph reading comprehension}, year = {2018}, } @article{andor2016globally, author = {Daniel Andor and Chris Alberti and David Weiss and Aliaksei Severyn and Alessandro Presta and Kuzman Ganchev and Slav Petrov and Michael Collins}, journal = {arXiv preprint arXiv:1603.06042}, title = {Globally normalized transition-based neural networks}, year = {2016}, } @inproceedings{chen2017reading, author = {Danqi Chen and Adam Fisch and Jason Weston and Antoine Bordes}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Reading {W}ikipedia to Answer Open-Domain Questions}, year = {2017}, } @article{watanabe2017question, author = {Yusuke Watanabe and Bhuwan Dhingra and Ruslan Salakhutdinov}, journal = {arXiv preprint arXiv:1703.08885}, title = {Question Answering from Unstructured Text by Retrieval and Comprehension}, year = {2017}, } @inproceedings{xiao2016sequence, author = {Chunyang Xiao and Marc Dymetman and Claire Gardent}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Sequence-based Structured Prediction for Semantic Parsing}, year = {2016}, } @inproceedings{cohen2017inducing, author = {Mor Cohen and Avi Calciularu and Idan Rejwan and Jonathan Berant}, booktitle = {Workshop on Learning and Reasoning: Principles & Applications to Everyday Spatial and Temporal Knowledge}, title = {Inducing Regular Grammars Using Recurrent Neural Networks}, year = {2017}, } @inproceedings{goldman2018weakly, author = {Omer Goldman and Veronika Latcinnik and Udi Naveh and Amir Globerson and Jonathan Berant}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Weakly-supervised Semantic Parsing with Abstract Examples}, year = {2018}, } @article{kovcisky2017narrativeqa, author = {Tom{\v{s}} Ko{\v{c}}isky and Jonathan Schwarz and Phil Blunsom and Chris Dyer and Karl Moritz Hermann and Gabor Melis and Edward Grefenstette}, journal = {arXiv preprint arXiv:1712.07040}, title = {The {NarrativeQA} Reading Comprehension Challenge}, year = {2017}, } @inproceedings{hewlett2017accurate, author = {Daniel Hewlett and Llion Jones and Alexandre Lacoste and others}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {2011--2020}, title = {Accurate Supervised and Semi-Supervised Machine Reading for Long Documents}, year = {2017}, } @article{hessel2017rainbow, author = {Matteo Hessel and Joseph Modayil and Hado Van Hasselt and Tom Schaul and Georg Ostrovski and Will Dabney and Dan Horgan and Bilal Piot and Mohammad Azar and David Silver}, journal = {arXiv preprint arXiv:1710.02298}, title = {Rainbow: Combining Improvements in Deep Reinforcement Learning}, year = {2017}, } @inproceedings{van2016deep, author = {Hado van Hasselt and Arthur Guez and David Silver}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {2094--2100}, title = {Deep Reinforcement Learning with Double {Q}-Learning}, volume = {16}, year = {2016}, } @inproceedings{wang2016dueling, author = {Ziyu Wang and Tom Schaul and Matteo Hessel and Hado Van Hasselt and Marc Lanctot and Nando De Freitas}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Dueling network architectures for deep reinforcement learning}, year = {2016}, } @inproceedings{lao2015learning, author = {Ni Lao and Einat Minkov and William Cohen}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Learning relational features with backward random walks}, year = {2015}, } @inproceedings{cheng2016long, author = {Jianpeng Cheng and Li Dong and Mirella Lapata}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Long short-term memory-networks for machine reading}, year = {2016}, } @inproceedings{salant2018contextualized, author = {Shimi Salant and Jonathan Berant}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Contextualized Word Representations for Reading Comprehension}, year = {2018}, } @inproceedings{wang2018r3, author = {Shuohang Wang and Mo Yu and Xiaoxiao Guo and Zhiguo Wang and Tim Klinger and Wei Zhang and Shiyu Chang and Gerald Tesauro and Bowen Zhou and Jing Jiang}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {{R3}: Reinforced Ranker-Reader for Open-Domain Question Answering}, year = {2018}, } @inproceedings{ba2015multiple, author = {Jimmy Ba and Volodymyr Mnih and Koray Kavukcuoglu}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Multiple object recognition with visual attention}, year = {2015}, } @inproceedings{swayamdipta2018multi, author = {Swabha Swayamdipta and Ankur P Parikh and Tom Kwiatkowski}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Multi-Mention Learning for Reading Comprehension with Neural Cascades}, year = {2018}, } @inproceedings{das2018go, author = {Rajarshi Das and Shehzaad Dhuliawala and Manzil Zaheer and Luke Vilnis and Ishan Durugkar and Akshay Krishnamurthy and Alex Smola and Andrew McCallum}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Go for a Walk and Arrive at the Answer: Reasoning Over Paths in Knowledge Bases using Reinforcement Learning}, year = {2018}, } @inproceedings{yu2017skim, author = {Adams Wei Yu and Hongrae Lee and Quoc V. Le}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Learning to Skim Text}, year = {2017}, } @inproceedings{seo2018neural, author = {Minjoon Seo and Sewon Min and Ali Farhadi and Hannaneh Hajishirzi}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Neural Speed Reading via Skim-{RNN}}, year = {2018}, } @inproceedings{campos2018skip, author = {Victor Campos and Brendan Jou and Xavier Giro-i-Nieto and Jordi Torres and Shih-Fu Chang}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Skip {RNN}: Learning to Skip State Updates in Recurrent Neural Networks}, year = {2018}, } @inproceedings{bradbury2017quasi, author = {James Bradbury and Stephen Merity and Caiming Xiong and Richard Socher}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Quasi-recurrent neural networks}, year = {2017}, } @inproceedings{richardson2018polyglot, author = {Kyle Richardson and Jonathan Berant and Jonas Kuhn}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Polyglot Semantic Parsing in {API}s}, year = {2018}, } @inproceedings{koshorek2018segmentation, author = {Omri Koshorek and Noam Mor and Adir Cohen and Michael Rotman and Jonathan Berant}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Text Segmentation as a Supervised Learning Task}, year = {2018}, } @inproceedings{talmor2018web, author = {Alon Talmor and Jonathan Berant}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {The Web as Knowledge-base for Answering Complex Questions}, year = {2018}, } @inproceedings{herzig2018mapping, author = {Roei Herzig and Moshiko Raboh and Gal Chechik and Jonathan Berant and Amir Globerson}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Mapping Images to Scene Graphs with Permutation-Invariant Structured Prediction}, year = {2018}, } @inproceedings{herzig2018zeroshot, author = {Jonathan Herzig and Jonathan Berant}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Decoupling Structure and Lexicon for Zero-Shot Semantic Parsing}, year = {2018}, } @inproceedings{geva2018long, author = {Mor Geva and Jonathan Berant}, booktitle = {International Conference on Computational Linguistics (COLING)}, title = {Learning to Search in Long Documents using Document Structure}, year = {2018}, } @inproceedings{liang2018mapo, author = {Chen Liang and Mohammad Norouzi and Jonathan Berant and Quoc Le and Ni Lao}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Memory Augmented Policy Optimization for Program Synthesis with Generalization}, year = {2018}, } @inproceedings{berant2019explaining, author = {Jonathan Berant and Daniel Deutch and Amir Globerson and Tova Milo and Tomer Wolfson}, booktitle = {International Conference on Data Engineering (ICDE)}, title = {Explaining Queries over Web Tables to Non-Experts}, year = {2019}, } @inproceedings{bisk2016natural, author = {Yonatan Bisk and Deniz Yuret and Daniel Marcu}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Natural language communication with robots}, year = {2016}, } @inproceedings{suhr2018situated, author = {Alane Suhr and Yoav Artzi}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Situated Mapping of Sequential Instructions to Actions with Single-step Reward Observation}, year = {2018}, } @inproceedings{misra2018mapping, author = {Dipendra Misra and Andrew Bennett and Valts Blukis and Eyvind Niklasson and Max Shatkhin and Artzi, Yoav}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Mapping Instructions to Actions in {3D} Environments with Visual Goal Prediction}, year = {2018}, } @inproceedings{anderson2018vision, author = {Peter Anderson and Qi Wu and Damien Teney and Jake Bruce and Mark Johnson and Niko S{\"u}nderhauf and Ian Reid and Stephen Gould and Anton van den Hengel}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Vision-and-language navigation: Interpreting visually-grounded navigation instructions in real environments}, year = {2018}, } @inproceedings{tan2018source, author = {Hao Tan and Mohit Bansal}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Source-target inference models for spatial instruction understanding}, year = {2018}, } @inproceedings{wiseman2016beam, author = {Sam Wiseman and Alexander M. Rush}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Sequence-to-Sequence Learning as Beam-Search Optimization}, year = {2016}, } @inproceedings{goyal2018continuous, author = {Kartik Goyal and Graham Neubig and Chris Dyer and Taylor Berg-Kirkpatrick}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {A continuous relaxation of beam search for end-to-end training of neural sequence models}, year = {2018}, } @inproceedings{yang2018breaking, author = {Yilin Yang and Liang Huang and Mingbo Ma}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Breaking the beam search curse: A study of (re-) scoring methods and stopping criteria for neural machine translation}, year = {2018}, } @article{devries2018talk, author = {Harm de Vries and Kurt Shuster and Dhruv Batra and Devi Parikh and Jason Weston and Douwe Kiela}, journal = {arXiv preprint arXiv:1807.03367}, title = {Talk the Walk: Navigating New York City through Grounded Dialogue}, year = {2018}, } @inproceedings{bogin2018emergence, author = {Ben Bogin and Mor Geva and Jonathan Berant}, booktitle = {Emergent Communication Workshop@NIPS}, title = {Emergence of Communication in an Interactive World with Consistent Speakers}, year = {2018}, } @inproceedings{muhlgay2019value, author = {Dor Muhlgay and Jonathan Herzig and Jonathan Berant}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Value-based Search in Execution Space for Mapping Instructions to Programs}, year = {2019}, } @inproceedings{talmor2019commonsenseqa, author = {Alon Talmor and Jonathan Herzig and Nicholas Lourie and Jonathan Berant}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {CommonsenseQA: A Question Answering Challenge Targeting Commonsense Knowledge}, year = {2019}, } @inproceedings{tevet2019evaluating, author = {Guy Tevet and Gavriel Habib and Vered Shwartz and Jonathan Berant}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Evaluating Text {GAN}s as Language Models}, year = {2019}, } @inproceedings{jacovi2019blackbox, author = {Alon Jacovi and Guy Hadash and Einat Kermany and Boaz Carmeli and Ofer Lavi and George Kour and Jonathan Berant}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Neural network gradient-based learning of black-box function interfaces}, year = {2019}, } @article{abujabal2018comqa, author = {Abdalghani Abujabal and Rishiraj Saha Roy and Mohamed Yahya and Gerhard Weikum}, journal = {arXiv preprint arXiv:1809.09528}, title = {ComQA: A Community-sourced Dataset for Complex Factoid Question Answering with Paraphrase Clusters}, year = {2018}, } @article{gardner2018allennlp, author = {Matt Gardner and Joel Grus and Mark Neumann and Oyvind Tafjord and Pradeep Dasigi and Nelson Liu and Matthew Peters and Michael Schmitz and Luke Zettlemoyer}, journal = {arXiv preprint arXiv:1803.07640}, title = {{AllenNLP}: A deep semantic natural language processing platform}, year = {2018}, } @inproceedings{geva2019discofuse, author = {Mor Geva and Eric Malmi and Idan Szpektor and Jonathan Berant}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Disco{F}use: A Large-Scale Dataset for Discourse-based Sentence Fusion}, year = {2019}, } @inproceedings{gorodissky2019white, author = {Or Gorodissky and Yotam Gil and Yoav Chai and Jonathan Berant}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {White-to-Black: Efficient Distillation of Black-Box Adversarial Attacks}, year = {2019}, } @article{fruchterman1991graph, author = {Thomas MJ Fruchterman and Edward M Reingold}, journal = {Software: Practice and experience}, number = {11}, pages = {1129--1164}, title = {Graph drawing by force-directed placement}, volume = {21}, year = {1991}, } @inproceedings{finegan2018improving, author = {Catherine Finegan-Dollak and Jonathan K Kummerfeld and Li Zhang and Karthik Ramanathan and Sesh Sadasivam and Rui Zhang and Dragomir Radev}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Improving text-to-sql evaluation methodology}, year = {2018}, } @inproceedings{li2016gated, author = {Yujia Li and Daniel Tarlow and Marc Brockschmidt and Richard Zemel}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Gated graph sequence neural networks}, year = {2016}, } @article{decao2018question, author = {Nicola De Cao and Wilker Aziz and Ivan Titov}, journal = {arXiv preprint arXiv:1808.09920}, title = {Question answering by reasoning across documents with graph convolutional networks}, year = {2018}, } @article{yogatama2019learning, author = {Dani Yogatama and Cyprien de Masson d'Autume and Jerome Connor and Tomas Kocisky and Mike Chrzanowski and Lingpeng Kong and Angeliki Lazaridou and Wang Ling and Lei Yu and Chris Dyer and others}, journal = {arXiv preprint arXiv:1901.11373}, title = {Learning and Evaluating General Linguistic Intelligence}, year = {2019}, } @article{liu2019multi, author = {Xiaodong Liu and Pengcheng He and Weizhu Chen and Jianfeng Gao}, journal = {arXiv preprint arXiv:1901.11504}, title = {Multi-Task Deep Neural Networks for Natural Language Understanding}, year = {2019}, } @article{pan2019improving, author = {Xiaoman Pan and Kai Sun and Dian Yu and Heng Ji and Dong Yu}, journal = {arXiv preprint arXiv:1902.00993}, title = {Improving Question Answering with External Knowledge}, year = {2019}, } @article{reddy2018coqa, author = {Siva Reddy and Danqi Chen and Christopher D Manning}, journal = {arXiv preprint arXiv:1808.07042}, title = {{CoQA}: A conversational question answering challenge}, year = {2018}, } @article{xu2017sqlnet, author = {Xiaojun Xu and Chang Liu and Dawn Song}, journal = {arXiv preprint arXiv:1711.04436}, title = {Sqlnet: Generating structured queries from natural language without reinforcement learning}, year = {2017}, } @inproceedings{sorokin2018modeling, author = {Daniil Sorokin and Iryna Gurevych}, booktitle = {International Conference on Computational Linguistics (COLING)}, title = {Modeling semantics with gated graph neural networks for knowledge base question answering}, year = {2018}, } @inproceedings{latentgraph2020raboh, author = {Moshiko Raboh and Roei Herzig and Gal Chechik and Jonathan Berant and Amir Globerson}, booktitle = {Winter Conference on Applications of Computer Vision (WACV)}, title = {Differentiable Scene Graphs}, year = {2020}, } @inproceedings{chung2018supervised, author = {Yu-An Chung and Hung-Yi Lee and James Glass}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Supervised and unsupervised transfer learning for question answering}, year = {2018}, } @article{sun2018improving, author = {Kai Sun and Dian Yu and Dong Yu and Claire Cardie}, journal = {arXiv preprint arXiv:1810.13441}, title = {Improving Machine Reading Comprehension with General Reading Strategies}, year = {2018}, } @article{chronopoulou2019transfer, author = {Alexandra Chronopoulou and Christos Baziotis and Alexandros Potamianos}, journal = {arXiv preprint arXiv:1902.10547}, title = {An Embarrassingly Simple Approach for Transfer Learning from Pretrained Language Models}, year = {2019}, } @article{phang2018sentence, author = {Jason Phang and Thibault Fevry and Samuel R Bowman}, journal = {arXiv preprint arXiv:1811.01088}, title = {Sentence encoders on stilts: Supplementary training on intermediate labeled-data tasks}, year = {2018}, } @inproceedings{howard2018universal, author = {Jeremy Howard and Sebastian Ruder}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Universal language model fine-tuning for text classification}, year = {2018}, } @inproceedings{lin2018denoising, author = {Yankai Lin and Haozhe Ji and Zhiyuan Liu and Maosong Sun}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {1736--1745}, title = {Denoising distantly supervised open-domain question answering}, volume = {1}, year = {2018}, } @inproceedings{das2019multi, author = {Rajarshi Das and Shehzaad Dhuliawala and Manzil Zaheer and Andrew McCallum}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Multi-step Retriever-Reader Interaction for Scalable Open-domain Question Answering}, year = {2019}, } @article{talmor2018repartitioning, author = {Alon Talmor and Jonathan Berant}, journal = {arXiv preprint arXiv:1807.09623}, title = {Repartitioning of the {ComplexWebQuestions} Dataset}, year = {2018}, } @inproceedings{bogin2019representing, author = {Ben Bogin and Matt Gardner and Jonathan Berant}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Representing Schema Structure with Graph Neural Networks for Text-to-{SQL} Parsing}, year = {2019}, } @inproceedings{talmor2019generalization, author = {Alon Talmor and Jonathan Berant}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Multi{QA}: An Empirical Investigation of Generalization and Transfer in Reading Comprehension}, year = {2019}, } @article{lin2019grammar, author = {Kevin Lin and Ben Bogin and Mark Neumann and Jonathan Berant and Matt Gardner}, journal = {arXiv preprint arXiv:1905.13326}, title = {Grammar-based Neural Text-to-{SQL} Generation}, year = {2019}, } @inproceedings{bogin2019global, author = {Ben Bogin and Matt Gardner and Jonathan Berant}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Global Reasoning over Database Structures for Text-to-{SQL} Parsing}, year = {2019}, } @inproceedings{geva2019annotator, author = {Mor Geva and Yoav Goldberg and Jonathan Berant}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Are We Modeling the Task or the Annotator? An Investigation of Annotator Bias in Natural Language Understanding Datasets}, year = {2019}, } @inproceedings{herzig2019detect, author = {Jonathan Herzig and Jonathan Berant}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Don't paraphrase, detect! Rapid and Effective Data Collection for Semantic Parsing}, year = {2019}, } @inproceedings{koshorek2019active, author = {Omri Koshorek and Gabriel Stanovsky and Yichu Zhou and Vivek Srikumar and Jonathan Berant}, booktitle = {Computational Natural Language Learning (CoNLL)}, title = {On the Limits of Learning to Actively Learn Semantic Representations}, year = {2019}, } @article{garder2019qaforamt, author = {Matt Gardner and Jonathan Berant and Hannaneh Hajishirzi and Alon Talmor and Sewon Min}, journal = {arXiv preprint arXiv:1909.11291}, title = {Question Answering is a Format; When is it Useful?}, year = {2019}, } @article{talmor2020olmpics, author = {Alon Talmor and Yanai Elazar and Yoav Goldberg and Jonathan Berant}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {oLMpics -- On what Language Model Pre-training Captures}, volume = {3}, year = {2020}, } @article{wolfson2020break, author = {Tomer Wolfson and Mor Geva and Ankit Gupta and Matt Gardner and Yoav Goldberg and Daniel Deutch and Jonathan Berant}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {Break It Down: A Question Understanding Benchmark}, volume = {8}, year = {2020}, } @article{gardner2020contrast, author = {Matt Gardner and Yoav Artzi and Victoria Basmova and Jonathan Berant and Ben Bogin and Sihao Chen and Pradeep Dasigi and Dheeru Dua and Yanai Elazar and Ananth Gottumukkala and Nitish Gupta and Hanna Hajishirzi and Gabriel Ilharco and Daniel Khashabi and Kevin Lin and Jiangming Liu and Nelson F. Liu and Phoebe Mulcaire and Qiang Ning and Sameer Singh and Noah A. Smith and Sanjay Subramanian and Reut Tsarfaty and Eric Wallace and Ally Zhang and Ben Zhou}, journal = {arXiv preprint arXiv:2004.02709}, title = {Evaluating {NLP} Models via Contrast Sets}, year = {2020}, } @article{tevet2020diversity, author = {Guy Tevet and Jonathan Berant}, journal = {arXiv preprint arXiv:2004.02990}, title = {Evaluating the Evaluation of Diversity in Natural Language Generation}, year = {2020}, } @inproceedings{geva2020injecting, author = {Mor Geva and Ankit Gupta and Jonathan Berant}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Injecting Numerical Reasoning Skills into Language Models}, year = {2020}, } @article{latcinnik2020explaining, author = {Veronica Latcinnik and Jonathan Berant}, journal = {arXiv preprint arXiv:2004.05569}, title = {Explaining Question Answering Models through Text Generation}, year = {2020}, } @inproceedings{subramanian2020interpretability, author = {Sanjay Subramanian and Ben Bogin and Nitish Gupta and Tomer Wolfson and Sameer Singh and Jonathan Berant and Matt Gardner}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Achieving Interpretability in Compositional Neural Networks}, year = {2020}, } @article{segal2020multispan, author = {Elad Segal and Avia Efrat and Mor Shoham and Amir Globerson and Jonathan Berant}, journal = {arXiv preprint arXiv:1909.13375}, title = {A Simple and Effective Model for Answering Multi-span Questions}, year = {2020}, } @article{gupta2020gmat, author = {Ankit Gupta and Jonathan Berant}, journal = {arXiv preprint arXiv:2006.03274}, title = {{GMAT}: Global Memory Augmentation for Transformers}, year = {2020}, } @article{talmor2020teaching, author = {Alon Talmor and Ojinvd Tafjord and Peter Clark and Yoav Goldberg and Jonathan Berant}, journal = {arXiv preprint arXiv:2006.06609}, title = {Teaching Pre-Trained Models to Systematically Reason Over Implicit Knowledge}, year = {2020}, } @article{bogin2020latent, author = {Ben Bogin and Sanjay Subramanian and Matt Gardner and Jonathan Berant}, journal = {arXiv preprint arXiv:2007.00266}, title = {Latent Compositional Representations Improve Systematic Generalization in Grounded Question Answering}, year = {2020}, } @inproceedings{papernot2016limitations, author = {Nicolas Papernot and Patrick McDaniel and Somesh Jha and Matt Fredrikson and Z Berkay Celik and Ananthram Swami}, booktitle = {Security and Privacy (EuroS\&P), 2016 IEEE European Symposium on}, pages = {372--387}, title = {The limitations of deep learning in adversarial settings}, year = {2016}, } @article{tramer2017ensemble, author = {Florian Tram{\`e}r and Alexey Kurakin and Nicolas Papernot and Dan Boneh and Patrick McDaniel}, journal = {arXiv preprint arXiv:1705.07204}, title = {Ensemble Adversarial Training: Attacks and Defenses}, year = {2017}, } @article{nayebi2017biologically, author = {Aran Nayebi and Surya Ganguli}, journal = {arXiv preprint arXiv:1703.09202}, title = {Biologically inspired protection of deep networks from adversarial attacks}, year = {2017}, } @article{brendel2017comment, author = {Wieland Brendel and Matthias Bethge}, journal = {arXiv preprint arXiv:1704.01547}, title = {Comment on" Biologically inspired protection of deep networks from adversarial attacks"}, year = {2017}, } @article{papernot2017extending, author = {Nicolas Papernot and Patrick McDaniel}, journal = {arXiv preprint arXiv:1705.05264}, title = {Extending Defensive Distillation}, year = {2017}, } @article{shaham2015understanding, author = {Uri Shaham and Yutaro Yamada and Sahand Negahban}, journal = {arXiv preprint arXiv:1511.05432}, title = {Understanding adversarial training: Increasing local stability of neural nets through robust optimization}, year = {2015}, } @article{meng2017magnet, author = {Dongyu Meng and Hao Chen}, journal = {arXiv preprint arXiv:1705.09064}, title = {MagNet: a Two-Pronged Defense against Adversarial Examples}, year = {2017}, } @inproceedings{cisse2017parseval, author = {Moustapha Cisse and Piotr Bojanowski and Edouard Grave and Yann Dauphin and Nicolas Usunier}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {854--863}, title = {Parseval networks: Improving robustness to adversarial examples}, year = {2017}, } @article{pang2017robust, author = {Tianyu Pang and Chao Du and Jun Zhu}, journal = {arXiv preprint arXiv:1706.00633}, title = {Robust Deep Learning via Reverse Cross-Entropy Training and Thresholding Test}, year = {2017}, } @inproceedings{pulina2010abstraction, author = {Luca Pulina and Armando Tacchella}, booktitle = {Computer Aided Verification (CAV)}, pages = {243--257}, title = {An abstraction-refinement approach to verification of artificial neural networks}, year = {2010}, } @inproceedings{huang2017safety, author = {Xiaowei Huang and Marta Kwiatkowska and Sen Wang and Min Wu}, booktitle = {Computer Aided Verification (CAV)}, pages = {3--29}, title = {Safety verification of deep neural networks}, year = {2017}, } @inproceedings{ehlers2017formal, author = {Ruediger Ehlers}, booktitle = {International Symposium on Automated Technology for Verification and Analysis (ATVA)}, pages = {269--286}, title = {Formal verification of piece-wise linear feed-forward neural networks}, year = {2017}, } @article{lomuscio2017approach, author = {Alessio Lomuscio and Lalit Maganti}, journal = {arXiv preprint arXiv:1706.07351}, title = {An approach to reachability analysis for feed-forward ReLU neural networks}, year = {2017}, } @article{grosse2017statistical, author = {Kathrin Grosse and Praveen Manoharan and Nicolas Papernot and Michael Backes and Patrick McDaniel}, journal = {arXiv preprint arXiv:1702.06280}, title = {On the (statistical) detection of adversarial examples}, year = {2017}, } @article{li2016adversarial, author = {Xin Li and Fuxin Li}, journal = {arXiv preprint arXiv:1612.07767}, title = {Adversarial examples detection in deep networks with convolutional filter statistics}, year = {2016}, } @inproceedings{hendrycks2017early, author = {Dan Hendrycks and Kevin Gimpel}, booktitle = {International Conference on Learning Representations Workshop (ICLR)}, title = {Early Methods for Detecting Adversarial Images}, year = {2017}, } @article{feinman2017detecting, author = {Reuben Feinman and Ryan R Curtin and Saurabh Shintre and Andrew B Gardner}, journal = {arXiv preprint arXiv:1703.00410}, title = {Detecting Adversarial Samples from Artifacts}, year = {2017}, } @inproceedings{anguita2013har, author = {Davide Anguita and Alessandro Ghio and Luca Oneto and Xavier Parra and Jorge L. Reyes-Ortiz}, booktitle = {21st European Symposium on Artificial Neural Networks, Computational Intelligence and Machine Learning (ESANN)}, title = {A Public Domain Dataset for Human Activity Recognition Using Smartphones}, year = {2013}, } @article{lyapunov1992general, author = {Aleksandr Mikhailovich Lyapunov}, journal = {International Journal of Control}, number = {3}, pages = {531--534}, title = {The general problem of the stability of motion}, volume = {55}, year = {1992}, } @phdthesis{lyapunov1892general, author = {Aleksandr Mikhailovich Lyapunov}, school = {Kharkov Mathematical Society}, title = {The general problem of the stability of motion (in Russian)}, year = {1892}, } @article{tedrake2010lqrtrees, author = {Russ Tedrake and Ian R. Manchester and Mark M. Tobenkin and John W. Roberts}, journal = {International Journal of Robotics Research}, pages = {1038--1052}, title = {{LQR}-Trees: Feedback motion planning via sums of squares verification}, volume = {29}, year = {2010}, } @article{tobenkin2011invariant, author = {Mark M. Tobenkin and Ian R. Manchester and Russ Tedrake}, journal = {IFAC Proceedings Volumes}, title = {Invariant funnels around trajectories using sum-of-squares programming}, volume = {44}, year = {2011}, } @inproceedings{papachristodoulou2002construction, author = {Antonis Papachristodoulou and Stephen Prajna}, booktitle = {IEEE Conference on Decision and Control}, title = {On the construction of Lyapunov functions using the sum of squares decomposition}, year = {2002}, } @article{papachristodoulou2005analysis, author = {Antonis Papachristodoulou and Stephen Prajna}, journal = {Positive polynomials in control}, title = {Analysis of non-polynomial systems using the sum of squares decomposition}, year = {2005}, } @article{katz2017towards, author = {Guy Katz and Clark Barrett and David L. Dill and Kyle Julian and Mykel J. Kochenderfer}, journal = {arXiv}, title = {Towards proving the adversarial robustness of deep neural networks}, year = {2017}, } @techreport{okelly2016apex, author = {Matthew O'Kelly and Houssam Abbas and Sicun Gao and Shin'ichi Shiraishi and Shinpei Kato and Rahul Mangharam}, institution = {University of Pennsylvania}, title = {{APEX}: Autonomous Vehicle Plan Verification and Execution}, year = {2016}, } @techreport{okelly2017computer, author = {Matthew O'Kelly and Houssam Abbas and Rahul Mangharam}, institution = {University of Pennsylvania}, title = {Computer-Aided Design for Safe Autonomous Vehicles}, year = {2017}, } @inproceedings{sharif2016accessorize, author = {Mahmood Sharif and Sruti Bhagavatula and Lujo Bauer and Michael K. Reiter}, booktitle = {ACM SIGSAC Conference on Computer and Communications Security}, pages = {1528--1540}, title = {Accessorize to a crime: Real and stealthy attacks on state-of-the-art face recognition}, year = {2016}, } @article{carlini2017ground, author = {Nicholas Carlini and Guy Katz and Clark Barrett and David L. Dill}, journal = {arXiv}, title = {Ground-Truth Adversarial Examples}, year = {2017}, } @article{xiong2016achieving, author = {Wayne Xiong and Jasha Droppo and Xuedong Huang and Frank Seide and Mike Seltzer and Andreas Stolcke and Dong Yu and Geoffrey Zweig}, journal = {arXiv}, title = {Achieving human parity in conversational speech recognition}, year = {2016}, } @article{miyato2015distributional, author = {Takeru Miyato and Shin-ichi Maeda and Masanori Koyama and Ken Nakae and Shin Ishii}, journal = {arXiv}, title = {Distributional smoothing with virtual adversarial training}, year = {2015}, } @article{chen2017ead, author = {Pin-Yu Chen and Yash Sharma and Huan Zhang and Jinfeng Yi and Cho-Jui Hsieh}, journal = {arXiv}, title = {{EAD}: Elastic-Net Attacks to Deep Neural Networks via Adversarial Examples}, year = {2017}, } @article{goodfellow2016cleverhans, author = {Ian Goodfellow and Nicolas Papernot and Patrick McDaniel}, journal = {arXiv}, title = {cleverhans v2.0.0: an adversarial machine learning library}, year = {2016}, } @article{rice1953classes, author = {Henry Gordon Rice}, journal = {Transactions of the American Mathematical Society}, number = {2}, pages = {358--366}, title = {Classes of recursively enumerable sets and their decision problems}, volume = {74}, year = {1953}, } @inproceedings{barak2012hypercontractivity, author = {Boaz Barak and Fernando Brand{\~a}o and Aram Harrow and Jonathan Kelner and David Steurer and Yuan Zhou}, booktitle = {Symposium on Theory of Computing (STOC)}, pages = {307--326}, title = {Hypercontractivity, sum-of-squares proofs, and their applications}, year = {2012}, } @inproceedings{regev2017learning, author = {Oded Regev and Aravindan Vijayaraghavan}, booktitle = {Foundations of Computer Science (FOCS)}, title = {On Learning Mixtures of Well-Separated Gaussians}, year = {2017}, } @inproceedings{kothari2018outlier, author = {Pravesh Kothari and David Steurer}, booktitle = {Symposium on Theory of Computing (STOC)}, title = {Outlier-robust moment-estimation via sum-of-squares}, year = {2018}, } @inproceedings{kothari2018agnostic, author = {Pravesh Kothari and Jacob Steinhardt}, booktitle = {Symposium on Theory of Computing (STOC)}, title = {Better Agnostic Clustering via Tensor Norms}, year = {2018}, } @article{huber1964robust, author = {Peter J. Huber}, journal = {The Annals of Mathematical Statistics}, number = {1}, pages = {73--101}, title = {Robust estimation of a location parameter}, volume = {35}, year = {1964}, } @article{box1953robust, author = {George E.P. Box}, journal = {Biometrika}, pages = {318--335}, title = {Non-normality and tests on variances}, volume = {40}, year = {1953}, } @article{newcomb1886generalized, author = {Simon Newcomb}, journal = {American Journal of Mathematics}, number = {4}, pages = {343--366}, title = {A Generalized Theory of the Combination of Observations so as to Obtain the Best Result}, volume = {8}, year = {1886}, } @inproceedings{elyaniv2011finance, author = {Ran El-Yaniv and Dmitry Pidan}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Selective Prediction of Financial Trends with Hidden Markov Models}, year = {2011}, } @article{zhang2019molecular, author = {Yao Zhang and Alpha A. Lee}, journal = {CoRR}, title = {Bayesian semi-supervised learning for uncertainty-calibrated prediction of molecular properties and active learning}, volume = {0}, year = {2019}, } @inproceedings{varshney2011risk, author = {K. R. Varshney}, booktitle = {2011 IEEE Statistical Signal Processing Workshop (SSP)}, title = {A risk bound for ensemble classification with a reject option}, year = {2011}, } @inproceedings{geifman2019selectivenet, author = {Yonatan Geifman and Ran El-Yaniv}, booktitle = {International Conference on Machine Learning (ICML)}, title = {SelectiveNet: A Deep Neural Network with an Integrated Reject Option}, year = {2019}, } @article{khan2001diagnosis, author = {Javed Khan and Jun S. Wei and Markus Ringnér and Lao H. Saal and Marc Ladanyi and Frank Westermann and Frank Berthold and Manfred Schwab and Cristina R. Antonescu and Carsten Peterson and Paul S. Meltzer}, journal = {Nature Medicine}, title = {Classification and diagnostic prediction of cancers using gene expression profiling and artificial neural networks}, year = {2001}, } @article{hanczar2008gene, author = {Blaise Hanczar and Edward R. Dougherty}, journal = {Bioinformatics}, title = {Classification with reject option in gene expression data}, year = {2008}, } @article{uyumazturk2019deep, author = {Bora Uyumazturk and Amirhossein Kiani and Pranav Rajpurkar and Alex Wang and Robyn L. Ball and Rebecca Gao and Yifan Yu and Erik Jones and Curtis P. Langlotz and Brock Martin and Gerald J. Berry and Michael G. Ozawa and Florette K. Hazard and Ryanne A. Brown and Simon B. Chen and Mona Wood and Libby S. Allard and Lourdes Ylagan and Andrew Y. Ng and Jeanne Shen}, journal = {arXiv}, title = {Deep Learning for the Digital Pathologic Diagnosis of Cholangiocarcinoma and Hepatocellular Carcinoma: Evaluating the Impact of a Web-based Diagnostic Assistant}, year = {2019}, } @inproceedings{su2019risk, author = {Lixin Su and Jiafeng Guo and Yixin Fan and Yanyan Lan and Xueqi Cheng}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, title = {Controlling Risk of Web Question Answering}, year = {2019}, } @article{jurczyk2016selqa, author = {Tomasz Jurczyk and Michael Zhai and Jinho D. Choi}, journal = {arXiv}, title = {SelQA: A New Benchmark for Selection-based Question Answering}, year = {2016}, } @article{tenney2019bert, author = {Ian Tenney and Dipanjan Das and Ellie Pavlick}, journal = {arXiv}, title = {{BERT} Rediscovers the Classical {NLP} Pipeline}, year = {2019}, } @inproceedings{hewitt2019structural, author = {John Hewitt and Christopher D. Manning}, booktitle = {Association for Computational Linguistics (ACL)}, title = {A Structural Probe for Finding Syntax in Word Representations}, year = {2019}, } @article{qi2020stanza, author = {Peng Qi and Yuhao Zhang and Yuhui Zhang and Jason Bolton and Christopher D. Manning}, journal = {arXiv}, title = {Stanza: A Python Natural Language Processing Toolkit for Many Human Languages}, year = {2020}, } @inproceedings{finn2017modelagnostic, author = {Chelsea Finn and Pieter Abbeel and Sergey Levine}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Model-Agnostic Meta-Learning for Fast Adaptation of Deep Networks}, year = {2017}, } @article{dalal2018safe, author = {Gal Dalal and Krishnamurthy Dvijotham and Matej Vecerik and Todd Hester and Cosmin Paduraru and Yuval Tassa}, journal = {arXiv}, title = {Safe Exploration in Continuous Action Spaces}, year = {2018}, } @article{lipton2016sisyphean, author = {Zachary C. Lipton and Kamyar Azizzadenesheli and Abhishek Kumar and Lihong Li and Jianfeng Gao and Li Deng}, journal = {arXiv}, title = {Combating Reinforcement Learning's Sisyphean Curse with Intrinsic Fear}, year = {2016}, } @inproceedings{richter2017novelty, author = {Charles Richter and Nicholas Roy}, booktitle = {Robotics: Science and Systems}, title = {Safe Visual Navigation via Deep Learning and Novelty Detection}, year = {2017}, } @article{achiam2019benchmarking, author = {Joshua Achiam and Dario Amodei}, journal = {arXiv}, title = {Benchmarking Safe Exploration in Deep Reinforcement Learning}, year = {2019}, } @article{kahn2017uncertaintyaware, author = {Gregory Kahn and Adam Villaflor and Vitchyr Pong and Pieter Abbeel and Sergey Levine}, journal = {arXiv}, title = {Uncertainty-Aware Reinforcement Learning for Collision Avoidance}, year = {2017}, } @article{fu2017ex2, author = {Justin Fu and John D. Co-Reyes and Sergey Levine}, journal = {arXiv}, title = {EX2: Exploration with Exemplar Models for Deep Reinforcement Learning}, year = {2017}, } @article{lee2019efficient, author = {Lisa Lee and Benjamin Eysenbach and Emilio Parisotto and Eric Xing and Sergey Levine and Ruslan Salakhutdinov}, journal = {arXiv}, title = {Efficient Exploration via State Marginal Matching}, year = {2019}, } @article{ranzato2015sequence, author = {Marc'Aurelio Ranzato and Sumit Chopra and Michael Auli and Wojciech Zaremba}, journal = {arXiv preprint arXiv:1511.06732}, title = {Sequence level training with recurrent neural networks}, year = {2015}, } @article{clark2016deep, author = {Kevin Clark and Christopher D Manning}, journal = {arXiv preprint arXiv:1609.08667}, title = {Deep reinforcement learning for mention-ranking coreference models}, year = {2016}, } @article{narasimhan2015language, author = {Karthik Narasimhan and Tejas Kulkarni and Regina Barzilay}, journal = {arXiv preprint arXiv:1506.08941}, title = {Language understanding for text-based games using deep reinforcement learning}, year = {2015}, } @article{narasimhan2016improving, author = {Karthik Narasimhan and Adam Yala and Regina Barzilay}, journal = {arXiv preprint arXiv:1603.07954}, title = {Improving information extraction by acquiring external evidence with reinforcement learning}, year = {2016}, } @inproceedings{norouzi2016reward, author = {Mohammad Norouzi and Samy Bengio and Navdeep Jaitly and Mike Schuster and Yonghui Wu and Dale Schuurmans and others}, booktitle = {Advances In Neural Information Processing Systems}, pages = {1723--1731}, title = {Reward augmented maximum likelihood for neural structured prediction}, year = {2016}, } @inproceedings{osband2016deep, author = {Ian Osband and Charles Blundell and Alexander Pritzel and Benjamin Van Roy}, booktitle = {Advances In Neural Information Processing Systems}, pages = {4026--4034}, title = {Deep exploration via bootstrapped {DQN}}, year = {2016}, } @article{nachum2016improving, author = {Ofir Nachum and Mohammad Norouzi and Dale Schuurmans}, journal = {arXiv preprint arXiv:1611.09321}, title = {Improving Policy Gradient by Exploring Under-appreciated Rewards}, year = {2016}, } @article{williams1992simple, author = {Ronald J Williams}, journal = {Machine learning}, number = {3}, pages = {229--256}, title = {Simple statistical gradient-following algorithms for connectionist reinforcement learning}, volume = {8}, year = {1992}, } @article{williams1991function, author = {Ronald J Williams and Jing Peng}, journal = {Connection Science}, number = {3}, pages = {241--268}, title = {Function optimization using connectionist reinforcement learning algorithms}, volume = {3}, year = {1991}, } @book{liu2008monte, author = {Jun S Liu}, publisher = {Springer Science \& Business Media Springer Science \& Business Media}, title = {{M}onte {C}arlo strategies in scientific computing}, year = {2008}, } @inproceedings{venkatraman2015improving, author = {Arun Venkatraman and Martial Hebert and J Andrew Bagnell}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {3024--3030}, title = {Improving Multi-Step Prediction of Learned Time Series Models}, year = {2015}, } @inproceedings{bengio2015scheduled, author = {Samy Bengio and Oriol Vinyals and Navdeep Jaitly and Noam Shazeer}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1171--1179}, title = {Scheduled sampling for sequence prediction with recurrent neural networks}, year = {2015}, } @inproceedings{bellemare2016unifying, author = {Marc Bellemare and Sriram Srinivasan and Georg Ostrovski and Tom Schaul and David Saxton and Remi Munos}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1471--1479}, title = {Unifying count-based exploration and intrinsic motivation}, year = {2016}, } @inproceedings{abadi2016tensorflow, author = {Martin Abadi and Paul Barham and Jianmin Chen and Zhifeng Chen and Andy Davis and Jeffrey Dean and Matthieu Devin and Sanjay Ghemawat and Geoffrey Irving and Michael Isard and others}, booktitle = {Proceedings of the 12th USENIX Symposium on Operating Systems Design and Implementation (OSDI). Savannah, Georgia, USA}, title = {TensorFlow: A system for large-scale machine learning}, year = {2016}, } @phdthesis{levine2014motor, author = {Sergey Levine}, school = {Stanford University}, title = {Motor Skill Learning with Local Trajectory Methods}, year = {2014}, } @article{riedel2016programming, author = {Sebastian Riedel and Matko Bosnjak and Tim Rockt{\"a}schel}, journal = {CoRR, abs/1605.06640}, title = {Programming with a differentiable forth interpreter}, year = {2016}, } @book{sutton1998reinforcement, author = {Richard S Sutton and Andrew G Barto}, number = {1}, publisher = {MIT Press MIT press Cambridge}, title = {Reinforcement learning: An introduction}, volume = {1}, year = {1998}, } @inproceedings{coulom2006efficient, author = {Remi Coulom}, booktitle = {International Conference on Computers and Games}, pages = {72--83}, title = {Efficient selectivity and backup operators in {M}onte-{C}arlo tree search}, year = {2006}, } @article{osband2014generalization, author = {Ian Osband and Benjamin Van Roy and Zheng Wen}, journal = {arXiv preprint arXiv:1402.0635}, title = {Generalization and exploration via randomized value functions}, year = {2014}, } @article{kearns2002near, author = {Michael Kearns and Satinder Singh}, journal = {Machine Learning}, number = {2}, pages = {209--232}, title = {Near-optimal reinforcement learning in polynomial time}, volume = {49}, year = {2002}, } @phdthesis{duff2002optimal, author = {Michael O'Gordon Duff}, school = {University of Massachusetts Amherst}, title = {Optimal Learning: Computational procedures for Bayes-adaptive Markov decision processes}, year = {2002}, } @inproceedings{kingma2015adam, author = {Diederik Kingma and Jimmy Ba}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Adam: A method for stochastic optimization}, year = {2015}, } @inproceedings{smith2006minimum, author = {David A Smith and Jason Eisner}, booktitle = {International Conference on Computational Linguistics and Association for Computational Linguistics (COLING/ACL)}, pages = {787--794}, title = {Minimum risk annealing for training log-linear models}, year = {2006}, } @article{shen2015minimum, author = {Shiqi Shen and Yong Cheng and Zhongjun He and Wei He and Hua Wu and Maosong Sun and Yang Liu}, journal = {arXiv preprint arXiv:1512.02433}, title = {Minimum risk training for neural machine translation}, year = {2015}, } @inproceedings{glorot2010understanding, author = {Xavier Glorot and Yoshua Bengio}, booktitle = {International Conference on Artificial Intelligence and Statistics}, title = {Understanding the difficulty of training deep feedforward neural networks}, year = {2010}, } @inproceedings{shao2017generating, author = {Louis Shao and Stephan Gouws and Denny Britz and Anna Goldie and Brian Strope and Ray Kurzweil}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {2210--2219}, title = {Generating High-Quality and Informative Conversation Responses with Sequence-to-Sequence Models}, year = {2017}, } @article{gehring2017convolutional, author = {Jonas Gehring and Michael Auli and David Grangier and Denis Yarats and Yann N Dauphin}, journal = {arXiv preprint arXiv:1705.03122}, title = {Convolutional Sequence to Sequence Learning}, year = {2017}, } @article{vaswani2017attention, author = {Ashish Vaswani and Noam Shazeer and Niki Parmar and Jakob Uszkoreit and Llion Jones and Aidan N Gomez and Lukasz Kaiser and Illia Polosukhin}, journal = {arXiv preprint arXiv:1706.03762}, title = {Attention Is All You Need}, year = {2017}, } @book{jurafsky2000speech, author = {Daniel Jurafsky and James H Martin}, publisher = {Prentice Hall Prentice Hall}, title = {Speech and language processing: An introduction to natural language processing, computational linguistics, and speech recognition}, year = {2000}, } @inproceedings{kalchbrenner2013recurrent, author = {Nal Kalchbrenner and Phil Blunsom}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1700--1709}, title = {Recurrent Continuous Translation Models}, year = {2013}, } @inproceedings{koehn2007moses, author = {Philipp Koehn and Hieu Hoang and Alexandra Birch and Chris Callison-Burch and Marcello Federico and Nicola Bertoldi and Brooke Cowan and Wade Shen and Christine Moran and Richard Zens and others}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {177--180}, title = {Moses: Open source toolkit for statistical machine translation}, year = {2007}, } @article{hahn2000challenges, author = {Udo Hahn and Inderjeet Mani}, journal = {Computer}, title = {The challenges of automatic summarization}, volume = {33}, year = {2000}, } @article{nallapati2016abstractive, author = {Ramesh Nallapati and Bowen Zhou and Caglar Gulcehre and Bing Xiang and others}, journal = {arXiv preprint arXiv:1602.06023}, title = {Abstractive text summarization using sequence-to-sequence rnns and beyond}, year = {2016}, } @article{doersch2016tutorial, author = {Carl Doersch}, journal = {arXiv preprint arXiv:1606.05908}, title = {Tutorial on variational autoencoders}, year = {2016}, } @book{euzenat2007ontology, author = {Jerome Euzenat and Pavel Shvaiko and others}, publisher = {Springer Springer}, title = {Ontology matching}, volume = {18}, year = {2007}, } @book{stone2014amazon, author = {Brad Stone and Spencer Soper}, publisher = {Bloomberg L. P.}, title = {Amazon Unveils a Listening, Talking, Music-Playing Speaker for Your Home}, year = {2014}, } @article{hester2017learning, author = {Todd Hester and Matej Vecerik and Olivier Pietquin and Marc Lanctot and Tom Schaul and Bilal Piot and Andrew Sendonaris and Gabriel Dulac-Arnold and Ian Osband and John Agapiou and others}, journal = {arXiv preprint arXiv:1704.03732}, title = {Learning from Demonstrations for Real World Reinforcement Learning}, year = {2017}, } @inproceedings{hester2018deep, author = {Todd Hester and Matej Vecerik and Olivier Pietquin and Marc Lanctot and Tom Schaul and Bilal Piot and Andrew Sendonaris and Gabriel Dulac{-}Arnold and Ian Osband and John Agapiou and Joel Z. Leibo and Audrunas Gruslys}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Deep {Q}-learning from Demonstrations}, year = {2018}, } @inproceedings{kim2013learning, author = {Beomjoon Kim and Amir massoud Farahmand and Joelle Pineau and Doina Precup}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {2859--2867}, title = {Learning from limited demonstrations}, year = {2013}, } @article{pomerleau1991efficient, author = {Dean A Pomerleau}, journal = {Neural Computation}, number = {1}, pages = {88--97}, title = {Efficient training of artificial neural networks for autonomous navigation}, volume = {3}, year = {1991}, } @book{goodfellow2016deep, author = {Ian Goodfellow and Yoshua Bengio and Aaron Courville}, publisher = {MIT Press MIT Press}, title = {Deep Learning}, year = {2016}, } @inproceedings{bitzer2010using, author = {Sebastian Bitzer and Matthew Howard and Sethu Vijayakumar}, booktitle = {International Conference on Intelligent Robots and Systems (IROS)}, pages = {3219--3225}, title = {Using dimensionality reduction to exploit constraints in reinforcement learning}, year = {2010}, } @inproceedings{deka2016erica, author = {Biplab Deka and Zifeng Huang and Ranjitha Kumar}, booktitle = {User Interface Software and Technology (UIST)}, pages = {767--776}, title = {ERICA: Interaction Mining Mobile Apps}, year = {2016}, } @inproceedings{atkeson1997robot, author = {Christopher G Atkeson and Stefan Schaal}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {12--20}, title = {Robot learning from demonstration}, volume = {97}, year = {1997}, } @inproceedings{kuznetsova2013generalizing, author = {Polina Kuznetsova and Vicente Ordonez and Alexander C Berg and Tamara L Berg and Yejin Choi}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {790--796}, title = {Generalizing Image Captions for Image-Text Parallel Corpus}, year = {2013}, } @article{hodosh2013framing, author = {Micah Hodosh and Peter Young and Julia Hockenmaier}, journal = {Journal of Artificial Intelligence Research (JAIR)}, pages = {853--899}, title = {Framing image description as a ranking task: Data, models and evaluation metrics}, volume = {47}, year = {2013}, } @inproceedings{mason2014domain, author = {Rebecca Mason and Eugene Charniak}, booktitle = {Computational Natural Language Learning (CoNLL)}, pages = {2--10}, title = {Domain-Specific Image Captioning}, year = {2014}, } @article{kolesnyk2016generating, author = {Vladyslav Kolesnyk and Tim Rockt{\"a}schel and Sebastian Riedel}, journal = {arXiv preprint arXiv:1606.01404}, title = {Generating natural language inference chains}, year = {2016}, } @article{yuan2017machine, author = {Xingdi Yuan and Tong Wang and Caglar Gulcehre and Alessandro Sordoni and Philip Bachman and Sandeep Subramanian and Saizheng Zhang and Adam Trischler}, journal = {arXiv preprint arXiv:1705.02012}, title = {Machine Comprehension by Text-to-Text Neural Question Generation}, year = {2017}, } @inproceedings{ali2010automation, author = {Husam Ali and Yllias Chali and Sadid A Hasan}, booktitle = {Proceedings of QG2010: The Third Workshop on Question Generation}, pages = {58--67}, title = {Automation of question generation from sentences}, year = {2010}, } @inproceedings{mannem2010question, author = {Prashanth Mannem and Rashmi Prasad and Aravind Joshi}, booktitle = {Proceedings of QG2010: The Third Workshop on Question Generation}, pages = {84--91}, title = {Question generation from paragraphs at UPenn: {QGSTEC} system description}, year = {2010}, } @inproceedings{williams2018broad, author = {Adina Williams and Nikita Nangia and Samuel Bowman}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {1112--1122}, title = {A Broad-Coverage Challenge Corpus for Sentence Understanding through Inference}, year = {2018}, } @inproceedings{dozat2017stanford, author = {Timothy Dozat and Peng Qi and Christopher D Manning}, booktitle = {Computational Natural Language Learning (CoNLL)}, pages = {20--30}, title = {Stanford's Graph-based Neural Dependency Parser at the CoNLL 2017 Shared Task}, year = {2017}, } @article{conneau2017supervised, author = {Alexis Conneau and Douwe Kiela and Holger Schwenk and Loic Barrault and Antoine Bordes}, journal = {arXiv preprint arXiv:1705.02364}, title = {Supervised learning of universal sentence representations from natural language inference data}, year = {2017}, } @inproceedings{poliak2018hypothesis, author = {Adam Poliak and Jason Naradowsky and Aparajita Haldar and Rachel Rudinger and Benjamin Van Durme}, booktitle = {Joint Conference on Lexical and Computational Semantics}, title = {Hypothesis Only Baselines in Natural Language Inference}, year = {2018}, } @incollection{dagan2006pascal, author = {Ido Dagan and Oren Glickman and Bernardo Magnini}, booktitle = {Machine learning challenges. evaluating predictive uncertainty, visual object classification, and recognising tectual entailment}, pages = {177--190}, title = {The {PASCAL} recognising textual entailment challenge}, year = {2006}, } @inproceedings{tapaswi2016movieqa, author = {Makarand Tapaswi and Yukun Zhu and Rainer Stiefelhagen and Antonio Torralba and Raquel Urtasun and Sanja Fidler}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {4631--4640}, title = {Movieqa: Understanding stories in movies through question-answering}, year = {2016}, } @inproceedings{pavlick2016most, author = {Ellie Pavlick and Chris Callison-Burch}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {2164--2173}, title = {Most" babies" are" little" and most" problems" are" huge": Compositional Entailment in Adjective-Nouns}, volume = {1}, year = {2016}, } @article{lai2017natural, author = {Alice Lai and Yonatan Bisk and Julia Hockenmaier}, journal = {arXiv preprint arXiv:1710.02925}, title = {Natural Language Inference from Multiple Premises}, year = {2017}, } @inproceedings{bojar2017findings, author = {Ond{\v{r}}ej Bojar and Rajen Chatterjee and Christian Federmann and Yvette Graham and Barry Haddow and Shujian Huang and Matthias Huck and Philipp Koehn and Qun Liu and Varvara Logacheva and others}, booktitle = {Proceedings of the Second Conference on Machine Translation}, pages = {169--214}, title = {Findings of the 2017 conference on machine translation (wmt17)}, year = {2017}, } @inproceedings{chandrasekar1996motivations, author = {Raman Chandrasekar and Christine Doran and Bangalore Srinivas}, booktitle = {Proceedings of the 16th conference on Computational linguistics-Volume 2}, pages = {1041--1044}, title = {Motivations and methods for text simplification}, year = {1996}, } @article{hannun2014deep, author = {Awni Hannun and Carl Case and Jared Casper and Bryan Catanzaro and Greg Diamos and Erich Elsen and Ryan Prenger and Sanjeev Satheesh and Shubho Sengupta and Adam Coates and others}, journal = {arXiv preprint arXiv:1412.5567}, title = {Deep speech: Scaling up end-to-end speech recognition}, year = {2014}, } @article{boulanger2012modeling, author = {Nicolas Boulanger-Lewandowski and Yoshua Bengio and Pascal Vincent}, journal = {arXiv preprint arXiv:1206.6392}, title = {Modeling temporal dependencies in high-dimensional sequences: Application to polyphonic music generation and transcription}, year = {2012}, } @inproceedings{johnson2016perceptual, author = {Justin Johnson and Alexandre Alahi and Li Fei-Fei}, booktitle = {European Conference on Computer Vision (ECCV)}, pages = {694--711}, title = {Perceptual losses for real-time style transfer and super-resolution}, year = {2016}, } @inproceedings{taskar2005learning, author = {Ben Taskar and Vassil Chatalbashev and Daphne Koller and Carlos Guestrin}, booktitle = {Proceedings of the 22nd international conference on Machine learning}, pages = {896--903}, title = {Learning structured prediction models: A large margin approach}, year = {2005}, } @article{oord2016pixel, author = {Aaron van den Oord and Nal Kalchbrenner and Koray Kavukcuoglu}, journal = {arXiv preprint arXiv:1601.06759}, title = {Pixel recurrent neural networks}, year = {2016}, } @inproceedings{nivre2003efficient, author = {Joakim Nivre}, booktitle = {Proceedings of the 8th International Workshop on Parsing Technologies (IWPT}, title = {An efficient algorithm for projective dependency parsing}, year = {2003}, } @book{friedman2001elements, author = {Jerome Friedman and Trevor Hastie and Robert Tibshirani}, number = {10}, publisher = {Springer series in statistics New York, NY, USA: Springer series in statistics New York, NY, USA:}, title = {The elements of statistical learning}, volume = {1}, year = {2001}, } @book{gelman1995bayesian, author = {Andrew Gelman and John B Carlin and Hal S Stern and Donald B Rubin}, publisher = {Chapman and Hall/CRC Chapman and Hall/CRC}, title = {Bayesian data analysis}, year = {1995 1995}, } @article{breiman1977variable, author = {Leo Breiman and William Meisel and Edward Purcell}, journal = {Technometrics}, number = {2}, pages = {135--144}, title = {Variable kernel estimates of multivariate densities}, volume = {19}, year = {1977}, } @book{wand1994kernel, author = {Matt P Wand and M Chris Jones}, publisher = {Chapman and Hall/CRC Chapman and Hall/CRC}, title = {Kernel smoothing}, year = {1994 1994}, } @article{graves2014neural, author = {Alex Graves and Greg Wayne and Ivo Danihelka}, journal = {arXiv preprint arXiv:1410.5401}, title = {Neural turing machines}, year = {2014}, } @inproceedings{sutskever2011generating, author = {Ilya Sutskever and James Martens and Geoffrey E Hinton}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1017--1024}, title = {Generating text with recurrent neural networks}, year = {2011}, } @article{graves2013generating, author = {Alex Graves}, journal = {arXiv preprint arXiv:1308.0850}, title = {Generating sequences with recurrent neural networks}, year = {2013}, } @article{deemter2005real, author = {Kees Van Deemter and Mari{\"e}t Theune and Emiel Krahmer}, journal = {Computational Linguistics}, number = {1}, pages = {15--24}, title = {Real versus template-based natural language generation: A false opposition?}, volume = {31}, year = {2005}, } @article{dvzeroski2004combining, author = {Saso D{\v{z}}eroski and Bernard {\v{Z}}enko}, journal = {Machine learning}, number = {3}, pages = {255--273}, title = {Is combining classifiers with stacking better than selecting the best one?}, volume = {54}, year = {2004}, } @article{vijayakumar2016diverse, author = {Ashwin K Vijayakumar and Michael Cogswell and Ramprasath R Selvaraju and Qing Sun and Stefan Lee and David Crandall and Dhruv Batra}, journal = {arXiv preprint arXiv:1610.02424}, title = {Diverse beam search: Decoding diverse solutions from neural sequence models}, year = {2016}, } @inproceedings{gimpel2013systematic, author = {Kevin Gimpel and Dhruv Batra and Chris Dyer and Gregory Shakhnarovich}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1100--1111}, title = {A systematic exploration of diversity in machine translation}, year = {2013}, } @article{brill1995transformation, author = {Eric Brill}, journal = {Computational linguistics}, number = {4}, pages = {543--565}, title = {Transformation-based error-driven learning and natural language processing: A case study in part-of-speech tagging}, volume = {21}, year = {1995}, } @article{khandelwal2018sharp, author = {Urvashi Khandelwal and He He and Peng Qi and Dan Jurafsky}, journal = {arXiv preprint arXiv:1805.04623}, title = {Sharp nearby, fuzzy far away: How neural language models use context}, year = {2018}, } @article{deb2002fast, author = {Kalyanmoy Deb and Amrit Pratap and Sameer Agarwal and TAMT Meyarivan}, journal = {IEEE transactions on evolutionary computation}, number = {2}, pages = {182--197}, title = {A fast and elitist multiobjective genetic algorithm: {NSGA}-{II}}, volume = {6}, year = {2002}, } @article{abolafia2018neural, author = {Daniel A Abolafia and Mohammad Norouzi and Quoc V Le}, journal = {arXiv preprint arXiv:1801.03526}, title = {Neural Program Synthesis with Priority Queue Training}, year = {2018}, } @article{thota2021cda, author = {Mamatha Thota and Georgios Leontidis}, journal = {arXiv}, title = {Contrastive Domain Adaptation}, year = {2021}, } @inproceedings{caron2020swav, author = {Mathilde Caron and Ishan Misra and Julien Mairal and Priya Goyal and Piotr Bojanowski and Armand Joulin}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {9912--9924}, title = {Unsupervised Learning of Visual Features by Contrasting Cluster Assignments}, volume = {33}, year = {2020}, } @article{wang2021cdcl, author = {Rui Wang and Zuxuan Wu and Zejia Weng and Jingjing Chen and Guo-Jun Qi and Yu-Gang Jiang}, journal = {arXiv}, title = {Cross-domain Contrastive Learning for Unsupervised Domain Adaptation}, year = {2021}, } @inproceedings{radford2021clip, author = {Alec Radford and Jong Wook Kim and Chris Hallacy and Aditya Ramesh and Gabriel Goh and Sandhini Agarwal and Girish Sastry and Amanda Askell and Pamela Mishkin and Jack Clark and Gretchen Krueger and Ilya Sutskever}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {8748--8763}, title = {Learning Transferable Visual Models From Natural Language Supervision}, volume = {139}, year = {2021}, } @inproceedings{he2020moco, author = {Kaiming He and Haoqi Fan and Yuxin Wu and Saining Xie and Ross Girshick}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Momentum Contrast for Unsupervised Visual Representation Learning}, year = {2020}, } @inproceedings{prabhu2021sentry, author = {Viraj Prabhu and Shivam Khare and Deeksha Karthik and Judy Hoffman}, booktitle = {International Conference on Computer Vision (ICCV)}, title = {Selective Entropy Optimization via Committee Consistency for Unsupervised Domain Adaptation}, year = {2021}, } @inproceedings{gidaris2018rotation, author = {Spyros Gidaris and Praveer Singh and Nikos Komodakis}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Unsupervised Representation Learning by Predicting Image Rotations}, year = {2018}, } @inproceedings{caron2021emerging, author = {Mathilde Caron and Hugo Touvron and Ishan Misra and Herve Jegou and Julien Mairal and Piotr Bojanowski and Armand Joulin}, booktitle = {International Conference on Computer Vision (ICCV)}, title = {Emerging Properties in Self-Supervised Vision Transformers}, year = {2021}, } @inproceedings{zbontar2021barlow, author = {Jure Zbontar and Li Jing and Ishan Misra and Yann LeCun and Stephane Deny}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Barlow Twins: Self-Supervised Learning via Redundancy Reduction}, volume = {139}, year = {2021}, } @article{haochen2022beyond, author = {Jeff Z. HaoChen and Colin Wei and Ananya Kumar and Tengyu Ma}, journal = {arXiv}, title = {Beyond Separability: Analyzing the Linear Transferability of Contrastive Representations to Related Subpopulations}, year = {2022}, } @article{blodgett2017racial, author = {Su Lin Blodgett and Brendan OConnor}, journal = {arXiv preprint arXiv:1707.00061}, title = {Racial Disparity in Natural Language Processing: A Case Study of Social Media {A}frican-{A}merican {E}nglish}, year = {2017}, } @article{gallego2015online, author = {Guillermo Gallego and Anran Li and Van-Anh Truong and Xinshang Wang}, journal = {arXiv preprint arXiv:1511.01837}, title = {Online Resource Allocation with Customer Choice}, year = {2015}, } @article{joseph2017fair, author = {Matthew Joseph and Michael Kearns and Jamie Morgenstern and Seth Neel and Aaron Roth}, journal = {arXiv preprint arXiv:1610.09559}, title = {Fair Algorithms for Infinite and Contextual Bandits}, year = {2017}, } @techreport{jaillet2011online, author = {Patrick Jaillet and Xin Lu}, institution = {Massachusetts Institute of Technology}, title = {Online Resource Allocation Problems}, year = {2011}, } @inproceedings{krishnan2014recommender, author = {Sanjay Krishnan and Jay Patel and Michael Frankling and Ken Goldberg}, booktitle = {ACM Conference on Recommender Systems (RECSYS)}, title = {A methodology for learning, analyzing, and mitigating social influence bias in recommender systems}, year = {2014}, } @article{adomavicius2014bias, author = {Gediminas Adomavicius and Jesse Bockstedt and Shawn Curley and Jingjing Zhang}, journal = {CEUR Workshop Proceedings}, pages = {2--9}, title = {De-Biasing User Preference Ratings in Recommender Systems}, volume = {1253}, year = {2014}, } @article{priamuthu2012online, author = {Selwyn Piramuthu and Gaurav Kapoor and Wei Zhou and Sjouke Mauw}, journal = {Decision Support Systems}, pages = {418--424}, title = {Input online review data and related bias in recommender systems}, volume = {53}, year = {2012}, } @inproceedings{sharma2015causal, author = {Amit Sharma and Jake Hofman and Duncan Watts}, booktitle = {ACM Conference on Economics and Computation}, title = {Estimating the Causal Impact of Recommendation Systems from Observational Data}, year = {2015 2015}, } @book{rubens2011active, author = {Neil Rubens and Dain Kaplan and Masashi Sugiyami}, publisher = {Springer}, title = {Active Learning in Recommender Systems}, year = {2011}, } @inproceedings{yao2017parity, author = {Sirui Yao and Bert Huang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Beyond Parity:Fairness Objectives for Collaborative Filtering}, year = {2017}, } @inproceedings{landeiro2016confounder, author = {Virgile Landeiro and Aron Culotta}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Robust Text Classification in the Presence of Confounding Bias}, year = {2016}, } @inproceedings{goel2016stopandfrisk, author = {Sharad Goel and Justin M. Rao and Ravi Shroff}, booktitle = {The Annals of Applied Statistics}, title = {Precinct or Prejudice? Understanding Racial Disparities in New York City's Stop-and-Frisk Policy}, year = {2016}, } @inproceedings{roemmele2011copa, author = {Melissa Roemmele and Cosmin Adrian Bejan and Andrew S. Gordon}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Choice of Plausible Alternatives: An Evaluation of Commonsense Causal Reasoning}, year = {2011}, } @inproceedings{sap2019atomic, author = {Maarten Sap and Ronan LeBras and Emily Allaway and Chandra Bhagavatula and Nicholas Lourie and Hannah Rashkin and Brendan Roof and Noah A. Smith and Yejin Choi}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {ATOMIC: An Atlas of Machine Commonsense for If-Then Reasoning}, year = {2019}, } @misc{nyclu2019data, author = {NYCLU}, howpublished = {https://www.nyclu.org/en/stop-and-frisk-data}, title = {Stop-and-Frisk Data}, year = {2019}, } @inproceedings{zhao2016teen, author = {Jessie Zhao and May Lau and David Vermette and David Liang and Glenn Flores}, booktitle = {Journal of Adolescent Research}, title = {Communication Between {A}sian {A}merican Adolescents and Health Care Providers About Sexual Activity, Sexually Transmitted Infections, and Pregnancy Prevention}, year = {2016}, } @inproceedings{zech2018radio, author = {John R. Zech and Marcus A. Badgeley and Manway Liu and Anthony B. Costa and Joseph J. Titano and Eric Karl Oermann}, booktitle = {PLOS Medicine}, title = {Variable generalization performance of a deep learning model to detect pneumonia in chest radiographs: A cross-sectional study}, year = {2018}, } @inproceedings{honein2001accutane, author = {M.A. Honein and L.J. Paulozzi and J.D. Erickson}, booktitle = {Teratology}, title = {Continued occurrence of Accutane exposed pregnancies}, year = {2001}, } @inproceedings{gelman2007police, author = {Andrew Gelmand and Jeffrey Fagan and Alex Kiss}, booktitle = {Journal of the American Statistical Association}, title = {An Analysis of the New York City Police Department’s “Stop-and-Frisk” Policy in the Context of Claims of Racial Bias}, year = {2007}, } @inproceedings{kozor2014drug, author = {Rebecca Kozor and Stuart M. Grieve and Stefan Buchholz and Sharlene Kaye and Shane Darke and Ravinay Bhindi and Gemma A. Figtree}, booktitle = {PLos ONE}, title = {Regular Cocaine Use Is Associated with Increased Systolic Blood Pressure, Aortic Stiffness and Left Ventricular Mass in Young Otherwise Healthy Individuals}, year = {2014}, } @inproceedings{schulz2008unobserved, author = {Laura E. Schulz and Noah D. Goodman and Joshua B. Tenenbaum and Adrianna C. Jenkins}, booktitle = {Cognition}, title = {Going beyond the evidence: Abstract laws and preschoolers’ responses to anomalous data}, year = {2008}, } @inproceedings{saxe2007causal, author = {Rebecca Saxe and Tania Tzelnic and Susan Carey}, booktitle = {Developmental Psychology}, title = {Knowing Who Dunnit: Infants Identify the Causal Agent in an Unseen Causal Interaction}, year = {2007}, } @inproceedings{ullman2018physics, author = {Tomer D. Ullman and Andreas Stuhmuller and Noah D. Goodman and Joshua B. Tenenbaum}, booktitle = {Cognitive Psychology}, title = {Learning physical parameters from dynamic scenes}, year = {2018}, } @inproceedings{van2013confounder, author = {Tyler J. VanderWeele and Ilya Shpitser}, booktitle = {Annals of Statistics}, title = {On the definition of a confounder}, year = {2013}, } @inproceedings{jarvik1991nicotine, author = {Murray E. Jarvik}, booktitle = {British Journal of Addiction}, title = {Beneficial effects of nicotine}, year = {1991}, } @inproceedings{van2012effect, author = {Tyler J. VanderWeele}, booktitle = {Epidemiologic Methods}, title = {Confounding and effect modification: distribution and measure}, year = {2012}, } @book{angrist2009econometrics, author = {Joashua D. Angrist and Jorn-Steffen Pischke}, publisher = {Princeton University Press}, title = {Mostly Harmless Econometrics: An Empiricist's Companian}, year = {2009}, } @book{van2015causal, author = {Tyler J. VanderWeele}, publisher = {Oxford University Press}, title = {Explanation in Causal Inference: Methods for Mediation and Interaction}, year = {2015}, } @inproceedings{singh2019fair, author = {Harvineet Singh and Rina Singh and Vishwali Mhasawade and Rumi Chunara}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Fair Predictors under Distribution Shift}, year = {2019}, } @inproceedings{ghassemi2019health, author = {Marzyeh Ghassemi and Tristan Naumann and Peter Schulam and Andrew L Beam and Irene Y Chen and Rajesh Ranganath}, booktitle = {The Lancet Digital Health}, pages = {157--159}, title = {Practical guidance on artificial intelligence for health-care data}, year = {2019}, } @book{gerritsen2015addiction, author = {Marielle Gerritsen and Nadine Berndt and Lilian Lechner and Hein de Vries and Aart Mudde and Catherine Bolmand}, pages = {308--316}, publisher = {Journal of Addiction Medicine}, title = {Self-report of Smoking Cessation in Cardiac Patients}, year = {2015}, } @book{gordis1969reliability, author = {Leon Gordis and Milton Markowitz and Abraham M. Lilienfeld}, pages = {49--54}, publisher = {Medical Care}, title = {The Inaccuracy in Using Interviews to Estimate Patient Reliability in Taking Medications at Home}, year = {1969}, } @book{hoeck2015counterfactual, author = {Nicole Van Hoeck and Patrick D. Watson and Aron K. Barbey}, publisher = {Frontiers in Human Neuroscience}, title = {Cognitive neuroscience of human counterfactual reasoning}, year = {2015}, } @inproceedings{white2015questions, author = {Ryen W. White and Matthew Richardson and Wen-tau Tih}, booktitle = {World Wide Web (WWW)}, pages = {135--136}, title = {Questions vs. Queries in Informational Search Tasks}, year = {2015}, } @inproceedings{kiela2021dynabench, author = {Douwe Kiela and Max Bartolo and Yixin Nie and Divyansh Kaushik and Atticus Geiger and Zhengxuan Wu and Bertie Vidgen and Grusha Prasad and Amanpreet Singh and Pratik Ringshia and Zhiyi Ma and Tristan Thrush and Sebastian Riedel and Zeerak Waseem and Pontus Stenetorp and Robin Jia and Mohit Bansal and Christopher Potts and Adina Williams}, booktitle = {North American Association for Computational Linguistics (NAACL)}, pages = {4110--4124}, title = {Dynabench: Rethinking Benchmarking in {NLP}}, year = {2021}, } @article{bartolo2020beat, author = {Max Bartolo and Alastair Roberts and Johannes Welbl and Sebastian Riedel and Pontus Stenetorp}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, pages = {662--678}, title = {Beat the AI: Investigating Adversarial Human Annotation for Reading Comprehension}, volume = {8}, year = {2020}, } @inproceedings{teevan2007information, author = {Jaime Teevan and Eytan Adar and Rosie Jones and Michael A. S. Potts}, booktitle = {Annual Conference of the Association for Computing Machinery Special Interest Group in Information Retrieval}, title = {Information Re-Retrieval: Repeat Queries in Yahoo’s Logs }, year = {2007}, } @inproceedings{huang2009query, author = {Jeff Huang and Efthimis N. Efthimiadis}, booktitle = {Proceedings of the 18th ACM Conference on Information and Knowledge Management}, title = {Analyzing and evaluating query reformulation strategies in web search logs}, year = {2009}, } @inproceedings{lau1999patterns, author = {Tessa Lau and Eric Horvitz}, booktitle = {User Modeling}, pages = {119--128}, title = {Patterns of Search: Analyzing and Modeling Web Query Refinement}, year = {1999}, } @inproceedings{wang2008query, author = {Xuanhai Wang and ChengXiang Zhai}, booktitle = {Proceedings of the 17th ACM Conference on Information and Knowledge Management}, title = {Mining term association patterns from search logs for effective query reformulation}, year = {2008}, } @inproceedings{pang2011query, author = {Bo Pang and Ravi Kumar}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Search in the Lost Sense of “Query”: Question Formulation in Web Search Queries and its Temporal Changes}, year = {2011}, } @inproceedings{spink2002question, author = {Amanda Spink and H. Cenk Ozmultu}, booktitle = {Information Processing & Management}, title = {Characteristics of question format web queries: an exploratory study}, year = {2002}, } @inproceedings{liu2013search, author = {Jian Liu and Yiqun Liu and Min Zhang and Shaoping Ma}, booktitle = {Proceedings of the 22nd ACM Conference on Information and Knowledge Management}, title = {How Do Users Grow Up along with Search Engines?: A Study of Long-term Users’ Behavior}, year = {2013}, } @inproceedings{jacovi2020faithful, author = {Alon Jacovi and Yoav Goldberg}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Towards Faithfully Interpretable {NLP} Systems: How Should We Define and Evaluate Faithfulness?}, year = {2020}, } @inproceedings{lakkaraju2019faithful, author = {Himabindu Lakkaraju and Ece Kamar and Rich Caruana and Jure Lescovec}, booktitle = {Proceedings of the 2019 AAAI/ACM Conference on AI, Ethics, and Society}, title = {Faithful and Customizable Explanations of Black Box Models}, year = {2019}, } @inproceedings{bansal2021teammate, author = {Gagan Bansal and Besmira Nushi and Ece Kamar and Eric Horvitz and Daniel S. Weld}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Is the Most Accurate {AI} the Best Teammate? Optimizing {AI} for Teamwork}, year = {2021}, } @inproceedings{ginsberg2014fill, author = {Matthew L. Ginsberg}, booktitle = { Journal Of Artificial Intelligence Research}, pages = {851--886}, title = {Dr.Fill: Crosswords and an Implemented Solver for Singly Weighted CSPs}, year = {2014}, } @inproceedings{rozner2021cryptic, author = {Joshua Rozner and Christopher Potts and Kyle Mahowald}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Decrypting Cryptic Crosswords: Semantically Complex Wordplay}, year = {2021}, } @inproceedings{littman2002puzzles, author = {Michael L. Littman and Greg A. Keim and Noam Shazeer}, booktitle = {Artificial Intelligence}, pages = {23--55}, title = {A probabilistic approach to solving crossword puzzles}, year = {2002}, } @inproceedings{wallace2022crossword, author = {Eric Wallace and Nicholas Tomlin and Albert Xu and Kevin Yang and Eshaan Pathak and Matthew L. Ginsberg and Dan Klein}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Automated Crossword Solving}, year = {2022}, } @inproceedings{urbanek2019fantasy, author = {Jack Urbanek and Angela Fan and Siddharth Karamcheti and Saachi Jain and Samuel Humeau and Emily Dinan and Tim Rocktaschel and Douwe Kiela and Arthur Szlam and Jason Weston}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Learning to Speak and Act in a Fantasy Text Adventure Game}, year = {2019}, } @inproceedings{frans2021charades, author = {Kevin Frans}, booktitle = {IEEE Conference on Games (CoG)}, pages = {1--2}, title = {{AI} Charades: Language Models as Interactive Game Environments}, year = {2021}, } @inproceedings{chattopadhyay2017human, author = {Prithvijit Chattopadhyay and Deshraj Yadav and Viraj Prabhu and Arjun Chandrasekaran and Abhishek Das and Stefan Lee and Dhruv Batra and Devi Parikh}, booktitle = {AAAI Conference on Human Computation & Crowdsourcing}, title = {Evaluating Visual Conversational Agents via Cooperative Human-{AI} Games}, year = {2017}, } @inproceedings{ammanabrolu2019quest, author = {Prithviraj Ammanabrolu and William Broniec and Alex Mueller and Jeremy Paul and Mark Riedl}, booktitle = {Proceedings of the 4th Workshop on Computational Creativity in Language Generation}, title = {Toward Automated Quest Generation in Text-Adventure Games}, year = {2019}, } @inproceedings{gero2020mental, author = {Katy Ilonka Gero and Zahra Ashktorab and Casey Dugan and Qian Pan and James Johnson and Wener Geyer and Maria Ruiz and Sarah Miller and David R Millen and Murray Campbell and Sadhana Kumaravel and Wei Zhang}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Mental Models of {AI} Agents in a Cooperative Game Setting}, year = {2020}, } @inproceedings{ashktorab2020collaboration, author = {Zahra Ashktorab and Q. Vera Liao and Casey Dugan and James Johnson and Qian Pan and Wei Zhang and Sadhana Kumaravel and Murray Campbell}, booktitle = {Proceedings of ACM Human-Computer Interaction (CSCW)}, title = {Human-{AI} Collaboration in a Cooperative Game Setting: Measuring Social Perception and Outcomes}, year = {2020}, } @inproceedings{hua2020unicorns, author = {Minh Hua and Rita Raley}, booktitle = {Digital Humanities Quarterly}, title = {Playing With Unicorns: {AI} Dungeon and Citizen {NLP}}, year = {2020}, } @inproceedings{seo2014program, author = {Hyunmin Seo and Caitlin Sadowski and Sebastian Elbaum and Edward Aftandilian and Robert Bowdidge}, booktitle = {International Conference on Software Engineering (ICSE)}, title = {Programmers' Build Errors: A Case Study at Google}, year = {2014}, } @inproceedings{ding2020patching, author = {Yangruibo Ding and Baishakhi Ray and Premkumar Devanbu and Vincent J. Hellendoorn}, booktitle = {Automated Software Engineering (ASE)}, title = {Patching as Translation: the Data and the Metaphor}, year = {2020}, } @article{hajipour2019samplefix, author = {Hossein Hajipour and Apratim Bhattacharya and Mario Fritz}, journal = {arXiv preprint arXiv:1906.10502}, title = {SampleFix: Learning to Correct Programs by Sampling Diverse Fixes}, year = {2019}, } @inproceedings{gupta2019deep, author = {Rahul Gupta and Aditya Kanade and Shirish Shevade}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Deep reinforcement learning for programming language correction}, year = {2019}, } @inproceedings{pradel2018deepbugs, author = {Michael Pradel and Koushik Sen}, booktitle = {Object-Oriented Programming, Systems, Languages, and Applications (OOPSLA)}, title = {Deepbugs: A learning approach to name-based bug detection}, year = {2018}, } @inproceedings{ahmed2018compilation, author = {Umair Z Ahmed and Pawan Kumar and Amey Karkare and Purushottam Kar and Sumit Gulwani}, booktitle = {International Conference on Software Engineering (ICSE)}, title = {Compilation error repair: for the student programs, from the student programs}, year = {2018}, } @inproceedings{bader2019getafix, author = {Johannes Bader and Andrew Scott and Michael Pradel and Satish Chandra}, booktitle = {Object-Oriented Programming, Systems, Languages, and Applications (OOPSLA)}, title = {Getafix: Learning to fix bugs automatically}, year = {2019}, } @inproceedings{edunov2018understanding, author = {Sergey Edunov and Myle Ott and Michael Auli and David Grangier}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Understanding back-translation at scale}, year = {2018}, } @article{artetxe2018unsupervised, author = {Mikel Artetxe and Gorka Labaka and Eneko Agirre}, journal = {arXiv preprint arXiv:1809.01272}, title = {Unsupervised statistical machine translation}, year = {2018}, } @inproceedings{lachaux2020unsupervised, author = {Marie-Anne Lachaux and Baptiste Roziere and Lowik Chanussot and Guillaume Lample}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Unsupervised Translation of Programming Languages}, year = {2020}, } @inproceedings{lample2018phrase, author = {Guillaume Lample and Myle Ott and Alexis Conneau and Ludovic Denoyer and Marc'Aurelio Ranzato}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Phrase-based \& neural unsupervised machine translation}, year = {2018}, } @inproceedings{yang2020improving, author = {Kevin Yang and Wengong Jin and Kyle Swanson and Regina Barzilay and Tommi Jaakkola}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Improving Molecular Design by Stochastic Iterative Target Augmentation}, year = {2020}, } @inproceedings{jin2019learning, author = {Wengong Jin and Kevin Yang and Regina Barzilay and Tommi Jaakkola}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Learning multimodal graph-to-graph translation for molecular optimization}, year = {2019}, } @inproceedings{min2019discrete, author = {Sewon Min and Danqi Chen and Hannaneh Hajishirzi and Luke Zettlemoyer}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {A discrete hard em approach for weakly supervised question answering}, year = {2019}, } @inproceedings{zhong2020grounded, author = {Sewon Min and Danqi Chen and Hannaneh Hajishirzi and Luke Zettlemoyer}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Grounded adaptation for zero-shot executable semantic parsing}, year = {2020}, } @inproceedings{yasunaga2017graph, author = {Michihiro Yasunaga and Rui Zhang and Kshitijh Meelu and Ayush Pareek and Krishnan Srinivasan and Dragomir Radev}, booktitle = {Computational Natural Language Learning (CoNLL)}, title = {Graph-based neural multi-document summarization}, year = {2017}, } @inproceedings{xie2020unsupervised, author = {Qizhe Xie and Zihang Dai and Eduard Hovy and Minh-Thang Luong and Quoc V Le}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Unsupervised data augmentation for consistency training}, year = {2020}, } @article{antoniou2017data, author = {Antreas Antoniou and Amos Storkey and Harrison Edwards}, journal = {arXiv preprint arXiv:1711.04340}, title = {Data augmentation generative adversarial networks}, year = {2017}, } @inproceedings{mcclosky2006effective, author = {David McClosky and Eugene Charniak and Mark Johnson}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Effective self-training for parsing}, year = {2006}, } @inproceedings{xu2020autoqa, author = {Silei Xu and Sina J Semnani and Giovanni Campagna and Monica S Lam}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Auto{QA}: From databases to {QA} semantic parsers with only synthetic training data}, year = {2020}, } @inproceedings{hellendoorn2019code, author = {Vincent J Hellendoorn and Sebastian Proksch and Harald C Gall and Alberto Bacchelli}, booktitle = {International Conference on Software Engineering (ICSE)}, title = {When code completion fails: A case study on real-world completions}, year = {2019}, } @inproceedings{sun2016deep, author = {Baochen Sun and Kate Saenko}, booktitle = {European Conference on Computer Vision (ECCV)}, title = {Deep coral: Correlation alignment for deep domain adaptation}, year = {2016}, } @inproceedings{pascanu2013difficulty, author = {Razvan Pascanu and Tomas Mikolov and Yoshua Bengio}, booktitle = {International Conference on Machine Learning (ICML)}, title = {On the difficulty of training recurrent neural networks}, year = {2013}, } @article{taylor1953cloze, author = {Wilson L. Taylor}, journal = {Journalism Bulletin}, number = {4}, pages = {415--433}, title = {``{C}loze procedure'': A new tool for measuring readability}, volume = {30}, year = {1953}, } @article{deyes1984towards, author = {Tony Deyes}, journal = {Applied Linguistics}, number = {2}, pages = {128--137}, title = {Towards an authentic `discourse cloze'}, volume = {5}, year = {1984}, } @inproceedings{massalin1987superoptimizer, author = {Henry Massalin}, booktitle = {Architectural Support for Programming Languages and Operating Systems (ASPLOS)}, title = {Superoptimizer -- A Look at the Smallest Program}, year = {1987}, } @inproceedings{vadas2005programming, author = {David Vadas and James R. Curran}, booktitle = {Australasian Language Technology Workshop (ALTA)}, title = {Programming With Unrestricted Natural Language}, year = {2005}, } @inproceedings{bansal2006automatic, author = {Sorav Bansal and Alex Aiken}, booktitle = {Architectural Support for Programming Languages and Operating Systems (ASPLOS)}, title = {Automatic Generation of Peephole Superoptimizers}, year = {2006}, } @inproceedings{solar2006combinatorial, author = {Armando Solar-Lezama and Liviu Tancau and Rastislav Bodik and Vijay Saraswat and Sanjit Seshia}, booktitle = {Architectural Support for Programming Languages and Operating Systems (ASPLOS)}, title = {Combinatorial Sketching for Finite Programs}, year = {2006}, } @inproceedings{little2007keyword, author = {Greg Little and Robert C. Miller}, booktitle = {Automated Software Engineering (ASE)}, title = {Keyword Programming in Java}, year = {2007}, } @phdthesis{armando2008sketch, author = {Armando Solar-Lezama}, school = {University of California at Berkeley}, title = {Program Synthesis by Sketching}, year = {2008}, } @inproceedings{tate2009equality, author = {Ross Tate and Michael Stepp and Zachary Tatlock and Sorin Lerner}, booktitle = {Principles of Programming Languages (POPL)}, title = {Equality Saturation: a New Approach to Optimization}, year = {2009}, } @inproceedings{jha2010oracle, author = {Susmit Jha and Sumit Gulwani and Sanjit A. Seshia and Ashish Tiwari}, booktitle = {International Conference on Software Engineering (ICSE)}, title = {Oracle-Guided Component-Based Program Synthesis}, year = {2010}, } @inproceedings{schkufza2013stochastic, author = {Eric Schkufza and Rahul Sharma and Alex Aiken}, booktitle = {Architectural Support for Programming Languages and Operating Systems (ASPLOS)}, title = {Stochastic Superoptimization}, year = {2013}, } @inproceedings{feser2015synthesizing, author = {John K. Feser and Swarat Chaudhuri and Isil Dillig}, booktitle = {Programming Language Design and Implementation (PLDI)}, title = {Synthesizing Data Structure Transformations from Input-Output Examples}, year = {2015}, } @inproceedings{rudinger2015script, author = {Rachel Rudinger and Pushpendre Rastogi and Francis Ferraro and Benjamin Van Durme}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Script Induction as Language Modeling}, year = {2015}, } @inproceedings{yaghmazadeh2016hierarchy, author = {Navid Yaghmazadeh and Christian Klinger and Isil Dillig and Swarat Chaudhuri}, booktitle = {Programming Language Design and Implementation (PLDI)}, title = {Synthesizing Transformations on Hierarchically Structured Data }, year = {2016}, } @inproceedings{feng2017api, author = {Yu Feng and Ruben Martins and Yuepeng Wang and Isil Dillig and Tomas W. Reps}, booktitle = {Principles of Programming Languages (POPL)}, title = {Component-Based Synthesis for Complex APIs}, year = {2017}, } @inproceedings{parisotto2017sql, author = {Emilio Parisotto and Abdel-rahman Mohamed and Rishabh Singh and Lihong Li and Dengyong Zhou and Pushmeet Kohli}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Neuro-symbolic Program Synthesis}, year = {2017}, } @inproceedings{wang2017sql, author = {Chenglong Wang and Alvin Cheung and Rastislav Bodik}, booktitle = {Programming Language Design and Implementation (PLDI)}, title = {Synthesizing Highly Expressive {SQL} Queries from Input-Output Examples}, year = {2017}, } @inproceedings{devlin2017robustfill, author = {Jacob Devlin and Jonathan Uesato and Surya Bhupatiraju and Rishabh Singh and Abdel-rahman Mohamed and Pushmeet Kohli}, booktitle = {International Conference on Machine Learning (ICML)}, title = {RobustFill: Neural Program Learning Under Noisy I/O}, year = {2017}, } @article{devlin2017varreplace, author = {Jacob Devlin and Jonathan Uesato and Rishabh Singh and Pushmeet Kohli}, journal = {arXiv preprint arXiv:1710.11054}, title = {Semantic Code Repair Using Neuro-Symbolic Transformation Networks}, year = {2017}, } @inproceedings{gupta2017deepfix, author = {Rahul Gupta and Soham Pal and Aditya Kanade and Shirish K. Shevade}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Deepfix: Fixing Common {C} Language Errors by Deep Learning}, year = {2017}, } @inproceedings{yaghmazadeh2017sqlizer, author = {Navid Yaghmazadeh and Yuepeng Wang and Isil Dillig and Thomas Dillig}, booktitle = {Object-Oriented Programming, Systems, Languages, and Applications (OOPSLA)}, title = {SQLizer: Query Synthesis from Natural Language}, year = {2017}, } @inproceedings{chambers2008narrative, author = {Nathanael Chambers and Dan Jurafsky}, booktitle = {Human Language Technology and Association for Computational Linguistics (HLT/ACL)}, title = {Unsupervised Learning of Narrative Event Chains}, year = {2008}, } @inproceedings{bhatia2018synfix, author = {Sahil Bhatia and Pushmeet Kohli and Rishabh Singh}, booktitle = {International Conference on Software Engineering (ICSE)}, title = {Neuro-Symbolic Program Corrector for Introductory Programming Assignments}, year = {2018}, } @inproceedings{lin2018nl2bash, author = {Xi Victoria Lin and Chenglong Wang and Luke S. Zettlemoyer and Michael D. Ernst}, booktitle = {Language Resources and Evaluation Conference (LREC)}, title = {NL2Bash: A Corpus and Semantic Parser for Natural Language Interface to the Linux Operating System}, year = {2018}, } @inproceedings{iyer2018mapping, author = {Srinivasan Iyer and Ioannis Konstas and Alvin Cheung and Luke S. Zettlemoyer}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Mapping Language to Code in Programmatic Context}, year = {2018}, } @inproceedings{allamanis2018varmisuse, author = {Miltiadis Allamanis and Marc Brockschmidt and Mahmoud Khademi}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Learning to Represent Programs with Graphs}, year = {2018}, } @inproceedings{svyatkovskiy2019pythia, author = {Alexey Svyatkovskiy and Ying Zhao and Shengyo Fu and Neel Sundaresan}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, title = {Pythia: {AI}-assisted Code Completion System}, year = {2019}, } @inproceedings{baziotis2019seq, author = {Christos Baziotis and Ion Androutsopoulos and Ioannis Konstas and Alexandros Potamianos}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {SEQ\({}^{\mbox{3}}\): Differentiable Sequence-to-Sequence-to-Sequence Autoencoder for Unsupervised Abstractive Sentence Compression}, year = {2019}, } @inproceedings{west2019bottlesum, author = {Peter West and Ari Holtzman and Jan Buys and Yejin Choi}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {BottleSum: Self-Supervised and Unsupervised Sentence Summarization using the Information Bottleneck Principle}, year = {2019}, } @inproceedings{yang2019xlnet, author = {Zhilin Yang and Zihang Dai and Yiming Yang and Jaime Carbonell and Ruslan Salakhutdinov and Quoc V. Le}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {{XLN}et: Generalized Autoregressive Pretraining for Language Understanding}, year = {2019}, } @article{zhu2019text, author = {Wanrong Zhu and Zhiting Hu and Eric Xing}, journal = {arXiv preprint arXiv:1901.00158}, title = {Text Infilling}, year = {2019}, } @inproceedings{ippolito2019unsupervised, author = {Daphne Ippolito and David Grangier and Chris Callison-Burch and Douglas Eck}, booktitle = {NAACL Workshop on Narrative Understanding}, pages = {37--43}, title = {Unsupervised Hierarchical Story Infilling}, year = {2019}, } @article{ai2019haim, author = {AI21}, journal = {AI21 Labs Blog}, title = {{HAIM}: A Modest Step Towards Controllable Text Generation}, year = {2019}, } @article{liu2019tigs, author = {Dayiheng Liu and Jie Fu and Pengfei Liu and Jiancheng Lv}, journal = {arXiv preprint arXiv:1905.10752}, title = {{TIGS}: An Inference Algorithm for Text Infilling with Gradient Search}, year = {2019}, } @article{wolf2019transformers, author = {Thomas Wolf and Lysandre Debut and Victor Sanh and Julien Chaumond and Clement Delangue and Anthony Moi and Pierric Cistac and Tim Rault and R'emi Louf and Morgan Funtowicz and Jamie Brew}, journal = {arXiv preprint arXiv:1910.03771}, title = {{HuggingFace}'s Transformers: State-of-the-art Natural Language Processing}, year = {2019}, } @article{wang2019bert, author = {Alex Wang and Kyunghyun Cho}, journal = {arXiv preprint arXiv:1902.04094}, title = {{BERT} has a mouth, and it must speak: {BERT} as a {M}arkov random field language model}, year = {2019}, } @article{raffel2019exploring, author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu}, journal = {arXiv preprint arXiv:1910.10683}, title = {Exploring the limits of transfer learning with a unified text-to-text transformer}, year = {2019}, } @article{gu2019insertion, author = {Jiatao Gu and Qi Liu and Kyunghyun Cho}, journal = {arXiv preprint arXiv:1902.01370}, title = {Insertion-based Decoding with automatically Inferred Generation Order}, year = {2019}, } @article{stern2019insertion, author = {Mitchell Stern and William Chan and Jamie Kiros and Jakob Uszkoreit}, journal = {arXiv preprint arXiv:1902.03249}, title = {Insertion Transformer: Flexible Sequence Generation via Insertion Operations}, year = {2019}, } @article{shih2019xl, author = {Yong-Siang Shih and Wei-Cheng Chang and Yiming Yang}, journal = {arXiv preprint arXiv:1910.10479}, title = {{XL}-{E}ditor: Post-editing Sentences with XLNet}, year = {2019}, } @inproceedings{ghazvininejad2019mask, author = {Marjan Ghazvininejad and Omer Levy and Yinhan Liu and Luke Zettlemoyer}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Mask-{P}redict: Parallel decoding of conditional masked language models}, year = {2019}, } @article{mansimov2019generalized, author = {Elman Mansimov and Alex Wang and Kyunghyun Cho}, journal = {arXiv preprint arXiv:1905.12790}, title = {A Generalized Framework of Sequence Generation with Application to Undirected Sequence Models}, year = {2019}, } @article{gu2019levenshtein, author = {Jiatao Gu and Changhan Wang and Jake Zhao}, journal = {arXiv preprint arXiv:1905.11006}, title = {Levenshtein Transformer}, year = {2019}, } @article{joshi2019spanbert, author = {Mandar Joshi and Danqi Chen and Yinhan Liu and Daniel S. Weld and Luke Zettlemoyer and Omer Levy}, journal = {arXiv preprint arXiv:1907.10529}, title = {Span{BERT}: Improving Pre-training by Representing and Predicting Spans}, year = {2019}, } @inproceedings{mccarthy2002ls, author = {Diana McCarthy}, booktitle = {{SIGLEX}/{SENSEVAL} Workshop on Word Sense Disambiguation: Recent Successes and Future Direction}, title = {Lexical Substitution as a Task for {WSD} Evaluation}, year = {2002}, } @inproceedings{mccarthy2007semeval, author = {Diana McCarthy and Roberto Navigli}, booktitle = {Workshop on Semantic Evaluations}, title = {Sem{E}val-2007 Task 10: {E}nglish Lexical Substitution Task}, year = {2007}, } @inproceedings{kremer2014coinco, author = {Gerhard Kremer and Katrin Erk and Sabastian Pado and Stefan Thater}, booktitle = {Association for Computational Linguistics (ACL)}, title = {What Substitutes Tell Us -- Analysis of an ``All-Words Lexical Substitution Corpus}, year = {2014}, } @inproceedings{zhou2019bbls, author = {Wangchunshu Zhou and Tao Ge and Ke Xu and Furu Wei and Ming Zhou}, booktitle = {Association for Computational Linguistics (ACL)}, title = {{BERT}-based Lexical Substitution}, year = {2019}, } @article{arefyev2020lssurvey, author = {Nikolay Arefyev and Boris Sheludko and Alexander Podolskiy and Alexander Panchenko}, journal = {arXiv}, title = {A Comparative Study of Lexical Substitution Approaches based on Neural Language Models}, year = {2020}, } @article{sharoff2006corpora, author = {S. Sharoff}, journal = {International Journal of Corpus Linguistics}, pages = {435--462}, title = {Open-source Corpora: Using the net to fish for linguistic data}, volume = {11}, year = {2006}, } @inproceedings{ide2008masc, author = {Nancy Ide and Collin Baker and Christiane Fellbaum and Charles Fillmore and Rebecca Passonneau}, booktitle = {Language Resources and Evaluation (LREC)}, title = {{MASC}: the Manually Annotated Sub-Corpus of {A}merican {E}nglish}, year = {2008}, } @inproceedings{ide2010masc, author = {Nancy Ide and Collin Baker and Christiane Fellbaum and Rebecca Passonneau}, booktitle = {Association for Computational Linguistics (ACL)}, title = {The Manually Annotated Sub-Corpus: A Community Resource for and by the People}, year = {2010}, } @techreport{kishida2005gap, author = {Kazuaki Kishida}, institution = {National Institute of Informatics}, title = {Property of Average Precision and its Generalization: An Examination of Evaluation Indicator for Information Retrieval Experiments}, year = {2005}, } @article{webber2010rbo, author = {William Webber and Alistair Moffat and Justin Zobel}, journal = {ACM Transactions on Information Systems (TOIS)}, title = {A Similarity Measure for Indefinite Rankings}, year = {2010}, } @book{murphy2010nearsynonym, author = {M. Lynne Murphy}, publisher = {Cambridge University Press}, title = {Lexical Meaning}, year = {2010}, } @misc{ai2020wordtune, author = {AI21}, howpublished = {\url{https://www.wordtune.com/}}, title = {Wordtune (accessed 2020 {O}ct 30)}, year = {2020}, } @misc{speer2018wordfreq, author = {Robyn Speer and Joshua Chin and Andrew Lin and Sara Jewett and Lance Nathan}, howpublished = {\url{https://doi.org/10.5281/zenodo.1443582}}, title = {Luminoso{I}nsight/wordfreq: v2.2}, year = {2018}, } @inproceedings{thater2010contextualizing, author = {Thater, Stefan and F{\"u}rstenau, Hagen and Pinkal, Manfred}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Contextualizing semantic representations using syntactically enriched vector models}, year = {2010}, } @inproceedings{smith2011cloze, author = {Nathaniel Smith and Roger Levy}, booktitle = {Proceedings of the Annual Meeting of the Cognitive Science Society}, title = {Cloze but no cigar: The complex relationship between cloze, corpus, and subjective probabilities in language processing}, year = {2011}, } @inproceedings{eisape2020cloze, author = {Tiwalayo Eisape and Noga Zaslavsky and Roger Levy}, booktitle = {Computational Natural Language Learning (CoNLL)}, title = {Cloze Distillation Improves Psychometric Predictive Power}, year = {2020}, } @article{navigli2009word, author = {Roberto Navigli}, journal = {ACM Computing Surveys (CSUR)}, title = {Word sense disambiguation: A survey}, year = {2009}, } @article{edmonds2002near, author = {Philip Edmonds and Graeme Hirst}, journal = {Computational Linguistics}, title = {Near-synonymy and lexical choice}, year = {2002}, } @article{kilgarriff1997wordsense, author = {A. Kilgarriff}, journal = {Computers and the Humanities}, title = {{I} Don’t Believe in Word Senses}, year = {1997}, } @inproceedings{pavlick2015ppdb, author = {Ellie Pavlick and Pushpendre Rastogi and Juri Ganitkevitch and Benjamin Van Durme and Chris Callison-Burch}, booktitle = {Association for Computational Linguistics (ACL)}, title = {{PPDB} 2.0: Better paraphrase ranking, fine-grained entailment relations, word embeddings, and style classification}, year = {2015}, } @inproceedings{wieting2018paranmt, author = {John Wieting and Kevin Gimpel}, booktitle = {Association for Computational Linguistics (ACL)}, title = {{P}ara{NMT}-50{M}: Pushing the Limits of Paraphrastic Sentence Embeddings with Millions of Machine Translations}, year = {2018}, } @article{pavlick2019inherent, author = {Ellie Pavlick and Tom Kwiatkowski}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {Inherent Disagreements in Human Textual Inferences}, volume = {7}, year = {2019}, } @inproceedings{nie2020learn, author = {Yixin Nie and Xiang Zhou and Mohit Bansal}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {What Can We Learn from Collective Human Opinions on Natural Language Inference Data?}, year = {2020}, } @inproceedings{dimarco1993nearsynonym, author = {Chrysanne DiMarco and Graeme Hirst and Manfred Stede}, booktitle = {AAAI Spring Symposium on Building Lexicons for Machine Translation}, title = {The semantic and stylistic differentiation of synonyms and near-synonyms}, year = {1993}, } @book{hayakawa1994ctrw, author = {Samuel Ichiye Hayakawa}, publisher = {Collins Reference}, title = {Choose the Right Word: A Contemporary Guide to Selecting the Precise Word for Every Situation}, year = {1994}, } @misc{brants2006ngram, author = {Thorsten Brants and Alex Franz}, title = {Web 1{T} 5-gram version 1}, year = {2006}, } @inproceedings{melamud2015modeling, author = {Melamud, Oren and Dagan, Ido and Goldberger, Jacob}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Modeling word meaning in context with substitute vectors}, year = {2015}, } @inproceedings{szarvas2013learning, author = {Szarvas, Gy{\"o}rgy and Busa-Fekete, R{'o}bert and H{\"u}llermeier, Eyke}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Learning to rank lexical substitutions}, year = {2013}, } @inproceedings{hintz2016language, author = {Hintz, Gerold and Biemann, Chris}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Language transfer learning for supervised lexical substitution}, year = {2016}, } @book{kipfer2013roget, author = {Barbara Ann Kipfer}, publisher = {Random House Publishing Group}, title = {Roget's 21st Century Thesaurus, Third Edition}, year = {2013}, } @phdthesis{miller2016thesis, author = {Tristan Miller}, school = {Technische Universität Darmstadt}, title = {Adjusting Sense Representations for Word Sense Disambiguation and Automatic Pun Interpretation}, year = {2016}, } @inproceedings{assael2019restoring, author = {Yannis Assael and Thea Sommerschield and Jonathan Prag}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Restoring ancient text using deep learning: a case study on Greek epigraphy}, year = {2019}, } @inproceedings{clark2018neural, author = {Clark, Elizabeth and Ji, Yangfeng and Smith, Noah A.}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Neural Text Generation in Stories Using Entity Representations as Context}, year = {2018}, } @inproceedings{buschek2021impact, author = {Buschek, Daniel and Z\"{u}rn, Martin and Eiband, Malin}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {The Impact of Multiple Parallel Phrase Suggestions on Email Input and Composition Behaviour of Native and Non-Native {E}nglish Writers}, year = {2021}, } @article{wang2021evaluation, author = {Lu Wang and Munif Ishad Mujib and Jake Williams and George Demiris and Jina Huh-Yoo}, journal = {arXiv preprint arXiv:2107.13115}, title = {An Evaluation of Generative Pre-Training Model-based Therapy Chatbot for Caregivers}, year = {2021}, } @inproceedings{wu2022aichain, author = {Tongshuang Wu and Michael Terry and Carrie J. Cai}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {{AI} Chains: Transparent and Controllable Human-{AI} Interaction by Chaining Large Language Model Prompts}, year = {2022}, } @inproceedings{zhou2021medical, author = {Meng Zhou and Zechen Li and Bowen Tan and Guangtao Zeng and Wenmian Yang and Xuehai He and Zeqian Ju and Subrato Chakravorty and Shu Chen and Xingyi Yang and Yichen Zhang and Qingyang Wu and Zhou Yu and Kun Xu and Eric Xing and Pengtao Xie}, booktitle = {Association for Computational Linguistics (ACL)}, title = {On the Generation of Medical Dialogs for {COVID}-19}, year = {2021}, } @article{bly1999design, author = {Bly, Sara and Churchill, Elizabeth F}, journal = {Interactions}, number = {2}, pages = {23--31}, title = {Design through matchmaking: technology in search of users}, volume = {6}, year = {1999}, } @inproceedings{yang2020reexamining, author = {Yang, Qian and Steinfeld, Aaron and Ros'{e}, Carolyn and Zimmerman, John}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Re-Examining Whether, Why, and How Human-{AI} Interaction Is Uniquely Difficult to Design}, year = {2020}, } @inproceedings{yang2019sketch, author = {Yang, Qian and Cranshaw, Justin and Amershi, Saleema and Iqbal, Shamsi T. and Teevan, Jaime}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Sketching {NLP}: A Case Study of Exploring the Right Things To Design with Language Intelligence}, year = {2019}, } @inproceedings{gehrmann2021gem, author = {Sebastian Gehrmann and Tosin Adewumi and Karmanya Aggarwal and Pawan Sasanka Ammanamanchi and Anuoluwapo Aremu and Antoine Bosselut and Khyathi Raghavi Chandu and Miruna-Adriana Clinciu and Dipanjan Das and Kaustubh Dhole and Wanyu Du and Esin Durmus and Ondřej Dušek and Chris Chinenye Emezue and Varun Gangal and Cristina Garbacea and Tatsunori Hashimoto and Yufang Hou and Yacine Jernite and Harsh Jhamtani and Yangfeng Ji and Shailza Jolly and Mihir Kale and Dhruv Kumar and Faisal Ladhak and Aman Madaan and Mounica Maddela and Khyati Mahajan and Saad Mahamood and Bodhisattwa Prasad Majumder and Pedro Henrique Martins and Angelina McMillan-Major and Simon Mille and Emiel van Miltenburg and Moin Nadeem and Shashi Narayan and Vitaly Nikolaev and Andre Niyongabo Rubungo and Salomey Osei and Ankur Parikh and Laura Perez-Beltrachini and Niranjan Ramesh Rao and Vikas Raunak and Juan Diego Rodriguez and Sashank Santhanam and João Sedoc and Thibault Sellam and Samira Shaikh and Anastasia Shimorina and Marco Antonio Sobrevilla Cabezudo and Hendrik Strobelt and Nishant Subramani and Wei Xu and Diyi Yang and Akhila Yerukola and Jiawei Zhou}, booktitle = {Association for Computational Linguistics (ACL)}, title = {The {GEM} Benchmark: Natural Language Generation, its Evaluation and Metrics}, year = {2021}, } @book{buxton2010sketching, author = {Buxton, Bill}, publisher = {Morgan Kaufmann}, title = {Sketching user experiences: getting the design right and the right design}, year = {2010}, } @inproceedings{gaver1991affordance, author = {William W. Gaver}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Technology affordances}, year = {1991}, } @inproceedings{ozenc2010support, author = {Ozenc, Fatih Kursat and Kim, Miso and Zimmerman, John and Oney, Stephen and Myers, Brad}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {How to support designers in getting hold of the immaterial material of software}, year = {2010}, } @inproceedings{martelaro2020arduino, author = {Martelaro, Nikolas and Zamfirescu-Pereria, J.D. and Goedicke, David and Sirkin, David and Ju, Wendy}, booktitle = {Extended Abstracts of Conference on Human Factors in Computing Systems (CHI EA)}, title = {Make This! Introduction to Electronics Prototyping Using Arduino}, year = {2020}, } @inproceedings{fiebrink2010wekinator, author = {Fiebrink, Rebecca and Cook, Perry R}, booktitle = {International Society for Music Information Retrieval (ISMIR)}, title = {The {W}ekinator: a system for real-time, interactive machine learning in music}, year = {2010}, } @inproceedings{carney2020teachable, author = {Carney, Michelle and Webster, Barron and Alvarado, Irene and Phillips, Kyle and Howell, Noura and Griffith, Jordan and Jongejan, Jonas and Pitaru, Amit and Chen, Alexander}, booktitle = {Extended Abstracts of Conference on Human Factors in Computing Systems (CHI EA)}, title = {Teachable Machine: Approachable Web-Based Tool for Exploring Machine Learning Classification}, year = {2020}, } @inproceedings{holstein2020replayenactments, author = {Holstein, Kenneth and Harpstead, Erik and Gulotta, Rebecca and Forlizzi, Jodi}, booktitle = {ACM Designing Interactive Systems Conference (DIS)}, title = {Replay Enactments: Exploring Possible Futures through Historical Data}, year = {2020}, } @book{schon1984reflective, author = {Sch{\"o}n, Donald A}, publisher = {Basic books}, title = {The reflective practitioner: How professionals think in action}, year = {1984}, } @inproceedings{lim2008anatomy, author = {Lim, Youn-Kyung and Stolterman, Erik and Tenenberg, Josh}, booktitle = {ACM Transactions on Computer-Human Interaction (TOCHI)}, title = {The anatomy of prototypes: Prototypes as filters, prototypes as manifestations of design ideas}, year = {2008}, } @article{fan2020englishcentric, author = {Angela Fan and Shruti Bhosale and Holger Schwenk and Zhiyi Ma and Ahmed El-Kishky and Siddharth Goyal and Mandeep Baines and Onur Celebi and Guillaume Wenzek and Vishrav Chaudhary and Naman Goyal and Tom Birch and Vitaliy Liptchinsky and Sergey Edunov and Edouard Grave and Michael Auli and Armand Joulin}, journal = {arXiv preprint arXiv:2010.11125}, title = {Beyond {E}nglish-Centric Multilingual Machine Translation}, year = {2020}, } @misc{lieber2021jurassic, author = {Opher Lieber and Or Sharir and Barak Lenz and Yoav Shoham}, howpublished = {\url{https://uploads-ssl.webflow.com/60fd4503684b466578c0d307/61138924626a6981ee09caf6_jurassic_tech_paper.pdf}}, title = {Jurassic-1: Technical Details and Evaluation}, year = {2021}, } @inproceedings{calderwood2020novelists, author = {Calderwood, Alex and Qiu, Vivian and Gero, Katy Ilonka and Chilton, Lydia B}, booktitle = {Proceedings of the Workshops on Human-AI Co-Creation with Generative Models and User-Aware Conversational Agents}, title = {How Novelists Use Generative Language Models: An Exploratory User Study}, year = {2020}, } @inproceedings{wu2020importance, author = {Wu, Qingyang and Li, Lei and Zhou, Hao and Zeng, Ying and Yu, Zhou}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Importance-aware learning for neural headline editing}, year = {2020}, } @misc{openai2023playground, author = {OpenAI}, howpublished = {\url{https://platform.openai.com/playground}}, title = {{O}pen{AI} playground}, year = {2023}, } @inproceedings{roemmele2018writing, author = {Roemmele, Melissa and Gordon, Andrew S.}, booktitle = {Intelligent User Interfaces (IUI)}, title = {Automated Assistance for Creative Writing with an {RNN} Language Model}, year = {2018}, } @article{cuadra2021look, author = {Cuadra, Andrea and Lee, Hansol and Cho, Jason and Ju, Wendy}, journal = {arXiv preprint arXiv:2104.07153}, title = {Look at Me When {I} Talk to You: A Video Dataset to Enable Voice Assistants to Recognize Errors}, year = {2021}, } @inproceedings{semmens2019vehicle, author = {Semmens, Rob and Martelaro, Nikolas and Kaveti, Pushyami and Stent, Simon and Ju, Wendy}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Is Now A Good Time? An Empirical Study of Vehicle-Driver Communication Timing}, year = {2019}, } @inproceedings{theodorou2021disability, author = {Theodorou, Lida and Massiceti, Daniela and Zintgraf, Luisa and Stumpf, Simone and Morrison, Cecily and Cutrell, Edward and Harris, Matthew Tobias and Hofmann, Katja}, booktitle = {ACM SIGACCESS Conference on Computers and Accessibility (ASSETS)}, title = {Disability-First Dataset Creation: Lessons from Constructing a Dataset for Teachable Object Recognition with Blind and Low Vision Data Collectors}, year = {2021}, } @inproceedings{yang2018ux, author = {Yang, Qian and Scuito, Alex and Zimmerman, John and Forlizzi, Jodi and Steinfeld, Aaro}, booktitle = {ACM Designing Interactive Systems Conference (DIS)}, title = {Investigating How Experienced {UX} Designers Effectively Work with Machine Learning}, year = {2018}, } @misc{purdue2021owl, author = {Purdue Online Writing Lab}, howpublished = {\url{https://owl.purdue.edu/owl/general_writing/academic_writing/essay_writing/argumentative_essays.html}}, title = {Argumentative Essays}, year = {2021}, } @misc{reddit2021writingprompts, author = {Reddit}, howpublished = {\url{https://www.reddit.com/r/WritingPrompts}}, title = {WritingPrompts}, year = {2021}, } @misc{nyt2021argument, author = {The New York Times}, howpublished = {\url{https://www.nytimes.com/2021/02/01/learning/300-questions-and-images-to-inspire-argument-writing.html}}, title = {300 Questions and Images to Inspire Argument Writing}, year = {2021}, } @article{storch2002patterns, author = {Storch, Neomy}, journal = {Language learning}, number = {1}, pages = {119--158}, title = {Patterns of interaction in {ESL} pair work}, volume = {52}, year = {2002}, } @article{ippolito2022wordcraft, author = {Daphne Ippolito and Ann Yuan and Andy Coenen and Sehmon Burnam}, journal = {arXiv preprint arXiv:2211.05030}, title = {Creative Writing with an {AI}-Powered Writing Assistant: Perspectives from Professional Writers}, year = {2022}, } @article{wei2022cot, author = {Jason Wei and Xuezhi Wang and Dale Schuurmans and Maarten Bosma and Brian Ichter and Fei Xia and Ed Chi and Quoc Le and Denny Zhou}, journal = {arXiv preprint arXiv:2201.11903}, title = {Chain-of-Thought Prompting Elicits Reasoning in Large Language Models}, year = {2022}, } @inproceedings{lu2022prompt, author = {Yao Lu and Max Bartolo and Alastair Moore and Sebastian Riedel and Pontus Stenetorp}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Fantastically Ordered Prompts and Where to Find Them: Overcoming Few-Shot Prompt Order Sensitivity}, year = {2022}, } @inproceedings{shen2020blank, author = {Shen, Tianxiao and Quach, Victor and Barzilay, Regina and Jaakkola, Tommi}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Blank Language Models}, year = {2020}, } @article{jansen2009patterns, author = {Jansen, Bernard J and Booth, Danielle L and Spink, Amanda}, journal = {Journal of the american society for information science and technology}, number = {7}, pages = {1358--1371}, title = {Patterns of query reformulation during web searching}, volume = {60}, year = {2009}, } @inproceedings{jiang2013users, author = {Jiang, Jiepu and Jeng, Wei and He, Daqing}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, title = {How do users respond to voice input errors? Lexical and phonetic query reformulation in voice search}, year = {2013}, } @article{dibia2022aligning, author = {Dibia, Victor and Fourney, Adam and Bansal, Gagan and Poursabzi-Sangdeh, Forough and Liu, Han and Amershi, Saleema}, journal = {arXiv preprint arXiv:2210.16494}, title = {Aligning Offline Metrics and Human Judgments of Value of {AI}-Pair Programmers}, year = {2022}, } @book{mani1999advances, author = {Mani, Inderjeet}, publisher = {MIT Press}, title = {Advances in Automatic Text Summarization}, year = {1999}, } @article{sparck1999automatic, author = {Sp\"arck Jones, Karen}, journal = {Advances in automatic text summarization}, pages = {1--12}, title = {Automatic summarizing: factors and directions}, year = {1999}, } @book{nenkova2012survey, author = {Nenkova, Ani and McKeown, Kathleen}, pages = {43--76}, publisher = {Springer}, title = {A survey of text summarization techniques}, year = {2012}, } @article{avinesh2018sherlock, author = {Avinesh, PVS and Binnig, Carsten and H{\"a}ttasch, Benjamin and Meyer, Christian M and {\"O}zyurt, Orkan}, journal = {Proceedings of the VLDB Endowment}, pages = {1902--1905}, title = {Sherlock: A System for Interactive Summarization of Large Text Collections}, volume = {11}, year = {2018}, } @inproceedings{shapira2021extending, author = {Ori Shapira and Ramakanth Pasunuru and Hadar Ronen and Mohit Bansal and Yael Amsterdamer and Ido Dagan}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Extending Multi-Document Summarization Evaluation to the Interactive Setting}, year = {2021}, } @inproceedings{shapira2022interactive, author = {Ori Shapira and Ramakanth Pasunuru and Mohit Bansal and Ido Dagan and Yael Amsterdamer}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Interactive Query-Assisted Summarization via Deep Reinforcement Learning}, year = {2022}, } @inproceedings{grusky2018newsroom, author = {Max Grusky and Mor Naaman and Yoav Artzi}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {{N}ewsroom: A Dataset of 1.3 Million Summaries with Diverse Extractive Strategies}, year = {2018}, } @inproceedings{chakrabarty2022copoet, author = {Chakrabarty, Tuhin and Padmakumar, Vishakh and He, He}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Help me write a poem: Instruction Tuning as a Vehicle for Collaborative Poetry Writing}, year = {2022}, } @book{lakoff1980metaphors, author = {Lakoff, George and Johnson, Mark}, publisher = {University of Chicago Press}, title = {Metaphors we live by}, year = {1980}, } @book{jones1995evaluating, author = {Sp\"arck Jones, Karen and Galliers, Julia R.}, publisher = {Springer Verlag}, title = {Evaluating Natural Language Processing Systems: An Analysis and Review}, year = {1995}, } @article{liberman2010obituary, author = {Liberman, Mark}, journal = {Computational Linguistics}, title = {Obituary: Fred Jelinek}, volume = {36}, year = {2010}, } @article{ganguli2022red, author = {Deep Ganguli and Liane Lovitt and John Kernion and Amanda Askell and Yushi Bai and Saurav Kadavath and Benjamin Mann and Ethan Perez and Nicholas Schiefer and Kamal Ndousse and Andy Jones and Sam Bowman and Anna Chen and Tom Conerly and Nova DasSarma and Dawn Drain and Nelson Elhage and Sheer El-Showk and Stanislav Fort and Zachary Dodds and T. J. Henighan and Danny Hernandez and Tristan Hume and Josh Jacobson and Scott Johnston and Shauna Kravec and Catherine Olsson and Sam Ringer and Eli Tran-Johnson and Dario Amodei and Tom B. Brown and Nicholas Joseph and Sam McCandlish and Christopher Olah and Jared Kaplan and Jack Clark}, journal = {arXiv preprint arXiv:2209.07858}, title = {Red Teaming Language Models to Reduce Harms: Methods, Scaling Behaviors, and Lessons Learned}, year = {2022}, } @inproceedings{kirk2022handling, author = {Hannah Rose Kirk and Abeba Birhane and Bertie Vidgen and Leon Derczynski}, booktitle = {Findings of Empirical Methods in Natural Language Processing (Findings of EMNLP)}, title = {Handling and Presenting Harmful Text in {NLP} Research}, year = {2022}, } @inproceedings{jakesch2023cowriting, author = {Jakesch, Maurice and Bhat, Advait and Buschek, Daniel and Zalmanson, Lior and Naaman, Mor}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Co-Writing with Opinionated Language Models Affects Users’ Views}, year = {2023}, } @article{wenker2022wrote, author = {Wenker, Kilian}, journal = {arXiv preprint arXiv:2210.06470}, title = {Who Wrote this? How Smart Replies Impact Language and Agency in the Workplace}, year = {2022}, } @article{allam2014impact, author = {Allam, Ahmed and Schulz, Peter Johannes and Nakamoto, Kent and others}, journal = {Journal of medical internet research}, number = {4}, title = {The impact of search engine selection and sorting criteria on vaccination beliefs and attitudes: two experiments manipulating Google output}, volume = {16}, year = {2014}, } @misc{wmt2006wmt, author = {WMT}, title = {Proceedings on the Workshop on Statistical Machine Translation}, year = {2006}, } @article{gunasekara2020overview, author = {Chulaka Gunasekara and Seokhwan Kim and Luis Fernando D'Haro and Abhinav Rastogi and Yun-Nung Chen and Mihail Eric and Behnam Hedayatnia and Karthik Gopalakrishnan and Yang Liu and Chao-Wei Huang and Dilek Hakkani-Tür and Jinchao Li and Qi Zhu and Lingxiao Luo and Lars Liden and Kaili Huang and Shahin Shayandeh and Runze Liang and Baolin Peng and Zheng Zhang and Swadheen Shukla and Minlie Huang and Jianfeng Gao and Shikib Mehri and Yulan Feng and Carla Gordon and Seyed Hossein Alavi and David Traum and Maxine Eskenazi and Ahmad Beirami and Eunjoon (EJ)Cho and Paul A. Crook and Ankita De and Alborz Geramifard and Satwik Kottur and Seungwhan Moon and Shivani Poddar and Rajen Subba}, journal = {arXiv preprint arXiv:2011.06486}, title = {Overview of the Ninth Dialog System Technology Challenge: DSTC9}, year = {2020}, } @misc{dilek2021alexa, author = {Dilek Hakkani-Tür}, howpublished = {\url{https://www.amazon.science/alexa-prize/proceedings/alexa-prize-socialbot-grand-challenge-year-iv}}, title = {Alexa Prize Socialbot Grand Challenge Year {IV}}, year = {2021}, } @misc{gottardi2022alexa, author = {Anna Gottardi and Osman Ipek and Giuseppe Castellucci and Shui Hu and Lavina Vaz and Yao Lu and Anju Khatri and Anjali Chadha and Desheng Zhang and Sattvik Sahai and Prerna Dwivedi and Hangjie Shi and Lucy Hu and Andy Huang and Luke Dai and Bofei Yang and Varun Somani and Pankaj Rajan and Ron Rezac and Michael Johnston and Savanna Stiff and Leslie Ball and David Carmel and Yang Liu and Dilek Hakkani-Tür and Oleg Rokhlenko and Kate Bland and Eugene Agichtein and Reza Ghanadan and Yoelle Maarek}, howpublished = {\url{https://www.amazon.science/publications/alexa-lets-work-together-introducing-the-first-alexa-prize-taskbot-challenge-on-conversational-task-assistance}}, title = {Alexa, let’s work together: Introducing the first Alexa Prize TaskBot Challenge on conversational task assistance}, year = {2022}, } @article{gehrmann2022gemv2, author = {Sebastian Gehrmann and Abhik Bhattacharjee and Abinaya Mahendiran and Alex Wang and Alexandros Papangelis and Aman Madaan and Angelina McMillan-Major and Anna V. Shvets and Ashish Upadhyay and Bingsheng Yao and Bryan Wilie and Chandra Bhagavatula and Chaobin You and Craig Thomson and Cristina Garbacea and Dakuo Wang and Daniel Deutsch and Deyi Xiong and Di Jin and Dimitra Gkatzia and Dragomir Radev and Elizabeth Clark and Esin Durmus and Faisal Ladhak and Filip Ginter and Genta Indra Winata and Hendrik Strobelt and Hiroaki Hayashi and Jekaterina Novikova and Jenna Kanerva and Jenny Chim and Jiawei Zhou and Jordan Clive and Joshua Maynez and Jo{\~a}o Sedoc and Juraj Juraska and Kaustubh D. Dhole and Khyathi Raghavi Chandu and Leonardo F. R. Ribeiro and Lewis Tunstall and Li Zhang and Mahima Pushkarna and Mathias Creutz and Michael White and Mihir Kale and Moussa Kamal Eddine and Nico Daheim and Nishant Subramani and Ondrej Dusek and Paul Pu Liang and Pawan Sasanka Ammanamanchi and Qinqin Zhu and Ratish Puduppully and Reno Kriz and Rifat Shahriyar and Ronald Cardenas and Saad Mahamood and Salomey Osei and Samuel Cahyawijaya and Sanja vStajner and S{'e}bastien Montella and Shailza and Shailza Jolly and Simon Mille and Tahmid Hasan and Tianhao Shen and Tosin P. Adewumi and Vikas Raunak and Vipul Raheja and Vitaly Nikolaev and Vivian Tsai and Yacine Jernite and Yi Xu and Yisi Sang and Yixin Liu and Yufang Hou}, journal = {arXiv preprint arXiv:2206.11249}, title = {{GEM}v2: Multilingual {NLG} Benchmarking in a Single Line of Code}, year = {2022}, } @article{hoeve2021towards, author = {Maartje ter Hoeve and Evgeny Kharitonov and Dieuwke Hupkes and Emmanuel Dupoux}, journal = {arXiv preprint arXiv:2112.11911}, title = {Towards Interactive Language Modeling}, year = {2021}, } @inproceedings{hadfieldmenell2016cooperative, author = {Hadfield-Menell, Dylan and Russell, Stuart J and Abbeel, Pieter and Dragan, Anca}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Cooperative Inverse Reinforcement Learning}, year = {2016}, } @article{salton1970evaluation, author = {G. Salton}, journal = {Information Storage and Retrieval}, number = {1}, pages = {29--44}, title = {Evaluation problems in interactive information retrieval}, volume = {6}, year = {1970}, } @article{belkin1982ask, author = {Nicholas J. Belkin and Robert N. Oddy and Helen M. Brooks}, journal = {J. Documentation}, pages = {61--71}, title = {Ask for Information Retrieval: Part {I}. Background and Theory}, volume = {38}, year = {1982}, } @article{kuhlthau1991inside, author = {Kuhlthau, Carol C.}, journal = {Journal of the American Society for Information Science}, number = {5}, pages = {361--371}, title = {Inside the search process: Information seeking from the user's perspective}, volume = {42}, year = {1991}, } @book{ingwersen1992information, author = {Ingwersen, Peter}, publisher = {Taylor Graham}, title = {Information retrieval interaction}, year = {1992}, } @article{marchionini2006exploratory, author = {Marchionini, Gary}, journal = {Communications of the ACM}, pages = {41--46}, title = {Exploratory Search: From Finding to Understanding}, volume = {49}, year = {2006}, } @incollection{micarelli2007personalized, author = {Alessandro Micarelli and Fabio Gasparetti and Filippo Sciarrone and Susan Gauch}, booktitle = {The adaptive web}, pages = {195--230}, title = {Personalized search on the world wide web}, year = {2007}, } @inproceedings{croft2019importance, author = {Croft, W. Bruce}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, title = {The Importance of Interaction for Information Retrieval}, year = {2019}, } @incollection{kamm1994user, author = {Kamm, Candace}, booktitle = {Voice Communication between Humans and Machines}, pages = {422--442}, title = {User Interfaces for Voice Applications}, year = {1994}, } @book{cohen2004voice, author = {Cohen, Michael and Giangola, James P. and Balogh, Jennifer}, publisher = {Addison-Wesley}, title = {Voice User Interface Design}, year = {2004}, } @book{harris2004voice, author = {Harris, R.A.}, publisher = {Elsevier Science}, title = {Voice Interaction Design: Crafting the New Conversational Speech Systems}, year = {2004}, } @article{virtanen2020scipy, author = {Virtanen, Pauli and Gommers, Ralf and Oliphant, Travis E. and Haberland, Matt and Reddy, Tyler and Cournapeau, David and Burovski, Evgeni and Peterson, Pearu and Weckesser, Warren and Bright, Jonathan and {van der Walt}, St{'e}fan J. and Brett, Matthew and Wilson, Joshua and Millman, K. Jarrod and Mayorov, Nikolay and Nelson, Andrew R. J. and Jones, Eric and Kern, Robert and Larson, Eric and Carey, C J and Polat, {\.I}lhan and Feng, Yu and Moore, Eric W. and {VanderPlas}, Jake and Laxalde, Denis and Perktold, Josef and Cimrman, Robert and Henriksen, Ian and Quintero, E. A. and Harris, Charles R. and Archibald, Anne M. and Ribeiro, Ant{\^o}nio H. and Pedregosa, Fabian and {van Mulbregt}, Paul and {SciPy 1.0 Contributors}}, journal = {Nature Methods}, pages = {261--272}, title = {{{SciPy} 1.0: Fundamental Algorithms for Scientific Computing in Python}}, volume = {17}, year = {2020}, } @misc{rcoreteam2020r, author = {{R Core Team}}, howpublished = {\url{https://www.R-project.org}}, title = {{R}: A Language and Environment for Statistical Computing}, year = {2020}, } @article{bland1995multiple, author = {Bland, J Martin and Altman, Douglas G}, journal = {BMJ}, number = {6973}, title = {Multiple significance tests: the {B}onferroni method}, volume = {310}, year = {1995}, } @misc{nyt2022chatgpt, author = {{New York Times}}, howpublished = {\url{https://www.nytimes.com/2022/12/05/technology/chatgpt-ai-twitter.html}}, title = {The Brilliance and Weirdness of {ChatGPT}}, year = {2022}, } @article{shneiderman1997direct, author = {Ben Shneiderman and Pattie Maes}, journal = {ACM Interactions}, title = {Direct manipulation vs. interface agents}, year = {1997}, } @book{shneiderman2022human, author = {Ben Shneiderman}, publisher = {{OUP} {O}xford}, title = {Human-Centered {AI}}, year = {2022}, } @article{paranjape2020neural, author = {Paranjape, Ashwin and See, Abigail and Kenealy, Kathleen and Li, Haojun and Hardy, Amelia and Qi, Peng and Sadagopan, Kaushik Ram and Phu, Nguyet Minh and Soylu, Dilara and Manning, Christopher D}, journal = {arXiv preprint arXiv:2008.12348}, title = {Neural generation meets real people: Towards emotionally engaging mixed-initiative conversations}, year = {2020}, } @article{shuster2022blenderbot, author = {Shuster, Kurt and Xu, Jing and Komeili, Mojtaba and Ju, Da and Smith, Eric Michael and Roller, Stephen and Ung, Megan and Chen, Moya and Arora, Kushal and Lane, Joshua and Behrooz, Morteza and Ngan, William and Poff, Spencer and Goyal, Naman and Szlam, Arthur and Boureau, Y-Lan and Kambadur, Melanie and Weston, Jason}, journal = {arXiv preprint arXiv:2208.03188}, title = {{BlenderBot} 3: a deployed conversational agent that continually learns to responsibly engage}, year = {2022}, } @article{openai2023gpt4, author = {{OpenAI}}, journal = {arXiv preprint arXiv:2303.08774}, title = {{GPT}-4 Technical Report}, year = {2023}, } @inproceedings{zhou2021paraphrase, author = {Jianing Zhou and Suma Bhat}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Paraphrase Generation: A Survey of the State of the Art}, year = {2021}, } @inproceedings{yang2018style, author = {Zichao Yang and Zhiting Hu and Chris Dyer and Eric P. Xing and Taylor Berg-Kirkpatrick}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Unsupervised Text Style Transfer using Language Models as Discriminators}, year = {2018}, } @article{reif2021style, author = {Emily Reif and Daphne Ippolito and Ann Yuan and Andy Coenen and Chris Callison-Burch and Jason Wei}, journal = {arXiv preprint arXiv:2109.03910}, title = {A Recipe For Arbitrary Text Style Transfer with Large Language Models}, year = {2021}, } @article{suzgun2022prompt, author = {Mirac Suzgun and Luke Melas-Kyriazi and Dan Jurafsky}, journal = {arXiv preprint arXiv:2205.11503}, title = {{Prompt-and-Rerank}: A Method for Zero-Shot and Few-Shot Arbitrary Textual Style Transfer with Small Language Models}, year = {2022}, } @article{wang2023codet5, author = {Yue Wang and Hung Le and Akhilesh Deepak Gotmare and Nghi D.Q. Bui and Junnan Li and Steven C.H. Hoi}, journal = {arXiv preprint arXiv:2305.07922}, title = {{CodeT5+}: Open Code Large Language Models for Code Understanding and Generation}, year = {2023}, } @misc{openai2022chatgpt, author = {{OpenAI}}, howpublished = {\url{https://openai.com/blog/chatgpt}}, title = {Introducing {ChatGPT}}, year = {2022}, } @inproceedings{birnholtz2013write, author = {Birnholtz, Jeremy and Steinhardt, Stephanie and Pavese, Antonella}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Write Here, Write Now! An Experimental Study of Group Maintenance in Collaborative Writing}, year = {2013}, } @article{maclean1991design, author = {Allan MacLean and Richard M Young and Victoria M E Bellotti and and Thomas P Moran}, journal = {Human-{C}omputer {I}nteraction}, pages = {201--250}, title = {Questions, Options, and Criteria: Elements of Design Space Analysis}, volume = {6}, year = {1991}, } @inproceedings{mieczkowski2023thesis, author = {Hannah Mieczkowski and Jeffrey Hancock}, booktitle = {Computer-Supported Cooperative Work And Social Computing (CSCW)}, title = {Examining Agency, Expertise, and Roles of {AI} Systems in {AI}-Mediated Communication}, year = {2023}, } @article{birhane2021value, author = {Birhane, Abeba and Kalluri, Pratyusha and Card, Dallas and Agnew, William and Dotan, Ravit and Bao, Michelle}, journal = {arXiv preprint arXiv:2106.15590}, title = {The Values Encoded in Machine Learning Research}, year = {2021}, } @inproceedings{dang2023choice, author = {Dang, Hai and Goller, Sven and Lehmann, Florian and Buschek, Daniel}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Choice Over Control: How Users Write with Large Language Models using Diegetic and Non-Diegetic Prompting}, year = {2023}, } @article{liang2023gptdetector, author = {Weixin Liang and Mert Yuksekgonul and Yining Mao and Eric Wu and James Zou}, journal = {arXiv preprint arXiv:2304.02819}, title = {{GPT} detectors are biased against non-native {E}nglish writers}, year = {2023}, } @inproceedings{valencia2023aac, author = {Valencia, Stephanie and Cave, Richard and Kallarackal, Krystal and Seaver, Katie and Terry, Michael and Kane, Shaun K.}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {``The less {I} type, the better: How {AI} Language Models can Enhance or Impede Communication for {AAC} Users}, year = {2023}, } @inproceedings{liu2022console, author = {Liu, Yihe and Mittal, Anushk and Yang, Diyi and Bruckman, Amy}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Will {AI} Console Me when {I} Lose my Pet? Understanding Perceptions of {AI}-Mediated Email Writing}, year = {2022}, } @article{moslem2023mt, author = {Yasmin Moslem and Rejwanul Haque and John D. Kelleher and Andy Way}, journal = {arXiv preprint arXiv:2301.13294}, title = {Adaptive Machine Translation with Large Language Models}, year = {2023}, } @inproceedings{goodman2022lampost, author = {Goodman, Steven M. and Buehler, Erin and Clary, Patrick and Coenen, Andy and Donsbach, Aaron and Horne, Tiffanie N. and Lahav, Michal and MacDonald, Robert and Michaels, Rain Breaw and Narayanan, Ajit and Pushkarna, Mahima and Riley, Joel and Santana, Alex and Shi, Lei and Sweeney, Rachel and Weaver, Phil and Yuan, Ann and Morris, Meredith Ringel}, booktitle = {ACM SIGACCESS Conference on Computers and Accessibility (ASSETS)}, title = {{LaMPost}: Design and Evaluation of an {AI}-assisted Email Writing Prototype for Adults with Dyslexia}, year = {2022}, } @article{hohenstein2021communication, author = {Jess Hohenstein and Dominic DiFranzo and Rene F. Kizilcec and Zhila Aghajari and Hannah Mieczkowski and Karen Levy and Mor Naaman and Jeff Hancock and Malte Jung}, journal = {arXiv preprint arXiv:2102.05756}, title = {Artificial intelligence in communication impacts language and social relationships}, year = {2021}, } @article{fabbri2021summeval, author = {Fabbri, Alexander R. and Kryściński, Wojciech and McCann, Bryan and Xiong, Caiming and Socher, Richard and Radev, Dragomir}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {{SummEval}: Re-evaluating Summarization Evaluation}, volume = {9}, year = {2021}, } @article{jelinek1980interpolated, author = {Jelinek, Frederick}, journal = {Proceeding of the Workshop on Pattern Recognition in Practice}, pages = {381--397}, title = {Interpolated estimation of {M}arkov source parameters from sparse data}, year = {1980}, } @inproceedings{katz1987estimation, author = {Katz, Slava}, booktitle = {International Conference on Acoustics, Speech, and Signal Processing (ICASSP)}, title = {Estimation of probabilities from sparse data for the language model component of a speech recognizer}, year = {1987}, } @inproceedings{fernandez2007rnn, author = {Fern'{a}ndez, Santiago and Graves, Alex and Schmidhuber, J\"{u}rgen}, booktitle = {International Conference on Artificial Neural Networks (ICANN)}, title = {An Application of Recurrent Neural Networks to Discriminative Keyword Spotting}, year = {2007}, } @article{goldbert2015primer, author = {Yoav Goldberg}, journal = {arXiv preprint arXiv:1510.00726}, title = {A Primer on Neural Network Models for Natural Language Processing}, year = {2015}, } @article{bavarian2022fill, author = {Mohammad Bavarian and Heewoo Jun and Nikolas Tezak and John Schulman and Christine McLeavey and Jerry Tworek and Mark Chen}, journal = {arXiv preprint arXiv:2207.14255}, title = {Efficient Training of Language Models to Fill in the Middle}, year = {2022}, } @inproceedings{belz2023missing, author = {Belz, Anya and Thomson, Craig and Reiter, Ehud}, booktitle = {ACL Workshop on Insights from Negative Results in {NLP}}, title = {Missing Information, Unresponsive Authors, Experimental Flaws: The Impossibility of Assessing the Reproducibility of Previous Human Evaluations in {NLP}}, year = {2023}, } @article{veselovsky2023aaai, author = {Veniamin Veselovsky and Manoel Horta Ribeiro and Robert West}, journal = {arXiv preprint arXiv:2306.07899}, title = {Artificial Artificial Artificial Intelligence: Crowd Workers Widely Use Large Language Models for Text Production Tasks}, year = {2023}, } @article{xu2020recipes, author = {Xu, Jing and Ju, Da and Li, Margaret and Boureau, Y-Lan and Weston, Jason and Dinan, Emily}, journal = {arXiv preprint arXiv:2010.07079}, title = {Recipes for safety in open-domain chatbots}, year = {2020}, } @inproceedings{ji2022achieving, author = {Ji, Tianbo and Graham, Yvette and Jones, Gareth and Lyu, Chenyang and Liu, Qun}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Achieving Reliable Human Assessment of Open-Domain Dialogue Systems}, year = {2022}, } @article{bowman2022measuring, author = {Samuel R. Bowman and Jeeyoon Hyun and Ethan Perez and Edwin Chen and Craig Pettit and Scott Heiner and Kamilė Lukošiūtė and Amanda Askell and Andy Jones and Anna Chen and Anna Goldie and Azalia Mirhoseini and Cameron McKinnon and Christopher Olah and Daniela Amodei and Dario Amodei and Dawn Drain and Dustin Li and Eli Tran-Johnson and Jackson Kernion and Jamie Kerr and Jared Mueller and Jeffrey Ladish and Joshua Landau and Kamal Ndousse and Liane Lovitt and Nelson Elhage and Nicholas Schiefer and Nicholas Joseph and Noemí Mercado and Nova DasSarma and Robin Larson and Sam McCandlish and Sandipan Kundu and Scott Johnston and Shauna Kravec and Sheer El Showk and Stanislav Fort and Timothy Telleen-Lawton and Tom Brown and Tom Henighan and Tristan Hume and Yuntao Bai and Zac Hatfield-Dodds and Ben Mann and Jared Kaplan}, journal = {arXiv preprint arXiv:2211.03540}, title = {Measuring Progress on Scalable Oversight for Large Language Models}, year = {2022}, } @inproceedings{peyrard2019simple, author = {Peyrard, Maxime}, booktitle = {Association for Computational Linguistics (ACL)}, title = {A Simple Theoretical Model of Importance for Summarization}, year = {2019}, } @inproceedings{cao2018faithful, author = {Cao, Ziqiang and Wei, Furu and Li, Wenjie and Li, Sujian}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Faithful to the Original: Fact-Aware Neural Abstractive Summarization}, year = {2018}, } @inproceedings{durmus2020feqa, author = {Durmus, Esin and He, He and Diab, Mona}, booktitle = {Association for Computational Linguistics (ACL)}, title = {{FEQA}: A Question Answering Evaluation Framework for Faithfulness Assessment in Abstractive Summarization}, year = {2020}, } @inproceedings{nan2021entity, author = {Nan, Feng and Nallapati, Ramesh and Wang, Zhiguo and dos Santos, Cicero and Zhu, Henghui and Zhang, Dejiao and Mckeown, Kathleen and Xiang, Bing}, booktitle = {European Association for Computational Linguistics (EACL)}, title = {Entity-level Factual Consistency of Abstractive Text Summarization}, year = {2021}, } @inproceedings{kang2020improved, author = {Kang, Daniel and Hashimoto, Tatsunori B}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Improved Natural Language Generation via Loss Truncation}, year = {2020}, } @inproceedings{goyal2021annotating, author = {Goyal, Tanya and Durrett, Greg}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Annotating and Modeling Fine-grained Factuality in Summarization}, year = {2021}, } @inproceedings{nan2021improving, author = {Nan, Feng and dos Santos, Cicero and Zhu, Henghui and Ng, Patrick and Mckeown, Kathleen and Nallapati, Ramesh and Zhang, Dejiao and Wang, Zhiguo and Arnold, Andrew O and Xiang, Bing}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Improving Factual Consistency of Abstractive Summarization via Question Answering}, year = {2021}, } @inproceedings{cao2021cliff, author = {Cao, Shuyang and Wang, Lu}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {{CLIFF}: Contrastive Learning for Improving Faithfulness and Factuality in Abstractive Summarization}, year = {2021}, } @inproceedings{chen2021improving, author = {Chen, Sihao and Zhang, Fan and Sone, Kazoo and Roth, Dan}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Improving Faithfulness in Abstractive Summarization with Contrast Candidate Generation and Selection}, year = {2021}, } @inproceedings{ladhak2022faithful, author = {Ladhak, Faisal and Durmus, Esin and He, He and Cardie, Claire and McKeown, Kathleen}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Faithful or Extractive? On Mitigating the Faithfulness-Abstractiveness Trade-off in Abstractive Summarization}, year = {2022}, } @inproceedings{bohm2019better, author = {B{\"o}hm, Florian and Gao, Yang and Meyer, Christian M. and Shapira, Ori and Dagan, Ido and Gurevych, Iryna}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Better Rewards Yield Better Summaries: Learning to Summarise Without References}, year = {2019}, } @inproceedings{campos2022training, author = {Campos, Jon Ander and Shern, Jun}, booktitle = {ACL Workshop on Learning with Natural Language Supervision}, title = {Training Language Models with Language Feedback}, year = {2022}, } @article{chakrabarty2021mermaid, author = {Chakrabarty, Tuhin and Zhang, Xurui and Muresan, Smaranda and Peng, Nanyun}, journal = {arXiv preprint arXiv:2103.06779}, title = {{MERMAID}: Metaphor Generation with Symbolism and Discriminative Decoding}, year = {2021}, } @article{stowe2021metaphor, author = {Stowe, Kevin and Chakrabarty, Tuhin and Peng, Nanyun and Muresan, Smaranda and Gurevych, Iryna}, journal = {arXiv preprint arXiv:2106.01228}, title = {Metaphor Generation with Conceptual Mappings}, year = {2021}, } @inproceedings{stowe2021exploring, author = {Stowe, Kevin and Beck, Nils and Gurevych, Iryna}, booktitle = {Computational Natural Language Learning (CoNLL)}, title = {Exploring Metaphoric Paraphrase Generation}, year = {2021}, } @inproceedings{mittal2022ambipun, author = {Anirudh Mittal and Yufei Tian and Nanyun Peng}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {AmbiPun: Generating Humorous Puns with Ambiguous Context}, year = {2022}, } @article{liu2023geval, author = {Yang Liu and Dan Iter and Yichong Xu and Shuohang Wang and Ruochen Xu and Chenguang Zhu}, journal = {arXiv preprint arXiv:2303.16634}, title = {{G-Eval}: {NLG} Evaluation using {GPT}-4 with Better Human Alignment}, year = {2023}, } @inproceedings{ethayarajh2022authenticity, author = {Kawin Ethayarajh and Dan Jurafsky}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {The Authenticity Gap in Human Evaluation}, year = {2022}, } @inproceedings{parmar2023instruction, author = {Mihir Parmar and Swaroop Mishra and Mor Geva and Chitta Baral}, booktitle = {European Association for Computational Linguistics (EACL)}, title = {Don't Blame the Annotator: Bias Already Starts in the Annotation Instructions}, year = {2023}, } @article{wojnowicz2016sketching, author = {Mike Wojnowicz and Ben Cruz and Xuan Zhao and Brian Wallace and Matt Wolff and Jay Luan and Caleb Crable}, journal = {arXiv preprint arXiv:1611.05923}, title = {``{I}nfluence Sketching'': Finding Influential Samples In Large-Scale Regressions}, year = {2016}, } @article{goodman2016eu, author = {Bryce Goodman and Seth Flaxman}, journal = {arXiv preprint arXiv:1606.08813}, title = {European Union regulations on algorithmic decision-making and a ``right to explanation''}, year = {2016}, } @inproceedings{amershi2015modeltracker, author = {Saleema Amershi and Max Chickering and Steven M Drucker and Bongshin Lee and Patrice Simard and Jina Suh}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, pages = {337--346}, title = {Modeltracker: Redesigning performance analysis tools for machine learning}, year = {2015}, } @inproceedings{shrikumar2017learning, author = {Avanti Shrikumar and Peyton Greenside and Anshul Kundaje}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Learning Important Features Through Propagating Activation Differences}, year = {2017}, } @article{lecun1998mnist, author = {Yann LeCun and Corinna Cortes and Christopher JC Burges}, journal = {http://yann.lecun.com/exdb/mnist/}, title = {The {MNIST} database of handwritten digits}, year = {1998}, } @article{liu1989limited, author = {Dong C Liu and Jorge Nocedal}, journal = {Mathematical Programming}, number = {1}, pages = {503--528}, title = {On the limited memory {BFGS} method for large scale optimization}, volume = {45}, year = {1989}, } @article{lecun1998gradient, author = {Yann LeCun and L{\'e}on Bottou and Yoshua Bengio and Patrick Haffner}, journal = {Proceedings of the IEEE}, number = {11}, pages = {2278--2324}, title = {Gradient-based learning applied to document recognition}, volume = {86}, year = {1998}, } @article{springenberg2014striving, author = {Jost Tobias Springenberg and Alexey Dosovitskiy and Thomas Brox and Martin Riedmiller}, journal = {arXiv preprint arXiv:1412.6806}, title = {Striving for simplicity: The all convolutional net}, year = {2014}, } @article{pearlmutter1994fast, author = {Barak A Pearlmutter}, journal = {Neural Computation}, number = {1}, pages = {147--160}, title = {Fast exact multiplication by the {Hessian}}, volume = {6}, year = {1994}, } @article{theano2016theano, author = {{Theano Development Team}}, journal = {arXiv preprint arXiv:1605.02688}, title = {{Theano: A {Python} framework for fast computation of mathematical expressions}}, year = {2016}, } @article{agarwal2016second, author = {Naman Agarwal and Brian Bullins and Elad Hazan}, journal = {arXiv preprint arXiv:1602.03943}, title = {Second order stochastic optimization in linear time}, year = {2016}, } @inproceedings{biggio2012poisoning, author = {Battista Biggio and Blaine Nelson and Pavel Laskov}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1467--1474}, title = {Poisoning Attacks Against Support Vector Machines}, year = {2012}, } @inproceedings{cadamuro2016debugging, author = {Gabriel Cadamuro and Ran Gilad-Bachrach and Xiaojin Zhu}, booktitle = {ICML Workshop on Reliable Machine Learning in the Wild}, title = {Debugging machine learning models}, year = {2016}, } @article{frenay2014classification, author = {Beno{\^\i}t Fr{\'e}nay and Michel Verleysen}, journal = {IEEE Transactions on Neural Networks and Learning Systems}, pages = {845--869}, title = {Classification in the presence of label noise: a survey}, volume = {25}, year = {2014}, } @article{biggio2011label, author = {Battista Biggio and Blaine Nelson and Pavel Laskov}, journal = {ACML}, pages = {97--112}, title = {Support Vector Machines Under Adversarial Label Noise}, volume = {20}, year = {2011}, } @article{jaeckel1972infinitesimal, author = {Louis A Jaeckel}, journal = {Unpublished memorandum, Bell Telephone Laboratories, Murray Hill, NJ}, title = {The infinitesimal jackknife}, year = {1972}, } @article{cook1977detection, author = {R Dennis Cook}, journal = {Technometrics}, pages = {15--18}, title = {Detection of influential observation in linear regression}, volume = {19}, year = {1977}, } @article{cook1980influence, author = {R Dennis Cook and Sanford Weisberg}, journal = {Technometrics}, pages = {495--508}, title = {Characterizations of an empirical influence function for detecting influential cases in regression}, volume = {22}, year = {1980}, } @book{cook1982residuals, author = {R Dennis Cook and Sanford Weisberg}, publisher = {New York: Chapman and Hall}, title = {Residuals and influence in regression}, year = {1982}, } @article{cook1986assessment, author = {R Dennis Cook}, journal = {Journal of the Royal Statistical Society. Series B (Methodological)}, pages = {133--169}, title = {Assessment of local influence}, year = {1986}, } @article{thomas1990assessing, author = {William Thomas and R Dennis Cook}, journal = {Technometrics}, number = {1}, pages = {59--65}, title = {Assessing influence on predictions from generalized linear models}, volume = {32}, year = {1990}, } @article{wei1998generalized, author = {Bo-Cheng Wei and Yue-Qing Hu and Wing-Kam Fung}, journal = {Scandinavian Journal of Statistics}, pages = {25--37}, title = {Generalized leverage and its applications}, volume = {25}, year = {1998}, } @article{chatterjee1986influential, author = {Samprit Chatterjee and Ali S Hadi}, journal = {Statistical Science}, pages = {379--393}, title = {Influential observations, high leverage points, and outliers in linear regression}, year = {1986}, } @inproceedings{liu2014efficient, author = {Yong Liu and Shali Jiang and Shizhong Liao}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {324--332}, title = {Efficient Approximation of Cross-Validation for Kernel Methods using {B}ouligand Influence Function}, year = {2014}, } @article{debruyne2008model, author = {Michiel Debruyne and Mia Hubert and Johan AK Suykens}, journal = {Journal of Machine Learning Research (JMLR)}, number = {0}, pages = {2377--2400}, title = {Model selection in kernel based regression using the influence function}, volume = {9}, year = {2008}, } @inproceedings{martens2010deep, author = {James Martens}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {735--742}, title = {Deep learning via Hessian-free optimization}, year = {2010}, } @manual{chollet2015keras, author = {Fran\c{c}ois Chollet}, howpublished = {\url{https://github.com/fchollet/keras}}, title = {Keras}, year = {2015}, } @inproceedings{szegedy2016rethinking, author = {Christian Szegedy and Vincent Vanhoucke and Sergey Ioffe and Jon Shlens and Zbigniew Wojna}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {2818--2826}, title = {Rethinking the {I}nception architecture for computer vision}, year = {2016}, } @inproceedings{huang2011adversarial, author = {Ling Huang and Anthony D Joseph and Blaine Nelson and Benjamin IP Rubinstein and JD Tygar}, booktitle = {Proceedings of the 4th ACM workshop on Security and artificial intelligence}, pages = {43--58}, title = {Adversarial machine learning}, year = {2011}, } @article{ben2010theory, author = {Shai Ben-David and John Blitzer and Koby Crammer and Alex Kulesza and Fernando Pereira and Jennifer Wortman Vaughan}, journal = {Machine Learning}, number = {1}, pages = {151--175}, title = {A theory of learning from different domains}, volume = {79}, year = {2010}, } @article{strack2014impact, author = {Beata Strack and Jonathan P DeShazo and Chris Gennings and Juan L Olmo and Sebastian Ventura and Krzysztof J Cios and John N Clore}, journal = {BioMed Research International}, title = {Impact of {HbA1c} measurement on hospital readmission rates: {Analysis} of 70,000 clinical database patient records}, volume = {2014}, year = {2014}, } @inproceedings{lakkaraju2017identifying, author = {Himabindu Lakkaraju and Ece Kamar and Rich Caruana and Eric Horvitz}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Identifying Unknown Unknowns in the Open World: Representations and Policies for Guided Exploration}, year = {2017}, } @inproceedings{datta2016algorithmic, author = {Anupam Datta and Shayak Sen and Yair Zick}, booktitle = {Security and Privacy (SP), 2016 IEEE Symposium on}, pages = {598--617}, title = {Algorithmic transparency via quantitative input influence: Theory and experiments with learning systems}, year = {2016}, } @article{adler2016auditing, author = {Philip Adler and Casey Falk and Sorelle A Friedler and Gabriel Rybeck and Carlos Scheidegger and Brandon Smith and Suresh Venkatasubramanian}, journal = {arXiv preprint arXiv:1602.07043}, title = {Auditing Black-box Models for Indirect Influence}, year = {2016}, } @article{lundberg2016unexpected, author = {Scott Lundberg and Su-In Lee}, journal = {arXiv preprint arXiv:1611.07478}, title = {An unexpected unity among methods for interpreting model predictions}, year = {2016}, } @article{vstrumbelj2014explaining, author = {Erik {\v{S}}trumbelj and Igor Kononenko}, journal = {Knowledge and information systems}, number = {3}, pages = {647--665}, title = {Explaining prediction models and individual predictions with feature contributions}, volume = {41}, year = {2014}, } @article{simonyan2013deep, author = {Karen Simonyan and Andrea Vedaldi and Andrew Zisserman}, journal = {arXiv preprint arXiv:1312.6034}, title = {Deep inside convolutional networks: Visualising image classification models and saliency maps}, year = {2013}, } @inproceedings{kim2016examples, author = {Been Kim and Oluwasanmi O Koyejo and Rajiv Khanna}, booktitle = {Advances In Neural Information Processing Systems}, pages = {2280--2288}, title = {Examples are not enough, learn to criticize! Criticism for Interpretability}, year = {2016}, } @inproceedings{caruana2015intelligible, author = {Rich Caruana and Yin Lou and Johannes Gehrke and Paul Koch and Marc Sturm and Noemie Elhadad}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, pages = {1721--1730}, title = {Intelligible models for healthcare: Predicting pneumonia risk and hospital 30-day readmission}, year = {2015}, } @article{debruyne2010detecting, author = {Michiel Debruyne and Mia Hubert and Johan Van Horebeek}, journal = {Computational Statistics \& Data Analysis}, number = {12}, pages = {3007--3019}, title = {Detecting influential observations in Kernel {PCA}}, volume = {54}, year = {2010}, } @article{christmann2004robustness, author = {Andreas Christmann and Ingo Steinwart}, journal = {Journal of Machine Learning Research (JMLR)}, number = {0}, pages = {1007--1034}, title = {On robustness properties of convex risk minimization methods for pattern recognition}, volume = {5}, year = {2004}, } @article{russakovsky2015imagenet, author = {Olga Russakovsky and Jia Deng and Hao Su and Jonathan Krause and Sanjeev Satheesh and Sean Ma and Zhiheng Huang and Andrej Karpathy and Aditya Khosla and Michael Bernstein and others}, journal = {International Journal of Computer Vision}, number = {3}, pages = {211--252}, title = {{ImageNet} large scale visual recognition challenge}, volume = {115}, year = {2015}, } @article{kansagara2011risk, author = {Devan Kansagara and Honora Englander and Amanda Salanitro and David Kagen and Cecelia Theobald and Michele Freeman and Sunil Kripalani}, journal = {JAMA}, number = {15}, pages = {1688--1698}, title = {Risk prediction models for hospital readmission: a systematic review}, volume = {306}, year = {2011}, } @inproceedings{jaakkola1999exploiting, author = {Tommi S Jaakkola and David Haussler and others}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {487--493}, title = {Exploiting generative models in discriminative classifiers}, year = {1999}, } @article{li2016understanding, author = {Jiwei Li and Will Monroe and Dan Jurafsky}, journal = {arXiv preprint arXiv:1612.08220}, title = {Understanding Neural Networks through Representation Erasure}, year = {2016}, } @inproceedings{donahue2014decaf, author = {Jeff Donahue and Yangqing Jia and Oriol Vinyals and Judy Hoffman and Ning Zhang and Eric Tzeng and Trevor Darrell}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {647--655}, title = {DeCAF: A Deep Convolutional Activation Feature for Generic Visual Recognition}, volume = {32}, year = {2014}, } @article{diamond2016cvxpy, author = {Steven Diamond and Stephen Boyd}, journal = {Journal of Machine Learning Research (JMLR)}, number = {83}, pages = {1--5}, title = {{CVXPY}: A {P}ython-Embedded Modeling Language for Convex Optimization}, volume = {17}, year = {2016}, } @inproceedings{moosavi2016deepfool, author = {Seyed-Mohsen Moosavi-Dezfooli and Alhussein Fawzi and Pascal Frossard}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {2574--2582}, title = {Deepfool: a simple and accurate method to fool deep neural networks}, year = {2016}, } @inproceedings{lakhina2004diagnosing, author = {Anukool Lakhina and Mark Crovella and Christophe Diot}, booktitle = {ACM SIGCOMM Computer Communication Review}, number = {4}, pages = {219--230}, title = {Diagnosing network-wide traffic anomalies}, volume = {34}, year = {2004}, } @article{paudice2018detection, author = {Andrea Paudice and Luis Mu{\~n}oz-Gonz{\'a}lez and Andras Gyorgy and Emil C Lupu}, journal = {arXiv preprint arXiv:1802.03041}, title = {Detection of Adversarial Training Examples in Poisoning Attacks through Anomaly Detection}, year = {2018}, } @article{nelson2008exploiting, author = {Blaine Nelson and Marco Barreno and Fuching Jack Chi and Anthony D Joseph and Benjamin IP Rubinstein and Udam Saini and Charles A Sutton and J Doug Tygar and Kai Xia}, journal = {LEET}, pages = {1--9}, title = {Exploiting Machine Learning to Subvert Your Spam Filter}, volume = {8}, year = {2008}, } @article{hodge2004survey, author = {Victoria Hodge and Jim Austin}, journal = {Artificial intelligence review}, number = {2}, pages = {85--126}, title = {A survey of outlier detection methodologies}, volume = {22}, year = {2004}, } @article{gupta2016monotonic, author = {Maya Gupta and Andrew Cotter and Jan Pfeifer and Konstantin Voevodski and Kevin Canini and Alexander Mangylov and Wojciech Moczydlowski and Alexander Van Esbroeck}, journal = {Journal of Machine Learning Research (JMLR)}, number = {1}, pages = {3790--3836}, title = {Monotonic calibrated interpolated look-up tables}, volume = {17}, year = {2016}, } @article{nakamura1988assessment, author = {E Nakamura and K Miyao and T Ozeki}, journal = {Mechanisms of Ageing and Development}, number = {1}, pages = {1--18}, title = {Assessment of biological age by principal component analysis}, volume = {46}, year = {1988}, } @article{kumar2017understanding, author = {Pavithra Kumar and Yuqi Tan and Patrick Cahan}, journal = {Development}, number = {1}, pages = {17--32}, title = {Understanding development and stem cells using single cell-based analyses of gene expression}, volume = {144}, year = {2017}, } @article{sprott2010biomarkers, author = {Richard L Sprott}, journal = {Experimental gerontology}, number = {1}, pages = {2--4}, title = {Biomarkers of aging and disease: introduction and definitions}, volume = {45}, year = {2010}, } @article{belsky2015quantification, author = {Daniel W Belsky and Avshalom Caspi and Renate Houts and Harvey J Cohen and David L Corcoran and Andrea Danese and HonaLee Harrington and Salomon Israel and Morgan E Levine and Jonathan D Schaefer and others}, journal = {Proceedings of the National Academy of Sciences}, number = {30}, title = {Quantification of biological aging in young adults}, volume = {112}, year = {2015}, } @article{sudlow2015uk, author = {Cathie Sudlow and John Gallacher and Naomi Allen and Valerie Beral and Paul Burton and John Danesh and Paul Downey and Paul Elliott and Jane Green and Martin Landray and others}, journal = {PLoS Medicine}, number = {3}, title = {{UK Biobank}: an open access resource for identifying the causes of a wide range of complex diseases of middle and old age}, volume = {12}, year = {2015}, } @article{fry2017comparison, author = {Anna Fry and Thomas J Littlejohns and Cathie Sudlow and Nicola Doherty and Ligia Adamska and Tim Sprosen and Rory Collins and Naomi E Allen}, journal = {American Journal of Epidemiology}, number = {9}, pages = {1026--1034}, title = {Comparison of sociodemographic and health-related characteristics of {UK Biobank} participants with those of the general population}, volume = {186}, year = {2017}, } @article{zhang2016predicting, author = {William B Zhang and Zachary Pincus}, journal = {Aging Cell}, number = {1}, pages = {39--48}, title = {Predicting all-cause mortality from basic physiology in the {Framingham Heart Study}}, volume = {15}, year = {2016}, } @article{trapnell2014dynamics, author = {Cole Trapnell and Davide Cacchiarelli and Jonna Grimsby and Prapti Pokharel and Shuqiang Li and Michael Morse and Niall J Lennon and Kenneth J Livak and Tarjei S Mikkelsen and John L Rinn}, journal = {Nature Biotechnology}, number = {4}, title = {The dynamics and regulators of cell fate decisions are revealed by pseudotemporal ordering of single cells}, volume = {32}, year = {2014}, } @article{bendall2014single, author = {Sean C Bendall and Kara L Davis and El-ad David Amir and Michelle D Tadmor and Erin F Simonds and Tiffany J Chen and Daniel K Shenfeld and Garry P Nolan and Dana Pe'er}, journal = {Cell}, number = {3}, pages = {714--725}, title = {Single-cell trajectory detection uncovers progression and regulatory coordination in human {B} cell development}, volume = {157}, year = {2014}, } @article{campbell2017uncovering, author = {Kieran Campbell and Christopher Yau}, journal = {bioRxiv}, title = {Uncovering genomic trajectories with heterogeneous genetic and environmental backgrounds across single-cells and populations}, year = {2017}, } @article{kraemer2000can, author = {Helena Chmura Kraemer and Jerome A Yesavage and Joy L Taylor and David Kupfer}, journal = {American Journal of Psychiatry}, number = {2}, pages = {163--171}, title = {How can we learn about developmental processes from cross-sectional studies, or can we?}, volume = {157}, year = {2000}, } @article{louis1986explaining, author = {Thomas A Louis and James Robins and Douglas W Dockery and Avron Spiro and James H Ware}, journal = {Journal of Clinical Epidemiology}, number = {10}, pages = {831--839}, title = {Explaining discrepancies between longitudinal and cross-sectional models}, volume = {39}, year = {1986}, } @article{economos1982rate, author = {Angelos C Economos}, journal = {Archives of Gerontology and Geriatrics}, number = {1}, pages = {3--27}, title = {Rate of aging, rate of dying and the mechanism of mortality}, volume = {1}, year = {1982}, } @article{klemera2006new, author = {Petr Klemera and Stanislav Doubal}, journal = {Mechanisms of Ageing and Development}, number = {3}, pages = {240--248}, title = {A new approach to the concept and computation of biological age}, volume = {127}, year = {2006}, } @article{levine2012modeling, author = {Morgan E Levine}, journal = {Journals of Gerontology Series A: Biomedical Sciences and Medical Sciences}, number = {6}, pages = {667--674}, title = {Modeling the rate of senescence: can estimated biological age predict mortality more accurately than chronological age?}, volume = {68}, year = {2012}, } @article{putin2016deep, author = {Evgeny Putin and Polina Mamoshina and Alexander Aliper and Mikhail Korzinkin and Alexey Moskalev and Alexey Kolosov and Alexander Ostrovskiy and Charles Cantor and Jan Vijg and Alex Zhavoronkov}, journal = {Aging}, number = {5}, title = {Deep biomarkers of human aging: application of deep neural networks to biomarker development}, volume = {8}, year = {2016}, } @article{pyrkov2018extracting, author = {Timothy V Pyrkov and Konstantin Slipensky and Mikhail Barg and Alexey Kondrashin and Boris Zhurov and Alexander Zenin and Mikhail Pyatnitskiy and Leonid Menshikov and Sergei Markov and Peter O Fedichev}, journal = {Scientific Reports}, number = {1}, title = {Extracting biological age from biomedical data via deep learning: too much of a good thing?}, volume = {8}, year = {2018}, } @article{mcclearn1997biogerontologic, author = {Gerald E McClearn}, journal = {Experimental Gerontology}, number = {1}, pages = {3--10}, title = {Biogerontologic theories}, volume = {32}, year = {1997}, } @article{margolick2015accelerating, author = {Joseph B Margolick and Luigi Ferrucci}, journal = {Experimental Gerontology}, pages = {78--80}, title = {Accelerating aging research: how can we measure the rate of biologic aging?}, volume = {64}, year = {2015}, } @inproceedings{hashimoto2016learning, author = {Tatsunori Hashimoto and David Gifford and Tommi Jaakkola}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {2417--2426}, title = {Learning Population-Level Diffusions with Generative {RNNs}}, year = {2016}, } @book{waddington1940organisers, author = {Conrad Hal Waddington}, publisher = {University Press; Cambridge}, title = {Organisers and Genes}, year = {1940}, } @article{nowell1976clonal, author = {Peter C Nowell}, journal = {Science}, number = {4260}, pages = {23--28}, title = {The clonal evolution of tumor cell populations}, volume = {194}, year = {1976}, } @article{comfort1969test, author = {Alex Comfort}, journal = {The Lancet}, number = {7635}, pages = {1411--1415}, title = {Test-battery to measure ageing-rate in man}, volume = {294}, year = {1969}, } @article{furukawa1975assessment, author = {Toshiyuki Furukawa and Michitoshi Inoue and Fumihiko Kajiya and Hiroshi Inada and Seiichi Takasugi and Sugao Fukui and Hiroshi Takeda and Hiroshi Abe}, journal = {Journal of Gerontology}, number = {4}, pages = {422--434}, title = {Assessment of biological age by multiple regression analysis}, volume = {30}, year = {1975}, } @article{borkan1980assessment, author = {Gary A Borkan and Arthur H Norris}, journal = {Journal of Gerontology}, number = {2}, pages = {177--184}, title = {Assessment of biological age using a profile of physical parameters}, volume = {35}, year = {1980}, } @article{chen2016dna, author = {Brian H Chen and Riccardo E Marioni and Elena Colicino and Marjolein J Peters and Cavin K Ward-Caviness and Pei-Chien Tsai and Nicholas S Roetker and Allan C Just and Ellen W Demerath and Weihua Guan and others}, journal = {Aging (Albany NY)}, number = {9}, title = {{DNA} methylation-based measures of biological age: meta-analysis predicting time to death}, volume = {8}, year = {2016}, } @article{horvath2013dna, author = {Steve Horvath}, journal = {Genome Biology}, number = {10}, title = {{DNA} methylation age of human tissues and cell types}, volume = {14}, year = {2013}, } @article{macdonald2004biological, author = {Stuart WS MacDonald and Roger A Dixon and Anna-Lisa Cohen and Janine E Hazlitt}, journal = {Gerontology}, number = {2}, pages = {64--81}, title = {Biological age and 12-year cognitive change in older adults: findings from the Victoria Longitudinal Study}, volume = {50}, year = {2004}, } @article{gupta2008extracting, author = {Anupam Gupta and Ziv Bar-Joseph}, journal = {IEEE/ACM Transactions on Computational Biology and Bioinformatics (TCBB)}, number = {2}, pages = {172--182}, title = {Extracting dynamics from static cancer expression data}, volume = {5}, year = {2008}, } @article{reid2016pseudotime, author = {John E Reid and Lorenz Wernisch}, journal = {Bioinformatics}, number = {19}, pages = {2973--2980}, title = {Pseudotime estimation: deconfounding single cell time series}, volume = {32}, year = {2016}, } @article{aijo2014methods, author = {Tarmo {\"A}ij{\"o} and Vincent Butty and Zhi Chen and Verna Salo and Subhash Tripathi and Christopher B Burge and Riitta Lahesmaa and Harri L{\"a}hdesm{\"a}ki}, journal = {Bioinformatics}, number = {12}, title = {Methods for time series analysis of {RNA}-seq data with application to human {Th17} cell differentiation}, volume = {30}, year = {2014}, } @article{magwene2003reconstructing, author = {Paul M Magwene and Paul Lizardi and Junhyong Kim}, journal = {Bioinformatics}, number = {7}, pages = {842--850}, title = {Reconstructing the temporal ordering of biological samples using microarray data}, volume = {19}, year = {2003}, } @article{qiu2011discovering, author = {Peng Qiu and Andrew J Gentles and Sylvia K Plevritis}, journal = {PLoS Computational Biology}, number = {4}, title = {Discovering biological progression underlying microarray samples}, volume = {7}, year = {2011}, } @article{di2009multilevel, author = {Chong-Zhi Di and Ciprian M Crainiceanu and Brian S Caffo and Naresh M Punjabi}, journal = {The Annals of Applied Statistics}, number = {1}, title = {Multilevel functional principal component analysis}, volume = {3}, year = {2009}, } @article{greven2011longitudinal, author = {Sonja Greven and Ciprian Crainiceanu and Brian Caffo and Daniel Reich}, journal = {Recent Advances in Functional Data Analysis and Related Topics}, title = {Longitudinal functional principal component analysis}, year = {2011}, } @article{verbeke1997linear, author = {Geert Verbeke}, journal = {Linear Mixed Models in Practice}, pages = {63--153}, title = {Linear mixed models for longitudinal data}, year = {1997}, } @article{bair2006prediction, author = {Eric Bair and Trevor Hastie and Debashis Paul and Robert Tibshirani}, journal = {Journal of the American Statistical Association (JASA)}, number = {473}, pages = {119--137}, title = {Prediction by supervised principal components}, volume = {101}, year = {2006}, } @article{abid2017contrastive, author = {Abubakar Abid and Vivek K Bagaria and Martin J Zhang and James Zou}, journal = {arXiv preprint arXiv:1709.06716}, title = {Contrastive principal component analysis}, year = {2017}, } @article{jonsen2005robust, author = {Ian D Jonsen and Joanna Mills Flemming and Ransom A Myers}, journal = {Ecology}, number = {11}, pages = {2874--2880}, title = {Robust state--space modeling of animal movement data}, volume = {86}, year = {2005}, } @article{ram1986government, author = {Rati Ram}, journal = {The American Economic Review}, number = {1}, pages = {191--203}, title = {Government size and economic growth: A new framework and some evidence from cross-section and time-series data}, volume = {76}, year = {1986}, } @article{relethford1978use, author = {John H Relethford and Francis C Lees and Pamela J Byard}, journal = {Human Biology}, pages = {461--475}, title = {The use of principal components in the analysis of cross-sectional growth data}, year = {1978}, } @misc{euyu2012monomial, author = {EuYu}, howpublished = {\url{https://math.stackexchange.com/q/214401}}, title = {A non-negative matrix has a non-negative inverse. {What} other properties does it have?}, year = {2012}, } @inproceedings{you2017deep, author = {Seungil You and David Ding and Kevin Canini and Jan Pfeifer and Maya Gupta}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {2985--2993}, title = {Deep Lattice Networks and Partial Monotonic Functions}, year = {2017}, } @article{daniels2010monotone, author = {Hennie Daniels and Marina Velikova}, journal = {IEEE Transactions on Neural Networks}, number = {6}, pages = {906--917}, title = {Monotone and partially monotone neural networks}, volume = {21}, year = {2010}, } @article{qu2011generalized, author = {Ya-Jun Qu and Bao-Gang Hu}, journal = {IEEE Transactions on Neural Networks}, number = {12}, pages = {2447--2459}, title = {Generalized constraint neural network regression model subject to linear priors}, volume = {22}, year = {2011}, } @article{shively2009bayesian, author = {Thomas S Shively and Thomas W Sager and Stephen G Walker}, journal = {Journal of the Royal Statistical Society: Series B (Statistical Methodology)}, number = {1}, pages = {159--175}, title = {A Bayesian approach to non-parametric monotone function estimation}, volume = {71}, year = {2009}, } @article{mozaffarian2011changes, author = {Dariush Mozaffarian and Tao Hao and Eric B Rimm and Walter C Willett and Frank B Hu}, journal = {New England Journal of Medicine}, number = {25}, pages = {2392--2404}, title = {Changes in diet and lifestyle and long-term weight gain in women and men}, volume = {364}, year = {2011}, } @article{hoffmann2015effect, author = {Johannes JML Hoffmann and Karin CAM Nabbe and Nicole MA van den Broek}, journal = {Clinical Chemistry and Laboratory Medicine (CCLM)}, number = {12}, title = {Effect of age and gender on reference intervals of red blood cell distribution width ({RDW}) and mean red cell volume ({MCV})}, volume = {53}, year = {2015}, } @article{stanojevic2008reference, author = {Sanja Stanojevic and Angie Wade and Janet Stocks and John Hankinson and Allan L Coates and Huiqi Pan and Mark Rosenthal and Mary Corey and Patrick Lebecque and Tim J Cole}, journal = {American Journal of Respiratory and Critical Care Medicine}, number = {3}, pages = {253--260}, title = {Reference ranges for spirometry across all ages: a new approach}, volume = {177}, year = {2008}, } @article{goodpaster2006loss, author = {Bret H Goodpaster and Seok Won Park and Tamara B Harris and Steven B Kritchevsky and Michael Nevitt and Ann V Schwartz and Eleanor M Simonsick and Frances A Tylavsky and Marjolein Visser and Anne B Newman}, journal = {The Journals of Gerontology Series A: Biological Sciences and Medical Sciences}, number = {10}, pages = {1059--1064}, title = {The loss of skeletal muscle strength, mass, and quality in older adults: the health, aging and body composition study}, volume = {61}, year = {2006}, } @inproceedings{munoz2017towards, author = {Luis Mu{\~n}oz-Gonz{\'a}lez and Battista Biggio and Ambra Demontis and Andrea Paudice and Vasin Wongrassamee and Emil C Lupu and Fabio Roli}, booktitle = {Proceedings of the 10th ACM Workshop on Artificial Intelligence and Security}, pages = {27--38}, title = {Towards poisoning of deep learning algorithms with back-gradient optimization}, year = {2017}, } @article{suciu2018does, author = {Octavian Suciu and Radu M{\u{a}}rginean and Yi{\u{g}}itcan Kaya and Hal Daum{\'e} III and Tudor Dumitra{\c{s}}}, journal = {arXiv preprint arXiv:1803.06975}, title = {When Does Machine Learning FAIL? Generalized Transferability for Evasion and Poisoning Attacks}, year = {2018}, } @article{shafahi2018poison, author = {Ali Shafahi and W Ronny Huang and Mahyar Najibi and Octavian Suciu and Christoph Studer and Tudor Dumitras and Tom Goldstein}, journal = {arXiv preprint arXiv:1804.00792}, title = {Poison {F}rogs! {Targeted} Clean-Label Poisoning Attacks on Neural Networks}, year = {2018}, } @article{gu2017badnets, author = {Tianyu Gu and Brendan Dolan-Gavitt and Siddharth Garg}, journal = {arXiv preprint arXiv:1708.06733}, title = {Badnets: Identifying vulnerabilities in the machine learning model supply chain}, year = {2017}, } @article{chen2017targeted, author = {Xinyun Chen and Chang Liu and Bo Li and Kimberly Lu and Dawn Song}, journal = {arXiv preprint arXiv:1712.05526}, title = {Targeted backdoor attacks on deep learning systems using data poisoning}, year = {2017}, } @article{bard1991some, author = {Jonathan F Bard}, journal = {Journal of optimization theory and applications}, number = {2}, pages = {371--378}, title = {Some properties of the bilevel programming problem}, volume = {68}, year = {1991}, } @article{crammer2002learnability, author = {Koby Crammer and Yoram Singer}, journal = {Machine learning}, number = {2}, pages = {201--233}, title = {On the learnability and design of output codes for multiclass problems}, volume = {47}, year = {2002}, } @article{mirrokni2015tight, author = {Vahab Mirrokni and Renato Paes Leme and Adrian Vladu and Sam Chiu-wai Wong}, journal = {arXiv preprint arXiv:1512.08602}, title = {Tight Bounds for Approximate {C}arath{\'e}odory and Beyond}, year = {2015}, } @article{barany2012notes, author = {Imre B{\'a}r{\'a}ny and Roman Karasev}, journal = {Discrete \& Computational Geometry}, number = {3}, pages = {783--792}, title = {Notes about the {C}arath{\'e}odory number}, volume = {48}, year = {2012}, } @inproceedings{wang2018learning, author = {Yisen Wang and Bo Dai and Lingkai Kong and Xingjun Ma and Sarah Monazam Erfani and James Bailey and Shu-Tao Xia and Le Song and Hongyuan Zha}, booktitle = {Uncertainty in Artificial Intelligence (UAI)}, title = {Learning Deep Hidden Nonlinear Dynamics from Aggregate Data}, year = {2018}, } @inproceedings{wang2014unsupervised, author = {Xiang Wang and David Sontag and Fei Wang}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, pages = {85--94}, title = {Unsupervised learning of disease progression models}, year = {2014}, } @article{papernot2018deep, author = {Nicolas Papernot and Patrick McDaniel}, journal = {arXiv preprint arXiv:1803.04765}, title = {Deep k-nearest neighbors: Towards confident, interpretable and robust deep learning}, year = {2018}, } @article{hsu2012tail, author = {Daniel Hsu and Sham Kakade and Tong Zhang and others}, journal = {Electronic Communications in Probability}, title = {A tail inequality for quadratic forms of subgaussian random vectors}, volume = {17}, year = {2012}, } @article{ghorbani2019data, author = {Amirata Ghorbani and James Zou}, journal = {arXiv preprint arXiv:1904.02868}, title = {Data Shapley: Equitable Valuation of Data for Machine Learning}, year = {2019}, } @article{jia2019towards, author = {Ruoxi Jia and David Dao and Boxin Wang and Frances Ann Hubis and Nick Hynes and Nezihe Merve Gurel and Bo Li and Ce Zhang and Dawn Song and Costas Spanos}, journal = {arXiv preprint arXiv:1902.10275}, title = {Towards Efficient Data Valuation Based on the Shapley Value}, year = {2019}, } @inproceedings{schulam2019can, author = {Peter Schulam and Suchi Saria}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, pages = {1022--1031}, title = {Can You Trust This Prediction? {Auditing} Pointwise Reliability After Learning}, year = {2019}, } @article{wang2019repairing, author = {Hao Wang and Berk Ustun and Flavio P Calmon}, journal = {arXiv preprint arXiv:1901.10501}, title = {Repairing without Retraining: Avoiding Disparate Impact with Counterfactual Distributions}, year = {2019}, } @inproceedings{zhou2019effects, author = {Jianlong Zhou and Zhidong Li and Huaiwen Hu and Kun Yu and Fang Chen and Zelin Li and Yang Wang}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Effects of Influence on User Trust in Predictive Decision Making}, year = {2019}, } @inproceedings{giordano2019swiss, author = {Ryan Giordano and William Stephenson and Runjing Liu and Michael Jordan and Tamara Broderick}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, pages = {1139--1147}, title = {A {Swiss Army} Infinitesimal Jackknife}, year = {2019}, } @article{pregibon1981logistic, author = {Daryl Pregibon and others}, journal = {Annals of Statistics}, number = {4}, pages = {705--724}, title = {Logistic regression diagnostics}, volume = {9}, year = {1981}, } @book{boyd2004convex, author = {Stephen Boyd and Lieven Vandenberghe}, publisher = {Cambridge University Press}, title = {Convex {Optimization}}, year = {2004}, } @inproceedings{arrieta2018should, author = {Imanol Arrieta-Ibarra and Leonard Goff and Diego Jim{\'e}nez-Hern{\'a}ndez and Jaron Lanier and E Glen Weyl}, booktitle = {American Economic Association Papers and Proceedings}, pages = {38--42}, title = {Should We Treat Data as Labor? {Moving} beyond ``Free''}, volume = {108}, year = {2018}, } @inproceedings{hayes2018contamination, author = {Jamie Hayes and Olga Ohrimenko}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {6604--6615}, title = {Contamination Attacks and Mitigation in Multi-Party Machine Learning}, year = {2018}, } @article{rad2018scalable, author = {Kamiar Rahnama Rad and Arian Maleki}, journal = {arXiv preprint arXiv:1801.10243}, title = {A scalable estimate of the extra-sample prediction error via approximate leave-one-out}, year = {2018}, } @book{vershynin2018high, author = {Roman Vershynin}, publisher = {Cambridge University Press}, title = {High-dimensional probability: An introduction with applications in data science}, volume = {47}, year = {2018}, } @article{bach2010self, author = {Francis Bach and others}, journal = {Electronic Journal of Statistics}, pages = {384--414}, title = {Self-concordant analysis for logistic regression}, volume = {4}, year = {2010}, } @inproceedings{chen2018my, author = {Irene Chen and Fredrik D Johansson and David Sontag}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {3539--3550}, title = {Why Is My Classifier Discriminatory?}, year = {2018}, } @article{hampel1974influence, author = {Frank R Hampel}, journal = {Journal of the American Statistical Association}, number = {346}, pages = {383--393}, title = {The influence curve and its role in robust estimation}, volume = {69}, year = {1974}, } @article{wang2018approximate, author = {Shuaiwen Wang and Wenda Zhou and Arian Maleki and Haihao Lu and Vahab Mirrokni}, journal = {arXiv preprint arXiv:1810.02716}, title = {Approximate Leave-One-Out for High-Dimensional Non-Differentiable Learning Problems}, year = {2018}, } @article{sharchilev2018finding, author = {Boris Sharchilev and Yury Ustinovsky and Pavel Serdyukov and Maarten de Rijke}, journal = {arXiv preprint arXiv:1802.06640}, title = {Finding influential training samples for gradient boosted decision trees}, year = {2018}, } @inproceedings{khanna2019interpreting, author = {Rajiv Khanna and Been Kim and Joydeep Ghosh and Oluwasanmi Koyejo}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, pages = {3382--3390}, title = {Interpreting Black Box Predictions using {Fisher} Kernels}, year = {2019}, } @inproceedings{mccoy2019right, author = {R Thomas McCoy and Ellie Pavlick and Tal Linzen}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Right for the Wrong Reasons: Diagnosing Syntactic Heuristics in Natural Language Inference}, year = {2019}, } @inproceedings{buolamwini2018gender, author = {Joy Buolamwini and Timnit Gebru}, booktitle = {Conference on Fairness, Accountability and Transparency}, pages = {77--91}, title = {Gender shades: Intersectional accuracy disparities in commercial gender classification}, year = {2018}, } @inproceedings{bagnell2005robust, author = {J Andrew Bagnell}, booktitle = {Proceedings of the 20th national conference on Artificial intelligence-Volume 2}, pages = {714--719}, title = {Robust supervised learning}, year = {2005}, } @inproceedings{zhang2017understanding, author = {Chiyuan Zhang and Samy Bengio and Moritz Hardt and Benjamin Recht and Oriol Vinyals}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Understanding deep learning requires rethinking generalization}, year = {2017}, } @inproceedings{hoffer2017train, author = {Elad Hoffer and Itay Hubara and Daniel Soudry}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1731--1741}, title = {Train longer, generalize better: closing the generalization gap in large batch training of neural networks}, year = {2017}, } @techreport{wah2011cub, author = {C Wah and S Branson and P Welinder and P Perona and S Belongie}, institution = {California Institute of Technology}, title = {The {Caltech}-{UCSD} {Birds}-200-2011 dataset}, year = {2011}, } @article{zhou2017places, author = {Bolei Zhou and Agata Lapedriza and Aditya Khosla and Aude Oliva and Antonio Torralba}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence}, number = {6}, pages = {1452--1464}, title = {Places: A 10 million image database for scene recognition}, volume = {40}, year = {2017}, } @inproceedings{liu2015deep, author = {Ziwei Liu and Ping Luo and Xiaogang Wang and Xiaoou Tang}, booktitle = {Proceedings of the IEEE International Conference on Computer Vision}, pages = {3730--3738}, title = {Deep learning face attributes in the wild}, year = {2015}, } @inproceedings{byrd2019effect, author = {Jonathon Byrd and Zachary Lipton}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {872--881}, title = {What is the Effect of Importance Weighting in Deep Learning?}, year = {2019}, } @inproceedings{shen2016relay, author = {Li Shen and Zhouchen Lin and Qingming Huang}, booktitle = {European Conference on Computer Vision}, pages = {467--482}, title = {Relay backpropagation for effective learning of deep convolutional neural networks}, year = {2016}, } @article{buda2018systematic, author = {Mateusz Buda and Atsuto Maki and Maciej A Mazurowski}, journal = {Neural Networks}, pages = {249--259}, title = {A systematic study of the class imbalance problem in convolutional neural networks}, volume = {106}, year = {2018}, } @book{bertsekas2009convex, author = {Dimitri P Bertsekas}, publisher = {Athena Scientific Belmont}, title = {Convex Optimization Theory}, year = {2009}, } @inproceedings{cao2019learning, author = {Kaidi Cao and Colin Wei and Adrien Gaidon and Nikos Arechiga and Tengyu Ma}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Learning Imbalanced Datasets with Label-Distribution-Aware Margin Loss}, year = {2019}, } @inproceedings{cui2019class, author = {Yin Cui and Menglin Jia and Tsung-Yi Lin and Yang Song and Serge Belongie}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {9268--9277}, title = {Class-balanced loss based on effective number of samples}, year = {2019}, } @article{radford2019language, author = {Alec Radford and Jeffrey Wu and Rewon Child and David Luan and Dario Amodei and Ilya Sutskever}, journal = {OpenAI Blog}, number = {8}, title = {Language models are unsupervised multitask learners}, volume = {1}, year = {2019}, } @inproceedings{vapnik1992principles, author = {Vladimir Vapnik}, booktitle = {Advances in Neural Information Processing Systems}, pages = {831--838}, title = {Principles of risk minimization for learning theory}, year = {1992}, } @inproceedings{gururangan2018annotation, author = {Suchin Gururangan and Swabha Swayamdipta and Omer Levy and Roy Schwartz and Samuel Bowman and Noah A Smith}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {107--112}, title = {Annotation Artifacts in Natural Language Inference Data}, year = {2018}, } @inproceedings{naik2018stress, author = {Aakanksha Naik and Abhilasha Ravichander and Norman Sadeh and Carolyn Rose and Graham Neubig}, booktitle = {International Conference on Computational Linguistics (COLING)}, pages = {2340--2353}, title = {Stress Test Evaluation for Natural Language Inference}, year = {2018}, } @article{merler2019diversity, author = {Michele Merler and Nalini Ratha and Rogerio S Feris and John R Smith}, journal = {arXiv preprint arXiv:1901.10436}, title = {Diversity in faces}, year = {2019}, } @inproceedings{dosovitskiy2017carla, author = {Alexey Dosovitskiy and German Ros and Felipe Codevilla and Antonio Lopez and Vladlen Koltun}, booktitle = {Conference on Robot Learning}, pages = {1--16}, title = {CARLA: An Open Urban Driving Simulator}, year = {2017}, } @inproceedings{agarwal2018reductions, author = {Alekh Agarwal and Alina Beygelzimer and Miroslav Dudik and John Langford and Hanna Wallach}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {60--69}, title = {A Reductions Approach to Fair Classification}, year = {2018}, } @article{hicks2017missing, author = {Stephanie C Hicks and F William Townes and Mingxiang Teng and Rafael A Irizarry}, journal = {Biostatistics}, number = {4}, pages = {562--578}, title = {Missing data and technical variability in single-cell {RNA}-sequencing experiments}, volume = {19}, year = {2017}, } @article{meyer2014identifying, author = {Clifford A Meyer and X Shirley Liu}, journal = {Nature Reviews Genetics}, number = {11}, pages = {709--721}, title = {Identifying and mitigating bias in next-generation sequencing methods for chromatin biology}, volume = {15}, year = {2014}, } @article{brunet2018understanding, author = {Marc-Etienne Brunet and Colleen Alkalay-Houlihan and Ashton Anderson and Richard Zemel}, journal = {arXiv preprint arXiv:1810.03611}, title = {Understanding the origins of bias in word embeddings}, year = {2018}, } @article{giordano2019higher, author = {Ryan Giordano and Michael I Jordan and Tamara Broderick}, journal = {arXiv preprint arXiv:1907.12116}, title = {A Higher-Order {Swiss Army} Infinitesimal Jackknife}, year = {2019}, } @article{badgeley2019deep, author = {Marcus A Badgeley and John R Zech and Luke Oakden-Rayner and Benjamin S Glicksberg and Manway Liu and William Gale and Michael V McConnell and Bethany Percha and Thomas M Snyder and Joel T Dudley}, journal = {npj Digital Medicine}, title = {Deep learning predicts hip fracture using confounding patient and healthcare variables}, volume = {2}, year = {2019}, } @article{blanchet2019quantifying, author = {Jose Blanchet and Karthyek Murthy}, journal = {Mathematics of Operations Research}, number = {2}, pages = {565--600}, title = {Quantifying distributional model risk via optimal transport}, volume = {44}, year = {2019}, } @inproceedings{devlin2019bert, author = {Jacob Devlin and Ming-Wei Chang and Kenton Lee and Kristina Toutanova}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {4171--4186}, title = {{BERT}: Pre-training of Deep Bidirectional Transformers for Language Understanding}, year = {2019}, } @inproceedings{hardt2016train, author = {Moritz Hardt and Ben Recht and Yoram Singer}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1225--1234}, title = {Train faster, generalize better: Stability of stochastic gradient descent}, year = {2016}, } @article{heinze2017conditional, author = {Christina Heinze-Deml and Nicolai Meinshausen}, journal = {arXiv preprint arXiv:1710.11469}, title = {Conditional variance penalties and domain shift robustness}, year = {2017}, } @inproceedings{ioffe2015batch, author = {Sergey Ioffe and Christian Szegedy}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {448--456}, title = {Batch Normalization: Accelerating Deep Network Training by Reducing Internal Covariate Shift}, year = {2015}, } @article{lecun2015deep, author = {Yann LeCun and Yoshua Bengio and Geoffrey Hinton}, journal = {Nature}, number = {7553}, title = {Deep Learning}, volume = {521}, year = {2015}, } @inproceedings{lampert2009learning, author = {Christoph H Lampert and Hannes Nickisch and Stefan Harmeling}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {951--958}, title = {Learning to detect unseen object classes by between-class attribute transfer}, year = {2009}, } @inproceedings{kim2018interpretability, author = {Been Kim and Martin Wattenberg and Justin Gilmer and Carrie Cai and James Wexler and Fernanda Viegas and others}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {2668--2677}, title = {Interpretability Beyond Feature Attribution: Quantitative Testing with Concept Activation Vectors (TCAV)}, year = {2018}, } @inproceedings{bau2017network, author = {David Bau and Bolei Zhou and Aditya Khosla and Aude Oliva and Antonio Torralba}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {6541--6549}, title = {Network dissection: Quantifying interpretability of deep visual representations}, year = {2017}, } @inproceedings{fong2017interpretable, author = {Ruth C Fong and Andrea Vedaldi}, booktitle = {International Conference on Computer Vision (ICCV)}, pages = {3429--3437}, title = {Interpretable explanations of black boxes by meaningful perturbation}, year = {2017}, } @article{nevitt2006osteoarthritis, author = {M Nevitt and David T Felson and Gayle Lester}, journal = {Cohort study protocol}, title = {The {Osteoarthritis Initiative}}, year = {2006}, } @article{pierson2019using, author = {Emma Pierson and David Cutler and Jure Leskovec and Sendhil Mullainathan and Ziad Obermeyer}, journal = {NBER Machine Learning and Healthcare Conference}, title = {Using machine learning to understand racial and socioeconomic differences in knee pain}, year = {2019}, } @article{kohn2016classifications, author = {MD Kohn and AA Sassoon and ND Fernando}, journal = {Clinical orthopaedics and related research}, number = {8}, pages = {1886--1893}, title = {Classifications in Brief: {Kellgren-Lawrence} Classification of Osteoarthritis}, volume = {474}, year = {2016}, } @article{kellgren1957radiological, author = {JH Kellgren and JS Lawrence}, journal = {Annals of the Rheumatic Diseases}, number = {4}, title = {Radiological assessment of osteo-arthrosis}, volume = {16}, year = {1957}, } @article{tiulpin2018automatic, author = {Aleksei Tiulpin and J{\'e}r{\^o}me Thevenot and Esa Rahtu and Petri Lehenkari and Simo Saarakkala}, journal = {Scientific Reports}, number = {1}, pages = {1--10}, title = {Automatic knee osteoarthritis diagnosis from plain radiographs: A deep learning-based approach}, volume = {8}, year = {2018}, } @inproceedings{melis2018towards, author = {David Alvarez Melis and Tommi Jaakkola}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {7775--7784}, title = {Towards robust interpretability with self-explaining neural networks}, year = {2018}, } @article{de2018clinically, author = {Jeffrey De Fauw and Joseph R Ledsam and Bernardino Romera-Paredes and Stanislav Nikolov and Nenad Tomasev and Sam Blackwell and Harry Askham and Xavier Glorot and Brendan O’Donoghue and Daniel Visentin and others}, journal = {Nature Medicine}, number = {9}, pages = {1342--1350}, title = {Clinically applicable deep learning for diagnosis and referral in retinal disease}, volume = {24}, year = {2018}, } @inproceedings{yi2018neural, author = {Kexin Yi and Jiajun Wu and Chuang Gan and Antonio Torralba and Pushmeet Kohli and Josh Tenenbaum}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1031--1042}, title = {Neural-symbolic vqa: Disentangling reasoning from vision and language understanding}, year = {2018}, } @inproceedings{zhou2018interpretable, author = {Bolei Zhou and Yiyou Sun and David Bau and Antonio Torralba}, booktitle = {European Conference on Computer Vision (ECCV)}, pages = {119--134}, title = {Interpretable basis decomposition for visual explanation}, year = {2018}, } @inproceedings{huang2016part, author = {Shaoli Huang and Zhe Xu and Dacheng Tao and Ya Zhang}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {1173--1182}, title = {Part-stacked {CNN} for fine-grained visual categorization}, year = {2016}, } @inproceedings{sundararajan2017axiomatic, author = {Mukund Sundararajan and Ankur Taly and Qiqi Yan}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {3319--3328}, title = {Axiomatic attribution for deep networks}, year = {2017}, } @article{bengio2013representation, author = {Yoshua Bengio and Aaron Courville and Pascal Vincent}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence}, number = {8}, pages = {1798--1828}, title = {Representation learning: A review and new perspectives}, volume = {35}, year = {2013}, } @inproceedings{cui2018large, author = {Yin Cui and Yang Song and Chen Sun and Andrew Howard and Serge Belongie}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {4109--4118}, title = {Large scale fine-grained categorization and domain-specific transfer learning}, year = {2018}, } @article{zelenko2003kernel, author = {Dmitry Zelenko and Chinatsu Aone and Anthony Richardella}, journal = {Journal of Machine Learning Research}, number = {0}, pages = {1083--1106}, title = {Kernel methods for relation extraction}, volume = {3}, year = {2003}, } @inproceedings{bunescu2005shortest, author = {Razvan C Bunescu and Raymond J Mooney}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {724--731}, title = {A shortest path dependency kernel for relation extraction}, year = {2005}, } @inproceedings{sutton2005joint, author = {Charles Sutton and Andrew McCallum}, booktitle = {Computational Natural Language Learning (CoNLL)}, title = {Joint Parsing and Semantic Role Labeling}, year = {2005}, } @article{lindley1956measure, author = {Dennis V Lindley}, journal = {The Annals of Mathematical Statistics}, pages = {986--1005}, title = {On a measure of the information provided by an experiment}, year = {1956}, } @article{japkowicz2002class, author = {Nathalie Japkowicz and Shaju Stephen}, journal = {Intelligent Data Analysis}, number = {5}, pages = {429--449}, title = {The class imbalance problem: A systematic study}, volume = {6}, year = {2002}, } @article{arjovsky2019invariant, author = {Martin Arjovsky and L{\'e}on Bottou and Ishaan Gulrajani and David Lopez-Paz}, journal = {arXiv preprint arXiv:1907.02893}, title = {Invariant risk minimization}, year = {2019}, } @inproceedings{hendrycks2019benchmarking, author = {Dan Hendrycks and Thomas Dietterich}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Benchmarking neural network robustness to common corruptions and perturbations}, year = {2019}, } @article{yang2020rethinking, author = {Zitong Yang and Yaodong Yu and Chong You and Jacob Steinhardt and Yi Ma}, journal = {arXiv preprint arXiv:2002.11328}, title = {Rethinking bias-variance trade-off for generalization of neural networks}, year = {2020}, } @inproceedings{rosset2004margin, author = {Saharon Rosset and Ji Zhu and Trevor J Hastie}, booktitle = {Advances in neural information processing systems}, pages = {1237--1244}, title = {Margin maximizing loss functions}, year = {2004}, } @article{chawla2002smote, author = {Nitesh V Chawla and Kevin W Bowyer and Lawrence O Hall and W Philip Kegelmeyer}, journal = {Journal of artificial intelligence research}, pages = {321--357}, title = {SMOTE: synthetic minority over-sampling technique}, volume = {16}, year = {2002}, } @article{haixiang2017learning, author = {Guo Haixiang and Li Yijing and Jennifer Shang and Gu Mingyun and Huang Yuanyue and Gong Bing}, journal = {Expert Systems with Applications}, pages = {220--239}, title = {Learning from class-imbalanced data: Review of methods and applications}, volume = {73}, year = {2017}, } @article{losch2019interpretability, author = {Max Losch and Mario Fritz and Bernt Schiele}, journal = {arXiv preprint arXiv:1907.10882}, title = {Interpretability beyond classification output: Semantic bottleneck networks}, year = {2019}, } @article{chen2020concept, author = {Zhi Chen and Yijie Bei and Cynthia Rudin}, journal = {arXiv preprint arXiv:2002.01650}, title = {Concept Whitening for Interpretable Image Recognition}, year = {2020}, } @inproceedings{bucher2018semantic, author = {Maxime Bucher and St{\'e}phane Herbin and Fr{\'e}d{\'e}ric Jurie}, booktitle = {Asian Conference on Computer Vision}, pages = {695--712}, title = {Semantic bottleneck for computer vision tasks}, year = {2018}, } @article{goyal2019explaining, author = {Yash Goyal and Uri Shalit and Been Kim}, journal = {arXiv preprint arXiv:1907.07165}, title = {Explaining classifiers with causal concept effect ({CaCE})}, year = {2019}, } @inproceedings{duan2012discovering, author = {Kun Duan and Devi Parikh and David Crandall and Kristen Grauman}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {3474--3481}, title = {Discovering localized attributes for fine-grained recognition}, year = {2012}, } @inproceedings{graziani2018regression, author = {Mara Graziani and Vincent Andrearczyk and Henning M{\"u}ller}, booktitle = {Understanding and Interpreting Machine Learning in Medical Image Computing Applications}, pages = {124--132}, title = {Regression concept vectors for bidirectional explanations in histopathology}, year = {2018}, } @inproceedings{clough2019global, author = {James R Clough and Ilkay Oksuz and Esther Puyol-Ant{\'o}n and Bram Ruijsink and Andrew P King and Julia A Schnabel}, booktitle = {International Conference on Medical Image Computing and Computer-Assisted Intervention}, pages = {656--664}, title = {Global and local interpretability for cardiac {MRI} classification}, year = {2019}, } @inproceedings{sprague2019interpretable, author = {Conner Sprague and Eric B Wendoloski and Ingrid Guch}, booktitle = {99th American Meteorological Society Annual Meeting}, title = {Interpretable {AI} for Deep Learning-Based Meteorological Applications}, year = {2019}, } @article{o2020generative, author = {Matthew O'Shaughnessy and Gregory Canal and Marissa Connor and Mark Davenport and Christopher Rozell}, journal = {arXiv preprint arXiv:2006.13913}, title = {Generative causal explanations of black-box classifiers}, year = {2020}, } @inproceedings{ghorbani2019towards, author = {Amirata Ghorbani and James Wexler and James Y Zou and Been Kim}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {9277--9286}, title = {Towards automatic concept-based explanations}, year = {2019}, } @inproceedings{higgins2017beta, author = {Irina Higgins and Loic Matthey and Arka Pal and Christopher Burgess and Xavier Glorot and Matthew Botvinick and Shakir Mohamed and Alexander Lerchner}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {beta-vae: Learning basic visual concepts with a constrained variational framework}, year = {2017}, } @inproceedings{chen2016infogan, author = {Xi Chen and Yan Duan and Rein Houthooft and John Schulman and Ilya Sutskever and Pieter Abbeel}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {{InfoGAN}: Interpretable representation learning by information maximizing generative adversarial nets}, year = {2016}, } @article{joshi2018xgems, author = {Shalmali Joshi and Oluwasanmi Koyejo and Been Kim and Joydeep Ghosh}, journal = {arXiv preprint arXiv:1806.08867}, title = {{xGEMs}: Generating examplars to explain black-box models}, year = {2018}, } @inproceedings{borkan2019nuanced, author = {Daniel Borkan and Lucas Dixon and Jeffrey Sorensen and Nithum Thain and Lucy Vasserman}, booktitle = {World Wide Web (WWW)}, pages = {491--500}, title = {Nuanced metrics for measuring unintended bias with real data for text classification}, year = {2019}, } @article{mozannar2020consistent, author = {Hussein Mozannar and David Sontag}, journal = {arXiv preprint arXiv:2006.01862}, title = {Consistent Estimators for Learning to Defer to an Expert}, year = {2020}, } @inproceedings{irvin2019chexpert, author = {Jeremy Irvin and Pranav Rajpurkar and Michael Ko and Yifan Yu and Silviana Ciurea-Ilcus and Chris Chute and Henrik Marklund and Behzad Haghgoo and Robyn Ball and Katie Shpanskaya and others}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {590--597}, title = {Chexpert: A large chest radiograph dataset with uncertainty labels and expert comparison}, volume = {33}, year = {2019}, } @article{porcel2018chest, author = {Jos{\'e} M Porcel}, journal = {Tuberculosis and Respiratory Diseases}, number = {2}, pages = {106--115}, title = {Chest tube drainage of the pleural space: a concise review for pulmonologists}, volume = {81}, year = {2018}, } @inproceedings{oakden2020hidden, author = {Luke Oakden-Rayner and Jared Dunnmon and Gustavo Carneiro and Christopher R{\'e}}, booktitle = {Proceedings of the ACM Conference on Health, Inference, and Learning}, pages = {151--159}, title = {Hidden stratification causes clinically meaningful failures in machine learning for medical imaging}, year = {2020}, } @inproceedings{huang2017densely, author = {Gao Huang and Zhuang Liu and Laurens Van Der Maaten and Kilian Q Weinberger}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition}, pages = {4700--4708}, title = {Densely connected convolutional networks}, year = {2017}, } @article{chen2020ethical, author = {Irene Y Chen and Emma Pierson and Sherri Rose and Shalmali Joshi and Kadija Ferryman and Marzyeh Ghassemi}, journal = {arXiv preprint arXiv:2009.10576}, title = {Ethical Machine Learning in Health}, year = {2020}, } @article{hill2020wrongfully, author = {Kashmir Hill}, journal = {The New York Times}, title = {Wrongfully Accused by an Algorithm}, url = {https://www.nytimes.com/2020/06/24/technology/facial-recognition-arrest.html}, year = {2020}, } @article{nyt2016jigsaw, author = {{The New York Times Company}}, journal = {The New York Times}, title = {The Times is Partnering with Jigsaw to Expand Comment Capabilities}, url = {https://www.nytco.com/press/the-times-is-partnering-with-jigsaw-to-expand-comment-capabilities/}, year = {2016}, } @article{broussard2020grades, author = {Meredith Broussard}, journal = {The New York Times}, title = {When Algorithms Give Real Students Imaginary Grades}, url = {https://www.nytimes.com/2020/09/08/opinion/international-baccalaureate-algorithm-grades.html}, year = {2020}, } @article{bbc2020gcse, author = {BBC}, journal = {The British Broadcasting Corporation}, title = {A-levels and GCSEs: How did the exam algorithm work?}, url = {https://www.bbc.com/news/explainers-53807730}, year = {2020}, } @article{npr2018grading, author = {NPR}, journal = {National Public Radio}, title = {More States Opting To 'Robo-Grade' Student Essays By Computer}, url = {https://www.npr.org/2018/06/30/624373367/more-states-opting-to-robo-grade-student-essays-by-computer}, year = {2018}, } @article{de2000reject, author = {Claudio De Stefano and Carlo Sansone and Mario Vento}, journal = {IEEE Transactions on Systems, Man, and Cybernetics, Part C (Applications and Reviews)}, number = {1}, pages = {84--94}, title = {To reject or not to reject: that is the question-an answer in case of neural classifiers}, volume = {30}, year = {2000}, } @article{bartlett2008classification, author = {Peter L Bartlett and Marten H Wegkamp}, journal = {Journal of Machine Learning Research (JMLR)}, number = {0}, pages = {1823--1840}, title = {Classification with a reject option using a hinge loss}, volume = {9}, year = {2008}, } @inproceedings{raghu2019direct, author = {Maithra Raghu and Katy Blumer and Rory Sayres and Ziad Obermeyer and Bobby Kleinberg and Sendhil Mullainathan and Jon Kleinberg}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {5281--5290}, title = {Direct uncertainty prediction for medical second opinions}, year = {2019}, } @inproceedings{geifman2018bias, author = {Yonatan Geifman and Guy Uziel and Ran El-Yaniv}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Bias-Reduced Uncertainty Estimation for Deep Neural Classifiers}, year = {2018}, } @inproceedings{de2020regression, author = {Abir De and Paramita Koley and Niloy Ganguly and Manuel Gomez-Rodriguez}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {2611--2620}, title = {Regression under Human Assistance}, year = {2020}, } @article{pimentel2014review, author = {Marco AF Pimentel and David A Clifton and Lei Clifton and Lionel Tarassenko}, journal = {Signal Processing}, pages = {215--249}, title = {A review of novelty detection}, volume = {99}, year = {2014}, } @article{hellman1970nearest, author = {Martin E Hellman}, journal = {IEEE Transactions on Systems Science and Cybernetics}, number = {3}, pages = {179--185}, title = {The nearest neighbor classification rule with a reject option}, volume = {6}, year = {1970}, } @article{hellman1970probability, author = {Martin Hellman and Josef Raviv}, journal = {IEEE Transactions on Information Theory}, number = {4}, pages = {368--372}, title = {Probability of error, equivocation, and the Chernoff bound}, volume = {16}, year = {1970}, } @article{cordella1995method, author = {Luigi Pietro Cordella and Claudio De Stefano and Francesco Tortorella and Mario Vento}, journal = {IEEE Transactions on Neural Networks}, number = {5}, pages = {1140--1147}, title = {A method for improving classification reliability of multilayer perceptrons}, volume = {6}, year = {1995}, } @inproceedings{park2018reducing, author = {Ji Ho Park and Jamin Shin and Pascale Fung}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {2799--2804}, title = {Reducing Gender Bias in Abusive Language Detection}, year = {2018}, } @inproceedings{hovy2016social, author = {Dirk Hovy and Shannon L Spruit}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {591--598}, title = {The social impact of natural language processing}, year = {2016}, } @article{koenecke2020racial, author = {Allison Koenecke and Andrew Nam and Emily Lake and Joe Nudell and Minnie Quartey and Zion Mengesha and Connor Toups and John R Rickford and Dan Jurafsky and Sharad Goel}, journal = {Proceedings of the National Academy of Sciences}, title = {Racial disparities in automated speech recognition}, year = {2020}, } @inproceedings{conneau2019cross, author = {Alexis Conneau and Guillaume Lample}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {7059--7069}, title = {Cross-lingual language model pretraining}, year = {2019}, } @inproceedings{conneau2018xnli, author = {Alexis Conneau and Ruty Rinott and Guillaume Lample and Adina Williams and Samuel Bowman and Holger Schwenk and Veselin Stoyanov}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {2475--2485}, title = {XNLI: Evaluating Cross-lingual Sentence Representations}, year = {2018}, } @article{hu2020xtreme, author = {Junjie Hu and Sebastian Ruder and Aditya Siddhant and Graham Neubig and Orhan Firat and Melvin Johnson}, journal = {arXiv preprint arXiv:2003.11080}, title = {Xtreme: A massively multilingual multi-task benchmark for evaluating cross-lingual generalization}, year = {2020}, } @article{clark2020tydi, author = {Jonathan H Clark and Eunsol Choi and Michael Collins and Dan Garrette and Tom Kwiatkowski and Vitaly Nikolaev and Jennimaria Palomaki}, journal = {arXiv preprint arXiv:2003.05002}, title = {TyDi QA: A benchmark for information-seeking question answering in typologically diverse languages}, year = {2020}, } @inproceedings{ribeiro2020beyond, author = {Marco Tulio Ribeiro and Tongshuang Wu and Carlos Guestrin and Sameer Singh}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {4902--4912}, title = {Beyond Accuracy: Behavioral Testing of {NLP} Models with {C}heck{L}ist}, year = {2020}, } @article{nestor2019feature, author = {Bret Nestor and Matthew McDermott and Willie Boag and Gabriela Berner and Tristan Naumann and Michael C Hughes and Anna Goldenberg and Marzyeh Ghassemi}, journal = {arXiv preprint arXiv:1908.00690}, title = {Feature robustness in non-stationary health records: caveats to deployable model performance in common clinical machine learning tasks}, year = {2019}, } @inproceedings{veeling2018rotation, author = {Bastiaan S Veeling and Jasper Linmans and Jim Winkens and Taco Cohen and Max Welling}, booktitle = {International Conference on Medical image computing and computer-assisted intervention}, pages = {210--218}, title = {Rotation equivariant CNNs for digital pathology}, year = {2018}, } @article{tellez2019quantifying, author = {David Tellez and Geert Litjens and P{\'e}ter B{\'a}ndi and Wouter Bulten and John-Melle Bokhorst and Francesco Ciompi and Jeroen van der Laak}, journal = {Medical Image Analysis}, title = {Quantifying the effects of data augmentation and stain color normalization in convolutional neural networks for computational pathology}, volume = {58}, year = {2019}, } @article{bandi2018detection, author = {Peter Bandi and Oscar Geessink and Quirine Manson and Marcory Van Dijk and Maschenka Balkenhol and Meyke Hermsen and Babak Ehteshami Bejnordi and Byungjae Lee and Kyunghyun Paeng and Aoxiao Zhong and others}, journal = {IEEE Transactions on Medical Imaging}, number = {2}, pages = {550--560}, title = {From detection of individual metastases to classification of lymph node status at the patient level: the {CAMELYON17} challenge}, volume = {38}, year = {2018}, } @article{litjens2018camelyon, author = {Geert Litjens and Peter Bandi and Babak Ehteshami Bejnordi and Oscar Geessink and Maschenka Balkenhol and Peter Bult and Altuna Halilovic and Meyke Hermsen and Rob van de Loo and Rob Vogels and others}, journal = {Science}, number = {6}, title = {1399 H\&E-stained sentinel lymph node sections of breast cancer patients: the {CAMELYON} dataset}, volume = {7}, year = {2018}, } @article{tellez2018whole, author = {David Tellez and Maschenka Balkenhol and Irene Otte-H{\\"o}ller and Rob van de Loo and Rob Vogels and Peter Bult and Carla Wauters and Willem Vreuls and Suzanne Mol and Nico Karssemeijer and others}, journal = {IEEE transactions on medical imaging}, number = {9}, pages = {2126--2136}, title = {Whole-slide mitosis detection in H\&E breast histology using PHH3 as a reference to train distilled stain-invariant convolutional networks}, volume = {37}, year = {2018}, } @article{weinstein2013cancer, author = {John N Weinstein and Eric A Collisson and Gordon B Mills and Kenna R Mills Shaw and Brad A Ozenberger and Kyle Ellrott and Ilya Shmulevich and Chris Sander and Joshua M Stuart and Cancer Genome Atlas Research Network and others}, journal = {Nature genetics}, number = {10}, title = {The cancer genome atlas pan-cancer analysis project}, volume = {45}, year = {2013}, } @article{esteva2017dermatologist, author = {Andre Esteva and Brett Kuprel and Roberto A Novoa and Justin Ko and Susan M Swetter and Helen M Blau and Sebastian Thrun}, journal = {Nature}, number = {7639}, pages = {115--118}, title = {Dermatologist-level classification of skin cancer with deep neural networks}, volume = {542}, year = {2017}, } @article{codella2019skin, author = {Noel Codella and Veronica Rotemberg and Philipp Tschandl and M Emre Celebi and Stephen Dusza and David Gutman and Brian Helba and Aadi Kalloo and Konstantinos Liopyris and Michael Marchetti and others}, journal = {arXiv preprint arXiv:1902.03368}, title = {Skin lesion analysis toward melanoma detection 2018: A challenge hosted by the international skin imaging collaboration (isic)}, year = {2019}, } @article{campanella2019clinical, author = {Gabriele Campanella and Matthew G Hanna and Luke Geneslaw and Allen Miraflor and Vitor Werneck Krauss Silva and Klaus J Busam and Edi Brogi and Victor E Reuter and David S Klimstra and Thomas J Fuchs}, journal = {Nature medicine}, number = {8}, pages = {1301--1309}, title = {Clinical-grade computational pathology using weakly supervised deep learning on whole slide images}, volume = {25}, year = {2019}, } @article{beck2011systematic, author = {Andrew H Beck and Ankur R Sangoi and Samuel Leung and Robert J Marinelli and Torsten O Nielsen and Marc J Van De Vijver and Robert B West and Matt Van De Rijn and Daphne Koller}, journal = {Science}, number = {108}, title = {Systematic analysis of breast cancer morphology uncovers stromal features associated with survival}, volume = {3}, year = {2011}, } @article{janowczyk2016deep, author = {Andrew Janowczyk and Anant Madabhushi}, journal = {Journal of pathology informatics}, title = {Deep learning for digital pathology image analysis: A comprehensive tutorial with selected use cases}, volume = {7}, year = {2016}, } @article{gurcan2009histopathological, author = {Metin N Gurcan and Laura E Boucheron and Ali Can and Anant Madabhushi and Nasir M Rajpoot and Bulent Yener}, journal = {IEEE reviews in biomedical engineering}, pages = {147--171}, title = {Histopathological image analysis: A review}, volume = {2}, year = {2009}, } @inproceedings{thagaard2020can, author = {Jeppe Thagaard and S{\o}ren Hauberg and Bert van der Vegt and Thomas Ebstrup and Johan D Hansen and Anders B Dahl}, booktitle = {International Conference on Medical Image Computing and Computer-Assisted Intervention}, pages = {824--833}, title = {Can you trust predictive uncertainty under real dataset shifts in digital pathology?}, year = {2020}, } @article{phillips2020chexphoto, author = {Nick A Phillips and Pranav Rajpurkar and Mark Sabini and Rayan Krishnan and Sharon Zhou and Anuj Pareek and Nguyet Minh Phu and Chris Wang and Andrew Y Ng and Matthew P Lungren}, journal = {arXiv preprint arXiv:2007.06199}, title = {Chexphoto: 10,000+ smartphone photos and synthetic photographic transformations of chest x-rays for benchmarking deep learning robustness}, year = {2020}, } @article{zhou2020curse, author = {Xiang Zhou and Yixin Nie and Hao Tan and Mohit Bansal}, journal = {arXiv preprint arXiv:2004.13606}, title = {The Curse of Performance Instability in Analysis Datasets: Consequences, Source, and Suggestions}, year = {2020}, } @article{bejnordi2017diagnostic, author = {Babak Ehteshami Bejnordi and Mitko Veta and Paul Johannes Van Diest and Bram Van Ginneken and Nico Karssemeijer and Geert Litjens and Jeroen AWM Van Der Laak and Meyke Hermsen and Quirine F Manson and Maschenka Balkenhol and others}, journal = {Jama}, number = {22}, pages = {2199--2210}, title = {Diagnostic assessment of deep learning algorithms for detection of lymph node metastases in women with breast cancer}, volume = {318}, year = {2017}, } @article{veta2019predicting, author = {Mitko Veta and Yujing J Heng and Nikolas Stathonikos and Babak Ehteshami Bejnordi and Francisco Beca and Thomas Wollmann and Karl Rohr and Manan A Shah and Dayong Wang and Mikael Rousson and others}, journal = {Medical image analysis}, pages = {111--121}, title = {Predicting breast tumor proliferation from whole-slide images: the TUPAC16 challenge}, volume = {54}, year = {2019}, } @article{komura2018machine, author = {Daisuke Komura and Shumpei Ishikawa}, journal = {Computational and structural biotechnology journal}, pages = {34--42}, title = {Machine learning methods for histopathological image analysis}, volume = {16}, year = {2018}, } @article{veta2016mitosis, author = {Mitko Veta and Paul J Van Diest and Mehdi Jiwa and Shaimaa Al-Janabi and Josien PW Pluim}, journal = {PloS one}, number = {8}, title = {Mitosis counting in breast cancer: Object-level interobserver agreement and comparison to an automatic method}, volume = {11}, year = {2016}, } @inproceedings{beede2020human, author = {Emma Beede and Elizabeth Baylor and Fred Hersch and Anna Iurchenko and Lauren Wilcox and Paisan Ruamviboonsuk and Laura M Vardoulakis}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, pages = {1--12}, title = {A Human-Centered Evaluation of a Deep Learning System Deployed in Clinics for the Detection of Diabetic Retinopathy}, year = {2020}, } @article{bentaieb2017adversarial, author = {A{\"\i}cha BenTaieb and Ghassan Hamarneh}, journal = {IEEE transactions on medical imaging}, number = {3}, pages = {792--802}, title = {Adversarial stain transfer for histopathology image analysis}, volume = {37}, year = {2017}, } @article{liu2017detecting, author = {Yun Liu and Krishna Gadepalli and Mohammad Norouzi and George E Dahl and Timo Kohlberger and Aleksey Boyko and Subhashini Venugopalan and Aleksei Timofeev and Philip Q Nelson and Greg S Corrado and others}, journal = {arXiv preprint arXiv:1703.02442}, title = {Detecting cancer metastases on gigapixel pathology images}, year = {2017}, } @article{bug2017context, author = {Daniel Bug and Steffen Schneider and Anne Grote and Eva Oswald and Friedrich Feuerhake and Julia Sch{\"u}ler and Dorit Merhof}, journal = {Deep Learning in Medical Image Analysis and Multimodal Learning for Clinical Decision Support}, pages = {135--142}, title = {Context-based normalization of histological stains using deep convolutional features}, year = {2017}, } @inproceedings{macenko2009method, author = {Marc Macenko and Marc Niethammer and James S Marron and David Borland and John T Woosley and Xiaojun Guan and Charles Schmitt and Nancy E Thomas}, booktitle = {2009 IEEE International Symposium on Biomedical Imaging: From Nano to Macro}, pages = {1107--1110}, title = {A method for normalizing histology slides for quantitative analysis}, year = {2009}, } @article{henderson2012influence, author = {Brian E Henderson and Norman H Lee and Victoria Seewaldt and Hongbing Shen}, journal = {Nature Reviews Cancer}, number = {9}, pages = {648--653}, title = {The influence of race and ethnicity on the biology of cancer}, volume = {12}, year = {2012}, } @article{kim2020cogs, author = {Najoung Kim and Tal Linzen}, journal = {arXiv preprint arXiv:2010.05465}, title = {COGS: A Compositional Generalization Challenge Based on Semantic Interpretation}, year = {2020}, } @article{mckinney2020international, author = {Scott Mayer McKinney and Marcin Sieniek and Varun Godbole and Jonathan Godwin and Natasha Antropova and Hutan Ashrafian and Trevor Back and Mary Chesus and Greg C Corrado and Ara Darzi and others}, journal = {Nature}, number = {7788}, pages = {89--94}, title = {International evaluation of an {AI} system for breast cancer screening}, volume = {577}, year = {2020}, } @article{beery2020iwildcam, author = {Sara Beery and Elijah Cole and Arvi Gjoka}, journal = {arXiv preprint arXiv:2004.10340}, title = {The iWildCam 2020 Competition Dataset}, year = {2020}, } @inproceedings{li2017deeper, author = {Da Li and Yongxin Yang and Yi-Zhe Song and Timothy M Hospedales}, booktitle = {Proceedings of the IEEE international conference on computer vision}, pages = {5542--5550}, title = {Deeper, broader and artier domain generalization}, year = {2017}, } @article{hendrycks2020many, author = {Dan Hendrycks and Steven Basart and Norman Mu and Saurav Kadavath and Frank Wang and Evan Dorundo and Rahul Desai and Tyler Zhu and Samyak Parajuli and Mike Guo and Dawn Song and Jacob Steinhardt and Justin Gilmer}, journal = {arXiv preprint arXiv:2006.16241}, title = {The many faces of robustness: A critical analysis of out-of-distribution generalization}, year = {2020}, } @article{obermeyer2019dissecting, author = {Ziad Obermeyer and Brian Powers and Christine Vogeli and Sendhil Mullainathan}, journal = {Science}, number = {6464}, pages = {447--453}, title = {Dissecting racial bias in an algorithm used to manage the health of populations}, volume = {366}, year = {2019}, } @article{bellamy2020evaluating, author = {David Bellamy and Leo Celi and Andrew L Beam}, journal = {arXiv preprint arXiv:2010.01149}, title = {Evaluating Progress on Machine Learning for Longitudinal Electronic Healthcare Data}, year = {2020}, } @article{chen2019can, author = {Irene Y Chen and Peter Szolovits and Marzyeh Ghassemi}, journal = {AMA Journal of Ethics}, number = {2}, pages = {167--179}, title = {Can {AI} help reduce disparities in general medical and mental health care?}, volume = {21}, year = {2019}, } @article{seyyed2020chexclusion, author = {Laleh Seyyed-Kalantari and Guanxiong Liu and Matthew McDermott and Marzyeh Ghassemi}, journal = {arXiv preprint arXiv:2003.00827}, title = {CheXclusion: Fairness gaps in deep chest {X-ray} classifiers}, year = {2020}, } @article{larrazabal2020gender, author = {Agostina J Larrazabal and Nicol{\'a}s Nieto and Victoria Peterson and Diego H Milone and Enzo Ferrante}, journal = {Proceedings of the National Academy of Sciences}, title = {Gender imbalance in medical imaging datasets produces biased classifiers for computer-aided diagnosis}, year = {2020}, } @article{davis2017calibration, author = {Sharon E Davis and Thomas A Lasko and Guanhua Chen and Edward D Siew and Michael E Matheny}, journal = {Journal of the American Medical Informatics Association}, number = {6}, pages = {1052--1061}, title = {Calibration drift in regression and machine learning models for acute kidney injury}, volume = {24}, year = {2017}, } @inproceedings{ardila2020common, author = {Rosana Ardila and Megan Branson and Kelly Davis and Michael Kohler and Josh Meyer and Michael Henretty and Reuben Morais and Lindsay Saunders and Francis Tyers and Gregor Weber}, booktitle = {Language Resources and Evaluation Conference (LREC)}, pages = {4218--4222}, title = {Common Voice: A Massively-Multilingual Speech Corpus}, year = {2020}, } @article{chung2018voxceleb2, author = {Joon Son Chung and Arsha Nagrani and Andrew Zisserman}, journal = {Proc. Interspeech}, pages = {1086--1090}, title = {VoxCeleb2: Deep Speaker Recognition}, year = {2018}, } @article{weinberger2015speech, author = {Steven Weinberger}, journal = {George Mason University}, title = {Speech accent archive}, year = {2015}, } @inproceedings{panayotov2015librispeech, author = {Vassil Panayotov and Guoguo Chen and Daniel Povey and Sanjeev Khudanpur}, booktitle = {International Conference on Acoustics, Speech, and Signal Processing (ICASSP)}, pages = {5206--5210}, title = {Librispeech: an asr corpus based on public domain audio books}, year = {2015}, } @article{baumann2019spoken, author = {Timo Baumann and Arne K{\"o}hn and Felix Hennig}, journal = {Language Resources and Evaluation}, number = {2}, pages = {303--329}, title = {The {Spoken {W}ikipedia Corpus} collection: Harvesting, alignment and an application to hyperlistening}, volume = {53}, year = {2019}, } @inproceedings{rabanser2019failing, author = {Stephan Rabanser and Stephan G{\"u}nnemann and Zachary Lipton}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1396--1408}, title = {Failing loudly: An empirical study of methods for detecting dataset shift}, year = {2019}, } @inproceedings{kaushik2019learning, author = {Divyansh Kaushik and Eduard Hovy and Zachary Lipton}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Learning The Difference That Makes A Difference With Counterfactually-Augmented Data}, year = {2019}, } @inproceedings{nekoto2020participatory, author = {Wilhelmina Nekoto and Vukosi Marivate and Tshinondiwa Matsila and Timi Fasubaa and Tajudeen Kolawole and Taiwo Fagbohungbe and Solomon Oluwole Akinola and Shamsuddee Hassan Muhammad and Salomon Kabongo and Salomey Osei and Sackey Freshia and Rubungo Andre Niyongabo and Ricky Macharm and Perez Ogayo and Orevaoghene Ahia and Musie Meressa and Mofe Adeyemi and Masabata Mokgesi-Selinga and Lawrence Okegbemi and Laura Jane Martinus and Kolawole Tajudeen and Kevin Degila and Kelechi Ogueji and Kathleen Siminyu and Julia Kreutzer and Jason Webster and Jamiil Toure Ali and Jade Abbott and Iroro Orife and Ignatius Ezeani and Idris Abdulkabir Dangana and Herman Kamper and Hady Elsahar and Goodness Duru and Ghollah Kioko and Espoir Murhabazi and Elan van Biljon and Daniel Whitenack and Christopher Onyefuluchi and Chris Emezue and Bonaventure Dossou and Blessing Sibanda and Blessing Itoro Bassey and Ayodele Olabiyi and Arshath Ramkilowan and Alp Öktem and Adewale Akinfaderin and Abdallah Bashir}, booktitle = {Findings of Empirical Methods in Natural Language Processing (Findings of EMNLP)}, title = {Participatory Research for Low-resourced Machine Translation: A Case Study in {African} Languages}, year = {2020}, } @article{wu2020variational, author = {Mike Wu and Richard L Davis and Benjamin W Domingue and Chris Piech and Noah Goodman}, journal = {International Conference on Educational Data Mining}, title = {Variational Item Response Theory: Fast, Accurate, and Expressive}, year = {2020}, } @inproceedings{kulkarni2014scaling, author = {Chinmay E Kulkarni and Richard Socher and Michael S Bernstein and Scott R Klemmer}, booktitle = {Proceedings of the first ACM conference on Learning@Scale conference}, pages = {99--108}, title = {Scaling short-answer grading by combining peer assessment with algorithmic scoring}, year = {2014}, } @article{shermis2014state, author = {Mark D Shermis}, journal = {Assessing Writing}, pages = {53--76}, title = {State-of-the-art automated essay scoring: Competition, results, and future directions from a United States demonstration}, volume = {20}, year = {2014}, } @inproceedings{taghipour2016neural, author = {Kaveh Taghipour and Hwee Tou Ng}, booktitle = {Proceedings of the 2016 conference on empirical methods in natural language processing}, pages = {1882--1891}, title = {A neural approach to automated essay scoring}, year = {2016}, } @inproceedings{ahadi2015exploring, author = {Alireza Ahadi and Raymond Lister and Heikki Haapala and Arto Vihavainen}, booktitle = {Proceedings of the eleventh annual International Conference on International Computing Education Research}, pages = {121--130}, title = {Exploring machine learning methods to automatically identify students in need of assistance}, year = {2015}, } @inproceedings{williams2016axis, author = {Joseph Jay Williams and Juho Kim and Anna Rafferty and Samuel Maldonado and Krzysztof Z Gajos and Walter S Lasecki and Neil Heffernan}, booktitle = {Proceedings of the Third (2016) ACM Conference on Learning@Scale}, pages = {379--388}, title = {Axis: Generating explanations at scale with learnersourcing and machine learning}, year = {2016}, } @article{desmarais2012review, author = {Michel C Desmarais and Ryan Baker}, journal = {User Modeling and User-Adapted Interaction}, number = {1}, pages = {9--38}, title = {A review of recent advances in learner and skill modeling in intelligent learning environments}, volume = {22}, year = {2012}, } @inproceedings{wu2019zero, author = {Mike Wu and Milan Mosse and Noah Goodman and Chris Piech}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {782--790}, title = {Zero shot learning for code education: Rubric sampling with deep learning inference}, volume = {33}, year = {2019}, } @inproceedings{amorim2018automated, author = {Evelin Amorim and Marcia Can{\c{c}}ado and Adriano Veloso}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {229--237}, title = {Automated essay scoring in the presence of biased ratings}, year = {2018}, } @article{perelman2014state, author = {Les Perelman}, journal = {Assessing Writing}, pages = {104--111}, title = {When “the state of the art” is counting words}, volume = {21}, year = {2014}, } @article{piech2013tuned, author = {Chris Piech and Jonathan Huang and Zhenghao Chen and Chuong Do and Andrew Ng and Daphne Koller}, journal = {Educational Data Mining}, title = {Tuned models of peer assessment in MOOCs}, year = {2013}, } @article{han2020fortifying, author = {Xiaochuang Han and Yulia Tsvetkov}, journal = {arXiv preprint arXiv:2010.03154}, title = {Fortifying Toxic Speech Detectors Against Veiled Toxicity}, year = {2020}, } @article{kompa2020empirical, author = {Benjamin Kompa and Jasper Snoek and Andrew Beam}, journal = {arXiv preprint arXiv:2010.03039}, title = {Empirical Frequentist Coverage of Deep Learning Uncertainty Quantification Procedures}, year = {2020}, } @inproceedings{long2015learning, author = {Mingsheng Long and Yue Cao and Jianmin Wang and Michael Jordan}, booktitle = {International conference on machine learning}, pages = {97--105}, title = {Learning transferable features with deep adaptation networks}, year = {2015}, } @inproceedings{wu2019domain, author = {Yifan Wu and Ezra Winston and Divyansh Kaushik and Zachary Lipton}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {6872--6881}, title = {Domain Adaptation with Asymmetrically-Relaxed Distribution Alignment}, year = {2019}, } @article{degrave2020ai, author = {Alex J DeGrave and Joseph D Janizek and Su-In Lee}, journal = {medRxiv}, title = {{AI} for radiographic {COVID-19} detection selects shortcuts over signal}, year = {2020}, } @article{li2019anchor, author = {Hongyang Li and Daniel Quang and Yuanfang Guan}, journal = {Genome research}, number = {2}, pages = {281--292}, title = {Anchor: trans-cell type prediction of transcription factor binding sites}, volume = {29}, year = {2019}, } @inproceedings{blitzer2007biographies, author = {John Blitzer and Mark Dredze and Fernando Pereira}, booktitle = {Proceedings of the 45th annual meeting of the association of computational linguistics}, pages = {440--447}, title = {Biographies, bollywood, boom-boxes and blenders: Domain adaptation for sentiment classification}, year = {2007}, } @inproceedings{lecun2004learning, author = {Yann LeCun and Fu Jie Huang and Leon Bottou}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Learning methods for generic object recognition with invariance to pose and lighting}, volume = {2}, year = {2004}, } @inproceedings{saenko2010adapting, author = {Kate Saenko and Brian Kulis and Mario Fritz and Trevor Darrell}, booktitle = {European conference on computer vision}, pages = {213--226}, title = {Adapting visual category models to new domains}, year = {2010}, } @inproceedings{pan2010cross, author = {Sinno Jialin Pan and Xiaochuan Ni and Jian-Tao Sun and Qiang Yang and Zheng Chen}, booktitle = {Proceedings of the 19th international conference on World wide web}, pages = {751--760}, title = {Cross-domain sentiment classification via spectral feature alignment}, year = {2010}, } @article{bruzzone2009domain, author = {Lorenzo Bruzzone and Mattia Marconcini}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence}, number = {5}, pages = {770--787}, title = {Domain adaptation problems: A {DASVM} classification technique and a circular validation strategy}, volume = {32}, year = {2009}, } @article{yang2008estimating, author = {Qiang Yang and Sinno Jialin Pan and Vincent Wenchen Zheng}, journal = {IEEE Intelligent Systems}, number = {1}, pages = {8--13}, title = {Estimating Location Using Wi-Fi}, volume = {23}, year = {2008}, } @inproceedings{gong2012geodesic, author = {Boqing Gong and Yuan Shi and Fei Sha and Kristen Grauman}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {2066--2073}, title = {Geodesic flow kernel for unsupervised domain adaptation}, year = {2012}, } @inproceedings{torralba2011unbiased, author = {Antonio Torralba and Alexei A Efros}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {1521--1528}, title = {Unbiased look at dataset bias}, year = {2011}, } @inproceedings{beery2018recognition, author = {Sara Beery and Grant Van Horn and Pietro Perona}, booktitle = {European Conference on Computer Vision (ECCV)}, pages = {456--473}, title = {Recognition in terra incognita}, year = {2018}, } @article{courtiol2019deep, author = {Pierre Courtiol and Charles Maussion and Matahi Moarii and Elodie Pronier and Samuel Pilcer and Meriem Sefta and Pierre Manceron and Sylvain Toldo and Mikhail Zaslavskiy and Nolwenn Le Stang and others}, journal = {Nature medicine}, number = {10}, pages = {1519--1525}, title = {Deep learning-based classification of mesothelioma improves prediction of patient outcome}, volume = {25}, year = {2019}, } @inproceedings{hu2020open, author = {Weihua Hu and Matthias Fey and Marinka Zitnik and Yuxiao Dong and Hongyu Ren and Bowen Liu and Michele Catasta and Jure Leskovec}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {{Open Graph Benchmark}: Datasets for machine learning on graphs}, year = {2020}, } @inproceedings{xu2018powerful, author = {Keyulu Xu and Weihua Hu and Jure Leskovec and Stefanie Jegelka}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {How Powerful are Graph Neural Networks?}, year = {2018}, } @article{damour2020underspecification, author = {Alexander D'Amour and Katherine Heller and Dan Moldovan and Ben Adlam and Babak Alipanahi and Alex Beutel and Christina Chen and Jonathan Deaton and Jacob Eisenstein and Matthew D Hoffman and others}, journal = {arXiv preprint arXiv:2011.03395}, title = {Underspecification Presents Challenges for Credibility in Modern Machine Learning}, year = {2020}, } @article{subbaswamy2020evaluating, author = {Adarsh Subbaswamy and Roy Adams and Suchi Saria}, journal = {arXiv preprint arXiv:2010.15100}, title = {Evaluating Model Robustness to Dataset Shift}, year = {2020}, } @article{borkan2019limitations, author = {Daniel Borkan and Lucas Dixon and John Li and Jeffrey Sorensen and Nithum Thain and Lucy Vasserman}, journal = {arXiv preprint arXiv:1903.02088}, title = {Limitations of pinned auc for measuring unintended bias}, year = {2019}, } @article{he2020towards, author = {Yue He and Zheyan Shen and Peng Cui}, journal = {Pattern Recognition}, title = {Towards Non-{IID} Image Classification: A Dataset and Baselines}, volume = {110}, year = {2020}, } @inproceedings{damour2020fairness, author = {Alexander D'Amour and Hansa Srinivasan and James Atwood and Pallavi Baljekar and D Sculley and Yoni Halpern}, booktitle = {Proceedings of the 2020 Conference on Fairness, Accountability, and Transparency}, pages = {525--534}, title = {Fairness is not static: deeper understanding of long term fairness via simulation studies}, year = {2020}, } @inproceedings{liu2018delayed, author = {Lydia T Liu and Sarah Dean and Esther Rolf and Max Simchowitz and Moritz Hardt}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Delayed Impact of Fair Machine Learning}, year = {2018}, } @article{bellemare2020autonomous, author = {Marc G. Bellemare and Salvatore Candido and Pablo Samuel Castro and Jun Gong and Marlos C. Machado and Subhodeep Moitra and Sameera S. Ponda and Ziyu Wang }, journal = {Nature}, title = {Autonomous navigation of stratospheric balloons using reinforcement learning}, volume = {588}, year = {2020}, } @article{dan2020scaling, author = {Dan Hendrycks and Steven Basart and Mantas Mazeika and Mohammadreza Mostajabi and Jacob Steinhardt and Dawn Song}, journal = {arXiv preprint arXiv:1911.11132}, title = {Scaling out-of-distribution detection for real-world settings}, year = {2020}, } @article{saerens2002adjusting, author = {Marco Saerens and Patrice Latinne and Christine Decaestecker}, journal = {Neural computation}, number = {1}, pages = {21--41}, title = {Adjusting the outputs of a classifier to new a priori probabilities: a simple procedure}, volume = {14}, year = {2002}, } @inproceedings{zhang2013domain, author = {Kun Zhang and Bernhard Sch{\"o}lkopf and Krikamol Muandet and Zhikun Wang}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {819--827}, title = {Domain adaptation under target and conditional shift}, year = {2013}, } @inproceedings{alexandari2020maximum, author = {Amr Alexandari and Anshul Kundaje and Avanti Shrikumar}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {222--232}, title = {Maximum likelihood with bias-corrected calibration is hard-to-beat at label shift adaptation}, year = {2020}, } @article{garg2020unified, author = {Saurabh Garg and Yifan Wu and Sivaraman Balakrishnan and Zachary C Lipton}, journal = {arXiv preprint arXiv:2003.07554}, title = {A Unified View of Label Shift Estimation}, year = {2020}, } @inproceedings{rigaki2018bringing, author = {Maria Rigaki and Sebastian Garcia}, booktitle = {2018 IEEE Security and Privacy Workshops (SPW)}, pages = {70--75}, title = {Bringing a gan to a knife-fight: Adapting malware communication to avoid detection}, year = {2018}, } @article{cuccarese2020functional, author = {Michael F Cuccarese and Berton A Earnshaw and Katie Heiser and Ben Fogelson and Chadwick T Davis and Peter F McLean and Hannah B Gordon and Kathleen-Rose Skelly and Fiona L Weathersby and Vlad Rodic and others}, journal = {bioRxiv}, title = {Functional immune mapping with deep-learning enabled phenomics applied to immunomodulatory and {COVID-19} drug discovery}, year = {2020}, } @article{encode2012integrated, author = {ENCODE Project Consortium and others}, journal = {Nature}, number = {7414}, pages = {57--74}, title = {An integrated encyclopedia of {DNA} elements in the human genome}, volume = {489}, year = {2012}, } @article{kundaje2015integrative, author = {Anshul Kundaje and Wouter Meuleman and Jason Ernst and Misha Bilenky and Angela Yen and Alireza Heravi-Moussavi and Pouya Kheradpour and Zhizhuo Zhang and Jianrong Wang and Michael J Ziller and others}, journal = {Nature}, number = {7539}, pages = {317--330}, title = {Integrative analysis of 111 reference human epigenomes}, volume = {518}, year = {2015}, } @article{moore2020expanded, author = {Jill E Moore and Michael J Purcaro and Henry E Pratt and Charles B Epstein and Noam Shoresh and Jessika Adrian and Trupti Kawli and Carrie A Davis and Alexander Dobin and Rajinder Kaul and others}, journal = {Nature}, number = {7818}, pages = {699--710}, title = {Expanded encyclopaedias of {DNA} elements in the human and mouse genomes}, volume = {583}, year = {2020}, } @article{gtex2020gtex, author = {GTEx Consortium and others}, journal = {Science}, number = {6509}, pages = {1318--1330}, title = {The {GTEx Consortium} atlas of genetic regulatory effects across human tissues}, volume = {369}, year = {2020}, } @article{ho2014comparative, author = {Joshua WK Ho and Youngsook L Jung and Tao Liu and Burak H Alver and Soohyun Lee and Kohta Ikegami and Kyung-Ah Sohn and Aki Minoda and Michael Y Tolstorukov and Alex Appert and others}, journal = {Nature}, number = {7515}, pages = {449--452}, title = {Comparative analysis of metazoan chromatin organization}, volume = {512}, year = {2014}, } @article{hubmap2019human, author = {HuBMAP Consortium and others}, journal = {Nature}, number = {7777}, title = {The human body at cellular resolution: the {NIH} Human Biomolecular Atlas Program}, volume = {574}, year = {2019}, } @article{aviv2017human, author = {Regev Aviv and Sarah A Teichmann and Eric S Lander and Amit Ido and Benoist Christophe and Birney Ewan and Bodenmiller Bernd and Peter Campbell and Carninci Piero and Clatworthy Menna and others}, journal = {Elife}, title = {The human cell atlas}, volume = {6}, year = {2017}, } @article{ching2018opportunities, author = {Travers Ching and Daniel S Himmelstein and Brett K Beaulieu-Jones and Alexandr A Kalinin and Brian T Do and Gregory P Way and Enrico Ferrero and Paul-Michael Agapow and Michael Zietz and Michael M Hoffman and others}, journal = {Journal of The Royal Society Interface}, number = {141}, title = {Opportunities and obstacles for deep learning in biology and medicine}, volume = {15}, year = {2018}, } @article{eraslan2019deep, author = {G{\"o}kcen Eraslan and {\v{Z}}iga Avsec and Julien Gagneur and Fabian J Theis}, journal = {Nature Reviews Genetics}, number = {7}, pages = {389--403}, title = {Deep learning: new computational modelling techniques for genomics}, volume = {20}, year = {2019}, } @article{libbrecht2015machine, author = {Maxwell W Libbrecht and William Stafford Noble}, journal = {Nature Reviews Genetics}, number = {6}, pages = {321--332}, title = {Machine learning applications in genetics and genomics}, volume = {16}, year = {2015}, } @article{avsec2019deep, author = {{\v{Z}}iga Avsec and Melanie Weilert and Avanti Shrikumar and Amr Alexandari and Sabrina Krueger and Khyati Dalal and Robin Fropf and Charles McAnany and Julien Gagneur and Anshul Kundaje and Julia Zeitlinger}, journal = {bioRxiv}, title = {Deep learning at base-resolution reveals motif syntax of the cis-regulatory code}, year = {2019}, } @article{zhou2015predicting, author = {Jian Zhou and Olga G Troyanskaya}, journal = {Nature methods}, number = {10}, pages = {931--934}, title = {Predicting effects of noncoding variants with deep learning--based sequence model}, volume = {12}, year = {2015}, } @article{kelley2016basset, author = {David R Kelley and Jasper Snoek and John L Rinn}, journal = {Genome research}, number = {7}, pages = {990--999}, title = {Basset: learning the regulatory code of the accessible genome with deep convolutional neural networks}, volume = {26}, year = {2016}, } @article{jaganathan2019predicting, author = {Kishore Jaganathan and Sofia Kyriazopoulou Panagiotopoulou and Jeremy F McRae and Siavash Fazel Darbandi and David Knowles and Yang I Li and Jack A Kosmicki and Juan Arbelaez and Wenwu Cui and Grace B Schwartz and others}, journal = {Cell}, number = {3}, pages = {535--548}, title = {Predicting splicing from primary sequence with deep learning}, volume = {176}, year = {2019}, } @article{srivastava2020sequence, author = {Divyanshi Srivastava and Shaun Mahony}, journal = {Biochimica et Biophysica Acta (BBA)-Gene Regulatory Mechanisms}, number = {6}, title = {Sequence and chromatin determinants of transcription factor binding and the establishment of cell type-specific binding patterns}, volume = {1863}, year = {2020}, } @article{keilwagen2019accurate, author = {Jens Keilwagen and Stefan Posch and Jan Grau}, journal = {Genome biology}, number = {1}, title = {Accurate prediction of cell type-specific transcription factor binding}, volume = {20}, year = {2019}, } @article{quang2019factornet, author = {Daniel Quang and Xiaohui Xie}, journal = {Methods}, pages = {40--47}, title = {FactorNet: a deep learning framework for predicting cell type specific transcription factor binding from nucleotide-resolution sequential data}, volume = {166}, year = {2019}, } @article{li2019leopard, author = {Hongyang Li and Yuanfang Guan}, journal = {bioRxiv}, title = {Leopard: fast decoding cell type-specific transcription factor binding landscape at single-nucleotide resolution}, year = {2019}, } @article{raghu2020survey, author = {Maithra Raghu and Eric Schmidt}, journal = {arXiv preprint arXiv:2003.11755}, title = {A survey of deep learning for scientific discovery}, year = {2020}, } @article{rolf2020generalizable, author = {Esther Rolf and Jonathan Proctor and Tamma Carleton and Ian Bolliger and Vaishaal Shankar and Miyabi Ishihara and Benjamin Recht and Solomon Hsiang}, journal = {NBER Working Paper}, number = {28045}, title = {A Generalizable and Accessible Approach to Machine Learning with Global Satellite Imagery}, year = {2020}, } @article{djolonga2020robustness, author = {Josip Djolonga and Jessica Yung and Michael Tschannen and Rob Romijnders and Lucas Beyer and Alexander Kolesnikov and Joan Puigcerver and Matthias Minderer and Alexander D'Amour and Dan Moldovan and others}, journal = {arXiv preprint arXiv:2007.08558}, title = {On robustness and transferability of convolutional neural networks}, year = {2020}, } @inproceedings{wang2019learningrobust, author = {Haohan Wang and Songwei Ge and Zachary Lipton and Eric P Xing}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Learning robust global representations by penalizing local predictive power}, year = {2019}, } @article{miller2020effect, author = {John Miller and Karl Krauth and Benjamin Recht and Ludwig Schmidt}, journal = {arXiv preprint arXiv:2004.14444}, title = {The Effect of Natural Distribution Shift on Question Answering Models}, year = {2020}, } @article{geirhos2018generalisation, author = {Robert Geirhos and Carlos RM Temme and Jonas Rauber and Heiko H Sch{\"u}tt and Matthias Bethge and Felix A Wichmann}, journal = {Advances in neural information processing systems}, pages = {7538--7550}, title = {Generalisation in humans and deep neural networks}, volume = {31}, year = {2018}, } @article{adragna2020fairness, author = {Robert Adragna and Elliot Creager and David Madras and Richard Zemel}, journal = {arXiv preprint arXiv:2011.06485}, title = {Fairness and Robustness in Invariant Learning: A Case Study in Toxicity Classification}, year = {2020}, } @article{bohacek1996art, author = {Regine S Bohacek and Colin McMartin and Wayne C Guida}, journal = {Medicinal research reviews}, number = {1}, pages = {3--50}, title = {The art and practice of structure-based drug design: a molecular modeling perspective}, volume = {16}, year = {1996}, } @article{lyu2019ultra, author = {Jiankun Lyu and Sheng Wang and Trent E Balius and Isha Singh and Anat Levit and Yurii S Moroz and Matthew J O’Meara and Tao Che and Enkhjargal Algaa and Kateryna Tolmachova and others}, journal = {Nature}, number = {7743}, pages = {224--229}, title = {Ultra-large library docking for discovering new chemotypes}, volume = {566}, year = {2019}, } @article{mccloskey2020machine, author = {Kevin McCloskey and Eric A Sigel and Steven Kearnes and Ling Xue and Xia Tian and Dennis Moccia and Diana Gikunju and Sana Bazzaz and Betty Chan and Matthew A Clark and others}, journal = {Journal of Medicinal Chemistry}, title = {Machine Learning on {DNA}-Encoded Libraries: A New Paradigm for Hit Finding}, year = {2020}, } @article{attene2013tox21, author = {Matias S Attene-Ramos and Nicole Miller and Ruili Huang and Sam Michael and Misha Itkin and Robert J Kavlock and Christopher P Austin and Paul Shinn and Anton Simeonov and Raymond R Tice and others}, journal = {Drug discovery today}, number = {15}, pages = {716--723}, title = {The Tox21 robotic platform for the assessment of environmental chemicals--from vision to reality}, volume = {18}, year = {2013}, } @article{collins2008transforming, author = {Francis S Collins and George M Gray and John R Bucher}, journal = {Science}, number = {5865}, title = {Transforming environmental health protection}, volume = {319}, year = {2008}, } @article{reker2020practical, author = {Daniel Reker}, journal = {Drug Discovery Today: Technologies}, title = {Practical considerations for active machine learning in drug discovery}, year = {2020}, } @inproceedings{agrawal2018don, author = {Aishwarya Agrawal and Dhruv Batra and Devi Parikh and Aniruddha Kembhavi}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {4971--4980}, title = {Don't just assume; look and answer: Overcoming priors for visual question answering}, year = {2018}, } @inproceedings{lewis1992feature, author = {David D Lewis}, booktitle = {Speech and Natural Language: Proceedings of a Workshop Held at Harriman, New York, February 23-26, 1992}, title = {Feature selection and feature extract ion for text categorization}, year = {1992}, } @book{zheng2018feature, author = {Alice Zheng and Amanda Casari}, publisher = {" O'Reilly Media, Inc."}, title = {Feature engineering for machine learning: principles and techniques for data scientists}, year = {2018}, } @book{nixon2019feature, author = {Mark Nixon and Alberto Aguado}, publisher = {Academic press}, title = {Feature extraction and image processing for computer vision}, year = {2019}, } @inproceedings{li2018deep, author = {Ya Li and Xinmei Tian and Mingming Gong and Yajing Liu and Tongliang Liu and Kun Zhang and Dacheng Tao}, booktitle = {European Conference on Computer Vision (ECCV)}, pages = {624--639}, title = {Deep domain generalization via conditional invariant adversarial networks}, year = {2018}, } @inproceedings{li2018domain, author = {Haoliang Li and Sinno Jialin Pan and Shiqi Wang and Alex C Kot}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {5400--5409}, title = {Domain generalization with adversarial feature learning}, year = {2018}, } @inproceedings{balaji2018metareg, author = {Yogesh Balaji and Swami Sankaranarayanan and Rama Chellappa}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {998--1008}, title = {Metareg: Towards domain generalization using meta-regularization}, year = {2018}, } @inproceedings{carlucci2019domain, author = {Fabio M Carlucci and Antonio D'Innocente and Silvia Bucci and Barbara Caputo and Tatiana Tommasi}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {2229--2238}, title = {Domain generalization by solving jigsaw puzzles}, year = {2019}, } @inproceedings{li2018learning, author = {Da Li and Yongxin Yang and Yi-Zhe Song and Timothy Hospedales}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Learning to generalize: Meta-learning for domain generalization}, year = {2018}, } @article{hand2006classifier, author = {David J Hand}, journal = {Statistical science}, pages = {1--14}, title = {Classifier technology and the illusion of progress}, year = {2006}, } @book{shapiro2014lectures, author = {Alexander Shapiro and Darinka Dentcheva and Andrzej Ruszczy{\'n}ski}, publisher = {SIAM}, title = {Lectures on stochastic programming: modeling and theory}, year = {2014}, } @inproceedings{loshchilov2019decoupled, author = {Ilya Loshchilov and Frank Hutter}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Decoupled Weight Decay Regularization}, year = {2019}, } @inproceedings{xu2020adversarial, author = {Minghao Xu and Jian Zhang and Bingbing Ni and Teng Li and Chengjie Wang and Qi Tian and Wenjun Zhang}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, number = {4}, pages = {6502--6509}, title = {Adversarial domain adaptation with domain mixup}, volume = {34}, year = {2020}, } @inproceedings{hendrycks2019augmix, author = {Dan Hendrycks and Norman Mu and Ekin D Cubuk and Barret Zoph and Justin Gilmer and Balaji Lakshminarayanan}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Augmix: A simple data processing method to improve robustness and uncertainty}, year = {2019}, } @article{bender2018data, author = {Emily M Bender and Batya Friedman}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, pages = {587--604}, title = {Data statements for natural language processing: Toward mitigating system bias and enabling better science}, volume = {6}, year = {2018}, } @article{berman2018ethical, author = {Gabrielle Berman and Sara de la Rosa and Tanya Accone}, journal = {Innocenti Discussion Paper, UNICEF Office of Research}, title = {Ethical considerations when using geospatial technologies for evidence generation}, year = {2018}, } @inproceedings{mohri2019agnostic, author = {Mehryar Mohri and Gary Sivek and Ananda Theertha Suresh}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {4615--4625}, title = {Agnostic federated learning}, year = {2019}, } @article{finlayson2021clinician, author = {Samuel G. Finlayson and Adarsh Subbaswamy and Karandeep Singh and John Bowers and Annabel Kupke and Jonathan Zittrain and Isaac S. Kohane and Suchi Saria}, journal = {New England Journal of Medicine}, number = {3}, pages = {283--286}, title = {The Clinician and Dataset Shift in Artificial Intelligence}, volume = {385}, year = {2021}, } @article{ciga2020self, author = {Ozan Ciga and Anne L Martel and Tony Xu}, journal = {arXiv preprint arXiv:2011.13971}, title = {Self supervised contrastive learning for digital histopathology}, year = {2020}, } @article{azizi2021big, author = {Shekoofeh Azizi and Basil Mustafa and Fiona Ryan and Zachary Beaver and Jan Freyberg and Jonathan Deaton and Aaron Loh and Alan Karthikesalingam and Simon Kornblith and Ting Chen and others}, journal = {arXiv preprint arXiv:2101.05224}, title = {Big self-supervised models advance medical image classification}, year = {2021}, } @inproceedings{ren2018adversarial, author = {Jian Ren and Ilker Hacihaliloglu and Eric A Singer and David J Foran and Xin Qi}, booktitle = {International Conference on Medical Image Computing and Computer-Assisted Intervention}, pages = {201--209}, title = {Adversarial domain adaptation for classification of prostate histopathology whole-slide images}, year = {2018}, } @article{peikari2018cluster, author = {Mohammad Peikari and Sherine Salama and Sharon Nofech-Mozes and Anne L Martel}, journal = {Scientific reports}, number = {1}, pages = {1--13}, title = {A cluster-then-label semi-supervised learning approach for pathology image classification}, volume = {8}, year = {2018}, } @article{lu2019semi, author = {Ming Y Lu and Richard J Chen and Jingwen Wang and Debora Dillon and Faisal Mahmood}, journal = {arXiv preprint arXiv:1910.10825}, title = {Semi-supervised histology classification using deep multiple instance learning and contrastive predictive coding}, year = {2019}, } @inproceedings{zhang2019whole, author = {Yifan Zhang and Hanbo Chen and Ying Wei and Peilin Zhao and Jiezhang Cao and Xinjuan Fan and Xiaoying Lou and Hailing Liu and Jinlong Hou and Xiao Han and others}, booktitle = {International Conference on Medical Image Computing and Computer-Assisted Intervention}, pages = {360--368}, title = {From whole slide imaging to microscopy: Deep microscopy adaptation network for histopathology cancer image classification}, year = {2019}, } @article{dehaene2020self, author = {Olivier Dehaene and Axel Camara and Olivier Moindrot and Axel de Lavergne and Pierre Courtiol}, journal = {arXiv preprint arXiv:2012.03583}, title = {Self-Supervision Closes the Gap Between Weak and Strong Supervision in Histology}, year = {2020}, } @article{koohbanani2021self, author = {Navid Alemi Koohbanani and Balagopal Unnikrishnan and Syed Ali Khurram and Pavitra Krishnaswamy and Nasir Rajpoot}, journal = {IEEE Transactions on Medical Imaging}, title = {Self-Path: Self-supervision for Classification of Pathology Images with Limited Annotations}, volume = {1}, year = {2021}, } @article{shaw2020teacher, author = {Shayne Shaw and Maciej Pajak and Aneta Lisowska and Sotirios A Tsaftaris and Alison Q O'Neil}, journal = {arXiv preprint arXiv:2003.08797}, title = {Teacher-student chain for efficient semi-supervised histology image classification}, year = {2020}, } @article{akram2018leveraging, author = {Saad Ullah Akram and Talha Qaiser and Simon Graham and Juho Kannala and Janne Heikkil{\"a} and Nasir Rajpoot }, journal = {Computational Pathology and Ophthalmic Medical Image Analysis}, pages = {69--77}, title = {Leveraging unlabeled whole-slide-images for mitosis detection}, volume = {1}, year = {2018}, } @inproceedings{zhang2019bridging, author = {Yuchen Zhang and Tianle Liu and Mingsheng Long and Michael Jordan}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {7404--7413}, title = {Bridging theory and algorithm for domain adaptation}, year = {2019}, } @inproceedings{long2018conditional, author = {Mingsheng Long and Zhangjie Cao and Jianmin Wang and Michael I Jordan}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Conditional Adversarial Domain Adaptation}, year = {2018}, } @inproceedings{saito2018maximum, author = {Kuniaki Saito and Kohei Watanabe and Yoshitaka Ushiku and Tatsuya Harada}, booktitle = {Proceedings of the IEEE conference on computer vision and pattern recognition}, pages = {3723--3732}, title = {Maximum classifier discrepancy for unsupervised domain adaptation}, year = {2018}, } @inproceedings{long2017deep, author = {Mingsheng Long and Han Zhu and Jianmin Wang and Michael I Jordan}, booktitle = {International conference on machine learning}, pages = {2208--2217}, title = {Deep transfer learning with joint adaptation networks}, year = {2017}, } @article{abid2021persistent, author = {Abubakar Abid and Maheen Farooqi and James Zou}, journal = {arXiv preprint arXiv:2101.05783}, title = {Persistent anti-muslim bias in large language models}, year = {2021}, } @article{nadeem2020stereoset, author = {Moin Nadeem and Anna Bethke and Siva Reddy}, journal = {arXiv preprint arXiv:2004.09456}, title = {Stereoset: Measuring stereotypical bias in pretrained language models}, year = {2020}, } @article{gehman2020realtoxicityprompts, author = {Samuel Gehman and Suchin Gururangan and Maarten Sap and Yejin Choi and Noah A Smith}, journal = {arXiv preprint arXiv:2009.11462}, title = {Realtoxicityprompts: Evaluating neural toxic degeneration in language models}, year = {2020}, } @article{tu2020empirical, author = {Lifu Tu and Garima Lalwani and Spandana Gella and He He}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, pages = {621--633}, title = {An empirical study on robustness to spurious correlations using pre-trained language models}, volume = {8}, year = {2020}, } @article{gururangan2020don, author = {Suchin Gururangan and Ana Marasovi{\'c} and Swabha Swayamdipta and Kyle Lo and Iz Beltagy and Doug Downey and Noah A Smith}, journal = {arXiv preprint arXiv:2004.10964}, title = {Don't stop pretraining: adapt language models to domains and tasks}, year = {2020}, } @article{hull1994database, author = {Jonathan J. Hull}, journal = {IEEE Transactions on pattern analysis and machine intelligence}, number = {5}, pages = {550--554}, title = {A database for handwritten text recognition research}, volume = {16}, year = {1994}, } @inproceedings{cordts2016cityscapes, author = {Marius Cordts and Mohamed Omran and Sebastian Ramos and Timo Rehfeld and Markus Enzweiler and Rodrigo Benenson and Uwe Franke and Stefan Roth and Bernt Schiele}, booktitle = {Proceedings of the IEEE conference on computer vision and pattern recognition}, pages = {3213--3223}, title = {The cityscapes dataset for semantic urban scene understanding}, year = {2016}, } @inproceedings{chalkidis2020legal, author = {Ilias Chalkidis and Manos Fergadiotis and Prodromos Malakasiotis and Nikolaos Aletras and Ion Androutsopoulos}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {2898--2904}, title = {{LEGAL-BERT}:"Preparing the Muppets for Court"}, year = {2020}, } @article{lee2020biobert, author = {Jinhyuk Lee and Wonjin Yoon and Sungdong Kim and Donghyeon Kim and Sunkyu Kim and Chan Ho So and Jaewoo Kang}, journal = {Bioinformatics}, number = {4}, pages = {1234--1240}, title = {BioBERT: a pre-trained biomedical language representation model for biomedical text mining}, volume = {36}, year = {2020}, } @article{gu2020domain, author = {Yu Gu and Robert Tinn and Hao Cheng and Michael Lucas and Naoto Usuyama and Xiaodong Liu and Tristan Naumann and Jianfeng Gao and Hoifung Poon}, journal = {arXiv preprint arXiv:2007.15779}, title = {Domain-specific language model pretraining for biomedical natural language processing}, year = {2020}, } @article{rong2020self, author = {Yu Rong and Yatao Bian and Tingyang Xu and Weiyang Xie and Ying Wei and Wenbing Huang and Junzhou Huang}, journal = {arXiv preprint arXiv:2007.02835}, title = {Self-supervised graph transformer on large-scale molecular data}, year = {2020}, } @article{robey2021model, author = {Alexander Robey and George J Pappas and Hamed Hassani}, journal = {arXiv preprint arXiv:2102.11436}, title = {Model-Based Domain Generalization}, year = {2021}, } @article{saito2021tune, author = {Kuniaki Saito and Donghyun Kim and Piotr Teterwak and Stan Sclaroff and Trevor Darrell and Kate Saenko}, journal = {arXiv preprint arXiv:2108.10860}, title = {Tune it the Right Way: Unsupervised Validation of Domain Adaptation via Soft Neighborhood Density}, year = {2021}, } @inproceedings{verma2021towards, author = {Vikas Verma and Thang Luong and Kenji Kawaguchi and Hieu Pham and Quoc Le}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Towards domain-agnostic contrastive learning}, year = {2021}, } @article{chang2021mobility, author = {Serina Chang and Emma Pierson and Pang Wei Koh and Jaline Gerardin and Beth Redbird and David Grusky and Jure Leskovec}, journal = {Nature}, title = {Mobility network models of {COVID-19} explain inequities and inform reopening}, year = {2021}, } @inproceedings{chang2021supporting, author = {Serina Y Chang and Mandy L Wilson and Bryan Lewis and Zakaria Mehrab and Komal K Dudakiya and Emma Pierson and Pang Wei Koh and Jaline Gerardin and Beth Redbird and David Grusky and Jure Leskovec}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, title = {Supporting {COVID-19} policy response with large-scale mobility-based modeling}, year = {2021}, } @article{koh2017denoising, author = {Pang Wei Koh and Emma Pierson and Anshul Kundaje}, journal = {Bioinformatics}, title = {Denoising genome-wide histone ChIP-seq with convolutional neural networks}, year = {2017}, } @article{geirhos2020shortcut, author = {Robert Geirhos and J{\"o}rn-Henrik Jacobsen and Claudio Michaelis and Richard Zemel and Wieland Brendel and Matthias Bethge and Felix A Wichmann}, journal = {Nature Machine Intelligence}, title = {Shortcut Learning in Deep Neural Networks}, year = {2020}, } @inproceedings{kabra2015understanding, author = {Mayank Kabra and Alice Robie and Kristin Branson}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {3917--3925}, title = {Understanding classifier errors by examining influential neighbors}, year = {2015}, } @inproceedings{cai2019human, author = {Carrie J Cai and Emily Reif and Narayan Hegde and Jason Hipp and Been Kim and Daniel Smilkov and Martin Wattenberg and Fernanda Viegas and Greg S Corrado and Martin C Stumpe and Michael Terry}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, pages = {1--14}, title = {Human-centered tools for coping with imperfect algorithms during medical decision-making}, year = {2019}, } @inproceedings{steed2021image, author = {Ryan Steed and Aylin Caliskan}, booktitle = {ACM Conference on Fairness, Accountability, and Transparency (FAccT)}, pages = {701--713}, title = {Image representations learned with unsupervised pre-training contain human-like biases}, year = {2021}, } @article{caliskan2017semantics, author = {Aylin Caliskan and Joanna J Bryson and Arvind Narayanan}, journal = {Science}, number = {6334}, pages = {183--186}, title = {Semantics derived automatically from language corpora contain human-like biases}, volume = {356}, year = {2017}, } @article{garg2018word, author = {Nikhil Garg and Londa Schiebinger and Dan Jurafsky and James Zou}, journal = {Science}, title = {Word embeddings quantify 100 years of gender and ethnic stereotypes}, volume = {115}, year = {2018}, } @article{tan2019assessing, author = {Yi Chern Tan and L Elisa Celis}, journal = {arXiv preprint arXiv:1911.01485}, title = {Assessing social and intersectional biases in contextualized word representations}, year = {2019}, } @article{tsai2021conditional, author = {Yao-Hung Hubert Tsai and Martin Q Ma and Han Zhao and Kun Zhang and Louis-Philippe Morency and Ruslan Salakhutdinov}, journal = {arXiv preprint arXiv:2106.02866}, title = {Conditional Contrastive Learning: Removing Undesirable Information in Self-Supervised Representations}, year = {2021}, } @article{mishra2021surprisingly, author = {Samarth Mishra and Kate Saenko and Venkatesh Saligrama}, journal = {arXiv preprint arXiv:2101.12727}, title = {Surprisingly Simple Semi-Supervised Domain Adaptation with Pretraining and Consistency}, year = {2021}, } @inproceedings{xu2019larger, author = {Ruijia Xu and Guanbin Li and Jihan Yang and Liang Lin}, booktitle = {International Conference on Computer Vision (ICCV)}, pages = {1426--1435}, title = {Larger norm more transferable: An adaptive feature norm approach for unsupervised domain adaptation}, year = {2019}, } @article{zhao2018adversarial, author = {Han Zhao and Shanghang Zhang and Guanhang Wu and Jos{\'e} MF Moura and Joao P Costeira and Geoffrey J Gordon}, journal = {Advances in neural information processing systems}, pages = {8559--8570}, title = {Adversarial multiple source domain adaptation}, volume = {31}, year = {2018}, } @inproceedings{dubey2021adaptive, author = {Abhimanyu Dubey and Vignesh Ramanathan and Alex Pentland and Dhruv Mahajan}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Adaptive Methods for Real-World Domain Generalization}, year = {2021}, } @article{cole2021does, author = {Elijah Cole and Xuan Yang and Kimberly Wilber and Oisin Mac Aodha and Serge Belongie}, journal = {arXiv preprint arXiv:2105.05837}, title = {When Does Contrastive Visual Representation Learning Work?}, year = {2021}, } @inproceedings{shen2021connect, author = {Kendrick Shen and Robbie Matthew Jones and Ananya Kumar and Sang Michael Xie and Percy Liang}, booktitle = {NeurIPS Workshop on Distribution Shifts}, title = {How Does Contrastive Pre-training Connect Disparate Domains?}, year = {2021}, } @article{wong2021external, author = {Andrew Wong and Erkin Otles and John P Donnelly and Andrew Krumm and Jeffrey McCullough and Olivia DeTroyer-Cooley and Justin Pestrue and Marie Phillips and Judy Konye and Carleen Penoza and others}, journal = {JAMA Internal Medicine}, number = {8}, pages = {1065--1070}, title = {External validation of a widely implemented proprietary sepsis prediction model in hospitalized patients}, volume = {181}, year = {2021}, } @inproceedings{bansal2021does, author = {Gagan Bansal and Tongshuang Wu and Joyce Zhou and Raymond Fok and Besmira Nushi and Ece Kamar and Marco Tulio Ribeiro and Daniel Weld}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, pages = {1--16}, title = {Does the whole exceed its parts? the effect of ai explanations on complementary team performance}, year = {2021}, } @article{bommasani2023fmti, author = {Rishi Bommasani and Kevin Klyman and Shayne Longpre and Sayash Kapoor and Nestor Maslej and Betty Xiong and Daniel Zhang and Percy Liang}, journal = {arXiv}, title = {The Foundation Model Transparency Index}, year = {2023}, } @article{thickstun2023anticipatory, author = {John Thickstun and D. Hall and Chris Donahue and Percy Liang}, journal = {arXiv}, title = {Anticipatory Music Transformer}, year = {2023}, } @article{shrivastava2023llamas, author = {Vaishnavi Shrivastava and Percy Liang and Ananya Kumar}, journal = {arXiv}, title = {Llamas Know What GPTs Don't Show: Surrogate Models for Confidence Estimation}, year = {2023}, } @article{huang2023benchmarking, author = {Qian Huang and Jian Vora and Percy Liang and J. Leskovec}, journal = {arXiv}, title = {Benchmarking Large Language Models As {AI} Research Agents}, year = {2023}, } @article{yasunaga2023large, author = {Michihiro Yasunaga and Xinyun Chen and Yujia Li and Panupong Pasupat and J. Leskovec and Percy Liang and Ed H. Chi and Denny Zhou}, journal = {arXiv}, title = {Large Language Models as Analogical Reasoners}, year = {2023}, } @article{li2023benchmarking, author = {Xiang Lisa Li and Vaishnavi Shrivastava and Siyan Li and Tatsunori Hashimoto and Percy Liang}, journal = {arXiv}, title = {Benchmarking and Improving Generator-Validator Consistency of Language Models}, year = {2023}, } @article{fleming2023medalign, author = {S. Fleming and A. Lozano and W. Haberkorn and Jenelle A. Jindal and E. Reis and Rahul Thapa and L. Blankemeier and Julian Z. Genkins and E. Steinberg and A. Nayak and Birju S. Patel and Chia-Chun Chiang and A. Callahan and Zepeng Huo and S. Gatidis and S. Adams and Oluseyi Fayanju and Shreya J. Shah and Thomas Savage and Ethan Goh and A. Chaudhari and N. Aghaeepour and Christopher D. Sharp and M. Pfeffer and Percy Liang and Jonathan H. Chen and K. Morse and E. Brunskill and Jason Alan Fries and N. Shah}, journal = {arXiv}, title = {MedAlign: A Clinician-Generated Dataset for Instruction Following with Electronic Medical Records}, year = {2023}, } @article{gu2023watermarks, author = {Chenchen Gu and Xiang Lisa Li and Percy Liang and Tatsunori Hashimoto}, journal = {arXiv}, title = {On the Learnability of Watermarks for Language Models}, year = {2023}, } @article{kuditipudi2023robust, author = {Rohith Kuditipudi and John Thickstun and Tatsunori Hashimoto and Percy Liang}, journal = {arXiv}, title = {Robust Distortion-free Watermarks for Language Models}, year = {2023}, } @inproceedings{xie2023data, author = {Sang Michael Xie and Shibani Santurkar and Tengyu Ma and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Data Selection for Language Models via Importance Resampling}, year = {2023}, } @inproceedings{xie2023doremi, author = {Sang Michael Xie and Hieu Pham and Xuanyi Dong and Nan Du and Hanxiao Liu and Yifeng Lu and Percy Liang and Quoc V. Le and Tengyu Ma and A. Yu}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {DoReMi: Optimizing Data Mixtures Speeds Up Language Model Pretraining}, year = {2023}, } @inproceedings{huang2023prodigy, author = {Qian Huang and Hongyu Ren and Peng Chen and Gregor Krvzmanc and D. Zeng and Percy Liang and J. Leskovec}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {{PRODIGY}: Enabling In-context Learning Over Graphs}, year = {2023}, } @inproceedings{huang2023lexinvariant, author = {Qian Huang and E. Zelikman and Sarah Chen and Yuhuai Wu and G. Valiant and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Lexinvariant Language Models}, year = {2023}, } @inproceedings{toups2023ecosystem, author = {Connor Toups and Rishi Bommasani and Kathleen A. Creel and Sarah H. Bana and Dan Jurafsky and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Ecosystem-level Analysis of Deployed Machine Learning Reveals Homogeneous Outcomes}, year = {2023}, } @inproceedings{dubois2023alpacafarm, author = {Yann Dubois and Xuechen Li and Rohan Taori and Tianyi Zhang and Ishaan Gulrajani and Jimmy Ba and Carlos Guestrin and Percy Liang and Tatsunori B. Hashimoto}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {{AlpacaFarm}: A Simulation Framework for Methods that Learn from Human Feedback}, year = {2023}, } @inproceedings{narayanan2023cheaply, author = {Deepak Narayanan and Keshav Santhanam and Peter Henderson and Rishi Bommasani and Tony Lee and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Cheaply Evaluating Inference Efficiency Metrics for Autoregressive Transformer APIs}, year = {2023}, } @inproceedings{lee2023holistic, author = {Tony Lee and Michihiro Yasunaga and Chenlin Meng and Yifan Mai and Joon Sung Park and Agrim Gupta and Yunzhi Zhang and Deepak Narayanan and Hannah Teufel and Marco Bellagente and Minguk Kang and Taesung Park and J. Leskovec and Jun-Yan Zhu and Fei-Fei Li and Jiajun Wu and Stefano Ermon and Percy Liang}, booktitle = {Neural Information Processing Systems Track on Datasets and Benchmarks (NeurIPS Datasets and Benchmarks)}, title = {Holistic Evaluation of Text-To-Image Models}, year = {2023}, } @article{liu2023lost, author = {Nelson F. Liu and Kevin Lin and John Hewitt and Ashwin Paranjape and Michele Bevilacqua and Fabio Petroni and Percy Liang}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {Lost in the Middle: How Language Models Use Long Contexts}, volume = {0}, year = {2023}, } @inproceedings{liu2023evaluating, author = {Nelson F. Liu and Tianyi Zhang and Percy Liang}, booktitle = {Findings of Empirical Methods in Natural Language Processing (Findings of EMNLP)}, title = {Evaluating Verifiability in Generative Search Engines}, year = {2023}, } @article{lee2023evaluating, author = {Mina Lee and Megha Srivastava and Amelia Hardy and John Thickstun and Esin Durmus and Ashwin Paranjape and Ines Gerard-Ursin and Xiang Lisa Li and Faisal Ladhak and Frieda Rong and Rose E. Wang and Minae Kwon and Joon Sung Park and Hancheng Cao and Tony Lee and Rishi Bommasani and Michael Bernstein and Percy Liang}, journal = {Transcations of Machine Learning Research (TMLR)}, title = {Evaluating Human-Language Model Interaction}, volume = {0}, year = {2023}, } @article{bommasani2023trustworthy, author = {Rishi Bommasani and Percy Liang}, journal = {arXiv}, title = {Trustworthy Social Bias Measurement}, year = {2023}, } @article{zhang2023benchmarking, author = {Tianyi Zhang and Faisal Ladhak and Esin Durmus and Percy Liang and K. McKeown and Tatsunori Hashimoto}, journal = {arXiv}, title = {Benchmarking Large Language Models for News Summarization}, year = {2023}, } @article{khattab2023dsp, author = {Omar Khattab and Keshav Santhanam and Xiang Lisa Li and David Hall and Percy Liang and Christopher Potts and Matei Zaharia}, journal = {arXiv}, title = {{Demonstrate-Search-Predict}: Composing retrieval and language models for knowledge-intensive {NLP}}, year = {2023}, } @inproceedings{park2023generative, author = {Joon Sung Park and Joseph C. O'Brien and Carrie J. Cai and Meredith Ringel Morris and Percy Liang and Michael S. Bernstein}, booktitle = {User Interface Software and Technology (UIST)}, title = {Generative Agents: Interactive Simulacra of Human Behavior}, year = {2023}, } @article{henderson2023fairuse, author = {Peter Henderson and Xuechen Li and Dan Jurafsky and Tatsunori Hashimoto and Mark A. Lemley and Percy Liang}, journal = {Journal of Machine Learning Research (JMLR)}, title = {Foundation Models and Fair Use}, volume = {0}, year = {2023}, } @article{bommasani2023ecosystem, author = {Rishi Bommasani and Dilara Soylu and Thomas Liao and Kathleen A. Creel and Percy Liang}, journal = {arXiv}, title = {Ecosystem Graphs: The Social Footprint of Foundation Models}, year = {2023}, } @inproceedings{karamcheti2023voltron, author = {Siddharth Karamcheti and Suraj Nair and Annie S. Chen and T. Kollar and Chelsea Finn and Dorsa Sadigh and Percy Liang}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Language-driven Representation Learning for Robotics}, year = {2023}, } @inproceedings{sheng2023flexgen, author = {Ying Sheng and Lianmin Zheng and Binhang Yuan and Zhuohan Li and Max Ryabinin and Daniel Y. Fu and Zhiqiang Xie and Beidi Chen and Clark W. Barrett and Joseph Gonzalez and Percy Liang and Christopher Ré and I. Stoica and Ce Zhang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {High-throughput Generative Inference of Large Language Models with a Single {GPU}}, year = {2023}, } @inproceedings{yasunaga2023retrieval, author = {Michihiro Yasunaga and Armen Aghajanyan and Weijia Shi and Rich James and Jure Leskovec and Percy Liang and Mike Lewis and Luke Zettlemoyer and Wen-tau Yih}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Retrieval-Augmented Multimodal Language Modeling}, year = {2023}, } @inproceedings{santurkar2023opinions, author = {Shibani Santurkar and Esin Durmus and Faisal Ladhak and Cinoo Lee and Percy Liang and Tatsunori Hashimoto}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Whose Opinions Do Language Models Reflect?}, year = {2023}, } @inproceedings{dubois2023evaluating, author = {Yann Dubois and Tatsunori Hashimoto and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Evaluating Self-Supervised Learning via Risk Decomposition}, year = {2023}, } @inproceedings{gao2023targeted, author = {Irena Gao and Shiori Sagawa and Pang Wei Koh and Tatsunori Hashimoto and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Out-of-Domain Robustness via Targeted Augmentations}, year = {2023}, } @inproceedings{liu2023sample, author = {Nelson F. Liu and Ananya Kumar and Percy Liang and Robin Jia}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Are Sample-Efficient {NLP} Models More Robust?}, year = {2023}, } @inproceedings{liu2023concurrence, author = {Nelson F. Liu and Tony Lee and Robin Jia and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Do Question Answering Modeling Improvements Hold Across Benchmarks?}, year = {2023}, } @inproceedings{zhang2023beyond, author = {Yuhui Zhang and Michihiro Yasunaga and Zhengping Zhou and Jeff Z. HaoChen and James Zou and Percy Liang and Serena Yeung}, booktitle = {Findings of the Association for Computational Linguistics (Findings of ACL)}, title = {Beyond Positive Scaling: How Negation Impacts Scaling Trends of Language Models}, year = {2023}, } @inproceedings{li2023contrastive, author = {Xiang Lisa Li and Ari Holtzman and Daniel Fried and Percy Liang and Jason Eisner and Tatsunori Hashimoto and Luke Zettlemoyer and M. Lewis}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Contrastive Decoding: Open-ended Text Generation as Optimization}, year = {2023}, } @inproceedings{hewitt2023backpack, author = {John Hewitt and John Thickstun and Christopher D. Manning and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Backpack Language Models}, year = {2023}, } @inproceedings{cui2023corrections, author = {Yuchen Cui and Siddharth Karamcheti and Raj Palleti and Nidhya Shivakumar and Percy Liang and Dorsa Sadigh}, booktitle = {ACM/IEEE International Conference on Human Robot Interaction (HRI)}, title = {"No, to the Right"-- Online Language Corrections for Robotic Manipulation via Shared Autonomy}, year = {2023}, } @inproceedings{santurkar2023captions, author = {Shibani Santurkar and Yann Dubois and Rohan Taori and Percy Liang and Tatsunori Hashimoto}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Is a Caption Worth a Thousand Images? A Controlled Study for Representation Learning}, year = {2023}, } @inproceedings{lee2023surgical, author = {Yoonho Lee and Annie S. Chen and Fahim Tajwar and Ananya Kumar and Huaxiu Yao and Percy Liang and Chelsea Finn}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Surgical Fine-Tuning Improves Adaptation to Distribution Shifts}, year = {2023}, } @article{liang2022helm, author = {Percy Liang and Rishi Bommasani and Tony Lee and Dimitris Tsipras and Dilara Soylu and Michihiro Yasunaga and Yian Zhang and D. Narayanan and Yuhuai Wu and Ananya Kumar and Benjamin Newman and Binhang Yuan and Bobby Yan and Ce Zhang and Christian Cosgrove and Christopher D. Manning and Christopher Ré and Diana Acosta-Navas and Drew A. Hudson and E. Zelikman and Esin Durmus and Faisal Ladhak and Frieda Rong and Hongyu Ren and Huaxiu Yao and Jue Wang and Keshav Santhanam and Laurel J. Orr and Lucia Zheng and Mert Yuksekgonul and Mirac Suzgun and Nathan S. Kim and Neel Guha and Niladri S. Chatterji and O. Khattab and Peter Henderson and Qian Huang and Ryan Chi and Sang Michael Xie and Shibani Santurkar and S. Ganguli and Tatsunori Hashimoto and Thomas F. Icard and Tianyi Zhang and Vishrav Chaudhary and William Wang and Xuechen Li and Yifan Mai and Yuhui Zhang and Yuta Koreeda}, journal = {arXiv preprint arXiv:2211.09110}, title = {Holistic Evaluation of Language Models}, year = {2022}, } @inproceedings{hewitt2022truncation, author = {John Hewitt and Christopher D. Manning and Percy Liang}, booktitle = {Findings of Empirical Methods in Natural Language Processing (Findings of EMNLP)}, title = {Truncation Sampling as Language Model Desmoothing}, year = {2022}, } @inproceedings{wu2022synthetic, author = {Yuhuai Wu and Felix Li and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Insights into Pre-training via Simpler Synthetic Tasks}, year = {2022}, } @inproceedings{dubois2022issl, author = {Yann Dubois and Tatsunori Hashimoto and S. Ermon and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Improving Self-Supervised Learning by Characterizing Idealized Representations}, year = {2022}, } @inproceedings{yuan2022decentralized, author = {Binhang Yuan and Yongjun He and Jared Quincy Davis and Tianyi Zhang and Tri Dao and Beidi Chen and Percy Liang and Christopher Re and Ce Zhang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Decentralized Training of Foundation Models in Heterogeneous Environments}, year = {2022}, } @inproceedings{li2022diffusion, author = {Xiang Lisa Li and John Thickstun and Ishaan Gulrajani and Percy Liang and Tatsunori Hashimoto}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Diffusion-{LM} Improves Controllable Text Generation}, year = {2022}, } @inproceedings{garg2022incontext, author = {Shivam Garg and Dimitris Tsipras and Percy Liang and G. Valiant}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {What Can Transformers Learn In-Context? A Case Study of Simple Function Classes}, year = {2022}, } @inproceedings{yasunaga2022dragon, author = {Michihiro Yasunaga and Antoine Bosselut and Hongyu Ren and Xikun Zhang and Christopher D. Manning and Percy Liang and Jure Leskovec}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Deep Bidirectional Language-Knowledge Graph Pretraining}, year = {2022}, } @inproceedings{bommasani2022homogenization, author = {Rishi Bommasani and Kathleen A. Creel and Ananya Kumar and Dan Jurafsky and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Picking on the Same Person: Does Algorithmic Monoculture lead to Outcome Homogenization?}, year = {2022}, } @inproceedings{donahue2022melody, author = {Chris Donahue and John Thickstun and Percy Liang}, booktitle = {International Society for Music Information Retrieval (ISMIR)}, title = {Melody transcription via generative pre-training}, year = {2022}, } @inproceedings{park2022social, author = {J. Park and Lindsay Popowski and Carrie J. Cai and M. Morris and Percy Liang and Michael S. Bernstein}, booktitle = {User Interface Software and Technology (UIST)}, title = {Social Simulacra: Creating Populated Prototypes for Social Computing Systems}, year = {2022}, } @article{wei2022emergent, author = {Jason Wei and Yi Tay and Rishi Bommasani and Colin Raffel and Barret Zoph and Sebastian Borgeaud and Dani Yogatama and Maarten Bosma and Denny Zhou and Donald Metzler and Ed Chi and Tatsunori Hashimoto and Oriol Vinyals and Percy Liang and Jeff Dean and William Fedus}, journal = {Transcations of Machine Learning Research (TMLR)}, title = {Emergent Abilities of Large Language Models}, volume = {0}, year = {2022}, } @inproceedings{kumar2022calibrated, author = {Ananya Kumar and Tengyu Ma and Percy Liang and Aditi Raghunathan}, booktitle = {Uncertainty in Artificial Intelligence (UAI)}, title = {Calibrated ensembles can mitigate accuracy tradeoffs under distribution shift}, year = {2022}, } @inproceedings{karamcheti2022lilac, author = {Siddharth Karamcheti and Raj Palleti and Yuchen Cui and Percy Liang and Dorsa Sadigh}, booktitle = {ACL Workshop for Learning with Natural Language Supervision (NL Supervision)}, title = {Shared Autonomy for Robotic Manipulation with Language Corrections}, year = {2022}, } @inproceedings{shen2022connect, author = {Kendrick Shen and Robbie Jones and Ananya Kumar and Sang Michael Xie and Jeff Z. HaoChen and Tengyu Ma and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Connect, Not Collapse: Explaining Contrastive Learning for Unsupervised Domain Adaptation}, year = {2022}, } @inproceedings{yasunaga2022linkbert, author = {Michihiro Yasunaga and Jure Leskovec and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {{LinkBERT}: Pretraining Language Models with Document Links}, year = {2022}, } @inproceedings{sagawa2022uwilds, author = {Shiori Sagawa and Pang Wei Koh and Tony Lee and Irena Gao and Sang Michael Xie and Kendrick Shen and Ananya Kumar and Weihua Hu and Michihiro Yasunaga and H. Marklund and Sara Beery and E. David and I. Stavness and Wei Guo and J. Leskovec and Kate Saenko and Tatsunori B. Hashimoto and S. Levine and Chelsea Finn and Percy Liang}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Extending the {WILDS} Benchmark for Unsupervised Adaptation}, year = {2022}, } @inproceedings{kumar2022finetuning, author = {Ananya Kumar and Aditi Raghunathan and Robbie Jones and Tengyu Ma and Percy Liang}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Fine-tuning can Distort Pretrained Features and Underperform Out-of-Distribution}, year = {2022}, } @inproceedings{xie2022incontext, author = {Sang Michael Xie and Aditi Raghunathan and Percy Liang and Tengyu Ma}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {An Explanation of In-context Learning as Implicit {B}ayesian Inference}, year = {2022}, } @inproceedings{li2022privacy, author = {Xuechen Li and Florian Tramèr and Percy Liang and Tatsunori B. Hashimoto}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Large Language Models Can Be Strong Differentially Private Learners}, year = {2022}, } @inproceedings{zhang2022greaselm, author = {Xikun Zhang and Antoine Bosselut and Michihiro Yasunaga and Hongyu Ren and Percy Liang and Christopher D. Manning and J. Leskovec}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {GreaseLM: Graph REASoning Enhanced Language Models for Question Answering}, year = {2022}, } @inproceedings{lee2022coauthor, author = {Mina Lee and Percy Liang and Qian Yang}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Co{A}uthor: Designing a Human-{AI} Collaborative Writing Dataset for Exploring Language Model Capabilities}, year = {2022}, } @inproceedings{karamcheti2021lila, author = {Siddharth Karamcheti and Megha Srivastava and Percy Liang and Dorsa Sadigh}, booktitle = {Conference on Robot Learning (CoRL)}, title = {{LILA}: Language-Informed Latent Actions}, year = {2021}, } @article{bommasani2021opportunities, author = {Rishi Bommasani and Drew A. Hudson and Ehsan Adeli and Russ Altman and Simran Arora and Sydney von Arx and Michael S. Bernstein and Jeannette Bohg and Antoine Bosselut and Emma Brunskill and Erik Brynjolfsson and Shyamal Buch and Dallas Card and Rodrigo Castellon and Niladri Chatterji and Annie Chen and Kathleen Creel and Jared Quincy Davis and Dorottya Demszky and Chris Donahue and Moussa Doumbouya and Esin Durmus and Stefano Ermon and John Etchemendy and Kawin Ethayarajh and Li Fei-Fei and Chelsea Finn and Trevor Gale and Lauren Gillespie and Karan Goel and Noah Goodman and Shelby Grossman and Neel Guha and Tatsunori Hashimoto and Peter Henderson and John Hewitt and Daniel E. Ho and Jenny Hong and Kyle Hsu and Jing Huang and Thomas Icard and Saahil Jain and Dan Jurafsky and Pratyusha Kalluri and Siddharth Karamcheti and Geoff Keeling and Fereshte Khani and Omar Khattab and Pang Wei Koh and Mark Krass and Ranjay Krishna and Rohith Kuditipudi and Ananya Kumar and Faisal Ladhak and Mina Lee and Tony Lee and Jure Leskovec and Isabelle Levent and Xiang Lisa Li and Xuechen Li and Tengyu Ma and Ali Malik and Christopher D. Manning and Suvir Mirchandani and Eric Mitchell and Zanele Munyikwa and Suraj Nair and Avanika Narayan and Deepak Narayanan and Ben Newman and Allen Nie and Juan Carlos Niebles and Hamed Nilforoshan and Julian Nyarko and Giray Ogut and Laurel Orr and Isabel Papadimitriou and Joon Sung Park and Chris Piech and Eva Portelance and Christopher Potts and Aditi Raghunathan and Rob Reich and Hongyu Ren and Frieda Rong and Yusuf Roohani and Camilo Ruiz and Jack Ryan and Christopher Ré and Dorsa Sadigh and Shiori Sagawa and Keshav Santhanam and Andy Shih and Krishnan Srinivasan and Alex Tamkin and Rohan Taori and Armin W. Thomas and Florian Tramèr and Rose E. Wang and William Wang and Bohan Wu and Jiajun Wu and Yuhuai Wu and Sang Michael Xie and Michihiro Yasunaga and Jiaxuan You and Matei Zaharia and Michael Zhang and Tianyi Zhang and Xikun Zhang and Yuhui Zhang and Lucia Zheng and Kaitlyn Zhou and Percy Liang}, journal = {arXiv preprint arXiv:2108.07258}, title = {On the Opportunities and Risks of Foundation Models}, year = {2021}, } @inproceedings{yasunaga2021language, author = {Michihiro Yasunaga and Jure Leskovec and Percy Liang}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {{LM-Critic}: Language Models for Unsupervised Grammatical Error Correction}, year = {2021}, } @inproceedings{hewitt2021conditional, author = {John Hewitt and Kawin Ethayarajh and Percy Liang and Christopher D. Manning}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Conditional probing: measuring usable information beyond a baseline}, year = {2021}, } @inproceedings{castellon2021calm, author = {Rodrigo Castellon and Chris Donahue and Percy Liang}, booktitle = {International Society for Music Information Retrieval (ISMIR)}, title = {Codified audio language modeling learns useful representations for music information retrieval}, year = {2021}, } @inproceedings{yasunaga2021break, author = {Michihiro Yasunaga and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {{Break-It-Fix-It}: Unsupervised Learning for Program Repair}, year = {2021}, } @inproceedings{davis2021catformer, author = {Jared Quincy Davis and Albert Gu and Krzysztof Choromanski and Tri Dao and Christopher Re and Chelsea Finn and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Catformer: Designing Stable Transformers via Sensitivity Analysis}, year = {2021}, } @inproceedings{liu2021jtt, author = {Evan Zheran Liu and Behzad Haghgoo and Annie S. Chen and Aditi Raghunathan and Pang Wei Koh and Shiori Sagawa and Percy Liang and Chelsea Finn}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Just Train Twice: Improving Group Robustness without Training Group Information}, year = {2021}, } @inproceedings{liu2021dream, author = {Evan Zheran Liu and Aditi Raghunathan and Percy Liang and Chelsea Finn}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Decoupling Exploration and Exploitation for Meta-Reinforcement Learning without Sacrifices}, year = {2021}, } @inproceedings{xie2021composed, author = {Sang Michael Xie and Tengyu Ma and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Composed Fine-Tuning: Freezing Pre-Trained Denoising Autoencoders for Improved Generalization}, year = {2021}, } @inproceedings{koh2021wilds, author = {Pang Wei Koh and Shiori Sagawa and Henrik Marklund and Sang Michael Xie and Marvin Zhang and Akshay Balsubramani and Weihua Hu and Michihiro Yasunaga and Richard Lanas Phillips and Irena Gao and Tony Lee and Etienne David and Ian Stavness and Wei Guo and Berton A. Earnshaw and Imran S. Haque and Sara Beery and Jure Leskovec and Anshul Kundaje and Emma Pierson and Sergey Levine and Chelsea Finn and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {{WILDS}: A Benchmark of in-the-Wild Distribution Shifts}, year = {2021}, } @inproceedings{miller2021line, author = {John Miller and Rohan Taori and Aditi Raghunathan and Shiori Sagawa and Pang Wei Koh and Vaishaal Shankar and Percy Liang and Yair Carmon and Ludwig Schmidt}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Accuracy on the Line: on the Strong Correlation Between Out-of-Distribution and In-Distribution Generalization}, year = {2021}, } @inproceedings{lee2021swords, author = {Mina Lee and C. Donahue and Robin Jia and Alexander Iyabor and Percy Liang}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Swords: A Benchmark for Lexical Substitution with Improved Data Coverage and Quality}, year = {2021}, } @inproceedings{yasunaga2021qagnn, author = {Michihiro Yasunaga and Hongyu Ren and Antoine Bosselut and Percy Liang and Jure Leskovec}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {{QA-GNN}: Reasoning with Language Models and Knowledge Graphs for Question Answering}, year = {2021}, } @inproceedings{li2021prefix, author = {Xiang Lisa Li and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Prefix-Tuning: Optimizing Continuous Prompts for Generation}, year = {2021}, } @inproceedings{jones2021selective, author = {Erik Jones and Shiori Sagawa and Pang Wei Koh and Ananya Kumar and Percy Liang}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Selective Classification Can Magnify Disparities Across Groups}, year = {2021}, } @inproceedings{xie2021innout, author = {Sang Michael Xie and Ananya Kumar and Robbie Jones and Fereshte Khani and Tengyu Ma and Percy Liang}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {In-{N}-Out: Pre-Training and Self-Training using Auxiliary Information for Out-of-Distribution Robustness}, year = {2021}, } @inproceedings{khani2021removing, author = {Fereshte Khani and Percy Liang}, booktitle = {ACM Conference on Fairness, Accountability, and Transparency (FAccT)}, title = {Removing Spurious Features can Hurt Accuracy and Affect Groups Disproportionately}, year = {2021}, } @inproceedings{gu2021beyond, author = {Yu Gu and Sue Kase and Michelle T. Vanni and Brian M. Sadler and Percy Liang and Xifeng Yan and Yu Su}, booktitle = {World Wide Web (WWW)}, title = {Beyond I.I.D.: Three Levels of Generalization for Question Answering on Knowledge Bases}, year = {2021}, } @article{koh2021stronger, author = {Pang Wei Koh and Jacob Steinhardt and Percy Liang}, journal = {Machine Learning}, title = {Stronger Data Poisoning Attacks Break Data Sanitization Defenses}, volume = {1}, year = {2021}, } @inproceedings{karamcheti2020decomposition, author = {Siddharth Karamcheti and Dorsa Sadigh and Percy Liang}, booktitle = {EMNLP Workshop for Interactive and Executable Semantic Parsing (IntEx-SemPar)}, title = {Learning Adaptive Language Interfaces through Decomposition}, year = {2020}, } @article{liu2020explore, author = {Evan Zheran Liu and Aditi Raghunathan and Percy Liang and Chelsea Finn}, journal = {arXiv preprint arXiv:2008.02790}, title = {Explore then Execute: Adapting without Rewards via Factorized Meta-Reinforcement Learning}, year = {2020}, } @article{liu2020learning, author = {Evan Zheran Liu and Ramtin Keramati and Sudarshan Seshadri and Kelvin Guu and Panupong Pasupat and Emma Brunskill and Percy Liang}, journal = {arXiv preprint arXiv:2007.05896}, title = {Learning Abstract Models for Strategic Exploration and Fast Reward Transfer}, year = {2020}, } @inproceedings{mussmann2020pairwise, author = {Stephen Mussmann and Robin Jia and Percy Liang}, booktitle = {Findings of Empirical Methods in Natural Language Processing (Findings of EMNLP)}, title = {On the Importance of Adaptive Data Collection for Extremely Imbalanced Pairwise Tasks}, year = {2020}, } @inproceedings{hewitt2020rnn, author = {John Hewitt and Michael Hahn and Surya Ganguli and Percy Liang and Christopher D. Manning}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {{RNN}s can generate bounded hierarchical languages with optimal memory}, year = {2020}, } @inproceedings{newman2020eos, author = {Benjamin Newman and John Hewitt and Percy Liang and Christopher D. Manning}, booktitle = {Proceedings of the Third BlackboxNLP Workshop on Analyzing and Interpreting Neural Networks for NLP}, title = {The {EOS} Decision and Length Extrapolation}, year = {2020}, } @inproceedings{dathathri2020sdp, author = {Sumanth Dathathri and Krishnamurthy Dvijotham and Alexey Kurakin and Aditi Raghunathan and Jonathan Uesato and Rudy Bunel and Shreya Shankar and Jacob Steinhardt and Ian Goodfellow and Percy Liang and Pushmeet Kohli}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Enabling certification of verification-agnostic networks via memory-efficient semidefinite programming}, year = {2020}, } @article{semanticmachines2020dataflow, author = {Semantic Machines and Jacob Andreas and John Bufe and David Burkett and Charles Chen and Josh Clausman and Jean Crawford and Kate Crim and Jordan DeLoach and Leah Dorner and Jason Eisner and Hao Fang and Alan Guo and David Hall and Kristin Hayes and Kellie Hill and Diana Ho and Wendy Iwaszuk and Smriti Jha and Dan Klein and Jayant Krishnamurthy and Theo Lanman and Percy Liang and Christopher H. Lin and Ilya Lintsbakh and Andy McGovern and Aleksandr Nisnevich and Adam Pauls and Dmitrij Petters and Brent Read and Dan Roth and Subhro Roy and Jesse Rusak and Beth Short and Div Slomin and Ben Snyder and Stephon Striplin and Yu Su and Zachary Tellman and Sam Thomson and Andrei Vorobev and Izabela Witoszko and Jason Wolfe and Abby Wray and Yuchen Zhang and Alexander Zotov}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {Task-Oriented Dialogue as Dataflow Synthesis}, volume = {8}, year = {2020}, } @inproceedings{sagawa2020overparameterization, author = {Shiori Sagawa and Aditi Raghunathan and Pang Wei Koh and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {An investigation of why overparameterization exacerbates spurious correlations}, year = {2020}, } @inproceedings{koh2020bottleneck, author = {Pang Wei Koh and Thao Nguyen and Yew Siang Tang and Stephen Mussmann and Emma Pierson and Been Kim and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Concept Bottleneck Models}, year = {2020}, } @inproceedings{khani2020noise, author = {Fereshte Khani and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Feature Noise Induces Loss Discrepancy Across Groups}, year = {2020}, } @inproceedings{yasunaga2020repair, author = {Michihiro Yasunaga and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Graph-based, Self-Supervised Program Repair from Diagnostic Feedback}, year = {2020}, } @inproceedings{raghunathan2020understanding, author = {Aditi Raghunathan and Sang Michael Xie and Fanny Yang and John C. Duchi and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Understanding and Mitigating the Tradeoff Between Robustness and Accuracy}, year = {2020}, } @inproceedings{kumar2020gradual, author = {Ananya Kumar and Tengyu Ma and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Understanding Self-Training for Gradual Domain Adaptation}, year = {2020}, } @inproceedings{srivasta2020human, author = {Megha Srivastava and Tatsunori Hashimoto and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Robustness to Spurious Correlations via Human Annotations}, year = {2020}, } @inproceedings{jones2020roben, author = {Erik Jones and Robin Jia and Aditi Raghunathan and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Robust Encodings: A Framework for Combating Adversarial Typos}, year = {2020}, } @inproceedings{kamath2020squads, author = {Amita Kamath and Robin Jia and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Selective Question Answering under Domain Shift}, year = {2020}, } @inproceedings{mu2020shaping, author = {Jesse Mu and Percy Liang and Noah Goodman}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Shaping Visual Representations with Language for Few-shot Classification}, year = {2020}, } @inproceedings{murty2020expbert, author = {Shikhar Murty and Pang Wei Koh and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {{ExpBERT}: Representation Engineering with Natural Language Explanations}, year = {2020}, } @inproceedings{donahue2020infilling, author = {Chris Donahue and Mina Lee and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Enabling Language Models to Fill in the Blanks}, year = {2020}, } @inproceedings{sagawa2020group, author = {Shiori Sagawa and Pang Wei Koh and Tatsunori B. Hashimoto and Percy Liang}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Distributionally Robust Neural Networks for Group Shifts: On the Importance of Regularization for Worst-Case Generalization}, year = {2020}, } @inproceedings{hu2020pretraining, author = {Weihua Hu and Bowen Liu and Joseph Gomes and Marinka Zitnik and Percy Liang and Vijay Pande and Jure Leskovec}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Strategies for Pre-training Graph Neural Networks}, year = {2020}, } @inproceedings{coleman2020selection, author = {Cody Coleman and Christopher Yeh and Stephen Mussmann and Baharan Mirzasoleiman and Peter Bailis and Percy Liang and Jure Leskovec and Matei Zaharia}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Selection via Proxy: Efficient Data Selection for Deep Learning}, year = {2020}, } @inproceedings{li2020greedy, author = {Ray Li and Percy Liang and Stephen Mussmann}, booktitle = {Symposium on Discrete Algorithms (SODA)}, title = {A Tight Analysis of Greedy Yields Subexponential Time Approximation for Uniform Decision Tree}, year = {2020}, } @inproceedings{jia2019certified, author = {Robin Jia and Aditi Raghunathan and Kerem Göksel and Percy Liang}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Certified Robustness to Adversarial Word Substitutions}, year = {2019}, } @inproceedings{oren2019drolm, author = {Yonatan Oren and Shiori Sagawa and Tatsunori Hashimoto and Percy Liang}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Distributionally Robust Language Modeling}, year = {2019}, } @inproceedings{hewitt2019control, author = {John Hewitt and Percy Liang}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Designing and Interpreting Probes with Control Tasks}, year = {2019}, } @inproceedings{kulal2019spoc, author = {Sumith Kulal and Panupong Pasupat and Kartik Chandra and Mina Lee and Oded Padon and Alex Aiken and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {SPoC: Search-based Pseudocode to Code}, year = {2019}, } @inproceedings{carmon2019unlabeled, author = {Yair Carmon and Aditi Raghunathan and Ludwig Schmidt and Percy Liang and John C. Duchi}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Unlabeled Data Improves Adversarial Robustness}, year = {2019}, } @inproceedings{kumar2019calibration, author = {Ananya Kumar and Percy Liang and Tengyu Ma}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Verified Uncertainty Calibration}, year = {2019}, } @inproceedings{koh2019influence, author = {Pang Wei Koh and Kai-Siang Ang and Hubert H. K. Teo and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {On the Accuracy of Influence Functions for Measuring Group Effects}, year = {2019}, } @inproceedings{lee2019autocomplete, author = {Mina Lee and Tatsunori Hashimoto and Percy Liang}, booktitle = {Emergent Communication Workshop at Neural Information Processing Systems (NeurIPS)}, title = {Learning Autocomplete Systems as a Communication Game}, year = {2019}, } @article{raghunathan2019hurt, author = {Aditi Raghunathan and Sang Michael Xie and Fanny Yang and John C. Duchi and Percy Liang}, journal = {arXiv preprint arXiv:1906.06032}, title = {Adversarial Training Can Hurt Generalization}, year = {2019}, } @article{khani2019mwld, author = {Fereshte Khani and Aditi Raghunathan and Percy Liang}, journal = {arXiv preprint arXiv:1906.03518}, title = {Maximum Weighted Loss Discrepancy}, year = {2019}, } @article{monajemi2019painless, author = {Hatef Monajemi and Riccardo Murri and Eric Jonas and Percy Liang and Victoria Stodden and David L. Donoho}, journal = {Harvard Data Science Review}, title = {Ambitious Data Science Can Be Painless}, volume = {1}, year = {2019}, } @inproceedings{hashimoto2019huse, author = {Tatsunori Hashimoto and Hugh Zhang and Percy Liang}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Unifying Human and Statistical Evaluation for Natural Language Generation}, year = {2019}, } @inproceedings{peng2019pun, author = {Nanyun Peng and He He and Percy Liang}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Pun Generation with Surprise}, year = {2019}, } @inproceedings{selsam2019sat, author = {Daniel Selsam and Matthew Lamm and Benedikt Bünz and Percy Liang and Leonardo de Moura and David L. Dill}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Learning a {SAT} Solver from Single-Bit Supervision}, year = {2019}, } @inproceedings{zhang2019discretization, author = {Yuchen Zhang and Percy Liang}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, title = {Defending against Whitebox Adversarial Attacks via Randomized Discretization}, year = {2019}, } @inproceedings{pierson2019aging, author = {Emma Pierson and Pang Wei Koh and Tatsunori Hashimoto and Daphne Koller and Jure Leskovec and Nick Eriksson and Percy Liang}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, title = {Inferring Multidimensional Rates of Aging from Cross-Sectional Data}, year = {2019}, } @inproceedings{shi2019frangel, author = {Kensen Shi and Jacob Steinhardt and Percy Liang}, booktitle = {Principles of Programming Languages (POPL)}, title = {{F}r{A}ngel: Component-Based Synthesis with Control Structures}, year = {2019}, } @inproceedings{raghunathan2018sdp, author = {Aditi Raghunathan and Jacob Steinhardt and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Semidefinite relaxations for certifying robustness to adversarial examples}, year = {2018}, } @inproceedings{mussmann2018sgd, author = {Stephen Mussmann and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Uncertainty Sampling is Preconditioned Stochastic Gradient Descent on Zero-One Loss}, year = {2018}, } @inproceedings{hashimoto2018edit, author = {Tatsunori Hashimoto and Kelvin Guu and Yonatan Oren and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {A Retrieve-and-Edit Framework for Predicting Structured Outputs}, year = {2018}, } @inproceedings{choi2018quac, author = {Eunsol Choi and He He and Mohit Iyyer and Mark Yatskar and Wen-tau Yih and Yejin Choi and Percy Liang and Luke Zettlemoyer}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {{QuAC}: Question Answering in Context}, year = {2018}, } @inproceedings{he2018negotiation, author = {He He and Derek Chen and Anusha Balakrishnan and Percy Liang}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Decoupling Strategy and Generation in Negotiation Dialogues}, year = {2018}, } @inproceedings{pasupat2018elements, author = {Panupong Pasupat and Tian-Shun Jiang and Evan Zheran Liu and Kelvin Guu and Percy Liang}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Mapping Natural Language Commands to Web Elements}, year = {2018}, } @inproceedings{lamm2018tap, author = {Matthew Lamm and Arun Chaganty and Christopher D. Manning and Dan Jurafsky and Percy Liang}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Textual Analogy Parsing: What's Shared and What's Compared among Analogous Facts}, year = {2018}, } @inproceedings{mussmann2018accuracy, author = {Stephen Mussmann and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {On the Relationship between Data Efficiency and Error in Active Learning}, year = {2018}, } @inproceedings{hashimoto2018repeated, author = {Tatsunori B. Hashimoto and Megha Srivastava and Hongseok Namkoong and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Fairness Without Demographics in Repeated Loss Minimization}, year = {2018}, } @inproceedings{hancock2018babble, author = {Braden Hancock and Paroma Varma and Stephanie Wang and Martin Bringmann and Percy Liang and Christopher R\'e}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Training Classifiers with Natural Language Explanations}, year = {2018}, } @inproceedings{chaganty2018evaluation, author = {Arun Chaganty and Stephen Mussmann and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {The price of debiasing automatic metrics in natural language evaluation}, year = {2018}, } @inproceedings{rajpurkar2018squadrun, author = {Pranav Rajpurkar and Robin Jia and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Know What You Don't Know: Unanswerable Questions for {SQuAD}}, year = {2018}, } @inproceedings{mussmann2018gbs, author = {Stephen Mussmann and Percy Liang}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, title = {Generalized Binary Search For Split-Neighborly Problems}, year = {2018}, } @article{khani2018pip, author = {Fereshte Khani and Noah D. Goodman and Percy Liang}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {Planning, Inference and Pragmatics in Sequential Language Games}, volume = {6}, year = {2018}, } @article{guu2018edit, author = {Kelvin Guu and Tatsunori B. Hashimoto and Yonatan Oren and Percy Liang}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {Generating Sentences by Editing Prototypes}, volume = {0}, year = {2018}, } @inproceedings{li2018style, author = {Juncen Li and Robin Jia and He He and Percy Liang}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Delete, Retrieve, Generate: A Simple Approach to Sentiment and Style Transfer}, year = {2018}, } @inproceedings{liu2018workflow, author = {Evan Zheran Liu and Kelvin Guu and Panupong Pasupat and Tianlin Shi and Percy Liang}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Reinforcement Learning on Web Interfaces using Workflow-Guided Exploration}, year = {2018}, } @inproceedings{raghunathan2018certified, author = {Aditi Raghunathan and Jacob Steinhardt and Percy Liang}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Certified defenses against adversarial examples}, year = {2018}, } @inproceedings{bastani2018active, author = {Osbert Bastani and Rahul Sharma and Alex Aiken and Percy Liang}, booktitle = {Programming Language Design and Implementation (PLDI)}, title = {Active Learning of Points-To Specifications}, year = {2018}, } @inproceedings{sharan2018prediction, author = {Vatsal Sharan and Sham Kakade and Percy Liang and Gregory Valiant}, booktitle = {Symposium on Theory of Computing (STOC)}, title = {Prediction with a Short Memory}, year = {2018}, } @article{demszky2018transforming, author = {Dorottya Demszky and Kelvin Guu and Percy Liang}, journal = {arXiv preprint arXiv:1809.02922}, title = {Transforming Question Answering Datasets Into Natural Language Inference Datasets}, year = {2018}, } @inproceedings{steinhardt2017certified, author = {Jacob Steinhardt and Pang Wei Koh and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Certified Defenses for Data Poisoning Attacks}, year = {2017}, } @inproceedings{hashimoto2017transformation, author = {Tatsunori B. Hashimoto and John Duchi and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Unsupervised Transformation Learning via Convex Relaxations}, year = {2017}, } @inproceedings{sharan2017overcomplete, author = {Vatsal Sharan and Sham Kakade and Percy Liang and Gregory Valiant}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Learning Overcomplete {HMM}s}, year = {2017}, } @inproceedings{jia2017adversarial, author = {Robin Jia and Percy Liang}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Adversarial Examples for Evaluating Reading Comprehension Systems}, year = {2017}, } @inproceedings{zhang2017macro, author = {Yuchen Zhang and Panupong Pasupat and Percy Liang}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Macro Grammars and Holistic Triggering for Efficient Semantic Parsing}, year = {2017}, } @inproceedings{chaganty2017unbiased, author = {Arun Chaganty and Ashwin Paranjape and Percy Liang and Chris Manning}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Importance sampling for unbiased on-demand evaluation of knowledge base population}, year = {2017}, } @inproceedings{koh2017understanding, author = {Pang Wei Koh and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Understanding Black-box Predictions via Influence Functions}, year = {2017}, } @inproceedings{zhang2017convexified, author = {Yuchen Zhang and Percy Liang and Martin J. Wainwright}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Convexified Convolutional Neural Networks}, year = {2017}, } @inproceedings{selsam2017bugfree, author = {Daniel Selsam and Percy Liang and David Dill}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Developing Bug-Free Machine Learning Systems With Formal Mathematics}, year = {2017}, } @inproceedings{shi2017wob, author = {Tianlin Shi and Andrej Karpathy and Linxi Fan and Jonathan Hernandez and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {World of Bits: An Open-Domain Platform for Web-Based Agents}, year = {2017}, } @inproceedings{zhang2017hitting, author = {Yuchen Zhang and Percy Liang and Moses Charikar}, booktitle = {Conference on Learning Theory (COLT)}, title = {A Hitting Time Analysis of Stochastic Gradient {L}angevin Dynamics}, year = {2017}, } @inproceedings{bastani2017synthesizing, author = {Osbert Bastani and Rahul Sharma and Alex Aiken and Percy Liang}, booktitle = {Programming Language Design and Implementation (PLDI)}, title = {Synthesizing Program Input Grammars}, year = {2017}, } @inproceedings{wang2017naturalizing, author = {Sida I. Wang and Sam Ginn and Percy Liang and Christopher D. Manning}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Naturalizing a Programming Language via Interactive Learning}, year = {2017}, } @inproceedings{he2017symmetric, author = {He He and Anusha Balakrishnan and Mihail Eric and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {1766--1776}, title = {Learning Symmetric Collaborative Dialogue Agents with Dynamic Knowledge Graph Embeddings}, year = {2017}, } @inproceedings{guu2017bridging, author = {Kelvin Guu and Panupong Pasupat and Evan Zheran Liu and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {From Language to Programs: Bridging Reinforcement Learning and Maximum Marginal Likelihood}, year = {2017}, } @inproceedings{steinhardt2016risk, author = {Jacob Steinhardt and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Unsupervised Risk Estimation Using Only Conditional Independence Structure}, year = {2016}, } @inproceedings{rajpurkar2016squad, author = {Pranav Rajpurkar and Jian Zhang and Konstantin Lopyrev and Percy Liang}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {{SQuAD}: 100,000+ Questions for Machine Comprehension of Text}, year = {2016}, } @inproceedings{wang2016games, author = {Sida I. Wang and Percy Liang and Chris Manning}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Learning Language Games through Interaction}, year = {2016}, } @inproceedings{jia2016recombination, author = {Robin Jia and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Data Recombination for Neural Semantic Parsing}, year = {2016}, } @inproceedings{long2016projections, author = {Reginald Long and Panupong Pasupat and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Simpler Context-Dependent Logical Forms via Model Projections}, year = {2016}, } @inproceedings{pasupat2016inferring, author = {Panupong Pasupat and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Inferring Logical Forms From Denotations}, year = {2016}, } @inproceedings{khani2016unanimity, author = {Fereshte Khani and Martin Rinard and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Unanimous Prediction for 100\% Precision with Application to Learning Semantic Mappings}, year = {2016}, } @inproceedings{chaganty2016perspectives, author = {Arun Tejasvi Chaganty and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {How Much is 131 Million Dollars? {P}utting Numbers in Perspective with Compositional Descriptions}, year = {2016}, } @inproceedings{raghunathan2016linear, author = {Aditi Raghunathan and Roy Frostig and John Duchi and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Estimation from Indirect Supervision with Linear Moments}, year = {2016}, } @incollection{wager2016levy, author = {Stefan Wager and Will Fithian and Percy Liang}, booktitle = {Perturbations, Optimization and Statistics}, title = {Data Augmentation via {L}\'evy Processes}, year = {2016}, } @article{liang2016executable, author = {Percy Liang}, journal = {Communications of the ACM}, title = {Learning Executable Semantic Parsers for Natural Language Understanding}, volume = {59}, year = {2016}, } @inproceedings{wang2015overnight, author = {Yushi Wang and Jonathan Berant and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Building a Semantic Parser Overnight}, year = {2015}, } @article{berant2015agenda, author = {Jonathan Berant and Percy Liang}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, pages = {545--558}, title = {Imitation Learning of Agenda-Based Semantic Parsers}, volume = {3}, year = {2015}, } @inproceedings{steinhardt2015relaxed, author = {Jacob Steinhardt and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Learning with Relaxed Supervision}, year = {2015}, } @inproceedings{wang2015polynomial, author = {Sida I. Wang and Arun Chaganty and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Estimating Mixture Models via Mixture of Polynomials}, year = {2015}, } @inproceedings{werling2015onthejob, author = {Keenon Werling and Arun Chaganty and Percy Liang and Chris Manning}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {On-the-Job Learning with {B}ayesian Decision Theory}, year = {2015}, } @inproceedings{kuleshov2015calibrated, author = {Volodymyr Kuleshov and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Calibrated Structured Prediction}, year = {2015}, } @article{kuleshov2015simultaneous, author = {Volodymyr Kuleshov and Arun Chaganty and Percy Liang}, journal = {arXiv}, title = {Simultaneous diagonalization: the asymmetric, low-rank, and noisy settings}, year = {2015}, } @inproceedings{guu2015traversing, author = {Kelvin Guu and John Miller and Percy Liang}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Traversing Knowledge Graphs in Vector Space}, year = {2015}, } @inproceedings{pasupat2015compositional, author = {Panupong Pasupat and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Compositional Semantic Parsing on Semi-Structured Tables}, year = {2015}, } @inproceedings{misra2015environment, author = {Dipendra K. Misra and Kejia Tao and Percy Liang and Ashutosh Saxena}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Environment-Driven Lexicon Induction for High-Level Instructions}, year = {2015}, } @inproceedings{steinhardt2015rcm, author = {Jacob Steinhardt and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Reified Context Models}, year = {2015}, } @inproceedings{steinhardt2015fast, author = {Jacob Steinhardt and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1063--1072}, title = {Learning Fast-Mixing Models for Structured Prediction}, year = {2015}, } @inproceedings{shi2015sample, author = {Tianlin Shi and Jacob Steinhardt and Percy Liang}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, pages = {875--884}, title = {Learning Where To Sample in Structured Prediction}, year = {2015}, } @inproceedings{kuleshov2015tensor, author = {Volodymyr Kuleshov and Arun Chaganty and Percy Liang}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, title = {Tensor factorization via matrix factorization}, year = {2015}, } @article{liang2015semantics, author = {Percy Liang and Christopher Potts}, journal = {Annual Reviews of Linguistics}, number = {1}, pages = {355--376}, title = {Bringing machine learning and compositional semantics together}, volume = {1}, year = {2015}, } @article{steinhardt2014sparse, author = {Jacob Steinhardt and Stefan Wager and Percy Liang}, journal = {arXiv preprint arXiv:1412.4182}, title = {The Statistics of Streaming Sparse Regression}, year = {2014}, } @inproceedings{ramanathan2014linking, author = {Vignesh Ramanathan and Armand Joulin and Percy Liang and Li Fei-Fei}, booktitle = {European Conference on Computer Vision (ECCV)}, title = {Linking people with "their" names using coreference resolution}, year = {2014}, } @article{liang2014talking, author = {Percy Liang}, journal = {XRDS: Crossroads, The ACM Magazine for Students}, number = {1}, pages = {18--21}, title = {Talking to computers in natural language}, volume = {21}, year = {2014}, } @inproceedings{berant2014paraphrasing, author = {Jonathan Berant and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Semantic Parsing via Paraphrasing}, year = {2014}, } @inproceedings{pasupat2014extraction, author = {Panupong Pasupat and Percy Liang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Zero-shot Entity Extraction from Web Pages}, year = {2014}, } @inproceedings{chaganty2014graphical, author = {Arun Chaganty and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Estimating Latent-Variable Graphical Models using Moments and Likelihoods}, year = {2014}, } @inproceedings{steinhardt2014eg, author = {Jacob Steinhardt and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Adaptivity and Optimism: An Improved Exponentiated Gradient Algorithm}, year = {2014}, } @inproceedings{steinhardt2014filtering, author = {Jacob Steinhardt and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {727--735}, title = {Filtering with Abstract Particles}, year = {2014}, } @article{frostig2014subconstant, author = {Roy Frostig and Sida I. Wang}, journal = {arXiv preprint arXiv:1408.2270}, title = {A sub-constant improvement in approximating the positive semidefinite {G}rothendieck problem}, year = {2014}, } @inproceedings{wager2014altitude, author = {Stefan Wager and Will Fithian and Sida I. Wang and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Altitude Training: Strong Bounds for Single-Layer Dropout}, year = {2014}, } @inproceedings{frostig2014lowrank, author = {Roy Frostig and Sida I. Wang and Percy Liang and Chris Manning}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Simple {MAP} inference via low-rank relaxations}, year = {2014}, } @inproceedings{wang2014iqp, author = {Sida I. Wang and Roy Frostig and Percy Liang and Chris Manning}, booktitle = {International Conference on Learning Representations Workshop (ICLR)}, title = {Relaxations for inference in restricted {B}oltzmann machines}, year = {2014}, } @article{liang2013lambdadcs, author = {Percy Liang}, journal = {arXiv preprint arXiv:1309.4408}, title = {Lambda Dependency-Based Compositional Semantics}, year = {2013}, } @inproceedings{berant2013freebase, author = {Jonathan Berant and Andrew Chou and Roy Frostig and Percy Liang}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Semantic Parsing on {F}reebase from Question-Answer Pairs}, year = {2013}, } @inproceedings{wang2013noising, author = {Sida I. Wang and Mengqiu Wang and Stefan Wager and Percy Liang and Chris Manning}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Feature Noising for Log-linear Structured Prediction}, year = {2013}, } @inproceedings{wager2013dropout, author = {Stefan Wager and Sida I. Wang and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Dropout Training as Adaptive Regularization}, year = {2013}, } @inproceedings{chaganty13regression, author = {Arun Chaganty and Percy Liang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Spectral Experts for Estimating Mixtures of Linear Regressions}, year = {2013}, } @inproceedings{ramanathan2013event, author = {Vignesh Ramanathan and Percy Liang and Li Fei-Fei}, booktitle = {International Conference on Computer Vision (ICCV)}, title = {Video Event Understanding using Natural Language Descriptions}, year = {2013}, } @inproceedings{sharma13algebraic, author = {Rahul Sharma and Saurabh Gupta and Bharath Hariharan and Alex Aiken and Percy Liang and Aditya V. Nori}, booktitle = {European Symposium on Programming (ESOP)}, title = {A Data Driven Approach for Algebraic Loop Invariants}, year = {2013}, } @inproceedings{hsu12identifiability, author = {Daniel Hsu and Sham M. Kakade and Percy Liang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Identifiability and Unmixing of Latent Parse Trees}, year = {2012}, } @article{liang13cl, author = {Percy Liang and Michael Jordan and Dan Klein}, journal = {Computational Linguistics}, pages = {389--446}, title = {Learning Dependency-Based Compositional Semantics}, volume = {39}, year = {2013}, } @phdthesis{liang11thesis, author = {Percy Liang}, school = {University of California Berkeley at Berkeley}, title = {Learning Dependency-Based Compositional Semantics}, year = {2011}, } @inproceedings{liang11dcs, author = {Percy Liang and Michael I. Jordan and Dan Klein}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {590--599}, title = {Learning Dependency-Based Compositional Semantics}, year = {2011}, } @inproceedings{liang11pruning, author = {Percy Liang and Mayur Naik}, booktitle = {Programming Language Design and Implementation (PLDI)}, title = {Scaling up Abstraction Refinement via Pruning}, year = {2011}, } @inproceedings{liang11minimal, author = {Percy Liang and Omer Tripp and Mayur Naik}, booktitle = {Principles of Programming Languages (POPL)}, title = {Learning Minimal Abstractions}, year = {2011}, } @inproceedings{golland2010pragmatics, author = {Dave Golland and Percy Liang and Dan Klein}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {410--419}, title = {A Game-theoretic Approach to Generating Spatial Descriptions}, year = {2010}, } @inproceedings{angeli10generation, author = {Gabor Angeli and Percy Liang and Dan Klein}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {A Simple Domain-Independent Probabilistic Approach to Generation}, year = {2010}, } @inproceedings{liang10abstraction, author = {Percy Liang and Omer Tripp and Mayur Naik and Mooly Sagiv}, booktitle = {Object-Oriented Programming, Systems, Languages, and Applications (OOPSLA)}, title = {A Dynamic Evaluation of Static Heap Abstractions}, year = {2010}, } @inproceedings{liang10programs, author = {Percy Liang and Michael I. Jordan and Dan Klein}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {639--646}, title = {Learning Programs: A Hierarchical {B}ayesian Approach}, year = {2010}, } @inproceedings{liang10regimes, author = {Percy Liang and Nati Srebro}, booktitle = {International Conference on Machine Learning (ICML)}, title = {On the Interaction between Norm and Dimensionality: Multiple Regimes in Learning}, year = {2010}, } @inproceedings{liang10type, author = {Percy Liang and Michael I. Jordan and Dan Klein}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Type-Based {MCMC}}, year = {2010}, } @article{liang10regularizationTR, author = {Percy Liang and Francis Bach and Guillaume Bouchard and Michael I. Jordan}, journal = {arXiv}, title = {Asymptotically Optimal Regularization in Smooth Parametric Models}, year = {2010}, } @inproceedings{liang09regularization, author = {Percy Liang and Francis Bach and Guillaume Bouchard and Michael I. Jordan}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Asymptotically Optimal Regularization in Smooth Parametric Models}, year = {2009}, } @incollection{liang09hdppcfg, author = {Percy Liang and Michael I. Jordan and Dan Klein}, booktitle = {The Oxford Handbook of Applied Bayesian Analysis}, title = {Probabilistic grammars and hierarchical {D}irichlet processes}, year = {2009}, } @inproceedings{liang09semantics, author = {Percy Liang and Michael I. Jordan and Dan Klein}, booktitle = {Association for Computational Linguistics and International Joint Conference on Natural Language Processing (ACL-IJCNLP)}, pages = {91--99}, title = {Learning Semantic Correspondences with Less Supervision}, year = {2009}, } @inproceedings{liang09measurements, author = {Percy Liang and Michael I. Jordan and Dan Klein}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Learning from Measurements in Exponential Families}, year = {2009}, } @inproceedings{liang09online, author = {Percy Liang and Dan Klein}, booktitle = {North American Association for Computational Linguistics (NAACL)}, pages = {611--619}, title = {Online {EM} for Unsupervised Models}, year = {2009}, } @inproceedings{liang08asymptotics, author = {Percy Liang and Michael I. Jordan}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {584--591}, title = {An Asymptotic Analysis of Generative, Discriminative, and Pseudolikelihood Estimators}, year = {2008}, } @inproceedings{liang08structure, author = {Percy Liang and Hal {Daum{\'e} III} and Dan Klein}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Structure Compilation: Trading Structure for Features}, year = {2008}, } @inproceedings{liang08errors, author = {Percy Liang and Dan Klein}, booktitle = {Human Language Technology and Association for Computational Linguistics (HLT/ACL)}, title = {Analyzing the Errors of Unsupervised Learning}, year = {2008}, } @inproceedings{haghighi08lexicon, author = {Aria Haghighi and Percy Liang and Taylor Berg-Kirkpatrick and Dan Klein}, booktitle = {Human Language Technology and Association for Computational Linguistics (HLT/ACL)}, title = {Learning Bilingual Lexicons from Monolingual Corpora}, year = {2008}, } @inproceedings{liang08agreement, author = {Percy Liang and Dan Klein and Michael I. Jordan}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Agreement-Based Learning}, year = {2008}, } @inproceedings{bouchard08language, author = {Alexandre Bouchard-C\^ot\'e and Percy Liang and Tom Griffiths and Dan Klein}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {A Probabilistic Approach to Language Change}, year = {2008}, } @inproceedings{liang07tutorial, author = {Percy Liang and Dan Klein}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Structured {B}ayesian Nonparametric Models with Variational Inference (tutorial)}, year = {2007}, } @inproceedings{liang07permdp, author = {Percy Liang and Michael I. Jordan and Ben Taskar}, booktitle = {International Conference on Machine Learning (ICML)}, title = {A permutation-augmented sampler for {D}irichlet process mixture models}, year = {2007}, } @inproceedings{liang07infpcfg, author = {Percy Liang and Slav Petrov and Michael I. Jordan and Dan Klein}, booktitle = {Empirical Methods in Natural Language Processing and Computational Natural Language Learning (EMNLP/CoNLL)}, title = {The Infinite {PCFG} using Hierarchical {D}irichlet Processes}, year = {2007}, } @inproceedings{bouchard07diachronic, author = {Alexandre Bouchard-C\^ot\'e and Percy Liang and Tom Griffiths and Dan Klein}, booktitle = {Empirical Methods in Natural Language Processing and Computational Natural Language Learning (EMNLP/CoNLL)}, title = {A Probabilistic Approach to Diachronic Phonology}, year = {2007}, } @inproceedings{liang06discrimative, author = {Percy Liang and Alexandre Bouchard-C\^ot\'e and Dan Klein and Ben Taskar}, booktitle = {International Conference on Computational Linguistics and Association for Computational Linguistics (COLING/ACL)}, title = {An End-to-End Discriminative Approach to Machine Translation}, year = {2006}, } @inproceedings{liang06alignment, author = {Percy Liang and Ben Taskar and Dan Klein}, booktitle = {North American Association for Computational Linguistics (NAACL)}, pages = {104--111}, title = {Alignment by Agreement}, year = {2006}, } @mastersthesis{liang05meng, author = {Percy Liang}, school = {Massachusetts Institute of Technology}, title = {Semi-Supervised Learning for Natural Language}, year = {2005}, } @techreport{liang05hypercycle, author = {Percy Liang and Nathan Srebro}, institution = {Massachusetts Institute of Technology}, title = {A Data Structure for Maintaining Acyclicity in Hypergraphs}, year = {2005}, } @techreport{liang04markov, author = {Percy Liang and Nathan Srebro}, institution = {Massachusetts Institute of Technology}, title = {Methods and Experiments With Bounded Tree-width {M}arkov Networks}, year = {2004}, } @techreport{liang03maxwmfarm, author = {Percy Liang and Nathan Srebro}, institution = {Massachusetts Institute of Technology}, title = {How Much Of A Hypertree Can Be Captured By Windmills?}, year = {2003}, } @inproceedings{liang05mcmaster, author = {Percy Liang and Nathan Srebro}, booktitle = {Mathematical Programing for Data Mining and Machine Learning Workshop at McMaster University}, title = {Linear Programming in Bounded Tree-width {M}arkov Networks}, year = {2005}, } @inproceedings{liang05geometric, author = {Percy Liang and Mukund Narasimhan and Michael Shilman and Paul Viola}, booktitle = {International Conference on Document Analysis and Recognition (ICDAR)}, title = {Efficient Geometric Algorithms for Parsing in Two Dimensions}, year = {2005}, } @article{ferguson73dp, author = {T. S. Ferguson}, journal = {Annals of Statistics}, pages = {209--230}, title = {A {B}ayesian Analysis of Some Nonparametric Problems}, volume = {1}, year = {1973}, } @article{ferguson74prior, author = {T. S. Ferguson}, journal = {Annals of Statistics}, pages = {615--629}, title = {Prior distributions on spaces of probability measures}, volume = {2}, year = {1974}, } @article{blackwell73urn, author = {D. Blackwell and J. B. MacQueen}, journal = {Annals of Statistics}, pages = {353--355}, title = {{F}erguson Distributions via {P}\'olya Urn Schemes}, volume = {1}, year = {1973}, } @article{aldous85exch, author = {D. Aldous}, journal = {Springer Lecture Notes in Math}, pages = {1--198}, title = {Exchangeability and related topics}, volume = {1117}, year = {1985}, } @article{antoniak74dpmix, author = {C. E. Antoniak}, journal = {Annals of Statistics}, pages = {1152--1174}, title = {Mixtures of {D}irichlet Processes with Applications to {B}ayesian Nonparametric Problems}, volume = {2}, year = {1974}, } @article{sethuraman94stick, author = {J. Sethuraman}, journal = {Statistica Sinica}, pages = {639--650}, title = {A Constructive Definition of {D}irichlet Priors}, volume = {4}, year = {1994}, } @article{escobar95mixture, author = {M. D. Escobar and M. West}, journal = {Journal of the American Statistical Association (JASA)}, pages = {577--588}, title = {{B}ayesian Density Estimation and Inference Using Mixtures}, volume = {90}, year = {1995}, } @article{bergstra12hyper, author = {James Bergstra and Yoshua Bengio}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {281--305}, title = {Random Search for Hyper-Parameter Optimization}, volume = {13}, year = {2012}, } @inproceedings{snoek12hyper, author = {Jasper Snoek and Hugo Larochelle and Ryan P. Adams}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Practical {B}ayesian Optimization of Machine Learning Algorithms}, year = {2012}, } @techreport{west95hyper, author = {M. West}, institution = {Department of Statistics, Duke University (Duke University)}, title = {Hyperparameter estimation in {D}irichlet process mixture models}, year = {1995}, } @article{pitman97yor, author = {J. Pitman and M. Yor}, journal = {Annals of Probability}, pages = {855--900}, title = {The two-parameter {P}oisson-{D}irichlet distribution derived from a stable subordinator}, volume = {25}, year = {1997}, } @article{ishwaran02exact, author = {H. Ishwaran and M. Zarepour}, journal = {Canadian Journal of Statististics}, pages = {269--284}, title = {Exact and approximate sum-representations for the {D}irichlet process}, volume = {30}, year = {2002}, } @inproceedings{griffiths06ibp, author = {Tom Griffiths and Zoubin Ghahramani}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Infinite Latent Feature Models and the {I}ndian Buffet Process}, year = {2006}, } @inproceedings{thibaux07hbp, author = {Romain Thibaux and Michael I. Jordan}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, title = {Hierarchical {B}eta Processes and the {I}ndian Buffet Process}, year = {2007}, } @inproceedings{xing08haplotype, author = {Jurgen Van Gael and Yunus Saatci and Yee Whye Teh and Zoubin Ghahramani}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1088--1095}, title = {Beam Sampling for the Infinite Hidden {M}arkov Model}, year = {2008}, } @inproceedings{xing04haplotype, author = {E. P. Xing and R. Sharan and M. I. Jordan}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {111--118}, title = {{B}ayesian Haplotype Inference via the {D}irichlet Process}, year = {2004}, } @article{teh06hdp, author = {Y. W. Teh and M. I. Jordan and M. Beal and D. Blei}, journal = {Journal of the American Statistical Association (JASA)}, pages = {1566--1581}, title = {Hierarchical {D}irichlet processes}, volume = {101}, year = {2006}, } @article{rodriguez08ndp, author = {Abel Rodriguez and David B. Dunson and Alan E. Gelfand}, journal = {Journal of the American Statistical Association (JASA)}, pages = {1131--1144}, title = {The nested {D}irichlet process}, volume = {103}, year = {2008}, } @inproceedings{beal02ihmm, author = {M. Beal and Z. Ghahramani and C. Rasmussen}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {577--584}, title = {The infinite hidden {M}arkov model}, year = {2002}, } @inproceedings{sohn07ihmm, author = {K. Sohn and E. P. Xing}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {A Hidden {M}arkov {D}irichlet Process Model for Genetic Recombination in Open Ancestral Space}, year = {2007}, } @inproceedings{teh06pitmanyor, author = {Y. W. Teh}, booktitle = {International Conference on Computational Linguistics and Association for Computational Linguistics (COLING/ACL)}, pages = {985--992}, title = {A Hierarchical {B}ayesian Language Model Based On {P}itman-{Y}or Processes}, year = {2006}, } @inproceedings{goldwater06segmentation, author = {Sharon Goldwater and Tom Griffiths and Mark Johnson}, booktitle = {International Conference on Computational Linguistics and Association for Computational Linguistics (COLING/ACL)}, title = {Contextual Dependencies in Unsupervised Word Segmentation}, year = {2006}, } @inproceedings{sudderth06transformed, author = {E. B. Sudderth and A. B. Torralba and W. T. Freeman and A. S. Willsky}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1297--1304}, title = {Describing Visual Scenes using Transformed {D}irichlet Processes}, year = {2006}, } @article{daume05clustering, author = {Hal {Daum{\'e} III} and Daniel Marcu}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {1--48}, title = {A {B}ayesian Model for Supervised Clustering with the {D}irichlet Process Prior}, volume = {1}, year = {2005}, } @article{blei05variational, author = {D. Blei and M. I. Jordan}, journal = {Bayesian Analysis}, pages = {121--144}, title = {Variational Inference for {D}irichlet Process Mixtures}, volume = {1}, year = {2005}, } @inproceedings{teh07collapsed, author = {Y. W. Teh and D. Newman and M. Welling}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1353--1360}, title = {A Collapsed Variational {B}ayesian Inference Algorithm for {L}atent {D}irichlet {A}llocation}, year = {2007}, } @inproceedings{kurihara07accelerated, author = {K. Kurihara and M. Welling and N. Vlassis}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Accelerated Variational {D}irichlet Mixture Models}, year = {2007}, } @inproceedings{kurihara07collapsed, author = {K. Kurihara and M. Welling and Y. W. Teh}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Collapsed Variational {D}irichlet Process Mixture Models}, year = {2007}, } @inproceedings{daume07astar, author = {Hal {Daum{\'e} III}}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, title = {Fast search for {D}irichlet process mixture models}, year = {2007}, } @inproceedings{heller05hierarchical, author = {K. A. Heller and Z. Ghahramani}, booktitle = {International Conference on Machine Learning (ICML)}, title = {{B}ayesian Hierarchical Clustering}, year = {2005}, } @article{ishwaran01gibbs, author = {H. Ishwaran and L. F. James}, journal = {Journal of the American Statistical Association (JASA)}, pages = {161--173}, title = {{G}ibbs Sampling Methods for Stick-Breaking Priors}, volume = {96}, year = {2001}, } @article{papaspiliopoulos08retro, author = {Omiros Papaspiliopoulos and Gareth O. Roberts}, journal = {Biometrika}, pages = {169--186}, title = {Retrospective {MCMC} for {D}irichlet process hierarchical models}, volume = {95}, year = {2008}, } @article{walker04slice, author = {Stephen G. Walker}, journal = {Communications in Statistics - Simulation and Computation}, pages = {45--54}, title = {Sampling the {D}irichlet Mixture Model with Slices}, volume = {36}, year = {2004}, } @techreport{dahl03splitmerge, author = {D. B. Dahl}, institution = {Department of Statistics, University of Wisconsin (U. Wisconsin)}, title = {An Improved Merge-Split Sampler for Conjugate {D}irichlet Process Mixture Models}, year = {2003}, } @techreport{dahl03univariate, author = {D. B. Dahl}, institution = {Department of Statistics, University of Wisconsin (U. Wisconsin)}, title = {Modal Clustering in a Univariate Class of Product Partition Models}, year = {2003}, } @techreport{neal00dp, author = {R. Neal}, institution = {Department of Statistics, University of Toronto (U. Toronto)}, title = {{M}arkov Chain Sampling Methods for {D}irichlet Process Mixture Models}, year = {2000}, } @techreport{jain00splitmerge, author = {S. Jain and R. Neal}, institution = {Department of Statistics, University of Toronto (U. Toronto)}, title = {A Split-Merge {M}arkov Chain {M}onte {C}arlo Procedure for the {D}irichlet Process Mixture Model}, year = {2000}, } @techreport{jain05splitmerge, author = {S. Jain and R. Neal}, institution = {Department of Statistics, University of Toronto (U. Toronto)}, title = {Splitting and merging components of a nonconjugate {D}irichlet process mixture model}, year = {2005}, } @article{blei03lda, author = {D. Blei and Andrew Ng and M. I. Jordan}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {993--1022}, title = {Latent {D}irichlet Allocation}, volume = {3}, year = {2003}, } @inproceedings{hamze04fields, author = {F. Hamze and N. de Freitas}, booktitle = {Uncertainty in Artificial Intelligence (UAI)}, title = {From Fields to Trees}, year = {2004}, } @inproceedings{welling06flexible, author = {M. Welling}, booktitle = {International Conference on Machine Learning Workshop on Nonparametric Bayesian Methods}, title = {Flexible Priors for Infinite Mixture Models}, year = {2006 2006}, } @article{johnson84randproj, author = {W. Johnson and J. Lindenstrauss}, journal = {Contemporary Mathematics}, pages = {189--206}, title = {Extensions of {L}ipschitz maps into a {H}ilbert space}, volume = {26}, year = {1984}, } @inproceedings{dasgupta99mixgauss, author = {S. Dasgupta}, booktitle = {Foundations of Computer Science (FOCS)}, title = {Learning mixtures of {G}aussians}, year = {1999}, } @article{kannan97convex, author = {R. Kannan and L. Lovasz and M. Simonovits}, journal = {Random Structures and Algorithms}, pages = {1--50}, title = {Random walks and an ${O}^*(n^5)$ volume algorithm for convex bodies}, volume = {11}, year = {1997}, } @inproceedings{friedman00bayesian, author = {N. Friedman and D. Koller}, booktitle = {Uncertainty in Artificial Intelligence (UAI)}, pages = {201--210}, title = {Being {B}ayesian about {B}ayesian Network Structure: A {B}ayesian Approach to Structure Discovery in {B}ayesian Networks}, year = {2000}, } @article{swendsen87, author = {R. H. Swendsen and J. S. Wang}, journal = {Physics Review Letters}, pages = {86--88}, title = {Nonuniversal critical dynamics in {MC} simulations}, volume = {58}, year = {1987}, } @article{barbu05swendsen, author = {A. Barbu and S. C. Zhu}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI)}, pages = {1239--1253}, title = {Generalizing {S}wendsen-{W}ang to sampling arbitrary posterior probabilities}, volume = {27}, year = {2005}, } @article{tanner87da, author = {M. A. Tanner and W. H. Wong}, journal = {Journal of the American Statistical Association (JASA)}, pages = {528--540}, title = {The calculation of posterior distributions by data augmentation}, volume = {82}, year = {1987}, } @article{liu98pxem, author = {C. Liu and D. Rubin and Y. N. Wu}, journal = {Biometrika}, pages = {755--770}, title = {Parameter expansion to accelerate {EM}: the {PX-EM} algorithm}, volume = {85}, year = {1998}, } @article{liu99pxda, author = {J. Liu and Y. Wu}, journal = {Journal of the American Statistical Association (JASA)}, pages = {1264--1274}, title = {Parameter expansion for data augmentation}, volume = {94}, year = {1999}, } @techreport{pitman02process, author = {J. Pitman}, institution = {Department of Statistics, University of California at Berkeley (UC Berkeley)}, number = {621}, title = {Combinatorial Stochastic Processes}, year = {2002}, } @book{bertsekas99nlp, author = {D. Bertsekas}, publisher = {Athena Scientific}, title = {Nonlinear Programming}, year = {1999}, } @book{tsybakov2009introduction, author = {Alexandre B. Tsybakov}, publisher = {Springer}, title = {Introduction to Nonparametric Estimation}, year = {2009}, } @techreport{mackay97hmm, author = {David MacKay}, institution = {University of Cambridge}, title = {Ensemble Learning for Hidden {M}arkov Models}, year = {1997}, } @techreport{bernholt2006robust, author = {Thorsten Bernholt}, institution = {Universit\"{a}t Dortmund}, title = {Robust estimators are hard to compute}, year = {2006}, } @techreport{wang2014qa, author = {Zhenghao Wang and Shengquan Yan and Huaming Wang and Xuedong Huang}, institution = {Microsoft Research}, title = {An Overview of Microsoft Deep {QA} System on Stanford WebQuestions Benchmark}, year = {2014}, } @inproceedings{hermjakob01parsing, author = {Ulf Hermjakob}, booktitle = {Workshop on Open-domain question answering, ACL}, pages = {1--6}, title = {Parsing and Question Classification for Question Answering}, year = {2001}, } @article{gildea02semantic, author = {D. Gildea and D. Jurafsky}, journal = {Computational Linguistics}, pages = {245--288}, title = {Automatic Labeling of Semantic Roles}, volume = {28}, year = {2002}, } @inproceedings{galley04translation, author = {Michel Galley and Mark Hopkins and Kevin Knight and Daniel Marcu}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, pages = {273--280}, title = {What's in a translation rule?}, year = {2004}, } @inproceedings{melamed04smt, author = {I. Dan Melamed}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Statistical Machine Translation by Parsing}, year = {2004}, } @article{chomsky56models, author = {Noam Chomsky}, journal = {IRE Transactions on Information Theory}, pages = {113--124}, title = {Three models for the description of language}, volume = {2}, year = {1956}, } @book{manning99nlp, author = {Chris Manning and Hinrich Schütze}, publisher = {MIT Press}, title = {Foundations of Statistical Natural Language Processing}, year = {1999}, } @article{marcus93treebank, author = {M. P. Marcus and M. A. Marcinkiewicz and B. Santorini}, journal = {Computational Linguistics}, pages = {313--330}, title = {Building a large annotated corpus of {E}nglish: the {P}enn {T}reebank}, volume = {19}, year = {1993}, } @inproceedings{charniak96treebank, author = {E. Charniak}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {1031--1036}, title = {Tree-bank Grammars}, year = {1996}, } @inproceedings{kurihara04varpcfg, author = {K. Kurihara and T. Sato}, booktitle = {International Joint Conference on Natural Language Processing Workshop Beyond Shallow Analyses}, title = {An Application of the Variational {B}ayesian Approach to Probabilistic Context-Free Grammars}, year = {2004}, } @inproceedings{kurihara06varinduct, author = {K. Kurihara and T. Sato}, booktitle = {International Colloquium on Grammatical Inference}, title = {Variational {B}ayesian Grammar Induction for Natural Language}, year = {2006}, } @inproceedings{petrov06latent, author = {S. Petrov and L. Barrett and R. Thibaux and D. Klein}, booktitle = {International Conference on Computational Linguistics and Association for Computational Linguistics (COLING/ACL)}, pages = {433--440}, title = {Learning Accurate, Compact, and Interpretable Tree Annotation}, year = {2006}, } @inproceedings{stolcke94merge, author = {A. Stolcke and S. Omohundro}, booktitle = {International Colloquium on Grammatical Inference and Applications}, pages = {106--118}, title = {Inducing Probabilistic Grammars by {B}ayesian Model Merging}, year = {1994}, } @inproceedings{wolff88syntax, author = {J. G. Wolff}, booktitle = {Categories and processes in language acquisition}, pages = {179--215}, title = {Learning syntax and meanings through optimization and distributional analysis}, year = {1988}, } @phdthesis{collins99thesis, author = {M. Collins}, school = {University of Pennsylvania}, title = {Head-Driven Statistical Models for Natural Language Parsing}, year = {1999}, } @inproceedings{eisner96dependency, author = {Jason Eisner}, booktitle = {International Conference on Computational Linguistics (COLING)}, pages = {340--345}, title = {Three New Probabilistic Models for Dependency Parsing: An Exploration}, year = {1996}, } @inproceedings{charniak00maxent, author = {E. Charniak}, booktitle = {Applied Natural Language Processing and North American Association for Computational Linguistics (ANLP/NAACL)}, pages = {132--139}, title = {A maximum-entropy-inspired parser}, year = {2000}, } @inproceedings{klein03unlexicalized, author = {D. Klein and C. Manning}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {423--430}, title = {Accurate Unlexicalized Parsing}, year = {2003}, } @article{johnson98parent, author = {Mark Johnson}, journal = {Computational Linguistics}, pages = {613--632}, title = {{PCFG} Models of Linguistic Tree Representations}, volume = {24}, year = {1998}, } @inproceedings{matsuzaki05latent, author = {T. Matsuzaki and Y. Miyao and J. Tsujii}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {75--82}, title = {Probabilistic {CFG} with Latent Annotations}, year = {2005}, } @inproceedings{johnson06adaptor, author = {Mark Johnson and Tom Griffiths and Sharon Goldwater}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {641--648}, title = {Adaptor Grammars: A Framework for Specifying Compositional Nonparametric {B}ayesian Models}, year = {2006}, } @inproceedings{blei04nested, author = {D. Blei and T. Griffiths and M. I. Jordan and J. Tenenbaum}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Hierarchical topic models and the nested {C}hinese restaurant process}, year = {2004}, } @inproceedings{goldwater05interpolate, author = {Sharon Goldwater and Tom Griffiths and Mark Johnson}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Interpolating Between Types and Tokens by Estimating Power-Law Generators}, year = {2005}, } @inproceedings{johnson07mcmc, author = {Mark Johnson and Tom Griffiths and Sharon Goldwater}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, pages = {139--146}, title = {{B}ayesian Inference for {PCFG}s via {M}arkov Chain {M}onte {C}arlo}, year = {2007}, } @inproceedings{haghighi07coref, author = {Aria Haghighi and Dan Klein}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Unsupervised Coreference Resolution in a Nonparametric {B}ayesian Model}, year = {2007}, } @inproceedings{daume06sum, author = {Hal {Daum{\'e} III} and Daniel Marcu}, booktitle = {International Conference on Computational Linguistics and Association for Computational Linguistics (COLING/ACL)}, title = {{B}ayesian Query-Focused Summarization}, year = {2006}, } @inproceedings{finkel07inftree, author = {J. R. Finkel and T. Grenager and C. Manning}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {272--279}, title = {The Infinite Tree}, year = {2007}, } @inproceedings{petrov07split, author = {S. Petrov and D. Klein}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, pages = {404--411}, title = {Learning and Inference for Hierarchically Split {PCFG}s}, year = {2007}, } @inproceedings{mcclosky06self, author = {David McClosky and Eugene Charniak and Mark Johnson}, booktitle = {International Conference on Computational Linguistics and Association for Computational Linguistics (COLING/ACL)}, title = {Reranking and Self-Training for Parser Adaptation}, year = {2006}, } @article{lari90scfg, author = {K. Lari and S. J. Young}, journal = {Computer Speech and Language}, pages = {35--56}, title = {The estimation of stochastic context-free grammars using the inside-outside algorithm}, volume = {4}, year = {1990}, } @article{brown93mt, author = {Peter F. Brown and Stephen A. Della Pietra and Vincent J. Della Pietra and Robert L. Mercer}, journal = {Computational Linguistics}, pages = {263--311}, title = {The Mathematics of Statistical Machine Translation: Parameter Estimation}, volume = {19}, year = {1993}, } @inproceedings{neal98gem, author = {R. M. Neal and G. E. Hinton}, booktitle = {Learning in Graphical Models}, pages = {355--368}, title = {A new view of the {EM} algorithm that justifies incremental, sparse and other variants}, year = {1998}, } @inproceedings{collins99unsupervised, author = {Michael Collins and Yoram Singer}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Unsupervised Models for Named Entity Classification}, year = {1999}, } @inproceedings{chen96smoothing, author = {Stanley F. Chen and Joshua Goodman}, booktitle = {Association for Computational Linguistics (ACL)}, title = {An Empirical Study of Smoothing Techniques for Language Modeling}, year = {1996}, } @inproceedings{ney96hmm, author = {Hermann Ney and Stephan Vogel}, booktitle = {International Conference on Computational Linguistics (COLING)}, pages = {836--841}, title = {{HMM}-Based Word Alignment in Statistical Translation}, year = {1996}, } @inproceedings{blum98cotraining, author = {Avrim Blum and Tom Mitchell}, booktitle = {Conference on Learning Theory (COLT)}, title = {Combining Labeled and Unlabeled Data with Co-training}, year = {1998}, } @inproceedings{carroll92dependency, author = {Glenn Carroll and Eugene Charniak}, booktitle = {Workshop Notes for Statistically-Based NLP Techniques, AAAI}, pages = {1--13}, title = {Two Experiments on Learning Probabilistic Dependency Grammars from Corpora}, year = {1992}, } @inproceedings{haghighi06induction, author = {Aria Haghighi and Dan Klein}, booktitle = {International Conference on Computational Linguistics and Association for Computational Linguistics (COLING/ACL)}, title = {Prototype-based Grammar Induction}, year = {2006}, } @inproceedings{pereira92bracket, author = {Fernando Pereira and Yves Shabes}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {128--135}, title = {Inside-outside reestimation from partially bracketed corpora}, year = {1992}, } @article{merialdo94tagging, author = {Bernard Merialdo}, journal = {Computational Linguistics}, pages = {155--171}, title = {Tagging {E}nglish text with a probabilistic model}, volume = {20}, year = {1994}, } @inproceedings{clark01induction, author = {Alexander Clark}, booktitle = {Computational Natural Language Learning (CoNLL)}, title = {Unsupervised induction of stochastic context free grammars with distributional clustering}, year = {2001}, } @inproceedings{paskin02bigrams, author = {Mark A. Paskin}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Grammatical Bigrams}, year = {2002}, } @inproceedings{klein04induction, author = {Dan Klein and Christopher D. Manning}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {478--485}, title = {Corpus-Based Induction of Syntactic Structure: Models of Dependency and Constituency}, year = {2004}, } @inproceedings{smith05contrastive, author = {Noah Smith and Jason Eisner}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {354--362}, title = {Contrastive Estimation: Training Log-Linear Models on Unlabeled Data}, year = {2005}, } @inproceedings{smith06anneal, author = {Noah Smith and Jason Eisner}, booktitle = {International Conference on Computational Linguistics and Association for Computational Linguistics (COLING/ACL)}, title = {Annealing Structural Bias in Multilingual Weighted Grammar Induction}, year = {2006}, } @inproceedings{goldwater07pos, author = {S. Goldwater and T. Griffiths}, booktitle = {Association for Computational Linguistics (ACL)}, title = {A Fully {B}ayesian Approach to Unsupervised Part-of-Speech Tagging}, year = {2007}, } @inproceedings{johnson08synergy, author = {Mark Johnson}, booktitle = {Human Language Technology and Association for Computational Linguistics (HLT/ACL)}, pages = {398--406}, title = {Using Adaptor Grammars to Identify Synergies in the Unsupervised Acquisition of Linguistic Structure}, year = {2008}, } @inproceedings{johnson07pos, author = {Mark Johnson}, booktitle = {Empirical Methods in Natural Language Processing and Computational Natural Language Learning (EMNLP/CoNLL)}, title = {Why doesn't {EM} find good {HMM} {POS}-taggers?}, year = {2007}, } @article{goldwater09segmentation, author = {Sharon Goldwater and Tom Griffiths and Mark Johnson}, journal = {Cognition}, pages = {21--54}, title = {A {B}ayesian Framework for Word Segmentation: Exploring the Effects of Context}, volume = {112}, year = {2009}, } @inproceedings{johnson09segmentation, author = {Mark Johnson and Sharon Goldwater}, booktitle = {North American Association for Computational Linguistics (NAACL)}, pages = {317--325}, title = {Improving nonparameteric {B}ayesian inference: experiments on unsupervised word segmentation with adaptor grammars}, year = {2009}, } @inproceedings{cohn09ptsg, author = {Trevor Cohn and Sharon Goldwater and Phil Blunsom}, booktitle = {North American Association for Computational Linguistics (NAACL)}, pages = {548--556}, title = {Inducing Compact but Accurate Tree-Substitution Grammars}, year = {2009}, } @inproceedings{post09ptsg, author = {Matt Post and Daniel Gildea}, booktitle = {Association for Computational Linguistics and International Joint Conference on Natural Language Processing (ACL-IJCNLP)}, title = {{B}ayesian learning of a tree substitution grammar}, year = {2009}, } @inproceedings{gao08comparison, author = {Jianfeng Gao and Mark Johnson}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {344--352}, title = {A comparison of {B}ayesian estimators for unsupervised Hidden {M}arkov Model {POS} taggers}, year = {2008}, } @inproceedings{grenager05segmentation, author = {Trond Grenager and Dan Klein and Christopher D. Manning}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {371--378}, title = {Unsupervised learning of field segmentation models for information extraction}, year = {2005}, } @article{dasgupta07em, author = {Sanjoy Dasgupta and Leonard Schulman}, journal = {Journal of Machine Learning Research (JMLR)}, title = {A Probabilistic Analysis of {EM} for Mixtures of Separated, Spherical {G}aussians}, volume = {8}, year = {2007}, } @article{ron98pfa, author = {Dana Ron and Yoram Singer and Naftali Tishby}, journal = {Journal of Computer and System Sciences}, pages = {133--152}, title = {On the Learnability and Usage of Acyclic Probabilistic Finite Automata}, volume = {56}, year = {1998}, } @inproceedings{srebro06mixture, author = {Nathan Srebro and Gregory Shakhnarovich and Sam Roweis}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {865--872}, title = {An investigation of computational and informational limits in {G}aussian mixture clustering}, year = {2006}, } @inproceedings{feldman05product, author = {Jon Feldman and Ryan O'Donnell and Rocco A. Servedio}, booktitle = {Foundations of Computer Science (FOCS)}, pages = {501--510}, title = {Learning mixtures of product distributions over discrete domains}, year = {2005}, } @article{clark05fsa, author = {Alexander Clark and Franck Thollard}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {473--497}, title = {{PAC}-learnability of Probabilistic Deterministic Finite State Automata}, volume = {5}, year = {2005}, } @article{blackwell57identifiable, author = {David Blackwell and Lambert Koopmans}, journal = {Annals of Mathematical Statistics}, pages = {1011--1015}, title = {On the Identifiability Problem for Functions of Finite {M}arkov Chains}, volume = {28}, year = {1957}, } @techreport{adriaans99shallow, author = {Pieter W. Adriaans}, institution = {Stanford University}, title = {Learning Shallow Context-Free Languages under Simple Distributions}, year = {1999}, } @article{kuhn55hungarian, author = {H. W. Kuhn}, journal = {Naval Research Logistic Quarterly}, pages = {83--97}, title = {The {H}ungarian method for the assignment problem}, volume = {2}, year = {1955}, } @phdthesis{ratnaparkhi98thesis, author = {Adwait Ratnaparkhi}, school = {University of Pennsylvania}, title = {Maximum entropy models for natural language ambiguity resolution}, year = {1998}, } @inproceedings{mccallum00memm, author = {Andrew McCallum and Dayne Freitag and Fernando Pereira}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Maximum Entropy {M}arkov Models for Information Extraction and Segmentation}, year = {2000}, } @inproceedings{lafferty01crf, author = {John Lafferty and Andrew McCallum and Fernando Pereira}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {282--289}, title = {Conditional Random Fields: Probabilistic Models for Segmenting and Labeling Data}, year = {2001}, } @inproceedings{kakade02objective, author = {Sham Kakade and Yee Whye Teh and Sam Roweis}, booktitle = {International Conference on Machine Learning (ICML)}, title = {An Alternate Objective Function for {M}arkovian Fields}, year = {2002}, } @inproceedings{klein02conditional, author = {Dan Klein and Christopher D. Manning}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Conditional structure versus conditional estimation in {NLP} models}, year = {2002}, } @inproceedings{ng02compare, author = {Andrew Y. Ng and Michael I. Jordan}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {On Discriminative vs. Generative classifiers: A comparison of logistic regression and naive {B}ayes}, year = {2002}, } @article{white82mis, author = {Halbert White}, journal = {Econometrica}, title = {Maximum likelihood estimation of misspecified models}, volume = {50}, year = {1982}, } @article{godambe87quasi, author = {V. P. Godambe and C. C. Heyde}, journal = {International Statistical Review}, pages = {231--244}, title = {Quasi-likelihood and Optimal estimation}, volume = {55}, year = {1987}, } @inproceedings{pal06mcl, author = {Andrew McCallum and Chris Pal and Greg Druck and Xuerei Wang}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Multi-Conditional Learning: Generative/Discriminative Training for Clustering and Classification}, year = {2006}, } @inproceedings{lasserre06hybrid, author = {Julia A. Lasserre and Christopher M. Bishop and Thomas P. Minka}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {87--94}, title = {Principled Hybrids of Generative and Discriminative Models}, year = {2006}, } @inproceedings{raina04hybrid, author = {R. Raina and Y. Shen and A. Ng and A. McCallum}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Classification with hybrid generative/discriminative models}, year = {2004}, } @inproceedings{suzuki07hybrid, author = {Jun Suzuki and Akinori Fujino and Hideki Isozaki}, booktitle = {Empirical Methods in Natural Language Processing and Computational Natural Language Learning (EMNLP/CoNLL)}, title = {Semi-Supervised Structured Output Learning based on a Hybrid Generative and Discriminative Approach}, year = {2007}, } @inproceedings{bouchard04tradeoff, author = {Guillaume Bouchard and Bill Triggs}, booktitle = {International Conference on Computational Statistics}, pages = {721--728}, title = {The Trade-Off Between Generative and Discriminative Classifiers}, year = {2004}, } @book{vaart98asymptotic, author = {A. W. van der Vaart}, publisher = {Cambridge University Press}, title = {Asymptotic statistics}, year = {1998}, } @article{besag75pseudo, author = {J. Besag}, journal = {The Statistician}, pages = {179--195}, title = {The analysis of non-lattice data}, volume = {24}, year = {1975}, } @article{lindsay88composite, author = {B. Lindsay}, journal = {Contemporary Mathematics}, pages = {221--239}, title = {Composite likelihood methods}, volume = {80}, year = {1988}, } @inproceedings{sutton05piecewise, author = {Charles Sutton and Andrew McCallum}, booktitle = {Uncertainty in Artificial Intelligence (UAI)}, title = {Piecewise Training of Undirected Models}, year = {2005}, } @inproceedings{sutton07pwpl, author = {Charles Sutton and Andrew McCallum}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Piecewise Pseudolikelihood for Efficient {CRF} Training}, year = {2007}, } @article{cox04pseudo, author = {David R. Cox and Nancy Reid}, journal = {Biometrika}, pages = {729--737}, title = {A note on pseudolikelihood constructed from marginal densities}, volume = {91}, year = {2004}, } @article{varin08composite, author = {Cristiano Varin}, journal = {Advances in Statistical Analysis}, pages = {1--28}, title = {On composite marginal likelihoods}, volume = {92}, year = {2008}, } @article{wainwright06wrong, author = {Martin Wainwright}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {1829--1859}, title = {Estimating the ``wrong'' graphical model: Benefits in the computation-limited setting}, volume = {7}, year = {2006}, } @inproceedings{wainwright03trw, author = {Martin Wainwright and Tommi Jaakkola and Alan Willsky}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, title = {Tree-reweighted belief propagation algorithms and approximate {ML} estimation by pseudo-moment matching}, year = {2003}, } @article{hyvarinen06pseudolikelihood, author = {Aapo Hyv\"arinen}, journal = {Neural Computation}, pages = {2283--2292}, title = {Consistency of pseudolikelihood estimation of fully visible {B}oltzmann machines}, volume = {18}, year = {2006}, } @inproceedings{hinton99poe, author = {Goeffrey Hinton}, booktitle = {International Conference on Artificial Neural Networks (ICANN)}, title = {Products of Experts}, year = {1999}, } @book{robert04mc, author = {Christian P. Robert and George Casella}, publisher = {Springer}, title = {{M}onte {C}arlo Statistical Methods}, year = {2004}, } @article{wainwright08varinf, author = {Martin Wainwright and Michael I. Jordan}, journal = {Foundations and Trends in Machine Learning}, pages = {1--307}, title = {Graphical models, exponential families, and variational inference}, volume = {1}, year = {2008}, } @article{siepel04phylohmm, author = {Adam Siepel and David Haussler}, journal = {Journal of Computational Biology}, pages = {413--428}, title = {Combining phylogenetic and hidden {M}arkov models in biosequence analysis}, volume = {11}, year = {2004}, } @article{felsenstein96phylohmm, author = {J. Felsenstein and G. A. Churchill}, journal = {Molecular Biology and Evolution}, pages = {93--104}, title = {A hidden {M}arkov model approach to variation among sites in rate of evolution}, volume = {13}, year = {1996}, } @article{jojic04phylohmm, author = {V. Jojic and N. Jojic and C. Meek and D. Geiger and A. Siepel and D. Haussler and D. Heckerman}, journal = {Bioinformatics}, pages = {161--168}, title = {Efficient approximations for learning phylogenetic {HMM} models from data}, volume = {20}, year = {2004}, } @inproceedings{geiger05structured, author = {Dan Geiger and Christopher Meek}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, title = {Structured Variational Inference Procedures and their Realizations}, year = {2005}, } @inproceedings{shotton06textonboost, author = {J. Shotton and J. Winn and C. Rother and A. Criminisi}, booktitle = {European Conference on Computer Vision (ECCV)}, title = {TextonBoost: Joint Appearance, Shape and Context Modeling for Multi-Class Object Recognition and Segmentation}, year = {2006}, } @article{zhu06grammar, author = {S. C. Zhu and D. Mumford}, journal = {Foundations and Trends in Computer Graphics and Vision}, pages = {259--362}, title = {A Stochastic Grammar of Images}, volume = {2}, year = {2006}, } @article{sakakibara05grammar, author = {Yasubumi Sakakibara}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI)}, pages = {1051--1062}, title = {Grammatical Inference in Bioinformatics}, volume = {27}, year = {2005}, } @inproceedings{denero08phrase, author = {John DeNero and Alexandre Bouchard-C\^ot\'e and Dan Klein}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {314--323}, title = {Sampling Alignment Structure under a {B}ayesian Translation Model}, year = {2008}, } @inproceedings{wallach08dependency, author = {Hanna Wallach and Charles Sutton and Andrew McCallum}, booktitle = {Workshop on Prior Knowledge for Text and Language}, pages = {15--20}, title = {{B}ayesian Modeling of Dependency Trees Using Hierarchical {P}itman-{Y}or Priors}, year = {2008}, } @inproceedings{blunsom09synchronous, author = {Phil Blunsom and Trevor Cohn and Miles Osborne}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {{B}ayesian Synchronous Grammar Induction}, year = {2009}, } @article{wu97itg, author = {Dekai Wu}, journal = {Computational Linguistics}, pages = {377--404}, title = {Stochastic inversion transduction grammars and bilingual parsing of parallel corpora}, volume = {23}, year = {1997}, } @article{dyrka07pcfg, author = {Witold Dyrka and Jean-Christophe Nebel}, journal = {Systems Biology, Bioinformatics and Synthetic Biology}, pages = {78--79}, title = {A probabilistic context-free grammar for the detection of binding sites from a protein sequence}, volume = {1}, year = {2007}, } @inproceedings{saxena07scene, author = {Ashutosh Saxena and Min Sun and Andrew Y. Ng}, booktitle = {International Conference on Computer Vision (ICCV)}, title = {Learning 3-{D} Scene Structure from a Single Still Image}, year = {2007}, } @inproceedings{delage06dbn, author = {Erick Delage and Honglak Lee and Andrew Y. Ng}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {A dynamic {B}ayesian network model for autonomous 3d reconstruction}, year = {2006}, } @inproceedings{hoiem05geometric, author = {Derek Hoiem and Alexei A. Efros and Martial Herbert}, booktitle = {International Conference on Computer Vision (ICCV)}, title = {Geometric Context from a Single Image}, year = {2005}, } @inproceedings{hoiem07occlusion, author = {Derek Hoiem and Andrew N. Stein and Alexei A. Efros and Martial Herbert}, booktitle = {International Conference on Computer Vision (ICCV)}, title = {Recovering Occlusion Boundaries from a Single Image}, year = {2007}, } @inproceedings{leung96repeat, author = {Thomas Leung and Jitendra Malik}, booktitle = {European Conference on Computer Vision (ECCV)}, title = {Detecting, Localizing and Grouping Repeated Scene Elements from an Image}, year = {1996}, } @inproceedings{ren06figure, author = {Xiaofeng Ren and Charless C. Fowlkes and Jitendra Malik}, booktitle = {European Conference on Computer Vision (ECCV)}, title = {Figure/Ground Assignment in Natural Images}, year = {2006}, } @book{pollard84convergence, author = {David Pollard}, publisher = {Springer-Verlag}, title = {Convergence of Stochastic Processes}, year = {1984}, } @article{zhang02covering, author = {Tong Zhang}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {527--550}, title = {Covering number bounds of certain regularized linear function classes}, volume = {2}, year = {2002}, } @inproceedings{collins01theory, author = {Michael Collins}, booktitle = {International Workshop on Parsing Technologies}, title = {Parameter Estimation for Statistical Parsing Models: Theory and Practice of Distribution-Free Methods}, year = {2001}, } @article{csiszar04info, author = {Imre Csisz\'ar and Paul Shields}, journal = {Foundations and Trends in Communications and Information Theory}, pages = {417--528}, title = {Information Theory and Statistics: A Tutorial}, volume = {1}, year = {2004}, } @inproceedings{bartlett01rademacher, author = {P. L. Bartlett and S. Mendelson}, booktitle = {Conference on Learning Theory (COLT)}, pages = {224--240}, title = {{R}ademacher and {G}aussian complexities: Risk bounds and structural results}, year = {2001}, } @book{shawetaylor04kernel, author = {John Shawe-Taylor and Nello Cristianini}, publisher = {Cambridge University Press}, title = {Kernel Methods for Pattern Analysis}, year = {2004}, } @inproceedings{crammar07multiple, author = {Koby Crammar and Michael Kearns and Jennifer Wortman}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Learning from Multiple Sources}, year = {2007}, } @inproceedings{punyakanok05constrained, author = {Vasin Punyakanok and Dan Roth and Wen-tau Yih and Dav Zimak}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Learning and Inference over Constrained Output}, year = {2005}, } @inproceedings{bucila06compress, author = {Cristian Bucil\u{a} and Rich Caruana and Alexandru Niculescu-Mizil}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, title = {Model Compression}, year = {2006}, } @phdthesis{craven96trepan, author = {Mark W. Craven}, school = {University of Wisconsin at Madison}, title = {Extracting comprehensible models from trained neural networks}, year = {1996}, } @book{krishnamurthi06pl, author = {Shriram Krishnamurthi}, publisher = {Creative Commons}, title = {Programming Languages: Application and Interpretation}, year = {2006}, } @article{wand87simple, author = {Mitchell Wand}, journal = {Fundamenta Informaticae}, pages = {115--122}, title = {A Simple Algorithm and Proof for Type Inference}, volume = {10}, year = {1987}, } @inproceedings{kothari08polylet, author = {Sunil Kothari and James L. Caldwell}, booktitle = {Fourth Conference on Computability}, title = {On Extending {W}and's Type Reconstruction Algorithm to Handle Polymorphic Let}, year = {2008}, } @techreport{kothari07survey, author = {Sunil Kothari}, institution = {University of Wyoming}, title = {Type Reconstruction Algorithms - A Survey}, year = {2007}, } @techreport{pottier05modern, author = {François Pottier}, institution = {INRIA}, title = {A Modern Eye on {ML} Type Inference: Old Techniques and Recent Developments}, year = {2005}, } @article{collins08exponentiated, author = {M. Collins and Amir Globerson and Terry Koo and Xavier Carreras and Peter Bartlett}, journal = {Journal of Machine Learning Research (JMLR)}, title = {Exponentiated Gradient Algorithms for Conditional Random Fields and Max-Margin {M}arkov Networks}, volume = {9}, year = {2008}, } @inproceedings{finkel08crf, author = {J. R. Finkel and A. Kleeman and C. Manning}, booktitle = {Human Language Technology and Association for Computational Linguistics (HLT/ACL)}, title = {Efficient, Feature-based, Conditional Random Field Parsing}, year = {2008}, } @inproceedings{neal98incremental, author = {R. Neal and G. Hinton}, booktitle = {Learning in Graphical Models}, title = {A view of the {EM} algorithm that justifies incremental, sparse, and other variants}, year = {1998}, } @article{cappe09online, author = {Olivier Capp\'e and Eric Moulines}, journal = {Journal of the Royal Statistics Society: Series B (Statistical Methodology)}, pages = {593--613}, title = {Online Expectation-Maximization Algorithm for Latent Data Models}, volume = {71}, year = {2009}, } @inproceedings{collins02perceptron, author = {Michael Collins}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Discriminative Training Methods for Hidden {M}arkov Models: Theory and Experiments with {P}erceptron Algorithms}, year = {2002}, } @article{och03systematic, author = {Franz Josef Och and Hermann Ney}, journal = {Computational Linguistics}, pages = {19--51}, title = {A Systematic Comparison of Various Statistical Alignment Models}, volume = {29}, year = {2003}, } @article{sato00online, author = {Masa-aki Sato and Shin Ishii}, journal = {Neural Computation}, pages = {407--432}, title = {On-line {EM} Algorithm for the Normalized {G}aussian Network}, volume = {12}, year = {2000}, } @inproceedings{mcdonald05online, author = {Ryan McDonald and Koby Crammer and Fernando Pereira}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {91--98}, title = {Online Large-Margin Training of Dependency Parsers}, year = {2005}, } @inproceedings{bottou08large, author = {Léon Bottou and Olivier Bousquet}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {The Tradeoffs of Large Scale Learning}, year = {2008}, } @inproceedings{shalev08inverse, author = {Shai Shalev-Shwartz and Nathan Srebro}, booktitle = {International Conference on Machine Learning (ICML)}, title = {{SVM} Optimization: Inverse Dependence on Training Set Size}, year = {2008}, } @inproceedings{seginer07fast, author = {Yoav Seginer}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Fast Unsupervised Incremental Parsing}, year = {2007}, } @inproceedings{yarowsky95unsupervised, author = {David Yarowsky}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Unsupervised word sense disambiguation rivaling supervised methods}, year = {1995}, } @inproceedings{salakhutdinov03ecg, author = {Ruslan Salakhutdinov and Sam Roweis and Zoubin Ghahramani}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Optimization with {EM} and expectation-conjugate-gradient}, year = {2003}, } @inproceedings{gildea99topic, author = {Dan Gildea and Thomas Hofmann}, booktitle = {Eurospeech}, title = {Topic-based language models using {EM}}, year = {1999}, } @inproceedings{kuo08transliterations, author = {Jin-Shea Kuo and Haizhou Li and Chih-Lung Lin}, booktitle = {Sixth SIGHAN Workshop on Chinese Language Processing}, title = {Mining Transliterations from Web Query Results: An Incremental Approach}, year = {2008}, } @article{venkataraman01word, author = {A. Venkataraman}, journal = {Computational Linguistics}, pages = {351--372}, title = {A statistical model for word discovery in transcribed speech}, volume = {27}, year = {2001}, } @inproceedings{quadrianto08labels, author = {Novi Quadrianto and Alex J. Smola and Tiberio S. Caetano and Quoc V. Le}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {776--783}, title = {Estimating labels from label proportions}, year = {2008}, } @inproceedings{ganchev08multi, author = {Kuzman Ganchev and João Graça and John Blitzer and Ben Taskar}, booktitle = {Uncertainty in Artificial Intelligence (UAI)}, title = {Multi-View Learning over Structured and Non-Identical Outputs}, year = {2008}, } @inproceedings{graca08em, author = {João Graça and Kuzman Ganchev and Ben Taskar}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {569--576}, title = {Expectation Maximization and Posterior Constraints}, year = {2008}, } @inproceedings{druck08ge, author = {Gregory Druck and Gideon Mann and Andrew McCallum}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, pages = {595--602}, title = {Learning from Labeled Features using Generalized Expectation Criteria}, year = {2008}, } @inproceedings{mann07expectation, author = {Gideon Mann and Andrew McCallum}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {593--600}, title = {Simple, Robust, Scalable Semi-supervised Learning via Expectation Regularization}, year = {2007}, } @inproceedings{mann08ge, author = {Gideon Mann and Andrew McCallum}, booktitle = {Human Language Technology and Association for Computational Linguistics (HLT/ACL)}, pages = {870--878}, title = {Generalized Expectation Criteria for Semi-Supervised Learning of Conditional Random Fields}, year = {2008}, } @inproceedings{chang07constraint, author = {Ming-Wei Chang and Lev Ratinov and Dan Roth}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {280--287}, title = {Guiding Semi-Supervision with Constraint-Driven Learning}, year = {2007}, } @inproceedings{haghighi06prototype, author = {Aria Haghighi and Dan Klein}, booktitle = {North American Association for Computational Linguistics (NAACL)}, pages = {320--327}, title = {Prototype-Driven Learning for Sequence Models}, year = {2006}, } @inproceedings{zaidan08annotator, author = {Omar F. Zaidan and Jason Eisner}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Modeling Annotators: A Generative Approach to Learning from Annotator Rationales}, year = {2008}, } @inproceedings{zaidan07annotator, author = {Omar F. Zaidan and Jason Eisner and Christine D. Piatko}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, title = {Using "Annotator Rationales" to Improve Machine Learning for Text Categorization}, year = {2007}, } @inproceedings{moore04improving, author = {Robert C. Moore}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {518--525}, title = {Improving {IBM} Word Alignment Model 1}, year = {2004}, } @inproceedings{daume04alignment, author = {Hal {Daum{\'e} III} and Daniel Marcu}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Phrase-Based {HMM} Approach to Document/Abstract Alignment}, year = {2004}, } @inproceedings{barzilay05content, author = {Regina Barzilay and Mirella Lapata}, booktitle = {Human Language Technology and Empirical Methods in Natural Language Processing (HLT/EMNLP)}, pages = {331--338}, title = {Collective Content Selection for Concept-To-Text Generation}, year = {2005}, } @inproceedings{snyder07database, author = {Benjamin Snyder and Regina Barzilay}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, pages = {1713--1718}, title = {Database-Text Alignment via Structured Multilabel Classification}, year = {2007}, } @inproceedings{zettlemoyer05ccg, author = {Luke S. Zettlemoyer and Michael Collins}, booktitle = {Uncertainty in Artificial Intelligence (UAI)}, pages = {658--666}, title = {Learning to Map Sentences to Logical Form: Structured Classification with Probabilistic Categorial Grammars}, year = {2005}, } @inproceedings{zettlemoyer07relaxed, author = {Luke S. Zettlemoyer and Michael Collins}, booktitle = {Empirical Methods in Natural Language Processing and Computational Natural Language Learning (EMNLP/CoNLL)}, pages = {678--687}, title = {Online Learning of Relaxed {CCG} Grammars for Parsing to Logical Form}, year = {2007}, } @inproceedings{lu08generative, author = {Wei Lu and Hwee Tou Ng and Wee Sun Lee and Luke S. Zettlemoyer}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {783--792}, title = {A Generative Model for Parsing Natural Language to Meaning Representations}, year = {2008}, } @inproceedings{ge05scissor, author = {Ruifang Ge and Raymond J. Mooney}, booktitle = {Computational Natural Language Learning (CoNLL)}, pages = {9--16}, title = {A Statistical Semantic Parser that Integrates Syntax and Semantics}, year = {2005}, } @inproceedings{kate06krisp, author = {Rohit J. Kate and Raymond J. Mooney}, booktitle = {International Conference on Computational Linguistics and Association for Computational Linguistics (COLING/ACL)}, pages = {913--920}, title = {Using String-Kernels for Learning Semantic Parsers}, year = {2006}, } @inproceedings{kate07krisper, author = {Rohit J. Kate and Raymond J. Mooney}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {895--900}, title = {Learning Language Semantics from Ambiguous Supervision}, year = {2007}, } @inproceedings{wong06mt, author = {Yuk Wah Wong and Raymond J. Mooney}, booktitle = {North American Association for Computational Linguistics (NAACL)}, pages = {439--446}, title = {Learning for semantic parsing with statistical machine translation}, year = {2006}, } @inproceedings{wong07synchronous, author = {Yuk Wah Wong and Raymond J. Mooney}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {960--967}, title = {Learning Synchronous Grammars for Semantic Parsing with Lambda Calculus}, year = {2007}, } @inproceedings{wong07generation, author = {Yuk Wah Wong and Raymond J. Mooney}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, pages = {172--179}, title = {Generation by Inverting a Semantic Parser That Uses Statistical Machine Translation}, year = {2007}, } @inproceedings{chen08sportscast, author = {David L. Chen and Raymond J. Mooney}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {128--135}, title = {Learning to Sportscast: A Test of Grounded Language Acquisition}, year = {2008}, } @article{feldman04embodied, author = {J. Feldman and S. Narayanan}, journal = {Brain and Language}, pages = {385--392}, title = {Embodied Meaning in a Neural Theory of Language}, volume = {89}, year = {2004}, } @inproceedings{branavan08annotation, author = {S.R.K. Branavan and Harr Chen and Jacob Eisenstein and Regina Barzilay}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Learning Document-Level Semantic Properties from Free-text Annotations}, year = {2008}, } @article{barzilay08coherence, author = {Regina Barzilay and Mirella Lapata}, journal = {Computational Linguistics}, pages = {1--34}, title = {Modeling Local Coherence: An Entity-based Approach}, volume = {34}, year = {2008}, } @inproceedings{eisenstein08topic, author = {Jacob Eisenstein and Regina Barzilay}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {334--343}, title = {{B}ayesian Unsupervised Topic Segmentation}, year = {2008}, } @inproceedings{barzilay06aggregation, author = {Regina Barzilay and Mirella Lapata}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Aggregation via Set Partitioning for Natural Language Generation}, year = {2006}, } @inproceedings{barzilay04content, author = {Regina Barzilay and Lillian Lee}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, title = {Catching the Drift: Probabilistic Content Models, with Applications to Generation and Summarization}, year = {2004}, } @article{siskind96cross, author = {J. M. Siskind}, journal = {Cognition}, pages = {1--38}, title = {A computational study of cross-situational techniques for learning word-to-meaning mappings}, volume = {61}, year = {1996}, } @article{gorniak07situated, author = {P. Gorniak and D. Roy}, journal = {Cognitive Science}, pages = {197--231}, title = {Situated Language Understanding as Filtering Perceived Affordances}, volume = {31}, year = {2007}, } @inproceedings{yu04grounding, author = {C. Yu and D. H. Ballard}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {488--493}, title = {On the integration of grounding language and learning objects}, year = {2004}, } @inproceedings{grenager06verb, author = {Trond Grenager and Christopher D. Manning}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Unsupervised discovery of a statistical verb lexicon}, year = {2006}, } @inproceedings{poon09semantic, author = {Hoifung Poon and Pedro Domingos}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Unsupervised Semantic Parsing}, year = {2009}, } @inproceedings{zettlemoyer09context, author = {Luke S. Zettlemoyer and Michael Collins}, booktitle = {Association for Computational Linguistics and International Joint Conference on Natural Language Processing (ACL-IJCNLP)}, title = {Learning Context-dependent Mappings from Sentences to Logical Form}, year = {2009}, } @inproceedings{branavan09reinforcement, author = {S.R.K. Branavan and Harr Chen and Luke S. Zettlemoyer and Regina Barzilay}, booktitle = {Association for Computational Linguistics and International Joint Conference on Natural Language Processing (ACL-IJCNLP)}, pages = {82--90}, title = {Reinforcement Learning for Mapping Instructions to Actions}, year = {2009}, } @article{yu07unified, author = {C. Yu and D. H. Ballard}, journal = {Neurocomputing}, number = {13}, pages = {2149--2165}, title = {A Unified Model of Early Word Learning: Integrating Statistical and Social Cues}, volume = {70}, year = {2007}, } @article{frank09intentions, author = {Michael C. Frank and Noah D. Goodman and Joshua B. Tenenbaum}, journal = {Psychological Science}, number = {5}, pages = {578--585}, title = {Using Speakers' Referential Intentions to Model Early Cross-Situational Word Learning}, volume = {20}, year = {2009}, } @article{chaloner95bayesian, author = {Kathryn Chaloner and Isabella Verdinelli}, journal = {Statistical Science}, pages = {273--304}, title = {{B}ayesian Experimental Design: A Review}, volume = {10}, year = {1995}, } @inproceedings{seeger08cs, author = {Matthias Seeger and Hannes Nickisch}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {912--919}, title = {Compressed Sensing and {B}ayesian Experimental Design}, year = {2008}, } @article{nemirovski02saddle, author = {A. Nemirovski and R. Y. Rubinstein}, journal = {International Series in Operations Research and Management Science}, pages = {155--184}, title = {An Efficient Stochastic Approximation Algorithm for Stochastic Saddle Point Problems}, volume = {46}, year = {2002}, } @phdthesis{schein05active, author = {Andrew I. Schein}, school = {Carnegie Mellon University}, title = {Active Learning for Logistic Regression}, year = {2005}, } @inproceedings{jaakkola97logistic, author = {Tommi Jaakkola and Michael I. Jordan}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, title = {A variational approach to {B}ayesian logistic regression models and their extensions}, year = {1997}, } @article{dudik07maxent, author = {Miroslav Dudík and Steven J. Phillips and Robert E. Schapire}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {1217--1260}, title = {Maximum Entropy Density Estimation}, volume = {8}, year = {2007}, } @book{borwein05variational, author = {Jonathan M. Borwein and Qiji Jim Zhu}, publisher = {Springer}, title = {Techniques of Variational Analysis}, year = {2005}, } @inproceedings{roy01active, author = {Nicholas Roy and Andrew McCallum}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {441--448}, title = {Toward Optimal Active Learning through Sampling Estimation of Error Reduction}, year = {2001}, } @article{brown92class, author = {P. F. Brown and V. J. Della Pietra and P. V. deSouza and J. C. Lai and R. L. Mercer}, journal = {Computational Linguistics}, pages = {467--479}, title = {Class-Based n-gram Models of Natural Language}, volume = {18}, year = {1992}, } @inproceedings{grandvalet05entropy, author = {Yves Grandvalet and Yoshua Bengio}, booktitle = {Semi-Supervised Learning}, title = {Entropy Regularization}, year = {2005}, } @inproceedings{stein61quadratic, author = {W. James and C. Stein}, booktitle = {Fourth Berkeley Symposium in Mathematics, Statistics, and Probability}, pages = {361--380}, title = {Estimation with Quadratic Loss}, year = {1961}, } @inproceedings{bouchard07tradeoff, author = {Guillaume Bouchard}, booktitle = {Sixth International Conference on Machine Learning and Applications (ICMLA)}, pages = {124--129}, title = {Bias-Variance Tradeoff in Hybrid Generative-Discriminative Models}, year = {2007}, } @article{akaike74aic, author = {Hirotugu Akaike}, journal = {IEEE Transactions on Automatic Control}, pages = {716--723}, title = {A new look at the statistical model identification}, volume = {19}, year = {1974}, } @article{bakker03task, author = {B. Bakker and T. Heskes}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {83--99}, title = {Task clustering and gating for {B}ayesian multitask learning}, volume = {4}, year = {2003}, } @article{evgeniou05task, author = {T. Evgeniou and C. Micchelli and M. Pontil}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {615--637}, title = {Learning multiple tasks with kernel methods}, volume = {6}, year = {2005}, } @inproceedings{argyriou07feature, author = {A. Argyriou and T. Evgeniou and M. Pontil}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {41--48}, title = {Multi-task feature learning}, year = {2007}, } @inproceedings{jacob09cluster, author = {Laurent Jacob and Francis Bach and Jean-Philippe Vert}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {745--752}, title = {Clustered Multi-Task Learning: A Convex Formulation}, year = {2009}, } @article{bickel06regularization, author = {Peter Bickel and Bo Li}, journal = {Sociedad de Estadística e Investigación Operativa Test}, pages = {271--344}, title = {Regularization in Statistics}, volume = {15}, year = {2006}, } @article{bernardo79reference, author = {J. M. Bernardo}, journal = {Journal of the Royal Statistics Society: Series B (Statistical Methodology)}, pages = {113--147}, title = {Reference posterior distributions for {B}ayesian inference}, volume = {41}, year = {1979}, } @article{peters06bindingprediction, author = {B. Peters and H.-H Bui and S. Frankild and M. Nielson and C. Lundegaard and E. Kostem and D. Basch and K. Lamberth and M. Harndahl and W. Fleri and S. S Wilson and J. Sidney and O. Lund and S. Buus and A. Sette}, journal = {PLoS Compututational Biology}, title = {A community resource benchmarking predictions of peptide binding to {MHC-I} molecules}, volume = {2}, year = {2006}, } @article{craven78gcv, author = {P. Craven and G. Wahba}, journal = {Numerische Mathematik}, number = {4}, pages = {377--403}, title = {Smoothing noisy data with spline functions. Estimating the correct degree of smoothing by the method of generalized cross-validation}, volume = {31}, year = {1978}, } @article{eldar09sure, author = {Yonina C. Eldar}, journal = {IEEE Transactions on Signal Processing}, number = {2}, pages = {471--481}, title = {Generalized {SURE} for Exponential Families: Applications to Regularization}, volume = {57}, year = {2009}, } @article{stein81sure, author = {C. M. Stein}, journal = {Annals of Statistics}, number = {6}, pages = {1135--1151}, title = {Estimation of the mean of a multivariate normal distribution}, volume = {9}, year = {1981}, } @article{bartlett05local, author = {Peter L. Bartlett and Olivier Bousquet and Shahar Mendelson}, journal = {Annals of Statistics}, number = {4}, pages = {1497--1537}, title = {Local {R}ademacher complexities}, volume = {33}, year = {2005}, } @article{bousquet02stability, author = {O. Bousquet and A. Elisseeff}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {499--526}, title = {Stability and Generalization}, volume = {2}, year = {2002}, } @book{cesabianchi06prediction, author = {Nicolò Cesa-Bianchi and Gábor Lugosi}, publisher = {Cambridge University Press}, title = {Prediction, learning, and games}, year = {2006}, } @article{bartlett53approximate, author = {M. S. Bartlett}, journal = {Biometrika}, pages = {306--317}, title = {Approximate confidence intervals. {II}. {M}ore than one unknown parameter}, volume = {40}, year = {1953}, } @article{levit85second, author = {B. Ya. Levit}, journal = {Theory of Probability and its Applications}, pages = {333--363}, title = {Second-order asymptotic optimality and positive solutions of the Schrödinger equation}, volume = {30}, year = {1985}, } @article{berkhin80second, author = {P. E. Berkhin and B. Ya. Levit}, journal = {Problemy Peredachi Informatsii}, pages = {60--79}, title = {Second-order asymptotically minimax estimates for the mean of a normal population}, volume = {16}, year = {1980}, } @article{dalalyan06second, author = {A. S. Dalalyan and G. K. Golubev and A. B. Tsybakov}, journal = {Annals of Statistics}, number = {1}, pages = {169--201}, title = {Penalized maximum likelihood and semiparametric second-order efficiency}, volume = {34}, year = {2006}, } @incollection{shibata89model, author = {R. Shibata}, booktitle = {From Data to Model}, pages = {215--240}, title = {Statistical Aspects of Model Selection}, year = {1989}, } @article{murata94neural, author = {N. Murata and S. Yoshizawa and S. Amari}, journal = {IEEE Transactions on Neural Networks}, number = {6}, pages = {865--872}, title = {Network Information Criterion---Determining the Number of Hidden Units for an Artificial Neural Network Model}, volume = {5}, year = {1994}, } @article{konishi96gic, author = {S. Konishi and G. Kitagawa}, journal = {Biometrika}, number = {4}, pages = {875--890}, title = {Generalized Information Criteria in Model Selection}, volume = {83}, year = {1996}, } @article{ishiguro97bootstrapping, author = {M. Ishiguro and Y. Sakamoto and G. Kitagawa}, journal = {Annals of the Institute of Statistical Mathematics}, pages = {411--434}, title = {Bootstrapping Log Likelihood and {EIC}, an Extension of {AIC}}, volume = {49}, year = {1997}, } @inproceedings{sahavechaphan06xsnippet, author = {Naiyana Sahavechaphan and Kajal Claypool}, booktitle = {Object-Oriented Programming, Systems, Languages, and Applications (OOPSLA)}, title = {XSnippet: Mining For Sample Code}, volume = {41}, year = {2006}, } @inproceedings{jiang07deckard, author = {Lingxiao Jiang and Ghassan Misherghi and Zhendong Su and Stephane Glondu}, booktitle = {International Conference on Software Engineering (ICSE)}, pages = {96--105}, title = {{DECKARD}: Scalable and Accurate Tree-Based Detection of Code Clones}, year = {2007}, } @inproceedings{lu09generation, author = {Wei Lu and Hwee Tou Ng and Wee Sun Lee}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {400--409}, title = {Natural Language Generation with Tree Conditional Random Fields}, year = {2009}, } @inproceedings{lu12probabilistic, author = {Wei Lu and Hwee Tou Ng}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1611--1622}, title = {A Probabilistic Forest-to-String Model for Language Generation from Typed Lambda Calculus Expressions}, year = {2012}, } @article{ratnaparkhi02surface, author = {Adwait Ratnaparkhi}, journal = {Computer, Speech \& Language}, pages = {435--455}, title = {Trainable approaches to surface natural language generation and their application to conversational dialog systems}, volume = {16}, year = {2002}, } @inproceedings{mellish00dependencies, author = {C. Mellish and R. Evans and L. Cahill and C. Doran and D. Paiva and M. Reape and D. Scott and N. Tipper}, booktitle = {Applied Natural Language Processing and North American Association for Computational Linguistics (ANLP/NAACL)}, pages = {119--126}, title = {A Representation for Complex and Evolving Data Dependencies in Generation}, year = {2000}, } @inproceedings{koller02generation, author = {Alexander Koller and Kristina Striegnitz}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {17--24}, title = {Generation as Dependency Parsing}, year = {2002}, } @inproceedings{paiva05control, author = {Daniel S. Paiva and Roger Evans}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {58--65}, title = {Empirically-based Control of Natural Language Generation}, year = {2005}, } @inproceedings{soricut06widl, author = {Radu Soricut and Daniel Marcu}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {1105--1112}, title = {Stochastic Language Generation Using {WIDL}-Expressions and its Application in Machine Translation and Summarization}, year = {2006}, } @inproceedings{soricut06discourse, author = {Radu Soricut and Daniel Marcu}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {803--810}, title = {Discourse Generation Using Utility-Trained Coherence Models}, year = {2006}, } @inproceedings{denero09efficient, author = {John DeNero and Mohit Bansal and Adam Pauls and Dan Klein}, booktitle = {North American Association for Computational Linguistics (NAACL)}, pages = {227--235}, title = {Efficient Parsing for Transducer Grammars}, year = {2009}, } @inproceedings{agarwal09hybrid, author = {Arvind Agarwal and Hal {Daum{\'e} III}}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Exponential Family Hybrid Learning}, year = {2009}, } @article{belz08sumtime, author = {Anja Belz}, journal = {Natural Language Engineering}, number = {4}, pages = {1--26}, title = {Automatic generation of weather forecast texts using comprehensive probabilistic generation-space models}, volume = {14}, year = {2008}, } @article{reiter05sumtime, author = {Ehud Reiter and Somayajulu Sripada and Jim Hunter and Jin Yu and Ian Davy}, journal = {Artificial Intelligence}, pages = {137--169}, title = {Choosing words in computer-generated weather forecasts}, volume = {167}, year = {2005}, } @inproceedings{belz09sumtime, author = {Anja Belz and Eric Kow}, booktitle = {European Workshop on Natural Language Generation}, pages = {16--24}, title = {System building cost vs. output quality in data-to-text generation}, year = {2009}, } @inproceedings{green06biomedical, author = {Nancy Green}, booktitle = {International Natural Language Generation Conference}, pages = {114--121}, title = {Generation of biomedical arguments for lay readers}, year = {2006}, } @inproceedings{turner09geo, author = {Ross Turner and Yaji Sripada and Ehud Reiter}, booktitle = {European Workshop on Natural Language Generation}, pages = {42--49}, title = {Generating approximate geographic descriptions}, year = {2009}, } @inproceedings{dale03navigation, author = {Robert Dale and Sabine Geldof and Jean-Philippe Prost}, booktitle = {Australasian computer science conference}, pages = {35--44}, title = {CORAL: using natural language generation for navigational assistance}, year = {2003}, } @inproceedings{foster04xslt, author = {Mary Ellen Foster and Michael White}, booktitle = {Workshop on NLP and XML: RDF/RDFS and OWL in Language Technology}, pages = {1--8}, title = {Techniques for text planning with {XSLT}}, year = {2004}, } @article{liu89lbfgs, author = {D. C. Liu and J. Nocedal}, journal = {Mathematical Programming B}, number = {3}, pages = {503--528}, title = {On the Limited Memory Method for Large Scale Optimization}, volume = {45}, year = {1989}, } @inproceedings{papineni02bleu, author = {Kishore Papineni and Salim Roukos and Todd Ward and Wei-Jing Zhu}, booktitle = {Association for Computational Linguistics (ACL)}, title = {{BLEU}: A Method for Automatic Evaluation of Machine Translation}, year = {2002}, } @inproceedings{piantadosi08compositional, author = {S. T. Piantadosi and N. D. Goodman and B. A. Ellis and J. B. Tenenbaum}, booktitle = {Proceedings of the Thirtieth Annual Conference of the Cognitive Science Society}, pages = {1620--1625}, title = {A {B}ayesian Model of the Acquisition of Compositional Semantics}, year = {2008}, } @inproceedings{goodman08church, author = {N. D. Goodman and V. K. Mansighka and D. Roy and K. Bonawitz and J. B. Tenenbaum}, booktitle = {Uncertainty in Artificial Intelligence (UAI)}, title = {Church: a language for generative models}, year = {2008}, } @article{lau03programming, author = {T. Lau and S. Wolfman and P. Domingos and D. S. Weld}, journal = {Machine Learning}, pages = {111--156}, title = {Programming by demonstration using version space algebra}, volume = {53}, year = {2003}, } @inproceedings{lau03traces, author = {T. Lau and P. Domingos and D. S. Weld}, booktitle = {International Conference On Knowledge Capture}, pages = {36--43}, title = {Learning Programs from Traces using Version Space Algebra}, year = {2003}, } @inproceedings{briggs06functional, author = {Forrest Briggs and Melissa O'Neill}, booktitle = {Third Asian-Pacific workshop on Genetic Programming}, pages = {110--127}, title = {Functional genetic programming with combinators}, year = {2006}, } @inproceedings{blunsom09note, author = {Phil Blunsom and Trevor Cohn and Sharon Goldwater and Mark Johnson}, booktitle = {Association for Computational Linguistics (ACL)}, title = {A note on the implementation of Hierarchical {D}irichlet Processes}, year = {2009}, } @book{cypher93pbd, author = {A. Cypher}, publisher = {MIT Press}, title = {Watch what {I} do: Programming by demonstration}, year = {1993}, } @article{caruana97multitask, author = {Rich Caruana}, journal = {Machine Learning}, pages = {41--75}, title = {Multitask learning}, volume = {28}, year = {1997}, } @article{xue07multitask, author = {Y. Xue and X. Liao and L. Carin and B. Krishnapuram}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {35--63}, title = {Multi-task learning for classification with {D}irichlet process priors}, volume = {8}, year = {2007}, } @book{hankin04lambda, author = {Chris Hankin}, publisher = {Lightning Source}, title = {An Introduction to Lambda Calculi for Computer Scientists}, year = {2004}, } @inproceedings{ariola97cyclic, author = {Zena M. Ariola and Stefan Blom}, booktitle = {Theoretical Aspects of Computer Software}, pages = {77--106}, title = {Cyclic lambda calculi}, year = {1997}, } @book{vapnik00nature, author = {Vladimir N. Vapnik}, publisher = {Springer-Verlag}, title = {The Nature of Statistical Learning Theory}, year = {2000}, } @inproceedings{haussler94rigorous, author = {David Haussler and Michael Kearns and H. Sebastian Seung and Naftali Tishby}, booktitle = {Conference on Learning Theory (COLT)}, pages = {76--87}, title = {Rigorous Learning Curve Bounds from Statistical Mechanics}, year = {1994}, } @article{wanwright09sharp, author = {M. J. Wainwright}, journal = {IEEE Transactions on Information Theory}, pages = {2183--2202}, title = {Sharp thresholds for noisy and high-dimensional recovery of sparsity using $\ell_1$-constrained quadratic programming (Lasso)}, volume = {55}, year = {2009}, } @article{schoenfinkel24combinatory, author = {Moses Schönfinkel}, journal = {Mathematische Annalen}, pages = {305--316}, title = {Über die Bausteine der mathematischen Logik}, volume = {92}, year = {1924}, } @phdthesis{shalev07online, author = {Shai Shalev-Shwartz}, school = {The Hebrew University of Jerusalem}, title = {Online Learning: Theory, Algorithms, and Applications}, year = {2007}, } @inproceedings{eisenstein09read, author = {J. Eisenstein and J. Clarke and D. Goldwasser and D. Roth}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {958--967}, title = {Reading to Learn: Constructing Features from Semantic Abstracts}, year = {2009}, } @article{culy96null, author = {Christopher Culy}, journal = {Language Variation and Change}, pages = {91--124}, title = {Null objects in {E}nglish recipes}, volume = {8}, year = {1996}, } @inproceedings{fleischman07intention, author = {M. Fleischman and D. Roy}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Representing Intentions in a Cognitive Model of Language Acquisition: Effects of Phrase Structure on Situated Verb Learning}, year = {2007}, } @inproceedings{solar05sketching, author = {Armando Solar-Lezama and Rodric Rabbah and Rastislav Bodík and Kemal Ebcioglu}, booktitle = {Programming Language Design and Implementation (PLDI)}, title = {Programming by Sketching for Bit-Streaming Programs}, year = {2005}, } @article{crammer06passive, author = {Koby Crammer and Ofer Dekel and Joseph Keshet and Shai Shalev-Shwartz and Yoram Singer}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {551--585}, title = {Online Passive-Aggressive Algorithms}, volume = {7}, year = {2006}, } @article{strohmer09kaczmarz, author = {Thomas Strohmer and Roman Vershynin}, journal = {Journal of Fourier Analysis and Applications}, pages = {262--278}, title = {A randomized Kaczmarz algorithm with exponential convergence}, volume = {15}, year = {2009}, } @inproceedings{needell2014kaczmarz, author = {Deanna Needell and Nathan Srebro and Rachel Ward}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Stochastic Gradient Descent, Weighted Sampling, and the Randomized Kaczmarz algorithm}, year = {2014}, } @techreport{srebro10stochastic, author = {Nati Srebro and Karthik Sridharan and Ambuj Tewari}, institution = {TTI Chicago}, title = {Stochastic optimization and online learning with smooth loss functions}, year = {2010}, } @inproceedings{srebro10tutorial, author = {Nati Srebro and Ambuj Tewari}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Stochastic optimization for machine learning (tutorial)}, year = {2010}, } @inproceedings{hazan11beyond, author = {Elad Hazan and Satyen Kale}, booktitle = {Conference on Learning Theory (COLT)}, title = {Beyond the regret minimization barrier: an optimal algorithm for stochastic strongly-convex optimization}, year = {2011}, } @inproceedings{rakhlin12making, author = {Alexander Rakhlin and Ohad Shamir and Karthik Sridharan}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Making Gradient Descent Optimal for Strongly Convex Stochastic Optimization}, year = {2012}, } @article{nesterov1983acceleration, author = {Y. Nesterov}, journal = {Soviet Mathematics Doklady}, number = {2}, pages = {372--376}, title = {A method of solving a convex programming problem with convergence rate ${O}(1/k^2)$}, volume = {27}, year = {1983}, } @book{nesterov2004introductory, author = {Y. Nesterov}, publisher = {Springer}, title = {Introductory Lectures on Convex Optimization: A Basic Course}, year = {2004}, } @article{nesterov2005smooth, author = {Y. Nesterov}, journal = {Mathematical Programming}, number = {1}, pages = {127--152}, title = {Smooth minimization of non-smooth functions}, volume = {103}, year = {2005}, } @inproceedings{lee13coordinate, author = {Yin Tat Lee and Aaron Sidford}, booktitle = {Foundations of Computer Science (FOCS)}, title = {Efficient Accelerated Coordinate Descent Methods and Faster Algorithms for Solving Linear Systems}, year = {2013}, } @inproceedings{cohen2015sampling, author = {Michael B. Cohen and Yin Tat Lee and Cameron Musco and Christopher Musco and Richard Peng and Aaron Sidford}, booktitle = {Innovations in Theoretical Computer Science (ITCS)}, title = {Uniform Sampling for Matrix Approximation}, year = {2015}, } @inproceedings{nelson2013osnap, author = {Jelani Nelson and Huy L. Nguyen}, booktitle = {Foundations of Computer Science (FOCS)}, title = {{OSNAP}: Faster numerical linear algebra algorithms via sparser subspace embeddings}, year = {2013}, } @inproceedings{li2013sampling, author = {Mu Li and Gary L. Miller and Richard Peng}, booktitle = {Foundations of Computer Science (FOCS)}, title = {Iterative Row Sampling}, year = {2013}, } @inproceedings{williams2012omega, author = {Virginia Vassilevska Williams}, booktitle = {Symposium on Theory of Computing (STOC)}, title = {Multiplying matrices faster than {C}oppersmith-{W}inograd}, year = {2012}, } @inproceedings{leroux2012sag, author = {N. Le Roux and M. Schmidt and F. Bach}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {A Stochastic Gradient Method with an Exponential Convergence Rate for Finite Training Sets}, year = {2012}, } @article{shalev13stochastic, author = {Shai Shalev-Shwartz and Tong Zhang}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {567--599}, title = {Stochastic Dual Coordinate Ascent Methods for Regularized Loss Minimization}, volume = {14}, year = {2013}, } @article{shalev2014accelerated, author = {Shai Shalev-Shwartz and Tong Zhang}, journal = {Mathematical Programming}, pages = {1--41}, title = {Accelerated proximal stochastic dual coordinate ascent for regularized loss minimization}, year = {2014}, } @article{shalev15dualfree, author = {Shai Shalev-Shwartz}, journal = {arXiv}, title = {{SDCA} without Duality}, year = {2015}, } @inproceedings{lin2014accelerated, author = {Qihang Lin and Zhaosong Lu and Lin Xiao}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {An Accelerated Proximal Coordinate Gradient Method}, year = {2014}, } @article{xiao2014proximal, author = {Lin Xiao and Tong Zhang}, journal = {SIAM Journal on Optimization}, number = {4}, pages = {2057--2075}, title = {A proximal stochastic gradient method with progressive variance reduction}, volume = {24}, year = {2014}, } @inproceedings{defazio2014saga, author = {Aaron Defazio and Francis Bach and Simon Lacoste-Julien}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {SAGA: A Fast Incremental Gradient Method With Support for Non-Strongly Convex Composite Objectives}, year = {2014}, } @inproceedings{johnson13svrg, author = {Rie Johnson and Tong Zhang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Accelerating Stochastic Gradient Descent using Predictive Variance Reduction}, year = {2013}, } @inproceedings{schaul14unittests, author = {Tom Schaul and Ioannis Antonoglou and David Silver}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Unit Tests for Stochastic Optimization}, year = {2014}, } @inproceedings{orabona14simultaneous, author = {Francesco Orabona}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Simultaneous Model Selection and Optimization through Parameter-free Stochastic Learning}, year = {2014}, } @inproceedings{frostig15competing, author = {Roy Frostig and Rong Ge and Sham M. Kakade and Aaron Sidford}, booktitle = {Conference on Learning Theory (COLT)}, title = {Competing with the empirical risk minimizer in a single pass}, year = {2015}, } @inproceedings{frostig15unregularizing, author = {Roy Frostig and Rong Ge and Sham M. Kakade and Aaron Sidford}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Un-regularizing: approximate proximal point and faster stochastic algorithms for empirical risk minimization}, year = {2015}, } @article{lin15catalyst, author = {Hongzhou Lin and Julien Mairal and Zaid Harchaoui}, journal = {arXiv}, title = {A Universal Catalyst for First-Order Optimization}, year = {2015}, } @phdthesis{mansinghka09thesis, author = {Vikash Mansinghka}, school = {Massachusetts Institute of Technology}, title = {Natively Probabilistic Computation}, year = {2009}, } @article{goodman08rule, author = {N. D. Goodman and J. B. Tenenbaum and J. Feldman and T. L. Griffiths}, journal = {Cognitive Science}, pages = {108--154}, title = {A rational analysis of rule-based concept learning}, volume = {32}, year = {2008}, } @inproceedings{arlot10penalty, author = {Sylvain Arlot and Francis Bach}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {46--54}, title = {Data-driven calibration of linear estimators with minimal penalties}, year = {2010}, } @inproceedings{kollar10directions, author = {Thomas Kollar and Stefanie Tellex and Deb Roy and Nicholas Roy}, booktitle = {Human-Robot Interaction}, pages = {259--266}, title = {Toward Understanding Natural Language Directions}, year = {2010}, } @techreport{jaeger08game, author = {Gerhard Jäger}, institution = {University of Tübingen}, title = {Game Theory in Semantics and Pragmatics}, year = {2008}, } @article{jaeger08applications, author = {Gerhard Jäger}, journal = {Language and Linguistics Compass}, pages = {406--421}, title = {Applications of Game Theory in Linguistics}, volume = {2}, year = {2008}, } @book{austin62do, author = {John Langshaw Austin}, publisher = {Oxford}, title = {How to do Things with Words: The {W}illiam {J}ames Lectures delivered at {H}arvard University in 1955}, year = {1962}, } @article{valiant84learnable, author = {Leslie Valiant}, journal = {Communications of the ACM}, number = {11}, pages = {1134--1142}, title = {A theory of the learnable}, volume = {27}, year = {1984}, } @article{jackson97dnf, author = {J. Jackson}, journal = {Journal of Computer and System Sciences}, number = {3}, pages = {414--440}, title = {An efficient membership-query algorithm for learning {DNF} with respect to the uniform distribution}, volume = {55}, year = {1997}, } @article{angluin88queries, author = {D. Angluin}, journal = {Machine Learning}, number = {4}, pages = {319--342}, title = {Queries and concept learning}, volume = {2}, year = {1988}, } @article{donoho06compressed, author = {David Donoho}, journal = {IEEE Trans. on Information Theory}, number = {4}, pages = {1289--1306}, title = {Compressed sensing}, volume = {52}, year = {2006}, } @inproceedings{hamlet94random, author = {D. Hamlet}, booktitle = {Encyclopedia of Software Engineering}, pages = {970--978}, title = {Random testing}, year = {1994 1994}, } @article{graf97predicate, author = {Susanne Graf and Hassen Saidi}, journal = {Computer Aided Verification}, pages = {72--83}, title = {Construction of abstract state graphs with {PVS}}, volume = {1254}, year = {1997}, } @article{monro51stochastic, author = {Herbert Robbins and Sutton Monro}, journal = {Annals of Mathematical Statistics}, number = {3}, pages = {400--407}, title = {A Stochastic Approximation Method}, volume = {22}, year = {1951}, } @inproceedings{smaragdakis11context, author = {Yannis Smaragdakis and Martin Bravenboer and Ondrej Lhotak}, booktitle = {Principles of Programming Languages (POPL)}, title = {Pick Your Contexts Well: Understanding Object-Sensitivity}, year = {2011}, } @inproceedings{spoon04ddp, author = {S. Alexander Spoon and Olin Shivers}, booktitle = {European Conference on Object-Oriented Programming (ECOOP)}, title = {Demand-Driven Type Inference with Subgoal Pruning: Trading Precision for Scalability}, year = {2004}, } @inproceedings{henzinger02lazy, author = {Thomas A. Henzinger and Ranjit Jhala and Rupak Majumdar and Grégoire Sutre}, booktitle = {Principles of Programming Languages (POPL)}, title = {Lazy Abstraction}, year = {2002}, } @inproceedings{mcmillan06lazy, author = {Ken McMillan}, booktitle = {Computer Aided Verification (CAV)}, pages = {123--136}, title = {Lazy Abstraction with Interpolants}, year = {2006}, } @inproceedings{vipindeep05pruning, author = {V. Vipindeep and Pankaj Jalote}, booktitle = {International Workshop on Dynamic Analysis (WODA)}, title = {Efficient static analysis with path pruning using coverage data}, year = {2005}, } @book{kamp93drt, author = {H. Kamp and U. Reyle}, publisher = {Kluwer, Dordrecht}, title = {From Discourse to Logic: An Introduction to the Model-theoretic Semantics of Natural Language, Formal Logic and Discourse Representation Theory}, year = {1993}, } @article{muskens96combine, author = {Reinhard Muskens}, journal = {Linguistics and Philosophy}, number = {2}, pages = {143--186}, title = {Combining Montague semantics and discourse representation}, volume = {19}, year = {1996}, } @inproceedings{kwiatkowski10ccg, author = {T. Kwiatkowski and L. Zettlemoyer and S. Goldwater and M. Steedman}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1223--1233}, title = {Inducing Probabilistic {CCG} Grammars from Logical Form with Higher-Order Unification}, year = {2010}, } @inproceedings{clarke10world, author = {James Clarke and Dan Goldwasser and Ming-Wei Chang and Dan Roth}, booktitle = {Computational Natural Language Learning (CoNLL)}, pages = {18--27}, title = {Driving Semantic Parsing from the World's Response}, year = {2010}, } @phdthesis{pross09grounded, author = {Tillmann Pross}, school = {University of Stuttgart}, title = {Grounded Discourse Representation Theory: Towards a Semantics-Pragmatics Interface for Human-Machine Collaboration}, year = {2009}, } @techreport{bos94drs, author = {Johan Bos and Elsbeth Mastenbroek and Scott McGlashan and Sebastian Millies and Manfred Pinkal}, institution = {Universität des Saarlandes}, title = {A Compositional {DRS}-based formalism for {NLP} applications}, year = {1994}, } @incollection{kamp05drt, author = {Hans Kamp and Josef van Genabith and Uwe Reyle}, booktitle = {Handbook of Philosophical Logic}, title = {Discourse Representation Theory}, year = {2005}, } @inproceedings{bos06superlatives, author = {Malvina Nissim and Johan Bos}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {An Empirical Approach to the Interpretation of Superlatives}, year = {2006}, } @inproceedings{bos09economical, author = {J. Bos}, booktitle = {Workshop on Controlled Natural Language}, pages = {1--5}, title = {A Controlled Fragment of {DRT}}, year = {2009}, } @inproceedings{bos04wide, author = {Johan Bos and Stephen Clark and Mark Steedman and James R. Curran and Julia Hockenmaier}, booktitle = {International Conference on Computational Linguistics (COLING)}, pages = {1240--1246}, title = {Wide-coverage semantic representations from a {CCG} parser}, year = {2004}, } @article{barker02continuations, author = {Chris Barker}, journal = {Natural Language Semantics}, pages = {211--242}, title = {Continuations and the nature of quantification}, volume = {10}, year = {2002}, } @article{shan04continuations, author = {Chung-chieh Shan}, journal = {arXiv}, title = {Delimited continuations in natural language}, year = {2004}, } @book{heim98semantics, author = {Irene Heim and Angelika Kratzer}, publisher = {Wiley-Blackwell}, title = {Semantics in Generative Grammar}, year = {1998}, } @article{white06hlds, author = {Michael White}, journal = {Research on Language and Computation}, pages = {39--75}, title = {Efficient Realization of Coordinate Structures in Combinatory Categorial Grammar}, volume = {4}, year = {2006}, } @inproceedings{bos08framenet, author = {J. Bos and M. Nissim}, booktitle = {Frames, Corpora, and Knowledge Representation}, pages = {169--183}, title = {Combining Discourse Representation Theory with FrameNet}, year = {2008}, } @inproceedings{chaves07model, author = {Rui Pedro Chaves}, booktitle = {International Workshop on Computational Semantics}, title = { Dynamic Model Checking of Discourse Representation Structures with Pluralities}, year = {2007}, } @book{blackburn05semantics, author = {Patrick Blackburn and Johan Bos}, publisher = {CSLI Publishers}, title = {Representation and Inference for Natural Language: A First Course in Computational Semantics}, year = {2005}, } @inproceedings{thompson97parse, author = {Cynthia A. Thompson and Raymond J. Mooney and Lappoon R. Tang}, booktitle = {ML-97 Workshop on Automata Induction, Grammatical Inference, and Language Acquisition}, title = {Learning to Parse Natural Language Database Queries into Logical Form}, year = {1997}, } @inproceedings{montague73ptq, author = {Richard Montague}, booktitle = {Approaches to Natural Language}, pages = {221--242}, title = {The proper treatment of quantification in ordinary {E}nglish}, year = {1973}, } @phdthesis{cooper75thesis, author = {Robin Cooper}, school = {University of Massachusetts at Amherst}, title = {Montague's semantic theory and transformational syntax}, year = {1975}, } @book{steedman00ccg, author = {Mark Steedman}, publisher = {MIT Press}, title = {The Syntactic Process}, year = {2000}, } @book{carpenter98type, author = {Bob Carpenter}, publisher = {MIT Press}, title = {Type-Logical Semantics}, year = {1998}, } @inproceedings{zelle96geoquery, author = {M. Zelle and R. J. Mooney}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {1050--1055}, title = {Learning to parse database queries using inductive logic programming}, year = {1996}, } @inproceedings{branavan10high, author = {S.R.K. Branavan and Luke Zettlemoyer and Regina Barzilay}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {1268--1277}, title = {Reading Between the Lines: Learning to Map High-level Instructions to Commands}, year = {2010}, } @inproceedings{duchi10adagrad, author = {John Duchi and Elad Hazan and Yoram Singer}, booktitle = {Conference on Learning Theory (COLT)}, title = {Adaptive Subgradient Methods for Online Learning and Stochastic Optimization}, year = {2010}, } @book{dechter03constraint, author = {Rina Dechter}, publisher = {Morgan Kaufmann}, title = {Constraint Processing}, year = {2003}, } @article{richardson06mln, author = {Matthew Richardson and Pedro Domingos}, journal = {Machine Learning}, pages = {107--136}, title = {{M}arkov Logic Networks}, volume = {62}, year = {2006}, } @inproceedings{tang01ilp, author = {L. R. Tang and R. J. Mooney}, booktitle = {European Conference on Machine Learning (ECML)}, pages = {466--477}, title = {Using multiple clause constructors in inductive logic programming for semantic parsing}, year = {2001}, } @inproceedings{kate05funql, author = {Rohit J. Kate and Yuk Wah Wong and Raymond J. Mooney}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {1062--1068}, title = {Learning to Transform Natural to Formal Languages}, year = {2005}, } @techreport{nivre05dependency, author = {Joakim Nivre}, institution = {Växjö University: School of Mathematics and Systems Engineering}, title = {Dependency Grammar and Dependency Parsing}, year = {2005}, } @inproceedings{popescu03precise, author = {Ana-Maria Popescu and Oren Etzioni and Henry Kautz}, booktitle = {International Conference on Intelligent User Interfaces (IUI)}, pages = {149--157}, title = {Towards a Theory of Natural Language Interfaces to Databases}, year = {2003}, } @inproceedings{schuler03interpretation, author = {William Schuler}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {529--536}, title = {Using model-theoretic semantic interpretation to guide statistical parsing and word recognition in a spoken language interface}, year = {2003}, } @article{copestake05mrs, author = {Ann Copestake and Dan Flickinger and Ivan Sag and Carl Pollard}, journal = {Journal of Research on Language and Computation}, pages = {281--332}, title = {Minimal Recursion Semantics: An introduction}, volume = {3}, year = {2005}, } @article{androutsopoulos95nlidb, author = {I. Androutsopoulos and G. D. Ritchie and P. Thanisch}, journal = {Journal of Natural Language Engineering}, pages = {29--81}, title = {Natural Language Interfaces to Databases -- An Introduction}, volume = {1}, year = {1995}, } @techreport{woods72lunar, author = {W. A. Woods and R. M. Kaplan and B. N. Webber}, institution = {BBN Report 2378, Bolt Beranek and Newman Inc.}, title = {The Lunar Sciences Natural Language Information System: Final Report}, year = {1972}, } @article{warren82chat80, author = {D. Warren and F. Pereira}, journal = {Computational Linguistics}, pages = {110--122}, title = {An Efficient Easily Adaptable System for Interpreting Natural Language Queries}, volume = {8}, year = {1982}, } @inproceedings{baldridge02ccg, author = {Jason Baldridge and Geert-Jan M. Kruijff}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {319--326}, title = {Coupling {CCG} with Hybrid Logic Dependency Semantics}, year = {2002}, } @inproceedings{branavan11win, author = {S.R.K. Branavan and David Silver and Regina Barzilay}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {268--277}, title = {Learning to Win by Reading Manuals in a {M}onte-{C}arlo Framework}, year = {2011}, } @inproceedings{goldwasser11confidence, author = {Dan Goldwasser and Roi Reichart and James Clarke and Dan Roth}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {1486--1495}, title = {Confidence Driven Unsupervised Semantic Parsing}, year = {2011}, } @inproceedings{goldwasser11instructions, author = {Dan Goldwasser and Dan Roth}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, pages = {1794--1800}, title = {Learning From Natural Instructions}, year = {2011}, } @inproceedings{alshawi11nlf, author = {Hiyan Alshawi and Pi-Chuan Chang and Michael Ringgaard}, booktitle = {International Conference on Compositional Semantics (IWCS)}, pages = {15--24}, title = {Deterministic Statistical Mapping of Sentences to Underspecified Semantics}, year = {2011}, } @inproceedings{giordani09sql, author = {Alessandra Giordani and Alessandro Moschitti}, booktitle = {International Conference on Applications of Natural Language to Information Systems}, pages = {207--221}, title = {Semantic Mapping Between Natural Language Questions and {SQL} Queries via Syntactic Pairing}, year = {2009}, } @inproceedings{miller96statistical, author = {Scott Miller and David Stallard and Robert Bobrow and Richard Schwartz}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {55--61}, title = {A Fully Statistical Approach to Natural Language Interfaces}, year = {1996}, } @inproceedings{kwiatkowski11lex, author = {T. Kwiatkowski and L. Zettlemoyer and S. Goldwater and M. Steedman}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1512--1523}, title = {Lexical Generalization in {CCG} Grammar Induction for Semantic Parsing}, year = {2011}, } @inproceedings{artzi11conversations, author = {Yoav Artzi and Luke Zettlemoyer}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {421--432}, title = {Bootstrapping Semantic Parsers from Conversations}, year = {2011}, } @inproceedings{cousot77abstract, author = {Patrick Cousot and Radhia Cousot}, booktitle = {Principles of Programming Languages (POPL)}, pages = {238--252}, title = {Abstract interpretation: a unified lattice model for static analysis of programs by construction or approximation of fixpoints}, year = {1977}, } @article{nocedal80lbfgs, author = {J. Nocedal}, journal = {Mathematics of Computation}, pages = {773--782}, title = {Updating Quasi-Newton Matrices with Limited Storage}, volume = {35}, year = {1980}, } @article{daume09searn, author = {Hal {Daum{\'e} III} and John Langford and Daniel Marcu}, journal = {Machine Learning}, pages = {297--325}, title = {Search-based Structured Prediction}, volume = {75}, year = {2009}, } @inproceedings{judge06qtb, author = {J. Judge and A. Cahill and J. v. Genabith}, booktitle = {International Conference on Computational Linguistics and Association for Computational Linguistics (COLING/ACL)}, pages = {497--504}, title = {Question-Bank: creating a corpus of parse-annotated questions}, year = {2006}, } @article{porter80stem, author = {M. F. Porter}, journal = {Program: electronic library and information systems}, pages = {130--137}, title = {An algorithm for suffix stripping}, volume = {14}, year = {1980}, } @inproceedings{vogel10navigate, author = {Adam Vogel and Dan Jurafsky}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {806--814}, title = {Learning to Follow Navigational Directions}, year = {2010}, } @inproceedings{chen11navigate, author = {David L. Chen and Raymond J. Mooney}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {859--865}, title = {Learning to Interpret Natural Language Navigation Instructions from Observations}, year = {2011}, } @article{grice75maxims, author = {H. P. Grice}, journal = {Syntax and Semantics}, pages = {41--58}, title = {Logic and Conversation}, volume = {3}, year = {1975}, } @phdthesis{potts03thesis, author = {Christopher Potts}, school = {UC Santa Cruz}, title = {The Logic of Conventional Implicatures}, year = {2003}, } @inproceedings{lev04logic, author = {Iddo Lev and Bill MacCartney and Christopher D. Manning and Roger Levy}, booktitle = {ACL Workshop on Text Meaning and Interpretation}, title = {Solving Logic Puzzles: From Robust Processing to Precise Semantics}, year = {2004}, } @phdthesis{hockenmaier03ccg, author = {Julia Hockenmaier}, school = {University of Edinburgh}, title = {Data and Models for Statistical Parsing with Combinatory Categorial Grammar}, year = {2003}, } @inproceedings{holland99proofs, author = {Amanda M. Holland-Minkley and Regina Barzilay and Robert L. Constable}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Verbalization of High-Level Formal Proofs}, year = {1999}, } @inproceedings{dinesh11regulatory, author = {Nikhil Dinesh and Aravind Joshi and Insup Lee}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Computing Logical Form on Regulatory Texts}, year = {2011}, } @inproceedings{miller04ner, author = {S. Miller and J. Guinness and A. Zamanian}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, pages = {337--342}, title = {Name Tagging with Word Clusters and Discriminative Training}, year = {2004}, } @inproceedings{koo08simple, author = {Terry Koo and Xavier Carreras and Michael Collins}, booktitle = {Human Language Technology and Association for Computational Linguistics (HLT/ACL)}, title = {Simple Semi-Supervised Dependency Parsing}, year = {2008}, } @inproceedings{anandkumar12moments, author = {Animashree Anandkumar and Daniel Hsu and Sham M. Kakade}, booktitle = {Conference on Learning Theory (COLT)}, title = {A Method of Moments for Mixture Models and Hidden {M}arkov Models}, year = {2012}, } @inproceedings{anandkumar11tree, author = {Animashree Anandkumar and Kamalika Chaudhuri and Daniel Hsu and Sham M. Kakade and Le Song and Tong Zhang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Spectral Methods for Learning Multivariate Latent Tree Structure}, year = {2011}, } @article{allman11identifiability, author = {Elizabeth S. Allman and Sonja Petrovi and John A. Rhodes and Seth Sullivant}, journal = {Transactions on Computational Biology and Bioinformatics}, pages = {710--722}, title = {Identifiability of 2-tree mixtures for group-based models}, volume = {8}, year = {2011}, } @article{allman09identifiability, author = {E. S. Allman and C. Matias and J. A. Rhodes}, journal = {Annals of Statistics}, pages = {3099--3132}, title = {Identifiability of parameters in latent structure models with many observed variables}, volume = {37}, year = {2009}, } @article{kruskal77three, author = {J. B. Kruskal}, journal = {Linear Algebra and Applications}, pages = {95--138}, title = {Three-way arrays: Rank and uniqueness of trilinear decompositions, with application to arithmetic complexity and statistics}, volume = {18}, year = {1977}, } @inproceedings{hsu09spectral, author = {Daniel Hsu and Sham M. Kakade and Tong Zhang}, booktitle = {Conference on Learning Theory (COLT)}, title = {A spectral algorithm for learning hidden {M}arkov models}, year = {2009}, } @article{geiger01stratified, author = {Dan Geiger and David Heckerman and Henry King and Christopher Meek}, journal = {Annals of Statistics}, pages = {505--529}, title = {Stratified exponential families: graphical models and model selection}, volume = {29}, year = {2001}, } @article{chi99pcfg, author = {Zhiyi Chi}, journal = {Computational Linguistics}, title = {Statistical Properties of Probabilistic Context-Free Grammars}, volume = {25}, year = {1999}, } @inproceedings{eisner00cubic, author = {Jason Eisner}, booktitle = {Advances in Probabilistic and Other Parsing Technologies}, pages = {29--62}, title = {Bilexical grammars and their cubic-time parsing algorithms}, year = {2000}, } @inproceedings{etzioni11openie, author = {Oren Etzioni and Anthony Fader and Janara Christensen and Stephen Soderland and Mausam}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Open Information Extraction: the Second Generation}, year = {2011}, } @inproceedings{poon10ontology, author = {Hoifung Poon and Pedro Domingos}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Unsupervised Ontology Induction from Text}, year = {2010}, } @inproceedings{zhang12smoothing, author = {Congle Zhang and Raphael Hoffmann and Daniel S. Weld}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Ontological Smoothing for Relation Extraction with Minimal Supervision}, year = {2012}, } @inproceedings{schoenmackers10horn, author = {Stefan Schoenmackers and Oren Etzioni and Daniel S. Weld and Jesse Davis}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Learning First-Order Horn Clauses from Web Text}, year = {2010}, } @article{jacobs91experts, author = {R. A. Jacobs and M. I. Jordan and S. J. Nowlan and G. E. Hinton}, journal = {Neural Computation}, pages = {79--87}, title = {Adaptive mixtures of local experts}, volume = {3}, year = {1991}, } @inproceedings{quattoni04crf, author = {A. Quattoni and M. Collins and T. Darrell}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Conditional Random Fields for Object Recognition}, year = {2004}, } @inproceedings{petrov08discriminative, author = {Slav Petrov and Dan Klein}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Discriminative Log-Linear Grammars with Latent Variables}, year = {2008}, } @inproceedings{wang09crf, author = {Yang Wang and Greg Mori}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Max-Margin Hidden Conditional Random Fields for Human Action Recognition}, year = {2009}, } @inproceedings{anandkumar12lda, author = {Animashree Anandkumar and Dean P. Foster and Daniel Hsu and Sham M. Kakade and Yi-Kai Liu}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Two {SVD}s Suffice: Spectral decompositions for probabilistic topic modeling and latent {D}irichlet allocation}, year = {2012}, } @inproceedings{hsu13spherical, author = {Daniel Hsu and Sham M. Kakade}, booktitle = {Innovations in Theoretical Computer Science (ITCS)}, title = {Learning Mixtures of Spherical {G}aussians: Moment Methods and Spectral Decompositions}, year = {2013}, } @article{candes11phaselift, author = {Emmanuel J. Candes and Thomas Strohmer and Vladislav Voroninski}, journal = {arXiv}, title = {PhaseLift: Exact and Stable Signal Recovery from Magnitude Measurements via Convex Programming}, year = {2011}, } @inproceedings{ohlsson12phase, author = {Henrik Ohlsson and Allen Yang and Roy Dong and Shankar Sastry}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {{CPRL} -- An Extension of Compressive Sensing to the Phase Retrieval Problem}, year = {2012}, } @article{donoho95soft, author = {D. L. Donoho}, journal = {IEEE Transactions on Information Theory}, pages = {613--627}, title = {De-noising by soft-thresholding}, volume = {41}, year = {1995}, } @article{cai10soft, author = {J.-F. Cai and E. J. Candes and Z. Shen}, journal = {SIAM Journal on Optimization}, pages = {1956--1982}, title = {A singular value thresholding algorithm for matrix completion}, volume = {20}, year = {2010}, } @inproceedings{barcelo11grpah, author = {Pablo Barcelo and Leonid Libkin and Juan Reutter}, booktitle = {Symposium on Principles of Database Systems}, title = {Querying Graph Patterns}, year = {2011}, } @inproceedings{chen12lexicon, author = {David L. Chen}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Fast Online Lexicon Learning for Grounded Language Acquisition}, year = {2012}, } @inproceedings{riedel13universal, author = {Sebastian Riedel and Limin Yao and Andrew McCallum}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Relation Extraction with Matrix Factorization and Universal Schemas}, year = {2013}, } @inproceedings{jenatton12latent, author = {R. Jenatton and N. Le Roux and A. Bordes and G. Obozinski}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {A latent factor model for highly multi-relational data}, year = {2012}, } @inproceedings{nickel12yago, author = {Maximilian Nickel and Volker Tresp and Hans-Peter Kriegel}, booktitle = {World Wide Web (WWW)}, title = {Factorizing {YAGO}}, year = {2012}, } @inproceedings{fader11reverb, author = {Anthony Fader and Stephen Soderland and Oren Etzioni}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Identifying Relations for Open Information Extraction}, year = {2011}, } @article{collobert11scratch, author = {Ronan Collobert and Jason Weston and Leon Bottou and Michael Karlen and Koray Kavukcuoglu and Pavel Kuksa}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {2493--2537}, title = {Natural Language Processing (almost) from Scratch}, volume = {12}, year = {2011}, } @phdthesis{odonnell11fragment, author = {Timothy J. O'Donnell}, school = {Massachusetts Institute of Technology}, title = {Productivity and Reuse in Language}, year = {2011}, } @inproceedings{song10kernel, author = {L. Song and B. Boots and S. Siddiqi and G. Gordon and A. Smola}, booktitle = {International Conference on Machine Learning (ICML)}, title = {{H}ilbert Space Embeddings of Hidden {M}arkov Models}, year = {2010}, } @inproceedings{parikh12spectral, author = {A. Parikh and L. Song and M. Ishteva and G. Teodoru and E. Xing}, booktitle = {Uncertainty in Artificial Intelligence (UAI)}, title = {A Spectral Algorithm for Latent Junction Trees}, year = {2012}, } @inproceedings{cohen12pcfg, author = {Shay B. Cohen and Karl Stratos and Michael Collins and Dean P. Foster and Lyle Ungar}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Spectral Learning of Latent-Variable {PCFG}s}, year = {2012}, } @inproceedings{balle12automata, author = {B. Balle and M. Mohri}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Spectral Learning of General Weighted Automata via Constrained Matrix Completion}, year = {2012}, } @inproceedings{balle11transducer, author = {B. Balle and A. Quattoni and X. Carreras}, booktitle = {European Conference on Machine Learning and Principles and Practice of Knowledge Discovery in Databases (ECML-PKDD)}, title = {A Spectral Learning Algorithm for Finite State Transducers}, year = {2011}, } @inproceedings{anandkumar13linear, author = {Animashree Anandkumar and Daniel Hsu and Adel Javanmard and Sham M. Kakade}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Learning Linear {B}ayesian Networks with Latent Variables}, year = {2013}, } @article{ghahramani97fhmm, author = {Zoubin Ghahramani and Michael Jordan}, journal = {Machine Learning}, pages = {245--273}, title = {Factorial Hidden {M}arkov Models}, volume = {29}, year = {1997}, } @article{anandkumar13tensor, author = {Anima Anandkumar and Rong Ge and Daniel Hsu and Sham M. Kakade and Matus Telgarsky}, journal = {arXiv}, title = {Tensor decompositions for learning latent variable models}, year = {2013}, } @inproceedings{salakhutdinov09softmax, author = {Ruslan Salakhutdinov and Geoff Hinton}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Replicated Softmax: an Undirected Topic Model}, year = {2009}, } @inproceedings{kirkpatrick10painless, author = {Taylor Berg-Kirkpatrick and Alexandre Bouchard-C\^ot\'e and John DeNero and Dan Klein}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Painless Unsupervised Learning with Features}, year = {2010}, } @article{deselaers12latent, author = {Thomas Deselaers and Tobias Gass and Georg Heigold and Hermann Ney}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI)}, pages = {1105--1117}, title = {Latent log-linear models for handwritten digit classification}, volume = {34}, year = {2012}, } @article{saul96sigmoid, author = {L. Saul and T. Jaakkola and M. I. Jordan}, journal = {Journal of Artificial Intelligence Research (JAIR)}, pages = {61--76}, title = {Mean Field Theory for Sigmoid Belief Networks}, volume = {4}, year = {1996}, } @book{smolensky86rbm, author = {P. Smolensky}, pages = {194--281}, publisher = {MIT Press}, title = {Parallel Distributed Processing: Volume 1: Foundations}, year = {1986}, } @article{anandkumar2013overcomplete, author = {Animashree Anandkumar and Daniel Hsu and Majid Janzamin and Sham Kakade}, journal = {arXiv}, title = {When are Overcomplete Representations Identifiable? Uniqueness of Tensor Decompositions Under Expansion Constraints}, year = {2013 2013}, } @inproceedings{manshadi2013integrating, author = {Mehdi Manshadi and Daniel Gildea and James Allen}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Integrating Programming by Example and Natural Language Programming}, year = {2013}, } @inproceedings{halpern2013unsupervised, author = {Yoni Halpern and David Sontag}, booktitle = {Uncertainty in Artificial Intelligence (UAI)}, title = {Unsupervised Learning of Noisy-Or {B}ayesian Networks}, year = {2013}, } @inproceedings{huang2005better, author = {Liang Huang and David Chiang}, booktitle = {Proceedings of the Ninth International Workshop on Parsing Technology}, pages = {53--64}, title = {Better k-best parsing}, year = {2005}, } @inproceedings{globerson2007fixing, author = {Amir Globerson and Tommi Jaakkola}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Fixing max-product: Convergent message passing algorithms for {MAP} {LP}-relaxations}, year = {2007}, } @article{kolda2009tensor, author = {Tamara G Kolda and Brett W Bader}, journal = {SIAM review}, number = {3}, pages = {455--500}, title = {Tensor decompositions and applications}, volume = {51}, year = {2009}, } @inproceedings{fader2013paraphrase, author = {Anthony Fader and Luke Zettlemoyer and Oren Etzioni}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Paraphrase-Driven Learning for Open Question Answering}, year = {2013}, } @inproceedings{lei2013natural, author = {Tao Lei and Fan Long and Regina Barzilay and Martin Rinard}, booktitle = {Association for Computational Linguistics (ACL)}, title = {From Natural Language Specifications to Program Input Parsers}, year = {2013}, } @inproceedings{menon2013machine, author = {A Menon and Omer Tamuz and Sumit Gulwani and Butler Lampson and A Kalai}, booktitle = {International Conference on Machine Learning (ICML)}, title = {A machine learning framework for programming by example}, year = {2013}, } @inproceedings{miller2008inky, author = {Robert C Miller and Victoria H Chou and Michael Bernstein and Greg Little and Max Van Kleek and David Karger and mc schraefel}, booktitle = {User Interface Software and Technology (UIST)}, pages = {131--140}, title = {{I}nky: a sloppy command line for the web with rich visual feedback}, year = {2008}, } @inproceedings{cai2013large, author = {Qingqing Cai and Alexander Yates}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Large-scale Semantic Parsing via Schema Matching and Lexicon Extension}, year = {2013}, } @inproceedings{yahya2012natural, author = {Mohamed Yahya and Klaus Berberich and Shady Elbassuoni and Maya Ramanath and Volker Tresp and Gerhard Weikum}, booktitle = {Empirical Methods in Natural Language Processing and Computational Natural Language Learning (EMNLP/CoNLL)}, pages = {379--390}, title = {Natural language questions for the web of data}, year = {2012}, } @inproceedings{surdeanu2012multi, author = {Mihai Surdeanu and Julie Tibshirani and Ramesh Nallapati and Christopher D Manning}, booktitle = {Empirical Methods in Natural Language Processing and Computational Natural Language Learning (EMNLP/CoNLL)}, pages = {455--465}, title = {Multi-instance multi-label learning for relation extraction}, year = {2012}, } @inproceedings{riedel2010modeling, author = {Sebastian Riedel and Limin Yao and Andrew McCallum}, booktitle = {Machine Learning and Knowledge Discovery in Databases (ECML PKDD)}, pages = {148--163}, title = {Modeling relations and their mentions without labeled text}, year = {2010}, } @inproceedings{carlson2010toward, author = {Andrew Carlson and Justin Betteridge and Bryan Kisiel and Burr Settles and Estevam R Hruschka Jr and Tom M Mitchell}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Toward an architecture for never-ending language learning}, year = {2010}, } @misc{freebase2013dump, author = {Google}, howpublished = {\url{https://developers.google.com/freebase/data}}, title = {{F}reebase Data Dumps (2013-06-09)}, year = {2013}, } @inproceedings{krishnamurthy2012weakly, author = {Jayant Krishnamurthy and Tom Mitchell}, booktitle = {Empirical Methods in Natural Language Processing and Computational Natural Language Learning (EMNLP/CoNLL)}, pages = {754--765}, title = {Weakly supervised training of semantic parsers}, year = {2012}, } @inproceedings{masaum2012open, author = {Mausam and Michael Schmitz and Robert Bart and Stephen Soderland and Oren Etzioni}, booktitle = {Empirical Methods in Natural Language Processing and Computational Natural Language Learning (EMNLP/CoNLL)}, pages = {523--534}, title = {Open language learning for information extraction}, year = {2012}, } @inproceedings{banko2007open, author = {Michele Banko and Michael J Cafarella and Stephen Soderland and Matthew Broadhead and Oren Etzioni}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, pages = {2670--2676}, title = {Open Information Extraction from the Web}, year = {2007}, } @article{lacoste2012sigma, author = {Simon Lacoste-Julien and Konstantina Palla and Alex Davies and Gjergji Kasneci and Thore Graepel and Zoubin Ghahramani}, journal = {arXiv}, title = {SiGMa: Simple Greedy Matching for Aligning Large Knowledge Bases}, year = {2012}, } @inproceedings{auer2007dbpedia, author = {Sören Auer and Christian Bizer and Georgi Kobilarov and Jens Lehmann and Richard Cyganiak and Zachary G. Ives}, booktitle = {International semantic web conference and Asian semantic web conference (ISWC/ASWC)}, pages = {722--735}, title = {{DB}pedia: A nucleus for a web of open data}, year = {2007}, } @inproceedings{lin2012linking, author = {Thomas Lin and Mausam and Oren Etzioni}, booktitle = {Knowledge Extraction Workshop (AKBC-WEKEX)}, title = {Entity linking at web scale}, year = {2012}, } @inproceedings{hearst1992automatic, author = {Marti A Hearst}, booktitle = {Interational Conference on Computational linguistics}, pages = {539--545}, title = {Automatic acquisition of hyponyms from large text corpora}, year = {1992}, } @inproceedings{chang2012sutime, author = {Angel X Chang and Christopher Manning}, booktitle = {Language Resources and Evaluation (LREC)}, pages = {3735--3740}, title = {{SUT}ime: A library for recognizing and normalizing time expressions}, year = {2012}, } @inproceedings{suchanek2007yago, author = {Fabian M Suchanek and Gjergji Kasneci and Gerhard Weikum}, booktitle = {World Wide Web (WWW)}, pages = {697--706}, title = {{YAGO}: a core of semantic knowledge}, year = {2007}, } @inproceedings{kushman2013regex, author = {Nate Kushman and Regina Barzilay}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, pages = {826--836}, title = {Using Semantic Unification to Generate Regular Expressions from Natural Language}, year = {2013}, } @article{krishnamurthy2013jointly, author = {Jayant Krishnamurthy and Thomas Kollar}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, pages = {193--206}, title = {Jointly Learning to Parse and Perceive: Connecting Natural Language to the Physical World}, volume = {1}, year = {2013}, } @article{artzi2013weakly, author = {Yoav Artzi and Luke Zettlemoyer}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, pages = {49--62}, title = {Weakly supervised learning of semantic parsers for mapping instructions to actions}, volume = {1}, year = {2013}, } @book{baader2003description, author = {Franz Baader}, publisher = {Cambridge University Press}, title = {The description logic handbook: theory, implementation, and applications}, year = {2003}, } @inproceedings{hoffmann2011knowledge, author = {Raphael Hoffmann and Congle Zhang and Xiao Ling and Luke S Zettlemoyer and Daniel S Weld}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {541--550}, title = {Knowledge-Based Weak Supervision for Information Extraction of Overlapping Relations}, year = {2011}, } @inproceedings{finkel2005incorporating, author = {Jenny Rose Finkel and Trond Grenager and Christopher Manning}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {363--370}, title = {Incorporating non-local information into information extraction systems by {G}ibbs sampling}, year = {2005}, } @inproceedings{doan2003learning, author = {AnHai Doan and Jayant Madhavan and Robin Dhamankar and Pedro Domingos and Alon Halevy}, booktitle = {Very Large Data Bases (VLDB)}, pages = {303--320}, title = {Learning to match ontologies on the semantic web}, year = {2003}, } @inproceedings{poon2013gusp, author = {Hoifung Poon}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Grounded Unsupervised Semantic Parsing}, year = {2013}, } @inproceedings{tellex2011understanding, author = {Stefanie Tellex and Thomas Kollar and Steven Dickerson and Matthew R Walter and Ashis Gopal Banerjee and Seth J Teller and Nicholas Roy}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Understanding Natural Language Commands for Robotic Navigation and Mobile Manipulation}, year = {2011}, } @inproceedings{matuszek2012grounded, author = {Cynthia Matuszek and Nicholas FitzGerald and Luke Zettlemoyer and Liefeng Bo and Dieter Fox}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1671--1678}, title = {A joint model of language and perception for grounded attribute learning}, year = {2012}, } @inproceedings{socher2012mvrnn, author = {Richard Socher and Brody Huval and Christopher D Manning and Andrew Y Ng}, booktitle = {Empirical Methods in Natural Language Processing and Computational Natural Language Learning (EMNLP/CoNLL)}, pages = {1201--1211}, title = {Semantic compositionality through recursive matrix-vector spaces}, year = {2012}, } @article{yates2009unsupervised, author = {Alexander Yates and Oren Etzioni}, journal = {Journal of Artificial Intelligence Research (JAIR)}, number = {1}, title = {Unsupervised methods for determining object and relation synonyms on the web}, volume = {34}, year = {2009}, } @inproceedings{unger2012template, author = {Christina Unger and Lorenz Bühmann and Jens Lehmann and Axel-Cyrille Ngonga and Daniel Gerber and Philipp Cimiano}, booktitle = {World Wide Web (WWW)}, pages = {639--648}, title = {Template-based question answering over {RDF} data}, year = {2012}, } @inproceedings{branavan2012learning, author = {SRK Branavan and Nate Kushman and Tao Lei and Regina Barzilay}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {126--135}, title = {Learning high-level planning from text}, year = {2012}, } @inproceedings{huang2012wordrep, author = {Eric H. Huang and Richard Socher and Christopher D. Manning and Andrew Y. Ng}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Improving Word Representations via Global Context and Multiple Word Prototypes}, year = {2012}, } @phdthesis{kushmerick1997wrapper, author = {Nicholas Kushmerick}, school = {University of Washington}, title = {Wrapper induction for information extraction}, year = {1997}, } @inproceedings{cafarella2008webtables, author = {Michael J Cafarella and Alon Halevy and Daisy Zhe Wang and Eugene Wu and Yang Zhang}, booktitle = {Very Large Data Bases (VLDB)}, pages = {538--549}, title = {Web{T}ables: exploring the power of tables on the web}, year = {2008}, } @article{ferrucci2013watson, author = {David Ferrucci and Eric Brown and Jennifer Chu-Carroll and James Fan and David Gondek and Aditya A. Kalyanpur and Adam Lally and J. William Murdock and Eric Nyberg and John Prager and Nico Schlaefer and Chris Welty}, journal = {AI Magazine}, number = {3}, pages = {59--79}, title = {Building {W}atson: An Overview of the {D}eep{QA} Project}, volume = {31}, year = {2013}, } @inproceedings{harris2011sparql, author = {S. Harris and A. Seaborne}, booktitle = {W3C Working Draft, 12 May}, title = {{SPARQL} 1.1 Query Language}, year = {2011}, } @inproceedings{clark1975bridging, author = {Herbert H Clark}, booktitle = {Workshop on theoretical issues in natural language processing}, pages = {169--174}, title = {Bridging}, year = {1975}, } @inproceedings{bollacker2008freebase, author = {Kurt Bollacker and Colin Evans and Praveen Paritosh and Tim Sturge and Jamie Taylor}, booktitle = {International Conference on Management of Data (SIGMOD)}, pages = {1247--1250}, title = {{F}reebase: a collaboratively created graph database for structuring human knowledge}, year = {2008}, } @inproceedings{weiss2010cascades, author = {David Weiss and Ben Taskar}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, title = {Structured Prediction Cascades}, year = {2010}, } @inproceedings{kiddon2011coarse, author = {Chlo'e Kiddon and Pedro Domingos}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Coarse-to-Fine Inference and Learning for First-Order Probabilistic Models}, year = {2011}, } @inproceedings{mccallum2003efficiently, author = {Andrew McCallum}, booktitle = {Uncertainty in Artificial Intelligence (UAI)}, pages = {403--410}, title = {Efficiently inducing features of conditional random fields}, year = {2003}, } @article{della1997inducing, author = {Stephen Della Pietra and Vincent Della Pietra and John Lafferty}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI)}, number = {4}, pages = {380--393}, title = {Inducing features of random fields}, volume = {19}, year = {1997}, } @inproceedings{ram2011density, author = {Parikshit Ram and Alexander G Gray}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, pages = {627--635}, title = {Density estimation trees}, year = {2011}, } @inproceedings{kwiatkowski2013scaling, author = {Tom Kwiatkowski and Eunsol Choi and Yoav Artzi and Luke Zettlemoyer}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Scaling Semantic Parsers with On-the-fly Ontology Matching}, year = {2013}, } @inproceedings{mintz2009distant, author = {Mike Mintz and Steven Bills and Rion Snow and Dan Jurafsky}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {1003--1011}, title = {Distant supervision for relation extraction without labeled data}, year = {2009}, } @book{manning2008ir, author = {Christopher Manning and Prabhakar Raghavan and Hinrich Sch{\"u}tze}, publisher = {Cambridge University Press}, title = {Introduction to information retrieval}, volume = {1}, year = {2008}, } @book{winograd1972language, author = {Terry Winograd}, publisher = {Academic Press}, title = {Understanding Natural Language}, year = {1972}, } @inproceedings{dalvi2012websets, author = {Bhavana Dalvi and William Cohen and Jamie Callan}, booktitle = {Web Search and Data Mining (WSDM)}, pages = {243--252}, title = {WebSets: Extracting sets of entities from the web using unsupervised information extraction}, year = {2012}, } @inproceedings{wang2009character, author = {Richard C Wang and William W Cohen}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1503--1512}, title = {Character-level analysis of semi-structured documents for set expansion}, year = {2009}, } @article{etzioni2005unsupervised, author = {Oren Etzioni and Michael Cafarella and Doug Downey and Ana-Maria Popescu and Tal Shaked and Stephen Soderland and Daniel S Weld and Alexander Yates}, journal = {Artificial Intelligence}, number = {1}, pages = {91--134}, title = {Unsupervised named-entity extraction from the web: An experimental study}, volume = {165}, year = {2005}, } @inproceedings{cohen2002flexible, author = {William W Cohen and Matthew Hurst and Lee S Jensen}, booktitle = {World Wide Web (WWW)}, pages = {232--241}, title = {A flexible learning system for wrapping tables and lists in {HTML} documents}, year = {2002}, } @inproceedings{baroni2010nouns, author = {Marco Baroni and Roberto Zamparelli}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1183--1193}, title = {Nouns are vectors, adjectives are matrices: Representing adjective-noun constructions in semantic space}, year = {2010}, } @inproceedings{ganitkevitch2013ppdb, author = {Juri Ganitkevitch and Benjamin Van Durme and Chris Callison-Burch}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, pages = {758--764}, title = {{PPDB}: The paraphrase database}, year = {2013}, } @article{madnani2010generating, author = {Nitin Madnani and Bonnie J Dorr}, journal = {Computational Linguistics}, number = {3}, pages = {341--387}, title = {Generating phrasal and sentential paraphrases: A survey of data-driven methods}, volume = {36}, year = {2010}, } @article{androutsopoulos2010survey, author = {Ion Androutsopoulos and Prodromos Malakasiotis}, journal = {Journal of Artificial Intelligence Research (JAIR)}, pages = {135--187}, title = {A survey of paraphrasing and textual entailment methods}, volume = {38}, year = {2010}, } @inproceedings{heilman2010tree, author = {Michael Heilman and Noah A Smith}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, pages = {1011--1019}, title = {Tree edit models for recognizing textual entailments, paraphrases, and answers to questions}, year = {2010}, } @inproceedings{barzilay2003learning, author = {Regina Barzilay and Lillian Lee}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, pages = {16--23}, title = {Learning to paraphrase: An unsupervised approach using multiple-sequence alignment}, year = {2003}, } @inproceedings{chang2005toward, author = {Kevin Chen-Chuan Chang and Bin He and Zhen Zhang}, booktitle = {Conference on Innovative Data Systems Research (CIDR)}, pages = {44--55}, title = {Toward Large Scale Integration: Building a {M}eta{Q}uerier over Databases on the Web}, year = {2005}, } @inproceedings{socher2011paraphrase, author = {Richard Socher and Eric H Huang and Jeffrey Pennin and Christopher D Manning and Andrew Ng}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {801--809}, title = {Dynamic pooling and unfolding recursive autoencoders for paraphrase detection}, year = {2011}, } @article{lin2001discovery, author = {Dekang Lin and Patrick Pantel}, journal = {Natural Language Engineering}, pages = {343--360}, title = {Discovery of inference rules for question-answering}, volume = {7}, year = {2001}, } @inproceedings{das2009paraphrase, author = {Dipanjan Das and Noah A Smith}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {468--476}, title = {Paraphrase identification as probabilistic quasi-synchronous recognition}, year = {2009}, } @inproceedings{duclaye2003learning, author = {Florence Duclaye and François Yvon and Olivier Collin}, booktitle = {Workshop on Natural Language Processing for Question Answering}, pages = {35--41}, title = {Learning paraphrases to improve a question-answering system}, year = {2003}, } @inproceedings{stern2011transformation, author = {Asher Stern and Ido Dagan}, booktitle = {Recent Advances in Natural Language Processing}, pages = {455--462}, title = {A Confidence Model for Syntactically-Motivated Entailment Proofs}, year = {2011}, } @inproceedings{wang2010paraphrasing, author = {Mengqiu Wang and Christopher D. Manning}, booktitle = {The International Conference on Computational Linguistics}, pages = {1164--1172}, title = {Probabilistic Tree-Edit Models with Structured Latent Variables for Textual Entailment and Question Answering}, year = {2010}, } @inproceedings{malakasiotis2011generate, author = {Prodromos Malakasiotis and Ion Androutsopoulos}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {96--106}, title = {A generate and rank approach to sentence paraphrasing}, year = {2011}, } @inproceedings{marton2009improved, author = {Yuval Marton and Chris Callison-Burch and Philip Resnik}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {381--390}, title = {Improved statistical machine translation using monolingually-derived paraphrases}, year = {2009}, } @inproceedings{zukerman2002lexical, author = {Ingrid Zukerman and Bhavani Raskutti}, booktitle = {International Conference on Computational Linguistics (COLING)}, pages = {1--7}, title = {Lexical query paraphrasing for document retrieval}, year = {2002}, } @inproceedings{jones2006generating, author = {Rosie Jones and Benjamin Rey and Omid Madani and Wiley Greiner}, booktitle = {World Wide Web (WWW)}, pages = {387--396}, title = {Generating query substitutions}, year = {2006}, } @inproceedings{wan2006dependency, author = {Stephen Wan and Mark Dras and Robert Dale and Cécile Paris}, booktitle = {Australasian Language Technology Workshop}, title = {Using dependency-based features to take the ``para-farce" out of paraphrase}, year = {2006}, } @inproceedings{dolan2004unsupervised, author = {Bill Dolan and Chris Quirk and Chris Brockett}, booktitle = {International Conference on Computational Linguistics (COLING)}, title = {Unsupervised construction of large paraphrase corpora: Exploiting massively parallel news sources}, year = {2004}, } @inproceedings{bannard2005paraphrasing, author = {Colin Bannard and Chris Callison-Burch}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {597--604}, title = {Paraphrasing with bilingual parallel corpora}, year = {2005}, } @article{och2004alignment, author = {Franz Joseph Och and Hermann Ney}, journal = {Computational Linguistics}, pages = {417--449}, title = {The Alignment Template Approach to Statistical Machine Translation}, volume = {30}, year = {2004}, } @book{fellbaum1998wordnet, author = {Christiane Fellbaum}, publisher = {MIT Press}, title = {WordNet: An Electronic Lexical Database}, year = {1998}, } @article{mikolov2013efficient, author = {Tomas Mikolov and Kai Chen and Greg Corrado and Jeffrey Dean}, journal = {arXiv preprint arXiv:1301.3781}, title = {Efficient Estimation of Word Representations in Vector Space}, year = {2013}, } @inproceedings{chang2010discriminative, author = {Ming-Wei Chang and Dan Goldwasser and Dan Roth and Vivek Srikumar}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Discriminative Learning over Constrained Latent Representations}, year = {2010}, } @inproceedings{larochelle2008zero, author = {Hugo Larochelle and Dumitru Erhan and Yoshua Bengio}, booktitle = {AAAI}, pages = {646--651}, title = {Zero-data Learning of New Tasks}, volume = {8}, year = {2008}, } @inproceedings{palatucci2009zero, author = {Mark Palatucci and Dean Pomerleau and Geoffrey E Hinton and Tom M Mitchell}, booktitle = {Advances in neural information processing systems}, pages = {1410--1418}, title = {Zero-shot learning with semantic output codes}, year = {2009}, } @inproceedings{liu2000xwrap, author = {Ling Liu and Calton Pu and Wei Han}, booktitle = {Data Engineering, 2000. Proceedings. 16th International Conference on}, pages = {611--621}, title = {{XWRAP}: An {XML}-enabled wrapper construction system for web information sources}, year = {2000}, } @inproceedings{crescenzi2001roadrunner, author = {Valter Crescenzi and Giansalvatore Mecca and Paolo Merialdo and others}, booktitle = {VLDB}, pages = {109--118}, title = {Roadrunner: Towards automatic data extraction from large web sites}, volume = {1}, year = {2001}, } @article{dalvi2011automatic, author = {Nilesh Dalvi and Ravi Kumar and Mohamed Soliman}, journal = {Proceedings of the VLDB Endowment}, number = {4}, pages = {219--230}, title = {Automatic wrappers for large scale web extraction}, volume = {4}, year = {2011}, } @inproceedings{freitag1998information, author = {Dayne Freitag}, booktitle = {AAAI/IAAI}, pages = {517--523}, title = {Information extraction from {HTML}: Application of a general machine learning approach}, year = {1998}, } @inproceedings{wong2009scalable, author = {Yuk Wah Wong and Dominic Widdows and Tom Lokovic and Kamal Nigam}, booktitle = {IEEE International Conference on Data Mining Workshops}, pages = {302--307}, title = {Scalable attribute-value extraction from semi-structured text}, year = {2009}, } @inproceedings{zhang2013automatic, author = {Zhixian Zhang and Kenny Q Zhu and Haixun Wang and Hongsong Li}, booktitle = {International Conference on Data Engineering}, title = {Automatic Extraction of Top-k Lists from the Web}, year = {2013}, } @book{fumarola2011extracting, author = {Fabio Fumarola and Tim Weninger and Rick Barber and Donato Malerba and Jiawei Han}, pages = {285--294}, publisher = {Modern Approaches in Applied Intelligence Springer}, title = {Extracting general lists from web documents: A hybrid approach}, year = {2011}, } @inproceedings{liu2003mining, author = {Bing Liu and Robert Grossman and Yanhong Zhai}, booktitle = {Proceedings of the ninth ACM SIGKDD international conference on Knowledge discovery and data mining}, pages = {601--606}, title = {Mining data records in Web pages}, year = {2003}, } @inproceedings{zheng2007template, author = {Shuyi Zheng and Ruihua Song and Ji-Rong Wen}, booktitle = {AAAI}, pages = {1507--1513}, title = {Template-independent news extraction based on visual consistency}, volume = {7}, year = {2007}, } @inproceedings{zheng2009efficient, author = {Shuyi Zheng and Ruihua Song and Ji-Rong Wen and C Lee Giles}, booktitle = {Proceedings of the 18th ACM conference on Information and knowledge management}, pages = {47--56}, title = {Efficient record-level wrapper induction}, year = {2009}, } @inproceedings{sahuguet1999wysiwyg, author = {Arnaud Sahuguet and Fabien Azavant}, booktitle = {WWW Conference}, title = {{WysiWyg} Web Wrapper Factory ({W4F})}, year = {1999}, } @inproceedings{toutanova2003tagger, author = {Kristina Toutanova and Christopher D. Manning}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, title = {Feature-Rich Part-of-Speech Tagging with a Cyclic Dependency Network}, year = {2003}, } @book{dagan2013rte, author = {Ido Dagan and Dan Roth and Mark Sammons and Fabio Massimo Zanzotto}, publisher = {Morgan and Claypool Publishers}, title = {Recognizing Textual Entailment: Models and Applications}, year = {2013}, } @inproceedings{harabagiu06methodsfor, author = {Sanda Harabagiu and Andrew Hickl}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Methods for Using Textual Entailment in Open-Domain Question Answering}, year = {2006}, } @inproceedings{romano2006investigating, author = {Lorenzo Romano and Milen kouylekov and Idan Szpektor and Ido Dagan and Alberto Lavelli}, booktitle = {European Association for Computational Linguistics (EACL)}, title = {Investigating a Generic Paraphrase-based Approach for Relation Extraction}, year = {2006}, } @article{piwek2012varieties, author = {Paul Piwek and Kristy Elizabeth Boyer}, journal = {Dialogue and Discourse}, pages = {1--9}, title = {Varieties of Question Generation: Introduction to this Special Issue}, volume = {3}, year = {2012}, } @article{yao2012semantics, author = {Xuchen Yao and Gosse Bouma and Yi Zhang}, journal = {Dialogue and Discourse}, pages = {11--42}, title = {Semantics-based Question Generation and Implementation}, volume = {3}, year = {2012}, } @article{olney2012question, author = {Andrew M. Olney and Arthur C. Graesser and Natalie K. Person}, journal = {Dialogue and Discourse}, pages = {75--99}, title = {Question Generation from Concept Maps}, volume = {3}, year = {2012}, } @article{muslea2001hierarchical, author = {Ion Muslea and Steven Minton and Craig A Knoblock}, journal = {Autonomous Agents and Multi-Agent Systems}, number = {1}, pages = {93--114}, title = {Hierarchical wrapper induction for semistructured information sources}, volume = {4}, year = {2001}, } @inproceedings{haghighi05robust, author = {Aria Haghighi and Andrew Y. Ng and Christopher D. Manning}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Robust Textual Inference via Graph Matching}, year = {2005}, } @inproceedings{spitkovsky2012cross, author = {Valentin I Spitkovsky and Angel X Chang}, booktitle = {Language Resources and Evaluation (LREC)}, pages = {3168--3175}, title = {A Cross-Lingual Dictionary for {E}nglish {W}ikipedia Concepts}, year = {2012}, } @inproceedings{bergsma2008discriminative, author = {Shane Bergsma and Dekang Lin and Randy Goebel}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {59--68}, title = {Discriminative learning of selectional preference from unlabeled text}, year = {2008}, } @article{recasens2010paraphrase, author = {Marta Recasens and Marta Vila}, journal = {Computational Linguistics}, number = {4}, pages = {639--647}, title = {On paraphrase and coreference}, volume = {36}, year = {2010}, } @inproceedings{singh2011large, author = {Sameer Singh and Amarnag Subramanya and Fernando Pereira and Andrew McCallum}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {793--803}, title = {Large-scale cross-document coreference using distributed inference and hierarchical models}, year = {2011}, } @inproceedings{snow2004learning, author = {Rion Snow and Daniel Jurafsky and Andrew Y Ng}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Learning syntactic patterns for automatic hypernym discovery}, year = {2004}, } @inproceedings{pauls2009kbest, author = {Adam Pauls and Dan Klein}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {958--966}, title = {{K}-best {A*} parsing}, year = {2009}, } @inproceedings{klein2002fast, author = {Dan Klein and Christopher D Manning}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Fast exact inference with a factored model for natural language parsing}, year = {2002}, } @inproceedings{song2011kernel, author = {Le Song and Eric P Xing and Ankur P Parikh}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {2708--2716}, title = {Kernel embeddings of latent tree graphical models}, year = {2011}, } @mastersthesis{anca2009math, author = {Stefan Anca}, school = {Jacobs University Bremen}, title = {Natural Language and Mathematics Processing for Applicable Theorem Search}, year = {2009}, } @book{ganesalingam2013math, author = {Mohan Ganesalingam}, publisher = {Springer-Verlag}, title = {The Language of Mathematics}, year = {2013}, } @inproceedings{klein2003fast, author = {Dan Klein and Christopher Manning}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, title = {{A*} Parsing: Fast Exact Viterbi Parse Selection}, year = {2003}, } @inproceedings{zhu2005twod, author = {Jun Zhu and Zaiqing Nie and Ji-Rong Wen and Bo Zhang and Wei-Ying Ma}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1044--1051}, title = {2{D} conditional random fields for web information extraction}, year = {2005}, } @inproceedings{song2004learning, author = {Ruihua Song and Haifeng Liu and Ji-Rong Wen and Wei-Ying Ma}, booktitle = {World Wide Web (WWW)}, pages = {203--211}, title = {Learning block importance models for web pages}, year = {2004}, } @inproceedings{arasu2003extracting, author = {Arvind Arasu and Hector Garcia-Molina}, booktitle = {ACM SIGMOD international conference on Management of data}, pages = {337--348}, title = {Extracting structured data from web pages}, year = {2003}, } @book{siefkes2005incremental, author = {Christian Siefkes}, pages = {510--521}, publisher = {Computational Linguistics and Intelligent Text Processing Springer}, title = {Incremental information extraction using tree-based context representations}, year = {2005}, } @article{andrieu2010particle, author = {Christophe Andrieu and Arnaud Doucet and Roman Holenstein}, journal = {Journal of the Royal Statistical Society: Series B (Statistical Methodology)}, number = {3}, pages = {269--342}, title = {Particle {M}arkov chain {M}onte {C}arlo methods}, volume = {72}, year = {2010}, } @book{bertot2004interactive, author = {Yves Bertot and Pierre Castéran}, publisher = {Springer}, title = {Interactive theorem proving and program development: {C}oq'{A}rt: the calculus of inductive constructions}, year = {2004}, } @inproceedings{taskar03maxmargin, author = {Ben Taskar and Carlos Guestrin and Daphne Koller}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Max-margin {M}arkov Networks}, year = {2003}, } @article{jaeger2000observable, author = {Herbert Jaeger}, journal = {Neural Computation}, number = {6}, pages = {1371--1398}, title = {Observable operator models for discrete stochastic time series}, volume = {12}, year = {2000}, } @inproceedings{ghahramani1999variational, author = {Z. Ghahramani and M. J Beal}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Variational Inference for {B}ayesian Mixtures of Factor Analysers}, year = {1999}, } @article{jaakkola1999variational, author = {T. S Jaakkola and M. I Jordan}, journal = {Journal of Artificial Intelligence Research (JAIR)}, pages = {291--322}, title = {Variational Probabilistic Inference and the {QMR-DT} Network}, volume = {10}, year = {1999}, } @inproceedings{mossel2005learning, author = {E. Mossel and S. Roch}, booktitle = {Theory of computing}, pages = {366--375}, title = {Learning nonsingular phylogenies and hidden {M}arkov models}, year = {2005}, } @inproceedings{bailly2010spectral, author = {R. Bailly and A. Habrard and F. Denis}, booktitle = {Algorithmic Learning Theory}, pages = {74--88}, title = {A spectral approach for probabilistic grammatical inference on trees}, year = {2010}, } @inproceedings{song2011spectral, author = {Le Song and E. P Xing and A. P Parikh}, booktitle = {International Conference on Machine Learning (ICML)}, title = {A spectral algorithm for latent tree graphical models}, year = {2011}, } @book{koller2009probabilistic, author = {D. Koller and N. Friedman}, publisher = {MIT Press}, title = {Probabilistic graphical models: principles and techniques}, year = {2009}, } @article{quattoni2007hidden, author = {Ariadna Quattoni and Sybor Wang and Louis-Phillipe Morency and Michael Collins and Trevor Darrell}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI)}, number = {10}, pages = {1848--1852}, title = {Hidden-state conditional random fields}, volume = {29}, year = {2007}, } @inproceedings{ross2011learning, author = {Stephane Ross and Daniel Munoz and Martial Hebert and J Andrew Bagnell}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {2737--2744}, title = {Learning message-passing inference machines for structured prediction}, year = {2011}, } @article{bunse1993numerical, author = {Angelika Bunse-Gerstner and Ralph Byers and Volker Mehrmann}, journal = {SIAM Journal on Matrix Analysis and Applications}, number = {4}, pages = {927--949}, title = {Numerical methods for simultaneous diagonalization}, volume = {14}, year = {1993}, } @inproceedings{bao2014qa, author = {J. Bao and Nan Duan and Ming Zhou and Tiejun Zhao}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Knowledge-based Question Answering as Machine Translation}, year = {2014}, } @article{chandrasekaran2013computational, author = {Venkat Chandrasekaran and Michael I Jordan}, journal = {Proceedings of the National Academy of Sciences}, number = {13}, pages = {1181--1190}, title = {Computational and statistical tradeoffs via convex relaxation}, volume = {110}, year = {2013}, } @article{shulaker2013carbon, author = {Max M Shulaker and Gage Hills and Nishant Patil and Hai Wei and Hong-Yu Chen and H-S Philip Wong and Subhasish Mitra}, journal = {Nature}, number = {7468}, pages = {526--530}, title = {Carbon nanotube computer}, volume = {501}, year = {2013}, } @article{choi2007low, author = {Jun Won Choi and Byonghyo Shim and Andrew C Singer and Nam Ik Cho}, journal = {IEEE Transactions on Signal Processing}, number = {10}, pages = {5084--5096}, title = {Low-power filtering via minimum power soft error cancellation}, volume = {55}, year = {2007}, } @article{schnaufer1997adaptive, author = {Bernard A Schnaufer and W Jenkins}, journal = {IEEE Transactions on Circuits and Systems}, number = {12}, pages = {1001--1014}, title = {Adaptive fault tolerance for reliable {LMS} adaptive filtering}, volume = {44}, year = {1997}, } @article{zhang2008bibliographical, author = {Youmin Zhang and Jin Jiang}, journal = {Annual reviews in control}, number = {2}, pages = {229--252}, title = {Bibliographical review on reconfigurable fault-tolerant control systems}, volume = {32}, year = {2008}, } @inproceedings{lin2010energy, author = {Kaisen Lin and Aman Kansal and Dimitrios Lymberopoulos and Feng Zhao}, booktitle = {International conference on Mobile systems, applications, and services}, pages = {285--298}, title = {Energy-accuracy trade-off for continuous mobile device location}, year = {2010}, } @article{shamir2013fundamental, author = {Ohad Shamir}, journal = {arXiv}, title = {Fundamental Limits of Online and Distributed Algorithms for Statistical Learning and Estimation}, year = {2013}, } @article{chen2014statistical, author = {Yudong Chen and Jiaming Xu}, journal = {arXiv}, title = {Statistical-Computational Tradeoffs in Planted Problems and Submatrix Localization with a Growing Number of Clusters and Submatrices}, year = {2014}, } @inproceedings{shivakumar2002modeling, author = {Premkishore Shivakumar and Michael Kistler and Stephen W Keckler and Doug Burger and Lorenzo Alvisi}, booktitle = {International Conference on Dependable Systems and Networks (DSN)}, pages = {389--398}, title = {Modeling the effect of technology trends on the soft error rate of combinational logic}, year = {2002}, } @article{sacks1958asymptotic, author = {Jerome Sacks}, journal = {Annals of Mathematical Statistics}, number = {2}, pages = {373--405}, title = {Asymptotic Distribution of Stochastic Approximation Procedures}, volume = {29}, year = {1958}, } @article{gladyshev1965stochastic, author = {G. E. Gladyshev}, journal = {Theory of Probability and its Applications}, number = {2}, pages = {275--278}, title = {On Stochastic Approximation}, volume = {10}, year = {1965}, } @article{fabian1968asymptotic, author = {Václav Fabian}, journal = {Annals of Mathematical Statistics}, number = {4}, pages = {1327--1332}, title = {On Aymptotic Normality in Stochastic Approximation}, volume = {39}, year = {1968}, } @article{chung1954stochastic, author = {K. L. Chung}, journal = {Annals of Mathematical Statistics}, number = {3}, pages = {463--483}, title = {On a Stochastic Approximation Method}, volume = {25}, year = {1954}, } @article{blum1954multidimensional, author = {Julius R. Blum}, journal = {Annals of Mathematical Statistics}, number = {4}, pages = {737--744}, title = {Multidimensional Stochastic Approximation Methods}, volume = {25}, year = {1954}, } @article{acar2009unsupervised, author = {Acar, Evrim and Yener, B{\"u}lent}, journal = {Knowledge and Data Engineering, IEEE Transactions on}, number = {1}, pages = {6--20}, title = {Unsupervised multiway data analysis: A literature survey}, volume = {21}, year = {2009}, } @article{bader2008discussion, author = {Bader, Brett W and Berry, Michael W and Browne, Murray}, journal = {Survey of Text Mining II}, pages = {147--163}, title = {Discussion tracking in Enron email using {PARAFAC}}, volume = {1}, year = {2008}, } @techreport{hinton2010practical, author = {G. Hinton}, institution = {University of Toronto}, title = {A practical guide to training restricted {B}oltzmann machines}, year = {2010}, } @inproceedings{salakhutdinov2008ais, author = {R. Salakhutdinov and I. Murray}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {872--879}, title = {On the quantitative analysis of deep belief networks}, year = {2008}, } @inproceedings{long2010restricted, author = {P. Long and R. Servedio}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {703--710}, title = {Restricted {B}oltzmann machines are hard to approximately evaluate or simulate}, year = {2010}, } @inproceedings{ravikumar2006quadratic, author = {P. Ravikumar and J. Lafferty}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {737--744}, title = {Quadratic programming relaxations for metric labeling and {M}arkov random field {MAP} estimation}, year = {2006}, } @article{alon2006approximating, author = {N. Alon and A. Naor}, journal = {SIAM Journal on Computing}, number = {4}, pages = {787--803}, title = {Approximating the cut-norm via {G}rothendieck's inequality}, volume = {35}, year = {2006}, } @inproceedings{khot08approximate, author = {S. Khot and A. Naor}, booktitle = {Foundations of Computer Science (FOCS)}, title = {Approximate kernel clustering}, year = {2008}, } @inproceedings{khot10sharp, author = {S. Khot and A. Naor}, booktitle = {Symposium on Discrete Algorithms (SODA)}, title = {Sharp kernel clustering algorithms and their associated {G}rothendieck inequalities}, year = {2010}, } @article{goemans1995improved, author = {M. Goemans and D. Williamson}, journal = {Journal of the ACM (JACM)}, number = {6}, pages = {1115--1145}, title = {Improved approximation algorithms for maximum cut and satisfiability problems using semidefinite programming}, volume = {42}, year = {1995}, } @article{pataki1998rank, author = {G. Pataki}, journal = {Mathematics of Operations Research}, number = {2}, pages = {339--358}, title = {On the rank of extreme matrices in semidefinite programs and the multiplicity of optimal eigenvalues}, volume = {23}, year = {1998}, } @article{so2008unified, author = {A. So and Y. Ye and J. Zhang}, journal = {Mathematics of Operations Research}, number = {4}, pages = {910--920}, title = {A unified theorem on {SDP} rank reduction}, volume = {33}, year = {2008}, } @article{burer01anonlinear, author = {S. Burer and R. Monteiro}, journal = {Mathematical Programming}, number = {2}, pages = {329--357}, title = {A Nonlinear Programming Algorithm for Solving Semidefinite Programs via Low-rank Factorization}, volume = {95}, year = {2001}, } @article{burer2005local, author = {S. Burer and R. Monteiro}, journal = {Mathematical Programming}, number = {3}, pages = {427--444}, title = {Local minima and convergence in low-rank semidefinite programming}, volume = {103}, year = {2005}, } @article{nesterov1998semidefinite, author = {Y. Nesterov}, journal = {Optimization methods and software}, pages = {141--160}, title = {Semidefinite relaxation and nonconvex quadratic optimization}, volume = {9}, year = {1998}, } @article{rietz1974proof, author = {R. E. Rietz}, journal = {Israel Journal of Mathematics}, number = {3}, pages = {271--276}, title = {A proof of the {G}rothendieck inequality}, volume = {19}, year = {1974}, } @inproceedings{briet2010positive, author = {J. Bri{\"e}t and F. M. de Oliveira Filho and F. Vallentin}, booktitle = {Automata, Languages and Programming}, pages = {31--42}, title = {The positive semidefinite {G}rothendieck problem with rank constraint}, year = {2010}, } @article{briet2014groth, author = {J. Bri{\"e}t and F. M. de Oliveira Filho and F. Vallentin}, journal = {Theory of Computing}, pages = {77--105}, title = {{G}rothendieck inequalities for semidefinite programs with rank constraints}, volume = {10}, year = {2014}, } @article{malik06thegap, author = {U. Malik and Imad M. Jaimoukha and G. D. Halikias and S. K. Gungah}, journal = {Mathematical Programming}, number = {3}, pages = {505--515}, title = {On the gap between the quadratic integer programming problem and its semidefinite relaxation}, volume = {107}, year = {2006}, } @article{halikias07newbounds, author = {G. D. Halikias and Imad M. Jaimoukha and U. Malik and S. K. Gungah}, journal = {Journal of Global Optimization}, number = {4}, pages = {543--554}, title = {New bounds on the unconstrained quadratic integer programming problem}, volume = {39}, year = {2007}, } @article{barvinok95problems, author = {A. I. Barvinok}, journal = {Discrete \& Computational Geometry}, pages = {189--202}, title = {Problems of Distance Geometry and Convex Properties of Quadratic Maps}, volume = {13}, year = {1995}, } @techreport{alfakih98embeddability, author = {A. Afakih and H. Wolkowicz}, institution = {University of Waterloo}, title = {On the embeddability of weighted graphs in Euclidean spaces}, year = {1998}, } @article{pisier12grothendieck, author = {G. Pisier}, journal = {Bulletin of the American Mathematical Society}, pages = {237--323}, title = {{G}rothendieck's Theorem, past and present}, volume = {49}, year = {2012}, } @inproceedings{riedel2012parse, author = {S. Riedel and D. Smith and A. McCallum}, booktitle = {Empirical Methods in Natural Language Processing and Computational Natural Language Learning (EMNLP/CoNLL)}, pages = {732--743}, title = {Parse, price and cut: delayed column and row generation for graph based parsers}, year = {2012}, } @article{shi2000normalized, author = {J. Shi and J. Malik}, journal = {Pattern Analysis and Machine Intelligence, IEEE Transactions on}, number = {8}, pages = {888--905}, title = {Normalized cuts and image segmentation}, volume = {22}, year = {2000}, } @inproceedings{kulis2007fast, author = {B. Kulis and A. C. Surendran and J. C. Platt}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, pages = {235--242}, title = {Fast low-rank semidefinite programming for embedding and clustering}, year = {2007}, } @article{kumar2009analysis, author = {M. P. Kumar and V. Kolmogorov and P. Torr}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {71--106}, title = {An analysis of convex relaxations for {MAP} estimation of discrete {MRF}s}, volume = {10}, year = {2009}, } @article{recht2013parallel, author = {B. Recht and C. Ré}, journal = {Mathematical Programming Computation}, pages = {1--26}, title = {Parallel stochastic gradient algorithms for large-scale matrix completion}, volume = {5}, year = {2013}, } @inproceedings{lee2010practical, author = {J. Lee and B. Recht and N. Srebro and J. Tropp and R. Salakhutdinov}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1297--1305}, title = {Practical large-scale optimization for max-norm regularization}, year = {2010}, } @inproceedings{krahenbuhl2011efficient, author = {P. Kr{\"a}henb{\"u}hl and V. Koltun}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Efficient inference in fully connected {CRF}s with {G}aussian edge potentials}, year = {2011}, } @inproceedings{krahenbuhl2013learning, author = {P. Kr{\"a}henb{\"u}hl and V. Koltun}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {513--521}, title = {Parameter Learning and Convergent Inference for Dense Random Fields}, year = {2013}, } @inproceedings{rush2010dual, author = {A. Rush and D. Sontag and M. Collins and T. Jaakkola}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1--11}, title = {On dual decomposition and linear programming relaxations for natural language processing}, year = {2010}, } @inproceedings{sontag2008outer, author = {D. Sontag and T. Jaakkola}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1393--1400}, title = {New Outer Bounds on the Marginal Polytope}, year = {2008}, } @inproceedings{sontag2008tightening, author = {D. Sontag and T. Meltzer and A. Globerson and Y. Weiss and T. Jaakkola}, booktitle = {Uncertainty in Artificial Intelligence (UAI)}, pages = {503--510}, title = {Tightening {LP} Relaxations for {MAP} using Message-Passing}, year = {2008}, } @inproceedings{cour2007solving, author = {T. Cour and J. Shi}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, pages = {75--82}, title = {Solving {M}arkov random fields with spectral relaxation}, year = {2007}, } @article{winder66partition, author = {R. O. Winder}, journal = {SIAM Journal on Applied Mathematics}, number = {4}, pages = {811--818}, title = {Partitions of {N}-Space by Hyperplanes}, volume = {14}, year = {1966}, } @inproceedings{kappes2013benchmark, author = {Jőrg H. Kappes and Bjoern Andres and Fred A. Hamprecht and Christoph Schnőrr and Sebastian Nowozin and Dhruv Batra and Sungwoong Kim and Bernhard X. Kausler and Jan Lellmann and Nikos Komodakis and Carsten Rother}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {A Comparative Study of Modern Inference Techniques for Discrete Energy Minimization Problem}, year = {2013}, } @article{allemand2001polynomial, author = {Kim Allemand and Komei Fukuda and Thomas M Liebling and Erich Steiner}, journal = {Mathematical programming}, number = {1}, pages = {49--52}, title = {A polynomial case of unconstrained zero-one quadratic optimization}, volume = {91}, year = {2001}, } @article{geman1984stochastic, author = {Stuart Geman and Donald Geman}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI)}, pages = {721--741}, title = {Stochastic relaxation, {G}ibbs distributions, and the {B}ayesian restoration of images}, volume = {6}, year = {1984}, } @inproceedings{hills2013rapid, author = {Gage Hills and Jie Zhang and Charles Mackin and Max Shulaker and Hai Wei and Hon Sun Philip Wong and Subhasish Mitra}, booktitle = {Proceedings of the 50th Annual Design Automation Conference}, title = {Rapid Exploration of Processing and Design Guidelines to Overcome Carbon Nanotube Variations}, year = {2013}, } @article{lohstroh1983worst, author = {Jan Lohstroh and Evert Seevinck and Jan De Groot}, journal = {IEEE Journal of Solid-State Circuits}, number = {6}, pages = {803--807}, title = {Worst-case static noise margin criteria for logic circuits and their mathematical equivalence}, volume = {18}, year = {1983}, } @article{luo2013compact, author = {Jieying Luo and Lan Wei and Chi-Shuen Lee and Aaron D. Franklin and Ximeng Guan and Eric Pop and Dimitri Antoniadis and Hon Sun Philip Wong}, journal = {IEEE Transactions on Electron Devices}, number = {6}, pages = {1834--1843}, title = {Compact Model for Carbon Nanotube Field-Effect Transistors Including Nonidealities and Calibrated with Experimental Data Down to 9-nm Gate Length}, volume = {60}, year = {2013}, } @article{cardoso1996joint, author = {J. Cardoso and A. Souloumiac}, journal = {SIAM Journal on Matrix Analysis and Applications}, number = {1}, pages = {161--164}, title = {Jacobi angles for simultaneous diagonalization}, volume = {17}, year = {1996}, } @article{afsari2008sensitivity, author = {B. Afsari}, journal = {SIAM Journal on Matrix Analysis and Applications}, number = {3}, pages = {1148--1171}, title = {Sensitivity analysis for the problem of matrix joint diagonalization}, volume = {30}, year = {2008}, } @techreport{cardoso1994perturbation, author = {J. Cardoso}, institution = {Télécom Paris}, title = {Perturbation of Joint Diagonalizers}, year = {1994}, } @article{laurent2000adaptive, author = {B. Laurent and P. Massart}, journal = {Annals of Statistics}, number = {5}, pages = {1302--1338}, title = {Adaptive estimation of a quadratic functional by model selection}, volume = {28}, year = {2000}, } @article{hastad1990tensor, author = {J. Ho{a}stad}, journal = {Journal of Algorithms}, number = {4}, title = {Tensor rank is {NP}-complete}, volume = {11}, year = {1990}, } @inproceedings{souloumiac2009joint, author = {A. Souloumiac}, booktitle = {Computational Advances in Multi-Sensor Adaptive Processing}, pages = {305--308}, title = {Joint diagonalization: Is non-orthogonal always preferable to orthogonal?}, year = {2009}, } @article{delathauwer2006decomposition, author = {Lieven De Lathauwer}, journal = {SIAM Journal of Matrix Analysis and Applications}, number = {3}, pages = {642--666}, title = {A Link Between the Canonical Decomposition in Multilinear Algebra and Simultaneous Matrix Diagonalization}, volume = {28}, year = {2006}, } @inproceedings{vasilescu2005multilinear, author = {M Alex O Vasilescu and Demetri Terzopoulos}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {547--553}, title = {Multilinear independent components analysis}, volume = {1}, year = {2005}, } @article{beckmann2005tensorial, author = {Christian F Beckmann and Stephen M Smith}, journal = {Neuroimage}, number = {1}, pages = {294--311}, title = {Tensorial extensions of independent component analysis for multisubject {FMRI} analysis}, volume = {25}, year = {2005}, } @article{yeredor2002non, author = {Arie Yeredor}, journal = {IEEE Transactions on Signal Processing}, number = {7}, pages = {1545--1553}, title = {Non-orthogonal joint diagonalization in the least-squares sense with application in blind source separation}, volume = {50}, year = {2002}, } @article{ziehe2004fast, author = {Andreas Ziehe and Pavel Laskov and Guido Nolte and Klaus-Robert Műller}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {777--800}, title = {A fast algorithm for joint diagonalization with non-orthogonal transformations and its application to blind source separation}, volume = {5}, year = {2004}, } @article{vollgraf2006quadratic, author = {Roland Vollgraf and Klaus Obermayer}, journal = {IEEE Transactions on Signal Processing}, number = {9}, pages = {3270--3278}, title = {Quadratic optimization for simultaneous matrix diagonalization}, volume = {54}, year = {2006}, } @inproceedings{afsari2006simple, author = {Bijan Afsari}, booktitle = {Independent Component Analysis and Blind Signal Separation}, pages = {1--7}, title = {Simple {LU} and {QR} based non-orthogonal matrix joint diagonalization}, year = {2006}, } @inproceedings{guo2010approximate, author = {Xijing Guo and Shihua Zhu and Sebastian Miron and David Brie}, booktitle = {International Conference on Acoustics, Speech, and Signal Processing (ICASSP)}, pages = {3774--3777}, title = {Approximate joint diagonalization by nonorthogonal nonparametric jacobi transformations}, year = {2010}, } @article{anandkumar2014guaranteed, author = {Animashree Anandkumar and Rong Ge and Majid Janzamin}, journal = {arXiv}, title = {Guaranteed Non-Orthogonal Tensor Decomposition via Alternating Rank-1 Updates}, year = {2014}, } @article{candes2006near, author = {Emmanuel J Candes and Terence Tao}, journal = {IEEE Transactions on Information Theory}, number = {12}, pages = {5406--5425}, title = {Near-optimal signal recovery from random projections: Universal encoding strategies?}, volume = {52}, year = {2006}, } @article{haupt2006signal, author = {Jarvis Haupt and Robert Nowak}, journal = {IEEE Transactions on Information Theory}, number = {9}, pages = {4036--4048}, title = {Signal reconstruction from noisy random projections}, volume = {52}, year = {2006}, } @inproceedings{sarlos2006improved, author = {Tamas Sarlos}, booktitle = {Foundations of Computer Science (FOCS)}, pages = {143--152}, title = {Improved approximation algorithms for large matrices via random projections}, year = {2006}, } @inproceedings{kleinberg1997two, author = {Jon M Kleinberg}, booktitle = {Symposium on Theory of Computing (STOC)}, pages = {599--608}, title = {Two algorithms for nearest-neighbor search in high dimensions}, year = {1997}, } @article{delathauwer2001independent, author = {Lieven De Lathauwer and Bart De Moor and Joos Vandewalle}, journal = {Signal Processing, IEEE Transactions on}, number = {10}, pages = {2262--2271}, title = {Independent component analysis and (simultaneous) third-order tensor diagonalization}, volume = {49}, year = {2001}, } @inproceedings{sutskever2009modelling, author = {Ilya Sutskever and Ruslan Salakhutdinov and Joshua B Tenenbaum}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1821--1828}, title = {Modelling Relational Data using {B}ayesian Clustered Tensor Factorization}, year = {2009}, } @inproceedings{nickel2011three, author = {Maximilian Nickel and Volker Tresp and Hans-Peter Kriegel}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {809--816}, title = {A three-way model for collective learning on multi-relational data}, year = {2011}, } @inproceedings{anandkumar2013community, author = {Animashree Anandkumar and Rong Ge and Daniel Hsu and Sham Kakade}, booktitle = {Conference on Learning Theory (COLT)}, pages = {867--881}, title = {A Tensor Spectral Approach to Learning Mixed Membership Community Models}, year = {2013}, } @article{boykov2004mincut, author = {Yuri Boykov and Vladimir Kolmogorov}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI)}, pages = {1124--1137}, title = {An Experimental Comparison of Min-Cut/Max-Flow Algorithms for Energy Minimization in Vision}, volume = {26}, year = {2004}, } @article{boykov2004what, author = {Vladimir Kolmogorov and Ramin Zabih}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI)}, pages = {147--159}, title = {What Energy Functions Can Be Minimized via Graph Cuts?}, volume = {26}, year = {2004}, } @article{boykov2001fast, author = {Yuri Boykov and Olga Veksler and Ramin Zabih}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI)}, pages = {1222--1239}, title = {Fast Approximate Energy Minimization via Graph Cuts?}, volume = {23}, year = {2001}, } @article{schoenberg1942positive, author = {Isaac J Schoenberg}, journal = {Duke Mathematical Journal}, pages = {96--108}, title = {Positive definite functions on spheres}, volume = {9}, year = {1942}, } @article{jordan1999variational, author = {Michael I. Jordan and Zoubin Ghahramani and Tommi S. Jaakkola and Lawrence K. Saul}, journal = {Machine Learning}, pages = {183--233}, title = {An Introduction to Variational Methods for Graphical Models}, volume = {37}, year = {1999}, } @inproceedings{wei2009non, author = {Wei, Lan and Frank, David J and Chang, Leland and Wong, H-SP}, booktitle = {IEEE International Electron Devices Meeting}, title = {A non-iterative compact model for carbon nanotube FETs incorporating source exhaustion effects}, year = {2009}, } @article{natori1998scaling, author = {Natori, Kenji and Sano, Nobuyuki}, journal = {Journal of applied physics}, number = {10}, pages = {5019--5024}, title = {Scaling limit of digital circuits due to thermal noise}, volume = {83}, year = {1998}, } @book{weste2010cmos, author = {Weste, Neil and Harris, David}, publisher = {Addison-Wesley Publishing Company}, title = {{CMOS} {VLSI} design: a circuits and systems perspective}, year = {2010}, } @article{brachat2010symmetric, author = {Jerome Brachat and Pierre Comon and Bernard Mourrain and Elias Tsigaridas}, journal = {Linear Algebra and its Applications}, number = {11}, pages = {1851--1872}, title = {Symmetric tensor decomposition}, volume = {433}, year = {2010}, } @article{comon2009tensor, author = {Pierre Comon and Xavier Luciani and André LF De Almeida}, journal = {Journal of Chemometrics}, number = {7}, pages = {393--405}, title = {Tensor decompositions, alternating least squares and other tales}, volume = {23}, year = {2009}, } @inproceedings{ross2011reduction, author = {Stéphane Ross and Geoffrey Gordon and Andrew Bagnell}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, title = {A reduction of imitation learning and structured prediction to no-regret online learning}, year = {2011}, } @article{goldberg2013training, author = {Yoav Goldberg and Joakim Nivre}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {Training Deterministic Parsers with Non-Deterministic Oracles}, volume = {1}, year = {2013}, } @inproceedings{shalit2014coordinate, author = {Uri Shalit and Gal Chechik}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Coordinate-descent for learning orthogonal matrices through Givens rotations}, year = {2014}, } @article{yeredor2004approximate, author = {Arie Yeredor and Andreas Ziehe and Klaus-Robert Müller}, journal = {Independent Component Analysis and Blind Signal Separation}, pages = {86--96}, title = {Approximate Joint Diagonalization Using a Natural Gradient Approach}, volume = {1}, year = {2004}, } @article{halko2011structure, author = {N. Halko and {P.-G.} Martinsson and J. Tropp}, journal = {SIAM Review}, pages = {217--288}, title = {Finding Structure with Randomness: Probabilistic Algorithms for Constructing Approximate Matrix Decompositions}, volume = {53}, year = {2011}, } @article{huang2013fast, author = {Furong Huang and U N Niranjan and Mohammad Umar Hakeem and Animashree Anandkumar}, journal = {arXiv}, title = {Fast Detection of Overlapping Communities via Online Tensor Methods}, year = {2013}, } @inproceedings{liu2005vector, author = {Ning Liu and Benyu Zhang and Jun Yan and Zheng Chen and Wenyin Liu and Fengshan Bai and Leefeng Chien}, booktitle = {International Conference on Data Mining}, title = {Text representation: from vector to tensor}, year = {2005}, } @inproceedings{auli2011efficient, author = {Miachel Auli and Adam Lopez}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Efficient {CCG} parsing: A* versus adaptive supertagging}, year = {2011}, } @inproceedings{manning2014stanford, author = {Christopher D. Manning and Mihai Surdeanu and John Bauer and Jenny Finkel and Steven J. Bethard and Davic McClosky}, booktitle = {ACL system demonstrations}, title = {The {S}tanford {C}ore{NLP} natural language processing toolkit}, year = {2014}, } @inproceedings{yao2014ie, author = {Xuchen Yao and Benjamin Van-Durme}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Information extraction over structured data: Question answering with {F}reebase}, year = {2014}, } @inproceedings{bordes2014qa, author = {Antoine Bordes and Sumit Chopra and Jason Weston}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Question Answering with Subgraph Embeddings}, year = {2014}, } @inproceedings{chen2014nndep, author = {Danqi Chen and Christopher D. Manning}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {A Fast and Accurate Dependency Parser using Neural Networks}, year = {2014}, } @book{kay86algorithm, author = {Martin Kay}, pages = {35--70}, publisher = {Readings in Natural Language Processing}, title = {Algorithm Schemata and Data Structures in Syntactic Processing}, year = {1986}, } @article{caraballo1998new, author = {Sharon A. Caraballo and Eugene Charniak}, journal = {Computational Linguistics}, pages = {275--298}, title = {New figures of merit for best-first probabilistic chart parsing}, volume = {24}, year = {1998}, } @inproceedings{sutton1999policy, author = {Richard Sutton and David McAllester and Satinder Singh and Yishai Mansour}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Policy gradient methods for reinforcement learning with function approximation}, year = {1999}, } @inproceedings{yang2014joint, author = {Min-Chul Yang and Nan Duan and Ming Zhou and Hae-Chang Rim}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Joint Relational Embeddings for Knowledge-based Question Answering}, year = {2014}, } @inproceedings{abbeel2004apprenticeship, author = {Pieter Abbeel and Andrew Ng}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Apprenticeship learning via inverse reinforcement learning}, year = {2004}, } @inproceedings{vlachos2012investigation, author = {Andreas Vlachos}, booktitle = {European Workshop on Reinforcement Learning}, title = {An Investigation of Imitation Learning Algorithms for Structured Prediction}, year = {2012}, } @inproceedings{jiang2012learned, author = {Jiarong Jiang and Adam Teichert and Jason Eisner and Hal {Daum{\'e} III}}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Learned prioritization for trading off accuracy and speed}, year = {2012}, } @inproceedings{huang2008forest, author = {Liang Huang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Forest reranking: Discriminative parsing with non-local features}, year = {2008}, } @inproceedings{rush2012vine, author = {Alexander Rush and Slav Petrov}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, title = {Vine pruning for efficient multi-pass dependency parsing}, year = {2012}, } @inproceedings{lewis2014ccg, author = {Mike Lewis and Mark Steedman}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {A* {CCG} Parsing with a Supertag-factored Model}, year = {2014}, } @inproceedings{kummerfeld2010faster, author = {Jonathan Kummerfeld and Jessika Roesner and Tim Dawborn and James Haggerty and James Curran and Stephen Clark}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Faster parsing by supertagger adaptation}, year = {2010}, } @inproceedings{richardson2013mctest, author = {Matthew Richardson and Christopher JC Burges and Erin Renshaw}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {193--203}, title = {MCTest: A Challenge Dataset for the Open-Domain Machine Comprehension of Text}, year = {2013}, } @inproceedings{brill2002askmsr, author = {Eric Brill and Susan Dumais and Michele Banko}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {257--264}, title = {An analysis of the {A}sk{MSR} question-answering system}, year = {2002}, } @inproceedings{moldovan2002lcc, author = {Dan I Moldovan and Sanda M Harabagiu and Roxana Girju and Paul Morarescu and V Finley Lacatusu and Adrian Novischi and Adriana Badulescu and Orest Bolohan}, booktitle = {TREC}, title = {{LCC} Tools for Question Answering}, year = {2002}, } @inproceedings{cui2005dependency, author = {Hang Cui and Renxu Sun and Keya Li and Min-Yen Kan and Tat-Seng Chua}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, pages = {400--407}, title = {Question answering passage retrieval using dependency relations}, year = {2005}, } @inproceedings{scaria2013biological, author = {Aju Thalappillil Scaria and Jonathan Berant and Mengqiu Wang and Christopher D Manning and Justin Lewis and Brittany Harding and Peter Clark}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Learning biological processes with global constraints}, year = {2013}, } @inproceedings{berant2014biological, author = {Jonathan Berant and Vivek Srikumar and Pei-Chun Chen and Abby Vander Linden and Brittany Harding and Brad Huang and Peter Clark and Christopher D Manning}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Modeling Biological Processes for Reading Comprehension}, year = {2014}, } @inproceedings{lao2012rules, author = {Ni Lao and Amarnag Subramanya and Fernando Pereira and William W Cohen}, booktitle = {Empirical Methods in Natural Language Processing and Computational Natural Language Learning (EMNLP/CoNLL)}, pages = {1017--1026}, title = {Reading the web with learned syntactic-semantic inference rules}, year = {2012}, } @inproceedings{kushman2014algebra, author = {Nate Kushman and Yoav Artzi and Luke Zettlemoyer and Regina Barzilay}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Learning to Automatically Solve Algebra Word Problems}, year = {2014}, } @article{reddy2014large, author = {Siva Reddy and Mirella Lapata and Mark Steedman}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, number = {10}, pages = {377--392}, title = {Large-scale Semantic Parsing without Question-Answer Pairs}, volume = {2}, year = {2014}, } @inproceedings{goldberg2010efficient, author = {Yoav Goldberg and Michael Elhadad}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {742--750}, title = {An efficient algorithm for easy-first non-directional dependency parsing}, year = {2010}, } @inproceedings{zhang2014greed, author = {Yuan Zhang and Tao Lei and Regina Barzilay and Tommi Jaakkola}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Greed is Good if Randomized: New Inference for Dependency Parsing}, year = {2014}, } @inproceedings{wick2011query, author = {Michael L Wick and Andrew McCallum}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {2564--2572}, title = {Query-Aware {MCMC}}, year = {2011}, } @article{andrieu2008tutorial, author = {Christophe Andrieu and Johannes Thoms}, journal = {Statistics and Computing}, number = {4}, pages = {343--373}, title = {A tutorial on adaptive {MCMC}}, volume = {18}, year = {2008}, } @article{hillar2013tensor, author = {Christopher J Hillar and Lek-Heng Lim}, journal = {Journal of the ACM (JACM)}, title = {Most Tensor Problems Are {NP-Hard}}, volume = {60}, year = {2013}, } @article{desilva2008tensor, author = {de Silva, V and Lim, L}, journal = {SIAM Journal on Matrix Analysis and Applications}, pages = {1084--1127}, title = {Tensor Rank and the {Ill-Posedness} of the Best {Low-Rank} Approximation Problem}, volume = {30}, year = {2008}, } @inproceedings{rahimi2007random, author = {Ali Rahimi and Ben Recht}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Random Features for Large-Scale Kernel Machines}, year = {2007}, } @article{guler1992ppa, author = {Osman Guler}, journal = {SIAM Journal on Optimization}, number = {4}, pages = {649--664}, title = {New Proximal Point Algorithms for Convex Minimization}, volume = {2}, year = {1992}, } @article{rockafellar1976ppa, author = {R. Tyrrell Rockafellar}, journal = {SIAM Journal on Control and Optimization}, number = {5}, pages = {877--898}, title = {Monotone operators and the proximal point algorithm}, volume = {14}, year = {1976}, } @article{parikh2014proximal, author = {Neal Parikh and Stephen Boyd}, journal = {Foundations and Trends in Optimization}, number = {3}, pages = {123--231}, title = {Proximal Algorithms}, volume = {1}, year = {2014}, } @article{boyd2011admm, author = {Stephen Boyd and Neal Parikh and Eric Chu and Borja Peleato and Jonathan Eckstein}, journal = {Foundations and Trends in Machine Learning}, number = {1}, pages = {1--122}, title = {Distributed Optimization and Statistical Learning via the Alternating Direction Method of Multipliers}, volume = {3}, year = {2011}, } @inproceedings{syed2010exploiting, author = {Zareen Syed and Tim Finin and Varish Mulwad and Anupam Joshi}, booktitle = {Proceedings of the Second Web Science Conference}, title = {Exploiting a web of semantic data for interpreting tables}, year = {2010}, } @inproceedings{limaye2010annotating, author = {Girija Limaye and Sunita Sarawagi and Soumen Chakrabarti}, booktitle = {Very Large Data Bases (VLDB)}, pages = {1338--1347}, title = {Annotating and searching web tables using entities, types and relationships}, volume = {3}, year = {2010}, } @inproceedings{pimplikar2012answering, author = {Rakesh Pimplikar and Sunita Sarawagi}, booktitle = {Very Large Data Bases (VLDB)}, number = {10}, pages = {908--919}, title = {Answering table queries on the web using column keywords}, volume = {5}, year = {2012}, } @inproceedings{gonzalez2010google, author = {Hector Gonzalez and Alon Y Halevy and Christian S Jensen and Anno Langen and Jayant Madhavan and Rebecca Shapley and Warren Shen and Jonathan Goldberg-Kidon}, booktitle = {Proceedings of the 2010 ACM SIGMOD International Conference on Management of data}, pages = {1061--1066}, title = {Google fusion tables: web-centered data management and collaboration}, year = {2010}, } @inproceedings{sarawagi2014open, author = {Sunita Sarawagi and Soumen Chakrabarti}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, pages = {711--720}, title = {Open-domain quantity queries on web tables: annotation, response, and consensus models}, year = {2014}, } @inproceedings{venetis2011recovering, author = {Petros Venetis and Alon Halevy and Jayant Madhavan and Marius Pa{\c{s}}ca and Warren Shen and Fei Wu and Gengxin Miao and Chung Wu}, booktitle = {Very Large Data Bases (VLDB)}, pages = {528--538}, title = {Recovering semantics of tables on the web}, volume = {4}, year = {2011}, } @inproceedings{fader2014open, author = {Anthony Fader and Luke Zettlemoyer and Oren Etzioni}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, pages = {1156--1165}, title = {Open question answering over curated and extracted knowledge bases}, year = {2014}, } @inproceedings{ji2011knowledge, author = {Heng Ji and Ralph Grishman}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {1148--1158}, title = {Knowledge base population: Successful approaches and challenges}, year = {2011}, } @inproceedings{unger2011pythia, author = {Christina Unger and Philipp Cimiano}, booktitle = {Proceedings of the 16th international conference on Natural language processing and information systems}, pages = {153--160}, title = {Pythia: compositional meaning construction for ontology-based question answering on the semantic web}, year = {2011}, } @inproceedings{rangel2014features, author = {Rodolfo A Pazos Rangel and Marco A Aguirre and Juan J González and Juan Martín Carpio}, booktitle = {Recent Advances on Hybrid Approaches for Designing Intelligent Systems}, pages = {617--630}, title = {Features and Pitfalls that Users Should Seek in Natural Language Interfaces to Databases}, year = {2014}, } @inproceedings{garrette2013learning, author = {Dan Garrette and Jason Baldridge}, booktitle = {North American Association for Computational Linguistics (NAACL)}, pages = {138--147}, title = {Learning a Part-of-Speech Tagger from Two Hours of Annotation}, year = {2013}, } @inproceedings{price1990atis, author = {Patti Price}, booktitle = {Proceedings of the Third DARPA Speech and Natural Language Workshop}, pages = {91--95}, title = {Evaluation of spoken language systems: The {ATIS} domain}, year = {1990}, } @inproceedings{hosseini2014learning, author = {Mohammad Javad Hosseini and Hannaneh Hajishirzi and Oren Etzioni and Nate Kushman}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {523--533}, title = {Learning to Solve Arithmetic Word Problems with Verb Categorization}, year = {2014}, } @inproceedings{schwitter2010controlled, author = {Rolf Schwitter}, booktitle = {International Conference on Computational Linguistics (COLING)}, pages = {1113--1121}, title = {Controlled natural languages for knowledge representation}, year = {2010}, } @article{wang2011semantic, author = {Ye-Yi Wang and Li Deng and Alex Acero}, journal = {Spoken Language Understanding: Systems for Extracting Semantic Information from Speech}, pages = {41--91}, title = {Semantic Frame-Based Spoken Language Understanding}, year = {2011}, } @inproceedings{wu2010open, author = {Fei Wu and Daniel S Weld}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {118--127}, title = {Open information extraction using {W}ikipedia}, year = {2010}, } @inproceedings{gupta2009answering, author = {Rahul Gupta and Sunita Sarawagi}, booktitle = {Very Large Data Bases (VLDB)}, number = {1}, pages = {289--300}, title = {Answering table augmentation queries from unstructured lists on the web}, year = {2009}, } @inproceedings{yao2014freebase, author = {Xuchen Yao and Jonathan Berant and Benjamin Van-Durme}, booktitle = {Workshop on Semantic parsing}, title = {{F}reebase {QA}: Information Extraction or Semantic Parsing}, year = {2014}, } @inproceedings{melamud2013context, author = {Oren Melamud and Jonathan Berant and Ido Dagan and Jacob Goldberger and Idan Szpektor}, booktitle = {Association for Computational Linguistics (ACL)}, title = {A Two Level Model for Context Sensitive Inference Rules}, year = {2013}, } @inproceedings{berant2012efficient, author = {Jonathan Berant and Ido Dagan and Meni Adler and Jacob Goldberger}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Efficient Tree-based Approximation for Entailment Graph learning}, year = {2012}, } @inproceedings{adler2012textexploration, author = {Meni Adler and Jonathan Berant and Ido Dagan}, booktitle = {ACL system demonstrations}, title = {Entailment-based Text Exploration with Application to the Health-care Domain}, year = {2012 2012}, } @inproceedings{zeichner2012crowdsourcing, author = {Naomi Zeichner and Jonathan Berant and Ido Dagan}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Crowdsourcing Inference-rule Evaluation}, year = {2012}, } @inproceedings{weisman2012learning, author = {Hila Weisman and Jonathan Berant and Idan Szpektor and Ido Dagan}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Learning Verb Inference Rules from Linguistically-motivated Evidence}, year = {2012}, } @inproceedings{berant2011global, author = {Jonathan Berant and Ido Dagan and Jacob Goldberger}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Global Learning of Typed Entailment Rules}, year = {2011}, } @inproceedings{stern2011knowledge, author = {Asher Stern and Amnon Lotan and Shachar Mirkin and Eyal Shnarch and Lili Kotlerman and Jonathan Berant and Ido Dagan}, booktitle = {Text Analysis Conference}, title = {Knowledge and Tree-Edits in Learnable Entailment Proofs}, year = {2011 2011}, } @inproceedings{berant2010global, author = {Jonathan Berant and Ido Dagan and Jacob Goldberger}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Global Learning of Focused Entailment Graphs}, year = {2010}, } @inproceedings{mirkin2010, author = {Shachar Mirkin and Jonathan Berant and Ido Dagan and Eyal Shnarch}, booktitle = {International Conference on Computational Linguistics (COLING)}, title = {Recognising Entailment within Discourse}, year = {2010}, } @inproceedings{stern2010rulechaining, author = {Asher Stern and Eyal Shnarch and Amnon Lotan and Shachar Mirkin and Lili Kotlerman and Naomi Zeichner and Jonathan Berant and Ido Dagan}, booktitle = {Text Analysis Conference}, title = {Rule Chaining and Approximate Match in Textual Inference}, year = {2010}, } @inproceedings{barhaim2009forest, author = {Roy Bar-Haim and Jonathan Berant and Ido Dagan}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {A Compact Forest for Scalable Inference over Entailment and Paraphrase Rules}, year = {2009}, } @inproceedings{mirkin2009discourse, author = {Shachar Mirkin and Roy Bar-Haim and Jonathan Berant and Ido Dagan and Eyal Shnarch and Asher Stern and Idan Szpektor}, booktitle = {Text Analysis Conference}, title = {Addressing Discourse and Document Structure in the {RTE} Search Task}, year = {2009 2009}, } @inproceedings{berant2008tracks, author = {Jonathan Berant and Catherine Caldwell-Harris and Shimon Edelman}, booktitle = {Annual Meeting of the Cognitive Science Society}, title = {Tracks in the Mind: Differential Entrenchment of Common and Rare Liturgical and Every- day Multiword Phrases in Religious and Secular Hebrew Speakers}, year = {2008 2008}, } @inproceedings{barhaim2008, author = {Roy Bar-Haim and Jonathan Berant and Ido Dagan and Iddo Greental and Shachar Mirkin and Eyal Shnarch and Idan Szpektor}, booktitle = {Text Analysis Conference}, title = {Efficient Semantic Deduction and Approximate Matching over Compact Parse Forests}, year = {2008 2008}, } @inproceedings{berant2007boosting, author = {Jonathan Berant and Yaron Gross and Matan Mussel and Ben Sandbank and Eytan Ruppin and Shimon Edelman}, booktitle = {Boston University Conference on Language Development}, title = {Boosting Unsupervised Grammar Induction by Splitting Complex Sentences on Function Words}, year = {2007 2007}, } @article{berant2012learning, author = {Jonathan Berant and Ido Dagan and Jacob Goldberger}, journal = {Computational Linguistics}, pages = {73--111}, title = {Learning Entailment Relations by Global Graph Structure Optimization}, volume = {38}, year = {2012}, } @inproceedings{harris2012measuring, author = {Catherine Caldwell-Harris and Jonathan Berant and Shimon Edelman}, booktitle = {Frequency Effects in Cognitive Linguistics (Vol. 1): Statistical Effects in Learnability, Processing and Change}, pages = {165--194}, title = {Measuring Mental Entrenchment of Phrases with Perceptual Identification, Familiarity Ratings, and Corpus Frequency Statistics}, year = {2012}, } @inproceedings{zhang2010chart, author = {Yue Zhang and Byung-Gyu Ahn and Stephen Clark and Curt Van Wyk and James R. Curran and Laura Rimell}, booktitle = {International Conference on Computational Linguistics (COLING)}, title = {Chart pruning for fast lexicalised-grammar parsing}, year = {2010}, } @inproceedings{bodenstab2011beam, author = {Nathan Bodenstab and Aaron Dunlop and Keith Hall and Brian Roark}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {440--449}, title = {Beam-width prediction for efficient context-free parsing}, year = {2011}, } @inproceedings{fitzgerald2013learning, author = {Nicholas FitzGerald and Yoav Artzi and Luke S. Zettlemoyer}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1914--1925}, title = {Learning Distributions over Logical Forms for Referring Expression Generation}, year = {2013}, } @article{chang2015learning, author = {Kai-Wei Chang and Akshay Krishnamurthy and Alekh Agarwal and Hal {Daum{\'e} III} and John Langford}, journal = {arXiv}, title = {Learning to search better than your teacher}, year = {2015}, } @inproceedings{chang2014scene, author = {Angel X Chang and Manolis Savva and Christopher D Manning}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Learning Spatial Knowledge for Text to 3{D} Scene Generation}, year = {2014}, } @inproceedings{socher2011parsing, author = {Richard Socher and Cliff C Lin and Chris Manning and Andrew Y Ng}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {129--136}, title = {Parsing natural scenes and natural language with recursive neural networks}, year = {2011}, } @article{weston2015towards, author = {Jason Weston and Antoine Bordes and Sumit Chopra and Tomas Mikolov}, journal = {arXiv preprint arXiv:1502.05698}, title = {Towards {AI}-Complete Question Answering: A Set of Prerequisite Toy Tasks}, year = {2015}, } @inproceedings{singh2015tensor, author = {Sameer Singh and Tim Rockt{\"{a}}schel and Sebastian Riedel}, booktitle = {NAACL Workshop on Vector Space Modeling for NLP}, title = {Towards Combined Matrix and Tensor Factorization for Universal Schema Relation Extraction}, year = {2015}, } @inproceedings{chang2014tensor, author = {Kai-Wei Chang and Wen-Tau Yih and Bishan Yang and Christopher Meek}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1568--1579}, title = {Typed tensor decomposition of knowledge bases for relation extraction}, year = {2014}, } @inproceedings{lasecki2013realtime, author = {Walter S Lasecki and Young Chol Song and Henry Kautz and Jeffrey P. Bigham}, booktitle = {Conference on Computer Supported Cooperative Work}, pages = {1203--1212}, title = {Real-time Crowd Labeling for Deployable Activity Recognition}, year = {2013}, } @inproceedings{cheng2015flock, author = {Justin Cheng and Michael S Bernstein}, booktitle = {Proceedings of the 18th {ACM} Conference on Computer Supported Cooperative Work \& Social Computing}, pages = {600--611}, title = {Flock: Hybrid {Crowd-Machine} Learning Classifiers}, year = {2015}, } @inproceedings{cohen2013pcfg, author = {Shay B Cohen and Giorgio Satta and Michael Collins}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, pages = {487--496}, title = {Approximate {PCFG} Parsing Using Tensor Decomposition}, year = {2013}, } @article{bertsimas2011theory, author = {Dimitris Bertsimas and David B Brown and Constantine Caramanis}, journal = {SIAM review}, number = {3}, pages = {464--501}, title = {Theory and applications of robust optimization}, volume = {53}, year = {2011}, } @article{chechik2008max, author = {Gal Chechik and Geremy Heitz and Gal Elidan and Pieter Abbeel and Daphne Koller}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {1--21}, title = {Max-margin classification of data with absent features}, volume = {9}, year = {2008}, } @article{buhlmann1999variable, author = {Peter B{\"u}hlmann and Abraham J Wyner}, journal = {Annals of Statistics}, number = {2}, pages = {480--513}, title = {Variable length {M}arkov chains}, volume = {27}, year = {1999}, } @inproceedings{riedel2010relaxed, author = {Sebastian Riedel and David A Smith}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {760--768}, title = {Relaxed marginal inference and its application to dependency parsing}, year = {2010}, } @inproceedings{stoyanov2012fast, author = {Veselin Stoyanov and Jason Eisner}, booktitle = {ICML Workshop on Inferning: Interactions between Inference and Learning}, title = {Fast and Accurate Prediction via Evidence-Specific {MRF} Structure}, year = {2012}, } @article{barbu2009training, author = {Adrian Barbu}, journal = {IEEE Transactions on Image Processing}, number = {11}, pages = {2451--2462}, title = {Training an active random field for real-time image denoising}, volume = {18}, year = {2009}, } @inproceedings{stoyanov2011empirical, author = {Veselin Stoyanov and Alexander Ropson and Jason Eisner}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, pages = {725--733}, title = {Empirical risk minimization of graphical model parameters given approximate inference, decoding, and model structure}, year = {2011}, } @inproceedings{domke2011parameter, author = {Justin Domke}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {2937--2943}, title = {Parameter learning with truncated message-passing}, year = {2011}, } @inproceedings{ravi2011deciphering, author = {Sujith Ravi and Kevin Knight}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {12--21}, title = {Deciphering foreign language}, year = {2011}, } @article{ney1994structuring, author = {Hermann Ney and Ute Essen and Reinhard Kneser}, journal = {Computer, Speech, and Language}, number = {1}, pages = {1--38}, title = {On structuring probabilistic dependences in stochastic language modeling}, volume = {8}, year = {1994}, } @inproceedings{kneser1995improved, author = {Reinhard Kneser and Hermann Ney}, booktitle = {International Conference on Acoustics, Speech, and Signal Processing (ICASSP)}, pages = {181--184}, title = {Improved backing-off for m-gram language modeling}, volume = {1}, year = {1995}, } @inproceedings{recht2011hogwild, author = {Benjamin Recht and Christopher Ré and Stephen Wright and Feng Niu}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {693--701}, title = {Hogwild: A lock-free approach to parallelizing stochastic gradient descent}, year = {2011}, } @inproceedings{wood2009stochastic, author = {Frank Wood and Cédric Archambeau and Jan Gasthaus and Lancelot James and Yee Whye Teh}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1129--1136}, title = {A stochastic memoizer for sequence data}, year = {2009}, } @inproceedings{milch2005approximate, author = {Brian Milch and Bhaskara Marthi and David Sontag and Stuart Russell and Daniel L Ong and Andrey Kolobov}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, pages = {238--245}, title = {Approximate inference for infinite contingent {B}ayesian networks}, year = {2005}, } @article{li2014mean, author = {Yujia Li and Richard Zemel}, journal = {arXiv preprint arXiv:1410.5884}, title = {Mean-Field Networks}, year = {2014}, } @inproceedings{niepert2014exchangeable, author = {Mathias Niepert and Pedro Domingos}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Exchangeable variable models}, year = {2014}, } @inproceedings{poon2011sum, author = {Hoifung Poon and Pedro Domingos}, booktitle = {Uncertainty in Artificial Intelligence (UAI)}, pages = {337--346}, title = {Sum-product networks: A new deep architecture}, year = {2011}, } @inproceedings{kulesza2007structured, author = {Alex Kulesza and Fernando Pereira}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {785--792}, title = {Structured learning with approximate inference}, year = {2007}, } @inproceedings{finley2008training, author = {Thomas Finley and Thorsten Joachims}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {304--311}, title = {Training structural {SVM}s when exact inference is intractable}, year = {2008}, } @inproceedings{zhang2013online, author = {Hao Zhang and Liang Huang and Kai Zhao and Ryan McDonald}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Online learning for inexact hypergraph search}, year = {2013}, } @inproceedings{huang2012structured, author = {Liang Huang and Suphan Fayong and Yang Guo}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {142--151}, title = {Structured {P}erceptron with inexact search}, year = {2012}, } @inproceedings{xing2002generalized, author = {Eric P Xing and Michael I Jordan and Stuart Russell}, booktitle = {Uncertainty in Artificial Intelligence (UAI)}, pages = {583--591}, title = {A generalized mean field algorithm for variational inference in exponential families}, year = {2002}, } @article{wainwright2005new, author = {Martin J Wainwright and Tommi S Jaakkola and Alan S Willsky}, journal = {IEEE Transactions on Information Theory}, number = {7}, pages = {2313--2335}, title = {A new class of upper bounds on the log partition function}, volume = {51}, year = {2005}, } @phdthesis{sontag2010approximate, author = {David Sontag}, school = {Massachusetts Institute of Technology}, title = {Approximate inference in graphical models using {LP} relaxations}, year = {2010}, } @inproceedings{weiss2010sidestepping, author = {David Weiss and Benjamin Sapp and Ben Taskar}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {2415--2423}, title = {Sidestepping intractable inference with structured ensemble cascades}, year = {2010}, } @inproceedings{yu2013max, author = {Heng Yu and Liang Huang and Haitao Mi and Kai Zhao}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1112--1123}, title = {Max-Violation {P}erceptron and Forced Decoding for Scalable {MT} Training}, year = {2013}, } @inproceedings{moreno1998recursive, author = {Pedro J Moreno and Christopher F Joerg and Jean-Manuel Van Thong and Oren Glickman}, booktitle = {ICSLP}, pages = {2711--2714}, title = {A recursive algorithm for the forced alignment of very long audio segments}, volume = {98}, year = {1998}, } @article{gorman2011prosodylab, author = {Kyle Gorman and Jonathan Howell and Michael Wagner}, journal = {Canadian Acoustics}, number = {3}, pages = {192--193}, title = {Prosodylab-aligner: A tool for forced alignment of laboratory speech}, volume = {39}, year = {2011}, } @inproceedings{pal2006sparse, author = {Chris Pal and Charles Sutton and Andrew McCallum}, booktitle = {International Conference on Acoustics, Speech, and Signal Processing (ICASSP)}, title = {Sparse forward-backward using minimum divergence beams for fast training of conditional random fields}, volume = {5}, year = {2006}, } @article{zhang2014face, author = {Liyan Zhang and Dmitri V. Kalashnikov and Sharad Mehrotra}, journal = {International Journal of Multimedia Information Retrieval}, number = {2}, pages = {69--88}, title = {Context-assisted face clustering framework with human-in-the-loop}, volume = {3}, year = {2014}, } @book{brooks2011handbook, author = {Steve Brooks and Andrew Gelman and Galin Jones and Xiao-Li Meng}, publisher = {CRC press}, title = {Handbook of {M}arkov Chain {M}onte {C}arlo}, year = {2011}, } @manual{graff2003gigawords, author = {David Graff and Christopher Cieri}, title = {{E}nglish {G}igaword LDC2003T05}, year = {2003}, } @inproceedings{greenberg1996insights, author = {Steven Greenberg and Joy Hollenback and Dan Ellis}, booktitle = {International Conference on Spoken Language Processing (ICSLP)}, title = {Insights into spoken language gleaned from phonetic transcription of the {S}witchboard corpus}, year = {1996}, } @phdthesis{kassel1995comparison, author = {Robert H Kassel}, school = {Massachusetts Institute of Technology}, title = {A comparison of approaches to on-line handwritten character recognition}, year = {1995}, } @article{hu1996hmm, author = {Jianying Hu and Michael K Brown and William Turin}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI)}, number = {10}, pages = {1039--1045}, title = {{HMM} based online handwriting recognition}, volume = {18}, year = {1996}, } @inproceedings{agazzi1993connected, author = {Oscar E Agazzi and S-s Kuo and Esther Levin and Roberto Pieraccini}, booktitle = {International Conference on Acoustics, Speech, and Signal Processing (ICASSP)}, pages = {113--116}, title = {Connected and degraded text recognition using planar hidden {M}arkov models}, volume = {5}, year = {1993}, } @inproceedings{curran2003language, author = {James R Curran and Stephen Clark}, booktitle = {North American Association for Computational Linguistics (NAACL)}, pages = {164--167}, title = {Language independent {NER} using a maximum entropy tagger}, year = {2003}, } @article{maas2014first, author = {Andrew L Maas and Awni Y Hannun and Daniel Jurafsky and Andrew Y Ng}, journal = {arXiv preprint arXiv:1408.2873}, title = {First-Pass Large Vocabulary Continuous Speech Recognition using Bi-Directional Recurrent {DNN}s}, year = {2014}, } @inproceedings{ney1992improvements, author = {Hermann Ney and Reinhold Haeb-Umbach and B-H Tran and Martin Oerder}, booktitle = {International Conference on Acoustics, Speech, and Signal Processing (ICASSP)}, pages = {9--12}, title = {Improvements in beam search for 10000-word continuous speech recognition}, volume = {1}, year = {1992}, } @inproceedings{koehn2003statistical, author = {Philipp Koehn and Franz Josef Och and Daniel Marcu}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {48--54}, title = {Statistical phrase-based translation}, year = {2003}, } @inproceedings{och2003minimum, author = {Franz Josef Och}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {160--167}, title = {Minimum error rate training in statistical machine translation}, year = {2003}, } @inproceedings{rush2011exact, author = {Alexander M Rush and Michael Collins}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {72--82}, title = {Exact decoding of syntactic translation models through {L}agrangian relaxation}, year = {2011}, } @inproceedings{nuhn2013beamdecipher, author = {Malte Nuhn and Julian Schamper and Hermann Ney}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {1569--1576}, title = {Beam Search for Solving Substitution Ciphers}, year = {2013}, } @inproceedings{nuhn2014fastem, author = {Malte Nuhn and Hermann Ney}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {759--764}, title = {{EM} Decipherment for Large Vocabularies}, year = {2014}, } @inproceedings{nuhn2014homophonics, author = {Malte Nuhn and Hermann Ney}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Improved Decipherment of Homophonic Ciphers}, year = {2014}, } @article{cappe2007overview, author = {Olivier Cappé and Simon J Godsill and Eric Moulines}, journal = {Proceedings of the IEEE}, number = {5}, pages = {899--924}, title = {An overview of existing methods and recent advances in sequential {M}onte {C}arlo}, volume = {95}, year = {2007}, } @article{gelman1992single, author = {Andrew Gelman and Donald B Rubin}, journal = {Bayesian statistics}, pages = {625--631}, title = {A single series from the {G}ibbs sampler provides a false sense of security}, volume = {4}, year = {1992}, } @article{cowles1996markov, author = {Mary Kathryn Cowles and Bradley P Carlin}, journal = {Journal of the American Statistical Association (JASA)}, number = {434}, pages = {883--904}, title = {{M}arkov chain {M}onte {C}arlo convergence diagnostics: a comparative review}, volume = {91}, year = {1996}, } @inproceedings{doeblin1940elements, author = {W Doeblin}, booktitle = {Annales scientifiques de l'École Normale Supérieure}, pages = {61--111}, title = {Elements d'une theorie generale des chaines simples constantes de Markoff}, volume = {57}, year = {1940}, } @article{corcoran1998perfect, author = {JN Corcoran and RL Tweedie}, journal = {preprint}, title = {Perfect sampling of {H}arris recurrent {M}arkov chains}, year = {1998}, } @book{levin2008markov, author = {D. Levin and Y. Peres and E. Wilmer}, publisher = {American Mathematical Society}, title = {{M}arkov Chains and Mixing Times}, year = {2008}, } @article{murray2008notes, author = {Ian Murray and Ruslan Salakhutdinov}, journal = {preprint}, title = {Notes on the {KL}-divergence between a {M}arkov chain and its equilibrium distribution}, year = {2008}, } @manual{sandhaus2008new, author = {Evan Sandhaus}, title = {The {N}ew {Y}ork {T}imes annotated corpus}, year = {2008}, } @article{gulwani2007program, author = {Sumit Gulwani and Nebojsa Jojic}, journal = {ACM SIGPLAN Notices}, number = {1}, pages = {277--289}, title = {Program verification as probabilistic inference}, volume = {42}, year = {2007}, } @article{gulwani2011automating, author = {Sumit Gulwani}, journal = {ACM SIGPLAN Notices}, number = {1}, pages = {317--330}, title = {Automating string processing in spreadsheets using input-output examples}, volume = {46}, year = {2011}, } @inproceedings{sharma2014invariant, author = {Rahul Sharma and Alex Aiken}, booktitle = {Computer Aided Verification (CAV)}, pages = {88--105}, title = {From invariant checking to invariant inference using randomized search}, year = {2014}, } @article{green1995reversible, author = {PJ Green}, journal = {Biometrika}, number = {4}, pages = {711--732}, title = {Reversible jump {M}arkov chain {M}onte {C}arlo computation and {B}ayesian model determination}, volume = {82}, year = {1995}, } @article{earl2005parallel, author = {David J Earl and Michael W Deem}, journal = {Physical Chemistry Chemical Physics}, number = {23}, pages = {3910--3916}, title = {Parallel tempering: Theory, applications, and new perspectives}, volume = {7}, year = {2005}, } @article{gelman1998simulating, author = {A Gelman and XL Meng}, journal = {Statistical science}, number = {2}, pages = {163--185}, title = {Simulating normalizing constants: From importance sampling to bridge sampling to path sampling}, volume = {13}, year = {1998}, } @article{viola2004robust, author = {Paul Viola and Michael J Jones}, journal = {International Journal of Computer Vision}, number = {2}, pages = {137--154}, title = {Robust real-time face detection}, volume = {57}, year = {2004}, } @inproceedings{shen2004discriminative, author = {Libin Shen and Anoop Sarkar and Franz Josef Och}, booktitle = {North American Association for Computational Linguistics (NAACL)}, pages = {177--184}, title = {Discriminative reranking for machine translation}, year = {2004}, } @article{collins2005discriminative, author = {Michael Collins and Terry Koo}, journal = {Computational Linguistics}, number = {1}, pages = {25--70}, title = {Discriminative reranking for natural language parsing}, volume = {31}, year = {2005}, } @inproceedings{gu2009recognition, author = {Chunhui Gu and Joseph J Lim and Pablo Arbeláez and Jitendra Malik}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {1030--1037}, title = {Recognition using regions}, year = {2009}, } @inproceedings{sapp2010cascaded, author = {B Sapp and A Toshev and B Taskar}, booktitle = {European Conference on Computer Vision (ECCV)}, pages = {406--420}, title = {Cascaded models for articulated pose estimation}, year = {2010}, } @inproceedings{yadollahpour2013discriminative, author = {Payman Yadollahpour and Dhruv Batra and Gregory Shakhnarovich}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {1923--1930}, title = {Discriminative re-ranking of diverse segmentations}, year = {2013}, } @article{roberts1999bounds, author = {GO Roberts and RL Tweedie}, journal = {Stochastic Processes and their applications}, number = {2}, pages = {211--229}, title = {Bounds on regeneration times and convergence rates for {M}arkov chains}, volume = {80}, year = {1999}, } @article{meyn1994computable, author = {SP Meyn and RL Tweedie}, journal = {The Annals of Applied Probability}, number = {4}, pages = {981--1011}, title = {Computable bounds for geometric convergence rates of {M}arkov chains}, volume = {4}, year = {1994}, } @article{athreya1978new, author = {Krishna B Athreya and P Ney}, journal = {Transactions of the American Mathematical Society}, pages = {493--501}, title = {A new approach to the limit theory of recurrent {M}arkov chains}, volume = {245}, year = {1978}, } @article{rosenthal1995minorization, author = {Jeffrey S Rosenthal}, journal = {Journal of the American Statistical Association (JASA)}, number = {430}, pages = {558--566}, title = {Minorization conditions and convergence rates for {M}arkov chain {M}onte {C}arlo}, volume = {90}, year = {1995}, } @article{propp1996exact, author = {JG Propp and DB Wilson}, journal = {Random structures and Algorithms}, pages = {223--252}, title = {Exact sampling with coupled {M}arkov chains and applications to statistical mechanics}, volume = {9}, year = {1996}, } @article{murdoch1998exact, author = {Duncan J Murdoch and Peter J Green}, journal = {Scandinavian Journal of Statistics}, number = {3}, pages = {483--502}, title = {Exact sampling from a continuous state space}, volume = {25}, year = {1998}, } @inproceedings{banarescu2013amr, author = {Laura Banarescu and Claire Bonial Shu Cai and Madalina Georgescu and Kira Griffitt and Ulf Hermjakob and Kevin Knight and Philipp Koehn and Martha Palmer and Nathan Schneider}, booktitle = {7th Linguistic Annotation Workshop and Interoperability with Discourse}, title = {Abstract Meaning Representation for Sembanking}, year = {2013}, } @inproceedings{neelakantan2015compositional, author = {Arvind Neelakantan and Benjamin Roth and Andrew McCallum}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Compositional Vector Space Models for Knowledge Base Completion}, year = {2015}, } @inproceedings{socher2013reasoning, author = {Richard Socher and Danqi Chen and Christopher D Manning and Andrew Ng}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {926--934}, title = {Reasoning with neural tensor networks for knowledge base completion}, year = {2013}, } @inproceedings{min2013distant, author = {Bonan Min and Ralph Grishman and Li Wan and Chang Wang and David Gondek}, booktitle = {North American Association for Computational Linguistics (NAACL)}, pages = {777--782}, title = {Distant Supervision for Relation Extraction with an Incomplete Knowledge Base}, year = {2013}, } @inproceedings{bordes2013translating, author = {Antoine Bordes and Nicolas Usunier and Alberto Garcia-Duran and Jason Weston and Oksana Yakhnenko}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {2787--2795}, title = {Translating embeddings for modeling multi-relational data}, year = {2013}, } @inproceedings{grefenstette2011experimental, author = {Edward Grefenstette and Mehrnoosh Sadrzadeh}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1394--1404}, title = {Experimental support for a categorical compositional distributional model of meaning}, year = {2011}, } @article{socher2014grounded, author = {Richard Socher and Andrej Karpathy and Quoc V Le and Christopher D Manning and Andrew Y Ng}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, pages = {207--218}, title = {Grounded compositional semantics for finding and describing images with sentences}, volume = {2}, year = {2014}, } @article{browne2012monte, author = {Cameron B Browne and Edward Powley and Daniel Whitehouse and Simon M Lucas and Peter I Cowling and Philipp Rohlfshagen and Stephen Tavener and Diego Perez and Spyridon Samothrakis and Simon Colton}, journal = {IEEE Transactions on Computational Intelligence and AI in Games}, pages = {1--43}, title = {A survey of {M}onte {C}arlo tree search methods}, volume = {4}, year = {2012}, } @inproceedings{dai2010decision, author = {Peng Dai and Mausam and Daniel S Weld}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Decision-theoretic control of crowd-sourced workflows}, year = {2010}, } @inproceedings{koutnik2014clockwork, author = {Jan Koutnik and Klaus Greff and Faustino Gomez and Juergen Schmidhuber}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1863--1871}, title = {A Clockwork {RNN}}, year = {2014}, } @article{hochreiter1997lstm, author = {Sepp Hochreiter and J{\"u}rgen Schmidhuber}, journal = {Neural Computation}, number = {8}, pages = {1735--1780}, title = {Long short-term memory}, volume = {9}, year = {1997}, } @article{mikolov2014learning, author = {Tomas Mikolov and Armand Joulin and Sumit Chopra and Michael Mathieu and Marc'Aurelio Ranzato}, journal = {arXiv preprint arXiv:1412.7753}, title = {Learning Longer Memory in Recurrent Neural Networks}, year = {2014}, } @article{le2015simple, author = {Quoc V Le and Navdeep Jaitly and Geoffrey E Hinton}, journal = {arXiv preprint arXiv:1504.00941}, title = {A Simple Way to Initialize Recurrent Networks of Rectified Linear Units}, year = {2015}, } @inproceedings{livni2014computational, author = {Roi Livni and Shai Shalev-Shwartz and Ohad Shamir}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {855--863}, title = {On the Computational Efficiency of Training Neural Networks}, year = {2014}, } @inproceedings{andoni2014learning, author = {Alexandr Andoni and Rina Panigrahy and Gregory Valiant and Li Zhang}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1908--1916}, title = {Learning polynomials with neural networks}, year = {2014}, } @article{elman1990finding, author = {Jeffrey L Elman}, journal = {Cognitive Science}, number = {2}, pages = {179--211}, title = {Finding structure in time}, volume = {14}, year = {1990}, } @inproceedings{arora2014provable, author = {Sanjeev Arora and Aditya Bhaskara and Rong Ge and Tengyu Ma}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {584--592}, title = {Provable Bounds for Learning Some Deep Representations}, year = {2014}, } @article{hermans2012recurrent, author = {Michiel Hermans and Benjamin Schrauwen}, journal = {Neural Computation}, number = {1}, pages = {104--133}, title = {Recurrent kernel machines: Computing with infinite echo state networks}, volume = {24}, year = {2012}, } @article{livni2013algorithm, author = {Roi Livni and Shai Shalev-Shwartz and Ohad Shamir}, journal = {arXiv preprint arXiv:1304.7045}, title = {An Algorithm for Training Polynomial Networks}, year = {2013}, } @article{lukovsevivcius2009reservoir, author = {Mantas Luko{\v{s}}Evi{\v{c}}Ius and Herbert Jaeger}, journal = {Computer Science Review}, number = {3}, pages = {127--149}, title = {Reservoir computing approaches to recurrent neural network training}, volume = {3}, year = {2009}, } @article{schmidhuber2007evolino, author = {J{\"u}rgen Schmidhuber and Daan Wierstra and Matteo Gagliolo and Faustino Gomez}, journal = {Neural Computation}, number = {3}, pages = {757--779}, title = {Training recurrent networks by {E}volino}, volume = {19}, year = {2007}, } @article{cho2014gru, author = {Kyunghyun Cho and Bart van Merri{\"e}nboer and Dzmitry Bahdanau and Yoshua Bengio}, journal = {arXiv preprint arXiv:1409.1259}, title = {On the properties of neural machine translation: Encoder-decoder approaches}, year = {2014}, } @article{stephenson08brier, author = {D. B. Stephenson and C. A. S. Coelho and I. T. Jolliffe}, journal = {Weather Forecasting}, pages = {752--757}, title = {Two Extra Components in the Brier Score Decomposition}, volume = {23}, year = {2008}, } @article{murphy1973vector, author = {Allan H Murphy}, journal = {Journal of Applied Meteorology}, number = {4}, pages = {595--600}, title = {A new vector partition of the probability score}, volume = {12}, year = {1973}, } @article{brocker2009decomposition, author = {Jochen Brocker}, journal = {Quarterly Journal of the Royal Meteorological Society}, number = {643}, pages = {1512--1519}, title = {Reliability, sufficiency, and the decomposition of proper scores}, volume = {135}, year = {2009}, } @article{brocker2012empirical, author = {Jochen Brocker}, journal = {Climate Dynamics}, pages = {655--667}, title = {Estimating reliability and resolution of probability forecasts through decomposition of the empirical score}, volume = {39}, year = {2012}, } @article{kroemer2010combining, author = {OB Kroemer and R. Detry and J. Piater and J. Peters}, journal = {RAS}, number = {9}, pages = {1105--1116}, title = {Combining active learning and reactive control for robot grasping}, volume = {58}, year = {2010}, } @article{argall2009survey, author = {B. Argall and S. Chernova and M. Veloso and B. Browning}, journal = {RAS}, title = {A survey of robot learning from demonstration}, volume = {57}, year = {2009}, } @inproceedings{alterovitz2011rapidly, author = {R. Alterovitz and S. Patil and A. Derbakova}, booktitle = {International Conference on Robotics and Automation (ICRA)}, title = {Rapidly-exploring roadmaps: Weighing exploration vs. refinement in optimal motion planning}, year = {2011}, } @inproceedings{hofer2014extracting, author = {S. H{\"o}fer and T. Lang and O. Brock}, booktitle = {International Conference on Robotics and Automation (ICRA)}, title = {Extracting Kinematic Background Knowledge from Interactions Using Task-Sensitive Relational Learning}, year = {2014}, } @inproceedings{kulick2013active, author = {J. Kulick and M. Toussaint and T. Lang and M. Lopes}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Active Learning for Teaching a Robot Grounded Relational Symbols}, year = {2013}, } @inproceedings{endres2013learning, author = {F. Endres and J. Trinkle and W. Burgard}, booktitle = {International Conference on Intelligent Robots and Systems (IROS)}, title = {Learning the dynamics of doors for robotic manipulation}, year = {2013}, } @inproceedings{nothman2012event, author = {J. Nothman and M. Honnibal and B. Hachey and J. Curran}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Event linking: Grounding event reference in a news archive}, year = {2012}, } @inproceedings{wongpiromsarn2010receding, author = {Tichakorn Wongpiromsarn and Ufuk Topcu and Richard M Murray}, booktitle = {International Conference on Hybrid Systems: Computation and Control}, pages = {101--110}, title = {Receding horizon control for temporal logic specifications}, year = {2010}, } @inproceedings{niekum2013incremental, author = {S. Niekum and S. Chitta and A. Barto and B. Marthi and S. Osentoski}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Incremental Semantically Grounded Learning from Demonstration}, year = {2013}, } @inproceedings{bollini2011bakebot, author = {M. Bollini and J. Barry and D. Rus}, booktitle = {The PR2 Workshop, IROS}, title = {Bakebot: Baking cookies with the {PR2}}, year = {2011}, } @inproceedings{kollar2010grounding, author = {T. Kollar and S. Tellex and D. Roy and N. Roy}, booktitle = {International Symposium on Experimental Robotics (ISER)}, title = {Grounding Verbs of Motion in Natural Language Commands to Robots}, year = {2010}, } @inproceedings{matuszek2012learning, author = {C. Matuszek and E. Herbst and L. Zettlemoyer and D. Fox}, booktitle = {International Symposium on Experimental Robotics (ISER)}, title = {Learning to parse natural language commands to a robot control system}, year = {2012}, } @inproceedings{walter2013learning, author = {M. Walter and S. Hemachandra and B. Homberg and S. Tellex and S. Teller}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Learning Semantic Maps from Natural Language Descriptions}, year = {2013}, } @inproceedings{ratliff2009chomp, author = {N. Ratliff and M. Zucker and D. Bagnell and S. Srinivasa}, booktitle = {International Conference on Robotics and Automation (ICRA)}, title = {{CHOMP}: Gradient Optimization Techniques for Efficient Motion Planning}, year = {2009}, } @article{srinivasa2010herb, author = {S. Srinivasa and D. Ferguson and C. Helfrich and D. Berenson and A. Collet and R. Diankov and G. Gallagher and G. Hollinger and J. Kuffner and M. Weghe}, journal = {Autonomous Robots}, number = {1}, pages = {5--20}, title = {{HERB}: a home exploring robotic butler}, volume = {28}, year = {2010}, } @article{jiang2012placing, author = {Y. Jiang and M. Lim and C. Zheng and A. Saxena}, journal = {IJRR}, number = {9}, title = {Learning to Place New Objects in a Scene}, volume = {31}, year = {2012}, } @inproceedings{sung2014learning, author = {J. Sung and B. Selman and A. Saxena}, booktitle = {International Conference on Intelligent Robots and Systems (IROS)}, title = {Synthesizing Manipulation Sequences for Under-Specified Tasks using Unrolled {M}arkov Random Fields}, year = {2014}, } @inproceedings{cakmak2007affordances, author = {Maya Cakmak and Mehmet R Dogar and Emre Ugur and Erol Sahin}, booktitle = {International conference on epigenetic robotics}, title = {Affordances as a framework for robot control}, year = {2007}, } @inproceedings{finucane2010ltlmop, author = {C. Finucane and G. Jing and H. Kress-Gazit}, booktitle = {International Conference on Intelligent Robots and Systems (IROS)}, title = {LTLMoP: Experimenting with language, temporal logic and robot control}, year = {2010}, } @inproceedings{guadarrama2013grounding, author = {S. Guadarrama and L. Riano and D. Golland and D. Gouhring and Y. Jia and D. Klein and P. Abbeel and T. Darrell}, booktitle = {International Conference on Intelligent Robots and Systems (IROS)}, title = {Grounding spatial relations for human-robot interaction}, year = {2013}, } @inproceedings{fasola2013using, author = {J. Fasola and M. J Matari{\'c}}, booktitle = {International Conference on Intelligent Robots and Systems (IROS)}, title = {Using Semantic Fields to Model Dynamic Spatial Relations in a Robot Architecture for Natural Language Instruction of Service Robots}, year = {2013}, } @inproceedings{lenz2013deep, author = {I. Lenz and H. Lee and A. Saxena}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Deep Learning for Detecting Robotic Grasps}, year = {2013}, } @inproceedings{chu2013haptic, author = {V. Chu and I. McMahon and L. Riano and C. McDonald and Q. He and J. Perez-Tejada and M. Arrigo and N. Fitter and J. Nappo and T. Darrell and others}, booktitle = {International Conference on Intelligent Robots and Systems (IROS)}, title = {Using Robotic Exploratory Procedures to Learn the Meaning of Haptic Adjectives}, year = {2013}, } @inproceedings{kunze2013acquiring, author = {L. Kunze and A. Haidu and M. Beetz}, booktitle = {International Conference on Intelligent Robots and Systems (IROS)}, title = {Acquiring task models for imitation learning through games with a purpose}, year = {2013}, } @inproceedings{ias2012execution, author = {D Marco and M Tenorth and K H{\"a}ussermann and O Zweigle and P Levi}, booktitle = {International Conference on Intelligent Autonomous Systems (IAS)}, title = {RoboEarth Action Recipe Execution}, year = {2012}, } @inproceedings{bollini2012interpreting, author = {M. Bollini and S. Tellex and T. Thompson and N. Roy and D. Rus}, booktitle = {International Symposium on Experimental Robotics (ISER)}, title = {Interpreting and executing recipes with a cooking robot}, year = {2012}, } @inproceedings{kress2007structured, author = {H. Kress-Gazit and G. Fainekos and G. Pappas}, booktitle = {International Conference on Intelligent Robots and Systems (IROS)}, title = {From structured {E}nglish to robot motion}, year = {2007}, } @article{maciel2011surgical, author = {A. Maciel and G. Sankaranarayanan and T. Halic and V. Arikatla and Z. Lu and S. De}, journal = {International Journal of Computer Assisted Radiology and Surgery}, number = {4}, pages = {457--471}, title = {Surgical model-view-controller simulation software framework for local and collaborative applications}, volume = {6}, year = {2011}, } @inproceedings{zickler2009efficient, author = {S. Zickler and M. Veloso}, booktitle = {International Conference on Autonomous Agents and Multiagent Systems (AAMAS)}, pages = {27--33}, title = {Efficient physics-based planning: sampling search via non-deterministic tactics and skills}, year = {2009}, } @inproceedings{beetz2011robotic, author = {M. Beetz and U. Klank and I. Kresse and A. Maldonado and L. Mosenlechner and D. Pangercic and T. Ruhr and M. Tenorth}, booktitle = {Humanoids}, title = {Robotic roommates making pancakes}, year = {2011}, } @article{miller2012geometric, author = {S. Miller and J. Van Den Berg and M. Fritz and T. Darrell and K. Goldberg and P. Abbeel}, journal = {International Journal of Robotics Research (IJRR)}, title = {A geometric approach to robotic laundry folding}, volume = {31}, year = {2012}, } @inproceedings{nguyen2013ros, author = {H. Nguyen and M. Ciocarlie and J. Hsiao and C. C. Kemp}, booktitle = {International Conference on Robotics and Automation (ICRA)}, title = {{ROS} Commander (ROSCo): Behavior Creation for Home Robots}, year = {2013}, } @inproceedings{barry2013manipulation, author = {J. Barry and K. Hsiao and L. P. Kaelbling and T. Lozano-P{'e}rez}, booktitle = {Expermental Robotics}, pages = {531--545}, title = {Manipulation with multiple action types}, year = {2013}, } @article{lemaignan2012grounding, author = {S. Lemaignan and R. Ros and E. A. Sisbot and R. Alami and M. Beetz}, journal = {International Journal of Social Robotics (IJSR)}, number = {2}, pages = {181--199}, title = {Grounding the interaction: Anchoring situated discourse in everyday human-robot interaction}, volume = {4}, year = {2012}, } @inproceedings{ros2010one, author = {R. Ros and S. Lemaignan and E. A. Sisbot and R. Alami and J. Steinwender and K. Hamann and F. Warneken}, booktitle = {RO-MAN}, pages = {570--575}, title = {Which one? grounding the referent based on efficient human-robot interaction}, year = {2010}, } @inproceedings{chao2011towards, author = {Crystal Chao and Maya Cakmak and Andrea L Thomaz}, booktitle = {International Conference on Development and Learning (ICDL)}, pages = {1--6}, title = {Towards grounding concepts for transfer in goal learning from demonstration}, year = {2011}, } @inproceedings{kaelbling2011hierarchical, author = {L. P. Kaelbling and T. Lozano-P{'e}rez}, booktitle = {International Conference on Robotics and Automation (ICRA)}, title = {Hierarchical task and motion planning in the now}, year = {2011}, } @article{rintanen2012planning, author = {J. Rintanen}, journal = {Artificial Intelligence}, title = {Planning as satisfiability: Heuristics}, volume = {193}, year = {2012}, } @article{anand2012semantic, author = {A. Anand and H. Koppula and T. Joachims and A. Saxena}, journal = {International Journal of Robotics Research (IJRR)}, title = {Contextually Guided Semantic Labeling and Search for 3{D} Point Clouds}, volume = {32}, year = {2012}, } @inproceedings{farhadi2010attribute, author = {A. Farhadi and I. Endres and D. Hoiem}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Attribute-centric recognition for cross-category generalization}, year = {2010}, } @inproceedings{tenorth2010knowrob, author = {M. Tenorth and L. Kunze and D. Jain and M. Beetz}, booktitle = {Humanoids}, title = {{KNOWROB}-{MAP}-knowledge-linked semantic object maps}, year = {2010}, } @article{chen2010training, author = {D. L. Chen and J. Kim and R. J. Mooney}, journal = {Journal of Artificial Intelligence Research (JAIR)}, number = {1}, pages = {397--436}, title = {Training a multilingual sportscaster: Using perceptual context to learn language}, volume = {37}, year = {2010}, } @inproceedings{duvallet2014inferring, author = {F. Duvallet and M. R. Walter and T. Howard and S. Hemachandra and J. Oh and S. Teller and N. Roy and A. Stentz}, booktitle = {International Symposium on Experimental Robotics (ISER)}, title = {Inferring Maps and Behaviors from Natural Language Instructions}, year = {2014}, } @inproceedings{koppula2013anticipating, author = {H. Koppula and A. Saxena}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Anticipating Human Activities using Object Affordances for Reactive Robotic Response}, year = {2013}, } @inproceedings{koppula2011semantic, author = {H.S. Koppula and A. Anand and T. Joachims and A. Saxena}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Semantic Labeling of 3{D} Point Clouds for Indoor Scenes}, year = {2011}, } @inproceedings{farhadi2010every, author = {A. Farhadi and M. Hejrati and M. A. Sadeghi and P. Young and C. Rashtchian and J. Hockenmaier and D. Forsyth}, booktitle = {European Conference on Computer Vision (ECCV)}, pages = {15--29}, title = {Every picture tells a story: Generating sentences from images}, year = {2010}, } @inproceedings{wulenzsaxena2014hierarchical, author = {C. Wu and I. Lenz and A. Saxena}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Hierarchical Semantic Labeling for Task-Relevant {RGB-D} Perception}, year = {2014}, } @inproceedings{jiang2013hallucinated, author = {Y. Jiang and H. Koppula and A. Saxena}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Hallucinated Humans as the Hidden Context for Labeling 3{D} Scenes}, year = {2013}, } @book{steedman1996surface, author = {M. Steedman}, publisher = {MIT press}, title = {Surface structure and interpretation}, year = {1996}, } @inproceedings{mourao2012learning, author = {K. Mourao and L. Zettlemoyer and R. Petrick and M. Steedman}, booktitle = {Uncertainty in Artificial Intelligence (UAI)}, title = {Learning strips operators from noisy and incomplete observations}, year = {2012}, } @inproceedings{guadarrama2014open, author = {S Guadarrama and E Rodner and K Saenko and N Zhang and R Farrell and J Donahue and T Darrell}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Open-vocabulary object retrieval}, year = {2014}, } @article{akgun2012keyframe, author = {B. Akgun and M. Cakmak and K. Jiang and A. Thomaz}, journal = {International Journal of Social Robotics (IJSR)}, number = {4}, pages = {343--355}, title = {Keyframe-based learning from demonstration}, volume = {4}, year = {2012}, } @inproceedings{hsiao2010contact, author = {K. Hsiao and S. Chitta and M. Ciocarlie and E. Jones}, booktitle = {International Conference on Intelligent Robots and Systems (IROS) IROS}, title = {Contact-reactive grasping of objects with partial shape information}, year = {2010 2010}, } @inproceedings{misra2014tell, author = {DK Misra and J Sung and K Lee and A Saxena}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Tell {M}e {D}ave: Context-sensitive grounding of natural language to mobile manipulation instructions}, year = {2014}, } @article{montesano2008learning, author = {L. Montesano and M. Lopes and A. Bernardino and J. Santos-Victor}, journal = {Robotics, IEEE Transactions on}, number = {1}, pages = {15--26}, title = {Learning Object Affordances: From Sensory--Motor Coordination to Imitation}, volume = {24}, year = {2008}, } @article{kjellstrom2011visual, author = {H. Kjellstr{'o}m and J. Romero and D. Kragi{'c}}, journal = {Computer Vision and Image Understanding}, number = {1}, pages = {81--90}, title = {Visual object-action recognition: Inferring object affordances from human demonstration}, volume = {115}, year = {2011}, } @article{koppula2013learning, author = {H. S. Koppula and R. Gupta and A. Saxena}, journal = {International Journal of Robotics Research (IJRR)}, number = {8}, pages = {951--970}, title = {Learning human activities and object affordances from {RGB-D} videos}, volume = {32}, year = {2013}, } @inproceedings{aydemir2011search, author = {A. Aydemir and K. Sjoo and J. Folkesson and A. Pronobis and P. Jensfelt}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {2818--2824}, title = {Search in the real world: Active visual object search based on spatial relations}, year = {2011}, } @inproceedings{malmaud2014cooking, author = {J. Malmaud and E. Wagner and N. Chang and K. Murphy}, booktitle = {ACL Workshop on Semantic Parsing}, pages = {33--38}, title = {Cooking with Semantics}, year = {2014}, } @inproceedings{kirk2014controlled, author = {N. H. Kirk and D. Nyga and M. Beetz}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {6667--6672}, title = {Controlled Natural Languages for language generation in artificial cognition}, year = {2014}, } @inproceedings{fasola2014interpreting, author = {J. Fasola and M. J Matari{\'c}}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {6667--6672}, title = {Interpreting Instruction Sequences in Spatial Language Discourse with Pragmatics towards Natural Human-Robot Interaction}, year = {2014}, } @inproceedings{naim2014unsupervised, author = {I. Naim and Y. Song and Q. Liu and H. Kautz and J. Luo and D. Gildea}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Unsupervised Alignment of Natural Language Instructions with Video Segments}, year = {2014}, } @inproceedings{bruce2002real, author = {J. Bruce and M. Veloso}, booktitle = {IROS}, pages = {2383--2388}, title = {Real-time randomized path planning for robot navigation}, volume = {3}, year = {2002}, } @inproceedings{mooney2008learning, author = {R. Mooney}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {1598--1601}, title = {Learning to Connect Language and Perception}, year = {2008}, } @inproceedings{fleischman2005intentional, author = {M. Fleischman and D. Roy}, booktitle = {Computational Natural Language Learning (CoNLL)}, pages = {104--111}, title = {Intentional context in situated natural language learning}, year = {2005}, } @inproceedings{yu2013grounded, author = {H. Yu and J. M. Siskind}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {53--63}, title = {Grounded Language Learning from Video Described with Sentences}, year = {2013}, } @inproceedings{kim2012unsupervised, author = {J. Kim and R. Mooney}, booktitle = {Computational Natural Language Learning (CoNLL)}, pages = {433--444}, title = {Unsupervised {PCFG} induction for grounded language learning with highly ambiguous supervision}, year = {2012}, } @article{sung2015robobarista, author = {Jaeyong Sung and Seok Hyun Jin and Ashutosh Saxena}, journal = {arXiv preprint arXiv:1504.03071}, title = {Robobarista: Object Part based Transfer of Manipulation Trajectories from Crowd-sourcing in 3{D} Pointclouds}, year = {2015}, } @article{saxena2014robobrain, author = {Ashutosh Saxena and Ashesh Jain and Ozan Sener and Aditya Jami and Dipendra Kumar Misra and Hema S Koppula}, journal = {arXiv preprint arXiv:1412.0691}, title = {RoboBrain: Large-Scale Knowledge Engine for Robots}, year = {2014}, } @inproceedings{ren2012rgb, author = {Xiaofeng Ren and Liefeng Bo and Dieter Fox}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {2759--2766}, title = {Rgb-(d) scene labeling: Features and algorithms}, year = {2012}, } @article{ullman1985implementation, author = {Jeffrey D Ullman}, journal = {ACM Transactions on Database Systems (TODS)}, number = {3}, pages = {289--321}, title = {Implementation of logical query languages for databases}, volume = {10}, year = {1985}, } @inproceedings{lenz2015deepmpc, author = {Ian Lenz and Ross Knepper and Ashutosh Saxena}, booktitle = {Robotics Science and Systems (RSS)}, title = {DeepMPC: Learning Deep Latent Features for Model Predictive Control}, year = {2015}, } @article{yang2015embeddings, author = {Bishan Yang and Wen-tau Yih and Xiaodong He and Jianfeng Gao and Li Deng}, journal = {arXiv preprint arXiv:1412.6575}, title = {Embedding Entities and Relations for Learning and Inference in Knowledge Bases}, year = {2015}, } @inproceedings{lao2011pathranking, author = {Ni Lao and Tom Mitchell and William W Cohen}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {529--539}, title = {Random walk inference and learning in a large scale knowledge base}, year = {2011}, } @article{grefenstette2013calculus, author = {Edward Grefenstette}, journal = {arXiv preprint arXiv:1304.5823}, title = {Towards a formal distributional semantics: Simulating logical calculi with tensors}, year = {2013}, } @article{vilnis2014gaussian, author = {Luke Vilnis and Andrew McCallum}, journal = {arXiv preprint arXiv:1412.6623}, title = {Word Representations via {G}aussian Embedding}, year = {2014}, } @inproceedings{gardner2014incorporating, author = {Matt Gardner and Partha Talukdar and Jayant Krishnamurthy and Tom Mitchell}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Incorporating vector space similarity in random walk inference over knowledge bases}, year = {2014}, } @inproceedings{nickel2014reducing, author = {Maximilian Nickel and Xueyan Jiang and Volker Tresp}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1179--1187}, title = {Reducing the Rank in Relational Factorization Models by Including Observable Patterns}, year = {2014}, } @inproceedings{rocktaschel2014lowlogic, author = {Tim Rockt{\"a}schel and Matko Bosnjak and Sameer Singh and Sebastian Riedel}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Low-dimensional embeddings of logic}, year = {2014}, } @inproceedings{perozzi2014deepwalk, author = {Bryan Perozzi and Rami Al-Rfou and Steven Skiena}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, pages = {701--710}, title = {Deepwalk: Online learning of social representations}, year = {2014}, } @inproceedings{bowman2014recursive, author = {Samuel R. Bowman and Christopher Potts and Christopher D. Manning}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Can recursive neural tensor networks learn logical reasoning?}, year = {2014}, } @inproceedings{dong2014knowledge, author = {Xin Dong and Evgeniy Gabrilovich and Geremy Heitz and Wilko Horn and Ni Lao and Kevin Murphy and Thomas Strohmann and Shaohua Sun and Wei Zhang}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, pages = {601--610}, title = {Knowledge {v}ault: A web-scale approach to probabilistic knowledge fusion}, year = {2014}, } @inproceedings{ng1999policy, author = {Andrew Y Ng and Daishi Harada and Stuart Russell}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {278--287}, title = {Policy invariance under reward transformations: Theory and application to reward shaping}, volume = {99}, year = {1999}, } @article{gill2002snopt, author = {Philip E Gill and Walter Murray and Michael A Saunders}, journal = {SIAM Journal on Optimization}, number = {4}, pages = {979--1006}, title = {{SNOPT}: An {SQP} algorithm for large-scale constrained optimization}, volume = {12}, year = {2002}, } @inproceedings{pennington2014glove, author = {Jeffrey Pennington and Richard Socher and Christopher D Manning}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1532--1543}, title = {Glo{V}e: Global Vectors for word representation}, year = {2014}, } @inproceedings{niculescu2005predicting, author = {Alexandru Niculescu-Mizil and Rich Caruana}, booktitle = {Proceedings of the 22nd international conference on Machine learning}, pages = {625--632}, title = {Predicting good probabilities with supervised learning}, year = {2005}, } @article{platt1999probabilistic, author = {John Platt}, journal = {Advances in Large Margin Classifiers}, number = {3}, pages = {61--74}, title = {Probabilistic outputs for support vector machines and comparisons to regularized likelihood methods}, volume = {10}, year = {1999}, } @inproceedings{zadrozny2002transforming, author = {Bianca Zadrozny and Charles Elkan}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, pages = {694--699}, title = {Transforming classifier scores into accurate multiclass probability estimates}, year = {2002}, } @article{gneiting2007probabilistic, author = {Tilmann Gneiting and Fadoua Balabdaoui and Adrian E Raftery}, journal = {Journal of the Royal Statistical Society: Series B (Statistical Methodology)}, number = {2}, pages = {243--268}, title = {Probabilistic forecasts, calibration and sharpness}, volume = {69}, year = {2007}, } @article{reid2011information, author = {Mark D Reid and Robert C Williamson}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {731--817}, title = {Information, divergence and risk for binary experiments}, volume = {12}, year = {2011}, } @article{cesabianchi06regret, author = {Nicolò Cesa-Bianchi and Gábor Lugosi and Gilles Stoltz}, journal = {Mathematics of Operations Research}, pages = {562--580}, title = {Regret Minimization Under Partial Monitoring}, volume = {31}, year = {2006}, } @article{cesabianchi05minimizing, author = {Nicolò Cesa-Bianchi and Gábor Lugosi and Gilles Stoltz}, journal = {IEEE Transactions on Information Theory}, pages = {2152--2162}, title = {Minimizing regret with label efficient prediction}, volume = {51}, year = {2005}, } @inproceedings{chai2004test, author = {Xiaoyong Chai and Lin Deng and Qiang Yang and Charles X Ling}, booktitle = {International Conference on Data Mining}, pages = {51--58}, title = {Test-cost sensitive naive {B}ayes classification}, year = {2004}, } @inproceedings{esmeir2007anytime, author = {Saher Esmeir and Shaul Markovitch}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {425--432}, title = {Anytime induction of cost-sensitive trees}, year = {2007}, } @inproceedings{bernstein2011crowds, author = {Michael S Bernstein and Joel Brandt and Robert C Miller and David R Karger}, booktitle = {User Interface Software and Technology}, pages = {33--42}, title = {Crowds in Two Seconds: Enabling Realtime Crowd-powered Interfaces}, year = {2011}, } @book{titterington1985statistical, author = {D Michael Titterington and Adrian FM Smith and Udi E Makov}, publisher = {Wiley New York}, title = {Statistical analysis of finite mixture distributions}, volume = {7}, year = {1985}, } @inproceedings{dreesen2012roots, author = {Philippe Dreesen and Kim Batselier and Bart De Moor}, booktitle = {IFAC Symposium on System Identification (SYSID)}, pages = {1203--1208}, title = {Back to the roots: Polynomial system solving, linear algebra, systems theory}, year = {2012}, } @inproceedings{cohen2013experiments, author = {Shay B Cohen and Karl Stratos and Michael Collins and Dean P Foster and Lyle H Ungar}, booktitle = {North American Association for Computational Linguistics (NAACL)}, pages = {148--157}, title = {Experiments with Spectral Learning of Latent-Variable PCFGs}, year = {2013}, } @article{hansen1982gmm, author = {Lars Peter Hansen}, journal = {Econometrica: Journal of the Econometric Society}, pages = {1029--1054}, title = {Large sample properties of generalized method of moments estimators}, volume = {50}, year = {1982}, } @book{mclachlan2004finite, author = {Geoffrey McLachlan and David Peel}, publisher = {John Wiley \& Sons}, title = {Finite mixture models}, year = {2004}, } @article{lasserre2001global, author = {Jean B Lasserre}, journal = {SIAM Journal on Optimization}, number = {3}, pages = {796--817}, title = {Global optimization with polynomials and the problem of moments}, volume = {11}, year = {2001}, } @book{lasserre2011moments, author = {Jean Bernard Lasserre}, publisher = {Imperial College Press}, title = {Moments, Positive Polynomials and Their Applications}, year = {2011}, } @article{lasserre2008semidefinite, author = {Jean B Lasserre}, journal = {Mathematical Programming}, number = {1}, pages = {65--92}, title = {A semidefinite programming approach to the generalized problem of moments}, volume = {112}, year = {2008}, } @book{stetter2004numerical, author = {Hans J Stetter}, publisher = {Siam}, title = {Numerical polynomial algebra}, year = {2004}, } @article{stetter1993multivariate, author = {Hans J Stetter}, journal = {WSSIA}, pages = {355--371}, title = {Multivariate polynomial equations as matrix eigenproblems}, volume = {2}, year = {1993}, } @article{moller1995multivariate, author = {H Michael M{\"o}ller and Hans J Stetter}, journal = {Numerische Mathematik}, number = {3}, pages = {311--329}, title = {Multivariate polynomial equations with multiple zeros solved by matrix eigenproblems}, volume = {70}, year = {1995}, } @inproceedings{henrion2005detecting, author = {Didier Henrion and Jean-Bernard Lasserre}, booktitle = {Positive polynomials in control}, pages = {293--310}, title = {Detecting global optimality and extracting solutions in {G}lopti{P}oly}, year = {2005}, } @book{hall2005generalized, author = {Alastair R Hall}, publisher = {Oxford University Press}, title = {Generalized method of moments}, year = {2005}, } @book{sturmfels2008algorithms, author = {Bernd Sturmfels}, publisher = {Springer Science \& Business Media}, title = {Algorithms in invariant theory}, year = {2008}, } @inproceedings{corless1995singular, author = {Robert M Corless and Patrizia M Gianni and Barry M Trager and Stephen M Watt}, booktitle = {International Symposium on Symbolic and Algebraic Computation}, pages = {195--207}, title = {The singular value decomposition for polynomial systems}, year = {1995}, } @inproceedings{laurent2009sums, author = {Monique Laurent}, booktitle = {Emerging applications of algebraic geometry}, pages = {157--270}, title = {Sums of squares, moment matrices and optimization over polynomials}, year = {2009}, } @article{parrilo2003minimizing, author = {Pablo A Parrilo and Bernd Sturmfels}, journal = {Algorithmic and quantitative real algebraic geometry, DIMACS Series in Discrete Mathematics and Theoretical Computer Science}, pages = {83--99}, title = {Minimizing polynomial functions}, volume = {60}, year = {2003}, } @article{parrilo2003semidefinite, author = {Pablo A Parrilo}, journal = {Mathematical programming}, number = {2}, pages = {293--320}, title = {Semidefinite programming relaxations for semialgebraic problems}, volume = {96}, year = {2003}, } @book{curto1996solution, author = {Ra{\'u}l E Curto and Lawrence A Fialkow}, publisher = {American Mathematical Society}, title = {Solution of the truncated complex moment problem for flat data}, volume = {568}, year = {1996 1996}, } @book{curto1998flat, author = {Ra{\'u}l E Curto and Lawrence A Fialkow}, publisher = {American Mathematical Society}, title = {Flat extensions of positive moment matrices: Recursively generated relations}, volume = {648}, year = {1998}, } @article{curto2000truncated, author = {Ra{\'u}l Curto and Lawrence Fialkow}, journal = {Transactions of the American mathematical society}, number = {6}, pages = {2825--2855}, title = {The truncated complex {K}-moment problem}, volume = {352}, year = {2000}, } @article{curto2005truncated, author = {Ra{\'u}l E Curto and Lawrence A Fialkow}, journal = {arXiv preprint arXiv:math/0507067}, title = {Truncated {K}-moment problems in several variables}, year = {2005}, } @article{laurent2008sparse, author = {Monique Laurent}, journal = {arXiv preprint arXiv:0812.2563}, title = {A Sparse Flat Extension Theorem for Moment Matrices}, year = {2008}, } @article{laurent2009generalized, author = {Monique Laurent and Bernard Mourrain}, journal = {Archiv der Mathematik}, number = {1}, pages = {87--98}, title = {A generalized flat extension theorem for moment matrices}, volume = {93}, year = {2009}, } @article{nie2013certifying, author = {Jiawang Nie}, journal = {Mathematical Programming}, number = {1}, pages = {485--510}, title = {Certifying convergence of Lasserre’s hierarchy via flat truncation}, volume = {142}, year = {2013}, } @article{nie2014optimality, author = {Jiawang Nie}, journal = {Mathematical programming}, number = {1}, pages = {97--121}, title = {Optimality conditions and finite convergence of Lasserre’s hierarchy}, volume = {146}, year = {2014}, } @article{nie2014truncated, author = {Jiawang Nie}, journal = {Foundations of Computational Mathematics}, number = {6}, pages = {1243--1276}, title = {The {A}-Truncated {K}-Moment Problem}, volume = {14}, year = {2014}, } @article{nie2013linear, author = {Jiawang Nie}, journal = {Mathematical Programming}, pages = {1--28}, title = {Linear optimization with cones of moments and nonnegative polynomials}, year = {2013}, } @article{corless2009symmetries, author = {Robert M Corless and Karin Gatermann and Ilias S Kotsireas}, journal = {Journal of Symbolic Computation}, number = {11}, pages = {1536--1550}, title = {Using symmetries in the eigenvalue method for polynomial systems}, volume = {44}, year = {2009}, } @article{anandkumar2014provable, author = {Animashree Anandkumar and Rong Ge and Majid Janzamin}, journal = {arXiv preprint arXiv:1408.0553}, title = {Provable Learning of Overcomplete Latent Variable Models: Semi-supervised and Unsupervised Settings}, year = {2014}, } @article{pearson1894contributions, author = {Karl Pearson}, journal = {Philosophical Transactions of the Royal Society of London. A}, pages = {71--110}, title = {Contributions to the mathematical theory of evolution}, volume = {185}, year = {1894}, } @article{anandkumar2014sample, author = {Anima Anandkumar and Rong Ge and Majid Janzamin}, journal = {arXiv preprint arXiv:1408.0553}, title = {Sample Complexity Analysis for Learning Overcomplete Latent Variable Models through Tensor Methods}, year = {2014}, } @book{sturmfels2002solving, author = {Bernd Sturmfels}, publisher = {American Mathematical Society}, title = {Solving systems of polynomial equations}, year = {2002}, } @article{hardt2014sharp, author = {Moritz Hardt and Eric Price}, journal = {arXiv preprint arXiv:1404.4997}, title = {Sharp bounds for learning a mixture of two {G}aussians}, year = {2014}, } @inproceedings{kalai2010efficiently, author = {Adam Tauman Kalai and Ankur Moitra and Gregory Valiant}, booktitle = {Symposium on Theory of Computing (STOC)}, pages = {553--562}, title = {Efficiently learning mixtures of two {G}aussians}, year = {2010}, } @article{day1969estimating, author = {N E Day}, journal = {Biometrika}, number = {3}, pages = {463--474}, title = {Estimating the Components of a Mixture of Normal Distributions}, volume = {56}, year = {1969}, } @article{triantafyllopoulos2002moments, author = {Kostas Triantafyllopoulos}, journal = {Department of Mathematics, University of Bristol}, title = {Moments and cumulants of the multivariate real and complex {G}aussian distributions}, volume = {12}, year = {2002 2002}, } @article{choi2011inverse, author = {Jaedeug Choi and Kee-Eung Kim}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {691--730}, title = {Inverse reinforcement learning in partially observable environments}, volume = {12}, year = {2011}, } @inproceedings{mansinghka2013approximate, author = {Vikash Mansinghka and Tejas D. Kulkarni and Yura N. Perov and Josh Tenenbaum}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1520--1528}, title = {Approximate {B}ayesian image interpretation using generative probabilistic graphics programs}, year = {2013}, } @article{fisher2012example, author = {Matthew Fisher and Daniel Ritchie and Manolis Savva and Thomas Funkhouser and Pat Hanrahan}, journal = {ACM SIGGRAPH Asia}, title = {Example-based Synthesis of 3{D} Object Arrangements}, volume = {12}, year = {2012}, } @article{dawid1984prequential, author = {A Philip Dawid}, journal = {Journal of the Royal Statistical Society. Series A (General)}, pages = {278--292}, title = {Present position and potential developments: Some personal views: Statistical theory: The prequential approach}, volume = {147}, year = {1984}, } @article{brier1950verification, author = {Glenn W Brier}, journal = {Monthly weather review}, number = {1}, pages = {1--3}, title = {Verification of forecasts expressed in terms of probability}, volume = {78}, year = {1950}, } @inproceedings{socher2013recursive, author = {Richard Socher and Alex Perelygin and Jean Y Wu and Jason Chuang and Christopher D Manning and Andrew Y Ng and Christopher Potts}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Recursive Deep Models for Semantic Compositionality Over a Sentiment Treebank}, year = {2013}, } @inproceedings{krizhevsky2012imagenet, author = {Alex Krizhevsky and Ilya Sutskever and Geoffrey E Hinton}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1097--1105}, title = {Imagenet classification with deep convolutional neural networks}, year = {2012}, } @article{viele2002regression, author = {Kert Viele and Barbara Tong}, journal = {Statistics and Computing}, number = {4}, pages = {315--330}, title = {Modeling with mixtures of linear regressions}, volume = {12}, year = {2002}, } @article{salimans2013fixed, author = {Tim Salimans and David A. Knowles}, journal = {Bayesian Analysis}, number = {4}, pages = {837--882}, title = {Fixed-form variational posterior approximation through stochastic linear regression}, volume = {8}, year = {2013}, } @inproceedings{salimans2015markov, author = {Tim Salimans and Diederik Kingma and Max Welling}, booktitle = {International Conference on Machine Learning (ICML)}, title = {{M}arkov Chain {M}onte {C}arlo and Variational Inference: Bridging the Gap}, year = {2015}, } @book{petrov2011coarse, author = {Slav Petrov and Eugene Charniak}, publisher = {Springer Science \& Business Media}, title = {Coarse-to-fine natural language processing}, year = {2011}, } @inproceedings{gimpel2010softmax, author = {Kevin Gimpel and Noah A. Smith}, booktitle = {North American Association for Computational Linguistics (NAACL)}, pages = {733--736}, title = {Softmax-margin {CRF}s: Training log-linear models with cost functions}, year = {2010}, } @inproceedings{li2012twiner, author = {Chenliang Li and Jianshu Weng and Qi He and Yuxia Yao and Anwitaman Datta and Aixin Sun and Bu-Sung Lee}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, pages = {721--730}, title = {Twiner: named entity recognition in targeted twitter stream}, year = {2012}, } @inproceedings{deng2009imagenet, author = {Jia Deng and Wei Dong and Richard Socher and Li-Jia Li and Kai Li and Li Fei-Fei}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {248--255}, title = {{I}mage{N}et: A large-scale hierarchical image database}, year = {2009}, } @inproceedings{kokkalis2013emailvalet, author = {Nicolas Kokkalis and Thomas K{\"o}hn and Carl Pfeiffer and Dima Chornyi and Michael S Bernstein and Scott R Klemmer}, booktitle = {Conference on Computer Supported Cooperative Work}, pages = {1291--1300}, title = {EmailValet: Managing email overload through private, accountable crowdsourcing}, year = {2013}, } @inproceedings{bernstein2010soylent, author = {Michael S Bernstein and Greg Little and Robert C Miller and Bj{\"o}rn Hartmann and Mark S Ackerman and David R Karger and David Crowell and Katrina Panovich}, booktitle = {Symposium on User Interface Software and Technology}, pages = {313--322}, title = {Soylent: a word processor with a crowd inside}, year = {2010}, } @inproceedings{yan2011active, author = {Yan Yan and Glenn M Fung and R{\'o}mer Rosales and Jennifer G Dy}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1161--1168}, title = {Active learning from crowds}, year = {2011}, } @inproceedings{donmez2008proactive, author = {Pinar Donmez and Jaime G Carbonell}, booktitle = {Conference on Information and Knowledge Management (CIKM)}, pages = {619--628}, title = {Proactive learning: cost-sensitive active learning with multiple imperfect oracles}, year = {2008}, } @inproceedings{settles2008analysis, author = {Burr Settles and Mark Craven}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1070--1079}, title = {An analysis of active learning strategies for sequence labeling tasks}, year = {2008}, } @article{greiner2002learning, author = {Russell Greiner and Adam J Grove and Dan Roth}, journal = {Artificial Intelligence}, number = {2}, pages = {137--174}, title = {Learning cost-sensitive active classifiers}, volume = {139}, year = {2002}, } @inproceedings{cheng2013feedback, author = {Yu Cheng and Zhengzhang Chen and Lu Liu and Jiang Wang and Ankit Agrawal and Alok Choudhary}, booktitle = {Conference on Information and Knowledge Management (CIKM)}, pages = {1311--1320}, title = {Feedback-driven multiclass active learning for data streams}, year = {2013}, } @inproceedings{helmbold1997some, author = {David Helmbold and Sandra Panizza}, booktitle = {Conference on Learning Theory (COLT)}, pages = {218--230}, title = {Some label efficient learning results}, year = {1997}, } @inproceedings{agarwal2013selective, author = {Alekh Agarwal}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1220--1228}, title = {Selective sampling algorithms for cost-sensitive multiclass prediction}, year = {2013}, } @inproceedings{chu2011unbiased, author = {Wei Chu and Martin Zinkevich and Lihong Li and Achint Thomas and Belle Tseng}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, pages = {195--203}, title = {Unbiased online active learning in data streams}, year = {2011}, } @inproceedings{golovin2010near, author = {Daniel Golovin and Andreas Krause and Debajyoti Ray}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {766--774}, title = {Near-optimal {B}ayesian active learning with noisy observations}, year = {2010}, } @inproceedings{tong2000active, author = {Simon Tong and Daphne Koller}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {647--653}, title = {Active learning for parameter estimation in {B}ayesian networks}, volume = {13}, year = {2000}, } @inproceedings{roth2006active, author = {Dan Roth and Kevin Small}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Active learning with {P}erceptron for structured output}, year = {2006}, } @inproceedings{angeli2014combining, author = {Gabor Angeli and Julie Tibshirani and Jean Y Wu and Christopher D Manning}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Combining distant and partial supervision for relation extraction}, year = {2014}, } @inproceedings{lasecki2013conversations, author = {Walter Stephen Lasecki and Ece Kamar and Dan Bohus}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Conversations in the crowd: Collecting data for task-oriented dialog learning}, year = {2013}, } @inproceedings{culotta2005reducing, author = {Aron Culotta and Andrew McCallum}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {746--751}, title = {Reducing labeling effort for structured prediction tasks}, year = {2005}, } @article{he2015delving, author = {Kaiming He and Xiangyu Zhang and Shaoqing Ren and Jian Sun}, journal = {arXiv preprint arXiv:1502.01852}, title = {Delving deep into rectifiers: Surpassing human-level performance on imagenet classification}, year = {2015}, } @article{singla2014near, author = {Adish Singla and Ilija Bogunovic and G{\'a}bor Bart{\'o}k and Amin Karbasi and Andreas Krause}, journal = {arXiv preprint arXiv:1402.2092}, title = {Near-Optimally Teaching the Crowd to Classify}, year = {2014}, } @inproceedings{seung1992query, author = {H Sebastian Seung and Manfred Opper and Haim Sompolinsky}, booktitle = {Proceedings of the fifth annual workshop on computational learning theory}, title = {Query by committee}, year = {1992}, } @inproceedings{lasecki2011realtime, author = {Walter S Lasecki and Kyle I Murray and Samuel White and Robert C Miller and Jeffrey P Bigham}, booktitle = {User Interface Software and Technology (UIST)}, pages = {23--32}, title = {Real-time crowd control of existing interfaces}, year = {2011}, } @inproceedings{gao2011active, author = {Tianshi Gao and Daphne Koller}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1062--1070}, title = {Active classification based on value of classifier}, year = {2011}, } @inproceedings{sculley2007online, author = {D Sculley}, booktitle = {Conference on Email and Anti-spam (CEAS)}, title = {Online Active Learning Methods for Fast Label-Efficient Spam Filtering}, year = {2007}, } @article{sutton1988learning, author = {Richard S Sutton}, journal = {Machine learning}, number = {1}, pages = {9--44}, title = {Learning to predict by the methods of temporal differences}, volume = {3}, year = {1988}, } @inproceedings{kocsis2006bandit, author = {Levente Kocsis and Csaba Szepesv{\'a}ri}, booktitle = {European Conference on Machine Learning (ECML)}, pages = {282--293}, title = {Bandit based {M}onte-{C}arlo planning}, year = {2006}, } @inproceedings{weiss2013adaptive, author = {David J Weiss and Ben Taskar}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {953--961}, title = {Learning adaptive value of information for structured prediction}, year = {2013}, } @book{guo2009continuous, author = {Xianping Guo and On{\'e}simo Hern{\'a}ndez-Lerma}, publisher = {Springer}, title = {Continuous-time {M}arkov decision processes}, year = {2009}, } @book{dattorro05convexoptimization, author = {Jon Dattorro}, publisher = {Meboo}, title = {Convex Optimization and Euclidean Distance Geometry}, year = {2005 2005}, } @inproceedings{zhang2014lower, author = {Yuchen Zhang and Martin J. Wainwright and Michael I. Jordan}, booktitle = {Conference on Learning Theory (COLT)}, title = {Lower bounds on the performance of polynomial-time algorithms for sparse linear regression}, year = {2014}, } @article{natarajan1995sparse, author = {Balas K. Natarajan}, journal = {SIAM Journal on Computing}, number = {2}, pages = {227--234}, title = {Sparse approximate solutions to linear systems}, volume = {24}, year = {1995}, } @article{turing1950computing, author = {Alan M Turing}, journal = {Mind}, pages = {433--460}, title = {Computing machinery and intelligence}, volume = {49}, year = {1950}, } @phdthesis{bobrow1964student, author = {Daniel G Bobrow}, school = {Massachusetts Institute of Technology}, title = {Natural language input for a computer problem solving system}, year = {1964}, } @inproceedings{zhao2015type, author = {Kai Zhao and Liang Huang}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Type-Driven Incremental Semantic Parsing with Polymorphism}, year = {2015}, } @inproceedings{dahl1994expanding, author = {Deborah A Dahl and Madeleine Bates and Michael Brown and William Fisher and Kate Hunicke-Smith and David Pallett and Christine Pao and Alexander Rudnicky and Elizabeth Shriberg}, booktitle = {Workshop on Human Language Technology}, pages = {43--48}, title = {Expanding the scope of the {ATIS} task: The {ATIS-3} corpus}, year = {1994}, } @inproceedings{yih2015stagg, author = {Wen-tau Yih and Ming-Wei Chang and Xiaodong He and Jianfeng Gao}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Semantic Parsing via Staged Query Graph Generation: Question Answering with Knowledge Base}, year = {2015}, } @inproceedings{erk2008structured, author = {Katrin Erk and Sebastian Padó}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {897--906}, title = {A structured vector space model for word meaning in context}, year = {2008}, } @inproceedings{yang2015smart, author = {Yi Yang and Ming-Wei Chang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {{S-MART}: Novel Tree-based Structured Learning Algorithms Applied to Tweet Entity Linking}, year = {2015}, } @inproceedings{huang2007forest, author = {Liang Huang and David Chiang}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Forest Rescoring: Faster Decoding with Integrated Language Models}, year = {2007}, } @article{vinyals2014show, author = {Oriol Vinyals and Alexander Toshev and Samy Bengio and Dumitru Erhan}, journal = {arXiv preprint arXiv:1411.4555}, title = {Show and tell: A neural image caption generator}, year = {2014}, } @inproceedings{sutskever2014sequence, author = {Ilya Sutskever and Oriol Vinyals and Quoc V. Le}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {3104--3112}, title = {Sequence to sequence learning with neural networks}, year = {2014}, } @inproceedings{bahdanau2015neural, author = {Dzmitry Bahdanau and Kyunghyun Cho and Yoshua Bengio}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Neural machine translation by jointly learning to align and translate}, year = {2015}, } @article{joulin2015stack, author = {Armand Joulin and Tomas Mikolov}, journal = {arXiv preprint arXiv:1503.01007}, title = {Inferring Algorithmic Patterns with Stack-Augmented Recurrent Nets}, year = {2015}, } @article{xu2015attend, author = {Kelvin Xu and Jimmy Lei Ba and Ryan Kiros and Kyunghyun Cho and Aaron Courville and Ruslan Salakhutdinov and Richard S. Zemel and Yoshua Bengio}, journal = {arXiv preprint arXiv:1502.03044}, title = {Show, Attend and Tell: Neural Image Caption Generation with Visual Attention}, year = {2015}, } @article{coulom2007computing, author = {Rémi Coulom}, journal = {Computer Games Workshop}, title = {Computing elo ratings of move patterns in the game of go}, year = {2007}, } @inproceedings{yin2015convolutional, author = {Wenpeng Yin and Hinrich Sch{\"u}tze}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Convolutional neural network for paraphrase identification}, year = {2015}, } @inproceedings{hu2014convolutional, author = {Baotian Hu and Zhengdong Lu and Hang Li and Qingcai Chen}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Convolutional neural network architectures for matching natural language sentences}, year = {2014}, } @inproceedings{bowman2015large, author = {Samuel Bowman and Gabor Angeli and Christopher Potts and Christopher D. Manning}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {A large annotated corpus for learning natural language inference}, year = {2015}, } @inproceedings{tai2015improved, author = {Kai Shen Tai and Richard Socher and Christopher D. Manning}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Improved Semantic Representations From Tree-Structured Long Short-Term Memory Networks}, year = {2015}, } @inproceedings{he2015multi, author = {Hua He and Kevin Gimpel and Jimmy Lin}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Multi-Perspective Sentence Similarity Modeling with Convolutional Neural Networks}, year = {2015}, } @article{rochtaschel2015reasoning, author = {Tim Rockt{\"{a}}schel and Edward Grefenstette and Karl Moritz Hermann and Tom{'{a}}s Kocisk{'{y}} and Phil Blunsom}, journal = {arXiv preprint arXiv:1509.06664}, title = {Reasoning about Entailment with Neural Attention}, year = {2015}, } @article{mnih2015human, author = {Volodymyr Mnih and Koray Kavukcuoglu and David Silver and Andrei A. Rusu and Joel Veness and Marc G. Bellemare and Alex Graves and Martin Riedmiller and Andreas K. Fidjeland and Georg Ostrovski and others}, journal = {Nature}, number = {7540}, pages = {529--533}, title = {Human-level control through deep reinforcement learning}, volume = {518}, year = {2015}, } @article{nielsen2009statistical, author = {Frank Nielsen and Vincent Garcia}, journal = {arXiv preprint arXiv:0911.4863}, title = {Statistical exponential families: A digest with flash cards}, year = {2009}, } @article{ganchev10posterior, author = {Kuzman Ganchev and João Graça and Jennifer Gillenwater and Ben Taskar}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {2001--2049}, title = {Posterior Regularization for Structured Latent Variable Models}, volume = {11}, year = {2010}, } @inproceedings{he2012cost, author = {He He and Hal {Daum{\'e} III} and Jason Eisner}, booktitle = {ICML Inferning Workshop}, title = {Cost-sensitive dynamic feature selection}, year = {2012}, } @inproceedings{he2013dynamic, author = {He He and Hal {Daum{\'e} III} and Jason Eisner}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1455--1464}, title = {Dynamic Feature Selection for Dependency Parsing}, year = {2013}, } @article{balle2014spectral, author = {Borja Balle and Xavier Carreras and Franco M. Luque and Ariadna Quattoni}, journal = {Machine Learning}, number = {1}, pages = {33--63}, title = {Spectral learning of weighted automata - a forward-backward perspective}, volume = {96}, year = {2014}, } @inproceedings{ozay2010gpca, author = {Necmiye Ozay and Mario Sznaier and Constantino M. Lagoa and Octavia I. Camps}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {3209--3216}, title = {{GPCA} with denoising: a moments-based convex approach}, year = {2010}, } @article{freund2004sensitivity, author = {Roland W Freund and Florian Jarre}, journal = {Operations Research Letters}, pages = {126--132}, title = {A sensitivity result for semidefinite programs}, volume = {32}, year = {2004}, } @misc{buja05lossfunctions, author = {Andreas Buja and Werner Stuetzle and Yi Shen}, title = {Loss Functions for Binary Class Probability Estimation and Classification: Structure and Applications}, year = {2005}, } @misc{foster98asymptoticcalibration, author = {Dean P. Foster and Rakesh V. Vohra}, title = {Asymptotic calibration}, year = {1998}, } @article{dawid1982well, author = {Dawid, A. Philip}, journal = {Journal of the American Statistical Association (JASA)}, number = {379}, pages = {605--610}, title = {The Well-Calibrated {B}ayesian}, volume = {77}, year = {1982}, } @inproceedings{menon2012ranking, author = {Aditya Krishna Menon and Xiaoqian Jiang and Shankar Vembu and Charles Elkan and Lucila Ohno{-}Machado}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Predicting accurate probabilities with a ranking loss}, year = {2012}, } @inproceedings{zhong2013accurate, author = {Leon Wenliang Zhong and James Kwok}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, pages = {1939--1945}, title = {Accurate Probability Calibration for Multiple Classifiers}, year = {2013}, } @phdthesis{seigel2013confidence, author = {Matthew Seigel}, school = {University of Cambridge}, title = {Confidence Estimation for Automatic Speech Recognition Hypotheses}, year = {2013}, } @article{jiang2012calibrating, author = {Xiaoqian Jiang and Melanie Osl and Jihoon Kim and Lucila Ohno{-}Machado}, journal = {Journal of the American Medical Informatics Association}, number = {2}, pages = {263--274}, title = {Calibrating predictive model estimates to support personalized medicine}, volume = {19}, year = {2012}, } @article{yu2011calibration, author = {Dong Yu and Jinyu Li and Li Deng}, journal = {Trans. Audio, Speech and Lang. Proc.}, number = {8}, pages = {2461--2473}, title = {Calibration of Confidence Measures in Speech Recognition}, volume = {19}, year = {2011}, } @inproceedings{nguyen2015posterior, author = {Khanh Nguyen and Brendan O'Connor}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1587--1598}, title = {Posterior calibration and exploratory analysis for natural language processing models}, year = {2015}, } @article{heckerman92towardsnormative, author = {David E. Heckerman and Bharat N. Nathwani}, journal = {Methods Archive}, number = {2}, pages = {106--116}, title = {Towards normative expert systems: Probability-based representations for efficient knowledge acquisition and inference}, volume = {31}, year = {1992}, } @book{lichtenstein1982calibration, author = {Sarah Lichtenstein and Baruch Fischhoff and Lawrence D. Phillips}, publisher = {Cambridge University Press}, title = {Judgement under Uncertainty: Heuristics and Biases}, year = {1982}, } @phdthesis{mueller2013semantic, author = {Andreas Mueller}, school = {University of Bonn}, title = {Methods for Learning Structured Prediction in Semantic Segmentation of Natural Images}, year = {2013}, } @techreport{krizhevsky2009learningmultiple, author = {Alex Krizhevsky}, institution = {University of Toronto}, title = {Learning multiple layers of features from tiny images}, year = {2009}, } @article{coates2012features, author = {Adam Coates and Andrew Y. Ng}, journal = {Neural Networks: Tricks of the Trade - Second Edition}, number = {1}, pages = {561--580}, title = {Learning Feature Representations with {K}-Means}, volume = {2}, year = {2012}, } @inproceedings{artzi2015broad, author = {Yoav Artzi and Kenton Lee Luke Zettlemoyer}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Broad-coverage {CCG} Semantic Parsing with {AMR}}, year = {2015}, } @inproceedings{weston2015memory, author = {Jason Weston and Sumit Chopra and Antoine Bordes}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Memory Networks}, year = {2015}, } @article{hinton2012improving, author = {Geoffrey E Hinton and Nitish Srivastava and Alex Krizhevsky and Ilya Sutskever and Ruslan R Salakhutdinov}, journal = {arXiv preprint arXiv:1207.0580}, title = {Improving neural networks by preventing co-adaptation of feature detectors}, year = {2012}, } @inproceedings{ba2013adaptive, author = {Jimmy Ba and Brendan Frey}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {3084--3092}, title = {Adaptive dropout for training deep neural networks}, year = {2013}, } @inproceedings{baldi2013understanding, author = {Pierre Baldi and Peter J Sadowski}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {2814--2822}, title = {Understanding dropout}, year = {2013}, } @inproceedings{maaten2013learning, author = {Laurens van der Maaten and Minmin Chen and Stephen Tyree and Kilian Q Weinberger}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {410--418}, title = {Learning with marginalized corrupted features}, year = {2013}, } @inproceedings{wan2013regularization, author = {Li Wan and Matthew Zeiler and Sixin Zhang and Yann L Cun and Rob Fergus}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1058--1066}, title = {Regularization of neural networks using dropconnect}, year = {2013}, } @inproceedings{goodfellow2013maxout, author = {Ian Goodfellow and David Warde-farley and Mehdi Mirza and Aaron Courville and Yoshua Bengio}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1319--1327}, title = {Maxout Networks}, year = {2013}, } @inproceedings{vinyals2015grammar, author = {Oriol Vinyals and Lukasz Kaiser and Terry Koo and Slav Petrov and Ilya Sutskever and Geoffrey Hinton}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {2755--2763}, title = {Grammar as a Foreign Language}, year = {2015}, } @inproceedings{vinyals2015pointer, author = {Oriol Vinyals and Meire Fortunato and Navdeep Jaitly}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {2674--2682}, title = {Pointer Networks}, year = {2015}, } @inproceedings{grefenstette2014deep, author = {Edward Grefenstette and Phil Blunsom and Nando de Freitas and Karl Moritz Hermann}, booktitle = {ACL Workshop on Semantic Parsing}, pages = {22--27}, title = {A Deep Architecture for Semantic Parsing}, year = {2014}, } @inproceedings{luong2015translation, author = {Minh-Thang Luong and Hieu Pham and Christopher D. Manning}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1412--1421}, title = {Effective Approaches to Attention-based Neural Machine Translation}, year = {2015}, } @inproceedings{bergstra2010theano, author = {James Bergstra and Olivier Breuleux and Fr{'{e}}d{'{e}}ric Bastien and Pascal Lamblin and Razvan Pascanu and Guillaume Desjardins and Joseph Turian and David Warde-Farley and Yoshua Bengio}, booktitle = {Python for Scientific Computing Conference}, title = {Theano: a {CPU} and {GPU} Math Expression Compiler}, year = {2010}, } @article{yin2015enquirer, author = {Pengcheng Yin and Zhengdong Lu and Hang Li and Ben Kao}, journal = {arXiv preprint arXiv:1512.00965}, title = {Neural Enquirer: Learning to Query Tables}, year = {2015}, } @article{bordes2015simple, author = {Antoine Bordes and Nicolas Usunier and Sumit Chopra and Jason Weston}, journal = {arXiv preprint arXiv:1506.02075}, title = {Large-scale Simple Question Answering with Memory Networks}, year = {2015}, } @inproceedings{wang2013fast, author = {Sida I. Wang and Christopher Manning}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {118--126}, title = {Fast dropout training}, year = {2013}, } @article{mcallester2013pac, author = {David McAllester}, journal = {arXiv preprint arXiv:1307.2118}, title = {A {PAC}-{B}ayesian tutorial with a dropout bound}, year = {2013}, } @article{josse2014stable, author = {Julie Josse and Stefan Wager}, journal = {arXiv preprint arXiv:1410.8275}, title = {Stable Autoencoding: A Flexible Framework for Regularized Low-Rank Matrix Estimation}, year = {2014}, } @article{baldi2014dropout, author = {Pierre Baldi and Peter Sadowski}, journal = {Artificial intelligence}, pages = {78--122}, title = {The dropout learning algorithm}, volume = {210}, year = {2014}, } @article{srivastava2014dropout, author = {Nitish Srivastava and Geoffrey Hinton and Alex Krizhevsky and Ilya Sutskever and Ruslan Salakhutdinov}, journal = {Journal of Machine Learning Research (JMLR)}, number = {1}, pages = {1929--1958}, title = {Dropout: A simple way to prevent neural networks from overfitting}, volume = {15}, year = {2014}, } @inproceedings{globerson2006nightmare, author = {Amir Globerson and Sam Roweis}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {353--360}, title = {Nightmare at test time: Robust learning by feature deletion}, year = {2006}, } @article{bishop1995training, author = {Chris M Bishop}, journal = {Neural computation}, number = {1}, pages = {108--116}, title = {Training with noise is equivalent to Tikhonov regularization}, volume = {7}, year = {1995}, } @book{simard1998transformation, author = {Patrice Y Simard and Yann A LeCun and John S Denker and Bernard Victorri}, pages = {239--274}, publisher = {Neural networks: Tricks of the trade Springer}, title = {Transformation Invariance in Pattern Recognition---Tangent Distance and Tangent Propagation}, year = {1998}, } @inproceedings{scholkopf1997improving, author = {Simard P Sch{\"o}lkopf and Patrice Simard and Vladimir Vapnik and AJ Smola}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {375--381}, title = {Improving the accuracy and speed of support vector machines}, year = {1997}, } @article{abu1990learning, author = {Yaser S Abu-Mostafa}, journal = {Journal of Complexity}, number = {2}, pages = {192--198}, title = {Learning from hints in neural networks}, volume = {6}, year = {1990}, } @article{efron1975efficiency, author = {Bradley Efron}, journal = {Journal of the American Statistical Association (JASA)}, number = {352}, pages = {892--898}, title = {The efficiency of logistic regression compared to normal discriminant analysis}, volume = {70}, year = {1975}, } @article{janzamin2015beating, author = {Majid Janzamin and Hanie Sedghi and Anima Anandkumar}, journal = {arXiv preprint arXiv:1506.08473}, title = {Beating the perils of non-convexity: Guaranteed training of neural networks using tensor methods}, year = {2015}, } @inproceedings{luong2015rare, author = {Minh-Thang Luong and Ilya Sutskever and Quoc V. Le and Oriol Vinyals and Wojciech Zaremba}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {11--19}, title = {Addressing the Rare Word Problem in Neural Machine Translation}, year = {2015}, } @inproceedings{mei2016listen, author = {Hongyuan Mei and Mohit Bansal and Matthew R Walter}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Listen, attend, and walk: Neural mapping of navigational instructions to action sequences}, year = {2016}, } @article{artzi2013uw, author = {Yoav Artzi and Luke Zettlemoyer}, journal = {arXiv preprint arXiv:1311.3011}, title = {{UW} {SPF}: The {U}niversity of {W}ashington Semantic Parsing Framework}, year = {2013}, } @inproceedings{dyer2015transition, author = {Chris Dyer and Miguel Ballesteros and Wang Ling and Austin Matthews and Noah A Smith}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Transition-based dependency parsing with stack long short-term memory}, year = {2015}, } @inproceedings{mitchell1977version, author = {Tom M Mitchell}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, pages = {305--310}, title = {Version spaces: A candidate elimination approach to rule learning}, year = {1977}, } @inproceedings{lau2000version, author = {Tessa A Lau and Pedro Domingos and Daniel S Weld}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {527--534}, title = {Version Space Algebra and its Application to Programming by Demonstration}, year = {2000}, } @article{vanlehn1987version, author = {Kurt Vanlehn and William Ball}, journal = {Machine learning}, number = {1}, pages = {39--74}, title = {A version space approach to learning context-free grammars}, volume = {2}, year = {1987}, } @article{robins2000inference, author = {Robins, James M and Wang, Naisyin}, journal = {Biometrika}, number = {1}, pages = {113--124}, title = {Inference for imputation estimators}, volume = {87}, year = {2000}, } @article{demp1977em, author = {A. P. Dempster and Laird N. M. and Rubin D. B.}, journal = {Journal of the Royal Statistical Society: Series B}, number = {1}, pages = {1--38}, title = {Maximum likelihood from incomplete data via the {EM} algorithm}, volume = {39}, year = {1977}, } @article{maron1998framework, author = {Maron, Oded and Lozano-P{\'e}rez, Tom{\'a}s}, journal = {Advances in neural information processing systems}, pages = {570--576}, title = {A framework for multiple-instance learning}, year = {1998}, } @inproceedings{auer1997multiple, author = {Peter Auer}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {21--29}, title = {On Learning From Multi-Instance Examples: Empirical Evaluation of a Theoretical Approach}, year = {1997}, } @mastersthesis{platanios2015estimating, author = {Emmanouil Antonios Platanios}, school = {Carnegie Mellon University}, title = {Estimating Accuracy from Unlabeled Data}, year = {2015}, } @inproceedings{platanios2014estimating, author = {Emmanouil Antonios Platanios and Avrim Blum and Tom M. Mitchell}, booktitle = {Uncertainty in Artificial Intelligence (UAI)}, title = {Estimating Accuracy from Unlabeled Data}, year = {2014}, } @article{bottou2013counterfactual, author = {L\'eon Bottou and Jonas Peters and Joaquin {Qui\~nonero-Candela} and Denis X. Charles and D. Max Chickering and Elon Portugaly and Dipankar Ray and Patrice Simard and Ed Snelson}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {3207--3260}, title = {Counterfactual Reasoning and Learning Systems: The Example of Computational Advertising}, volume = {14}, year = {2013}, } @inproceedings{gopalan2011domain, author = {Raghuraman Gopalan and Ruonan Li and Rama Chellappa}, booktitle = {International Conference on Computer Vision (ICCV)}, pages = {999--1006}, title = {Domain adaptation for object recognition: An unsupervised approach}, year = {2011}, } @article{shimodaira2000improving, author = {Hidetoshi Shimodaira}, journal = {Journal of Statistical Planning and Inference}, pages = {227--244}, title = {Improving predictive inference under covariate shift by weighting the log-likelihood function}, volume = {90}, year = {2000}, } @book{quinonero2009dataset, author = {Joaquin {Qui\~nonero-Candela} and Masashi Sugiyama and Anton Schwaighofer and Neil D. Lawrence}, publisher = {The MIT Press}, title = {Dataset shift in machine learning}, year = {2009}, } @phdthesis{klein2005thesis, author = {Dan Klein}, school = {Stanford University}, title = {The Unsupervised Learning of Natural Language Structure}, year = {2005}, } @inproceedings{nigam1998learning, author = {Kamal Nigam and Andrew McCallum and Sebastian Thrun and Tom Mitchell}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Learning to classify text from labeled and unlabeled documents}, year = {1998}, } @article{dawid1979maximum, author = {Alexander Philip Dawid and Allan M. Skene}, journal = {Applied Statistics}, pages = {20--28}, title = {Maximum likelihood estimation of observer error-rates using the {EM} algorithm}, volume = {1}, year = {1979}, } @inproceedings{jaffe2015estimating, author = {A. Jaffe and B. Nadler and Y. Kluger}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, pages = {407--415}, title = {Estimating the accuracies of multiple classifiers without labeled data}, year = {2015}, } @inproceedings{sculley2015hidden, author = {D. Sculley and Gary Holt and Daniel Golovin and Eugene Davydov and Todd Phillips and Dietmar Ebner and Vinay Chaudhary and Michael Young and Jean-Fran{\c{c}}ois Crespo and Dan Dennison}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {2494--2502}, title = {Hidden Technical Debt in Machine Learning Systems}, year = {2015}, } @misc{bottou2015two, author = {L\'eon Bottou}, howpublished = {Invited talk at the 32nd International Conference on Machine Learning}, title = {Two high stakes challenges in machine learning}, year = {2015}, } @inproceedings{blitzer2011domain, author = {John Blitzer and Sham Kakade and Dean P. Foster}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, pages = {173--181}, title = {Domain adaptation with coupled subspaces}, year = {2011}, } @article{edmonds1972theoretical, author = {Jack Edmonds and Richard M. Karp}, journal = {Journal of the ACM (JACM)}, number = {2}, pages = {248--264}, title = {Theoretical improvements in algorithmic efficiency for network flow problems}, volume = {19}, year = {1972}, } @article{tomizawa1971techniques, author = {N. Tomizawa}, journal = {Networks}, number = {2}, pages = {173--194}, title = {On some techniques useful for solution of transportation network problems}, volume = {1}, year = {1971}, } @incollection{newey1994large, author = {Whitney K. Newey and Daniel McFadden}, booktitle = {Handbook of Econometrics}, pages = {2111--2245}, title = {Large sample estimation and hypothesis testing}, volume = {4}, year = {1994}, } @incollection{taylor2008medical, author = {Russell H. Taylor and Arianna Menciassi and Gabor Fichtinger and Paolo Dario}, booktitle = {Springer Handbook of Robotics}, pages = {1199--1222}, title = {Medical robotics and computer-integrated surgery}, year = {2008}, } @article{bousquet2004introduction, author = {Olivier Bousquet and St{\'e}phane Boucheron and G{\'a}bor Lugosi}, journal = {Advanced Lectures on Machine Learning}, pages = {169--207}, title = {Introduction to statistical learning theory}, year = {2004}, } @article{lorentz1966metric, author = {G. G. Lorentz}, journal = {Bulletin of the American Mathematical Society}, number = {6}, pages = {903--937}, title = {Metric entropy and approximation}, volume = {72}, year = {1966}, } @article{kolmogorov1959varepsilon, author = {Andrei Nikolaevich Kolmogorov and Vladimir Mikhailovich Tikhomirov}, journal = {Uspekhi Matematicheskikh Nauk}, number = {2}, pages = {3--86}, title = {$\varepsilon$-entropy and $\varepsilon$-capacity of sets in function spaces}, volume = {14}, year = {1959}, } @article{fan1953minimax, author = {Ky Fan}, journal = {Proceedings of the National Academy of Sciences of the United States of America}, pages = {42--47}, title = {Minimax theorems}, volume = {39}, year = {1953}, } @article{lovasz1975ratio, author = {L{\'a}szl{\'o} Lov{\'a}sz}, journal = {Discrete Mathematics}, number = {4}, pages = {383--390}, title = {On the ratio of optimal integral and fractional covers}, volume = {13}, year = {1975}, } @book{boucheron2013concentration, author = {St{\'e}phane Boucheron and G{\'a}bor Lugosi and Pascal Massart}, publisher = {Oxford University Press}, title = {Concentration inequalities: A nonasymptotic theory of independence}, year = {2013}, } @inproceedings{snyder2010climbing, author = {Benjamin Snyder and Regina Barzilay}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Climbing the tower of Babel: Unsupervised multilingual learning}, year = {2010}, } @article{talagrand1996majorizing, author = {Michel Talagrand}, journal = {The Annals of Probability}, pages = {1049--1103}, title = {Majorizing measures: the generic chaining}, year = {1996}, } @article{dudley1967sizes, author = {Richard M. Dudley}, journal = {Journal of Functional Analysis}, number = {3}, pages = {290--330}, title = {The sizes of compact subsets of {H}ilbert space and continuity of {G}aussian processes}, volume = {1}, year = {1967}, } @book{drton2009lectures, author = {Mathias Drton and Bernd Sturmfels and Seth Sullivant}, publisher = {Springer}, title = {Lectures on algebraic statistics}, year = {2009}, } @incollection{powell1994estimation, author = {James L. Powell}, booktitle = {Handbook of Econometrics}, pages = {2443--2521}, title = {Estimation of semiparametric models}, volume = {4}, year = {1994}, } @article{balasubramanian2011unsupervised, author = {Krishnakumar Balasubramanian and Pinar Donmez and Guy Lebanon}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {3119--3145}, title = {Unsupervised supervised learning {II}: Margin-based classification without labels}, volume = {12}, year = {2011}, } @article{donmez2010unsupervised, author = {Pinar Donmez and Guy Lebanon and Krishnakumar Balasubramanian}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {1323--1351}, title = {Unsupervised supervised learning {I}: Estimating classification and regression errors without labels}, volume = {11}, year = {2010}, } @incollection{cozman2006risks, author = {Fabio Cozman and Ira Cohen}, booktitle = {Semi-Supervised Learning}, title = {Risks of Semi-Supervised Learning: How Unlabeled Data Can Degrade Performance of Generative Classifiers}, year = {2006}, } @book{chapelle2006semisupervised, author = {O. Chapelle and A. Zien and B. Scholkopf}, publisher = {MIT Press}, title = {Semi-Supervised Learning}, year = {2006}, } @article{li2015towards, author = {Yu-Feng Li and Zhi-Hua Zhou}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence}, number = {1}, pages = {175--188}, title = {Towards making unlabeled data never hurt}, volume = {37}, year = {2015}, } @inproceedings{kakade2007multi, author = {Sham M. Kakade and Dean P. Foster}, booktitle = {Conference on Learning Theory (COLT)}, pages = {82--96}, title = {Multi-view regression via canonical correlation analysis}, year = {2007}, } @inproceedings{ando2007two, author = {Rie Kubota Ando and Tong Zhang}, booktitle = {Conference on Learning Theory (COLT)}, pages = {25--32}, title = {Two-view feature generation model for semi-supervised learning}, year = {2007}, } @article{rinott1994normal, author = {Yosef Rinott}, journal = {Journal of Computational and Applied Mathematics}, number = {2}, pages = {135--143}, title = {On normal approximation rates for certain sums of dependent random variables}, volume = {55}, year = {1994}, } @inproceedings{tsirelson1976norms, author = {B. S. Tsirelson and I. A. Ibragimov and V. N. Sudakov}, booktitle = {Proceedings of the Third Japan-USSR Symposium on Probability Theory}, pages = {20--41}, title = {Norms of {G}aussian sample functions}, year = {1976}, } @inproceedings{chang2010structured, author = {Ming-Wei Chang and Vivek Srikumar and Dan Goldwasser and Dan Roth}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {199--206}, title = {Structured output learning with indirect supervision}, year = {2010}, } @inproceedings{duchi2013local, author = {John C. Duchi and Michael I. Jordan and Martin J. Wainwright}, booktitle = {Foundations of Computer Science (FOCS)}, title = {Local Privacy and Statistical Minimax Rates}, year = {2013}, } @inproceedings{schapire2002prior, author = {Robert E. Schapire and Marie Rochery and Mazin G. Rahim and Narendra Gupta}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Incorporating Prior Knowledge into Boosting}, year = {2002}, } @inproceedings{joachims1999transductive, author = {Thorsten Joachims}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Transductive inference for text classification using support vector machines}, year = {1999}, } @article{nesterov2011random, author = {Yurii Nesterov and Vladimir Spokoiny}, journal = {Foundations of Computational Mathematics}, pages = {1--40}, title = {Random gradient-free minimization of convex functions}, year = {2011}, } @article{tropp2012user, author = {Joel A Tropp}, journal = {Foundations of computational mathematics}, number = {4}, pages = {389--434}, title = {User-friendly tail bounds for sums of random matrices}, volume = {12}, year = {2012}, } @article{sion1958minimax, author = {Maurice Sion}, journal = {Pacific journal of mathematics}, number = {1}, pages = {171--176}, title = {On general minimax theorems}, volume = {8}, year = {1958}, } @article{balcan2010discriminative, author = {Maria-Florina Balcan and Avrim Blum}, journal = {Journal of the ACM (JACM)}, number = {3}, title = {A discriminative model for semi-supervised learning}, volume = {57}, year = {2010}, } @article{tamhane1981randomized, author = {Ajit C Tamhane}, journal = {Journal of the American Statistical Association (JASA)}, number = {376}, pages = {916--923}, title = {Randomized response techniques for multiple sensitive attributes}, volume = {76}, year = {1981}, } @article{warner1965randomized, author = {Stanley L Warner}, journal = {Journal of the American Statistical Association (JASA)}, number = {309}, pages = {63--69}, title = {Randomized response: A survey technique for eliminating evasive answer bias}, volume = {60}, year = {1965}, } @inproceedings{dwork2006differential, author = {Cynthia Dwork}, booktitle = {Automata, languages and programming}, pages = {1--12}, title = {Differential privacy}, year = {2006}, } @inproceedings{vaish2014twitch, author = {Rajan Vaish and Keith Wyngarden and Jingshu Chen and Brandon Cheung and Michael S Bernstein}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, pages = {3645--3654}, title = {Twitch crowdsourcing: crowd contributions in short bursts of time}, year = {2014}, } @article{meyer1973inverse, author = {Carl D. Meyer}, journal = {SIAM Journal on Applied Mathematics}, number = {3}, pages = {315--323}, title = {Generalised Inversion of Modified Matrices}, volume = {24}, year = {1973}, } @inproceedings{dwork2006calibrating, author = {Cynthia Dwork and Frank McSherry and Kobbi Nissim and Adam Smith}, booktitle = {Proceedings of the 3rd Theory of Cryptography Conference}, pages = {265--284}, title = {Calibrating noise to sensitivity in private data analysis}, year = {2006}, } @article{evfimievski2004privacy, author = {Alexandre Evfimievski and Ramakrishnan Srikant and Rakesh Agrawal and Johannes Gehrke}, journal = {Information Systems}, number = {4}, pages = {343--364}, title = {Privacy preserving mining of association rules}, volume = {29}, year = {2004}, } @article{kasiviswanathan2011can, author = {Shiva Prasad Kasiviswanathan and Homin K Lee and Kobbi Nissim and Sofya Raskhodnikova and Adam Smith}, journal = {SIAM Journal on Computing}, number = {3}, pages = {793--826}, title = {What can we learn privately?}, volume = {40}, year = {2011}, } @article{matloff1984use, author = {Norman S Matloff}, journal = {Statistics \& Probability Letters}, number = {1}, pages = {31--34}, title = {Use of covariates in randomized response settings}, volume = {2}, year = {1984}, } @inproceedings{babenko2009visual, author = {Boris Babenko and Ming-Hsuan Yang and Serge Belongie}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {983--990}, title = {Visual tracking with online multiple instance learning}, year = {2009}, } @inproceedings{temizer2010collision, author = {Selim Temizer and Mykel J. Kochenderfer and Leslie P. Kaelbling and Tomas Lozano-P{\'e}rez and James K. Kuchar}, booktitle = {AIAA Guidance, Navigation, and Control Conference}, title = {Collision avoidance for unmanned aircraft using {M}arkov decision processes}, year = {2010}, } @inproceedings{mei2015teaching, author = {Shike Mei and Xiaojin Zhu}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Using Machine Teaching to Identify Optimal Training-Set Attacks on Machine Learners}, year = {2015}, } @article{cook2011assessing, author = {Samantha Cook and Corrie Conrad and Ashley L. Fowlkes and Matthew H. Mohebbi}, journal = {{P}lo{S} one}, number = {8}, title = {Assessing {G}oogle flu trends performance in the {U}nited {S}tates during the 2009 influenza virus {A} ({H1N1}) pandemic}, volume = {6}, year = {2011}, } @book{nisan2007algorithmic, author = {Noam Nisan and Tim Roughgarden and Eva Tardos and Vijay V. Vazirani}, publisher = {Cambridge University Press}, title = {Algorithmic game theory}, volume = {1}, year = {2007}, } @article{blum2014learning, author = {Avrim Blum and Yishay Mansour and Jamie Morgenstern}, journal = {arXiv}, title = {Learning Valuation Distributions from Partial Observation}, year = {2014}, } @inproceedings{raina2007self, author = {Rajar Raina and Alexis Battle and Honglak Lee and Benjamin Packer and Andrew Y. Ng}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {759--766}, title = {Self-taught learning: transfer learning from unlabeled data}, year = {2007}, } @inproceedings{moldovan2012safe, author = {Teodor M. Moldovan and Pieter Abbeel}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1711--1718}, title = {Safe Exploration in {M}arkov Decision Processes}, year = {2012}, } @article{hans2008safe, author = {Alexander Hans and Daniel Schneega{\ss} and Anton Maximilian Sch{\"a}fer and Steffen Udluft}, journal = {ESANN}, pages = {143--148}, title = {Safe exploration for reinforcement learning}, year = {2008}, } @article{basseville1988detecting, author = {Mich{\`e}le Basseville}, journal = {Automatica}, number = {3}, pages = {309--326}, title = {Detecting changes in signals and systems--A survey}, volume = {24}, year = {1988}, } @article{liu2013change, author = {Song Liu and Makoto Yamada and Nigel Collier and Masashi Sugiyama}, journal = {Neural Networks}, pages = {72--83}, title = {Change-point detection in time-series data by relative density-ratio estimation}, volume = {43}, year = {2013}, } @article{kawahara2009change, author = {Yoshinobu Kawahara and Masashi Sugiyama}, journal = {SDM}, pages = {389--400}, title = {Change-Point Detection in Time-Series Data by Direct Density-Ratio Estimation}, volume = {9}, year = {2009}, } @article{lygeros1999controllers, author = {John Lygeros and Claire Tomlin and Shankar Sastry}, journal = {Automatica}, number = {3}, pages = {349--370}, title = {Controllers for reachability specifications for hybrid systems}, volume = {35}, year = {1999}, } @article{mitchell2005time, author = {Ian M. Mitchell and Alexandre M. Bayen and Claire J. Tomlin}, journal = {IEEE Transactions on Automatic Control}, number = {7}, pages = {947--957}, title = {A time-dependent {H}amilton-{J}acobi formulation of reachable sets for continuous dynamic games}, volume = {50}, year = {2005}, } @book{bacsar2008optimal, author = {Tamer Ba{\c{s}}ar and Pierre Bernhard}, publisher = {Springer Science \& Business Media}, title = {{H}-infinity optimal control and related minimax design problems: a dynamic game approach}, year = {2008}, } @article{wager2015estimation, author = {Stefan Wager and Susan Athey}, journal = {arXiv}, title = {Estimation and Inference of Heterogeneous Treatment Effects using Random Forests}, year = {2015}, } @article{athey2015measure, author = {Susan Athey and Guido Imbens}, journal = {The American Economic Review}, number = {5}, pages = {476--480}, title = {A measure of robustness to misspecification}, volume = {105}, year = {2015}, } @misc{russell2015research, author = {Stuart Russell and Daniel Dewey and Max Tegmark and Janos Kramar and Richard Mallah}, title = {Research priorities for robust and beneficial artificial intelligence}, year = {2015}, } @inproceedings{geiger2012kitti, author = {Andreas Geiger and Philip Lenz and Raquel Urtasun}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {3354--3361}, title = {Are we ready for autonomous driving? {T}he {KITTI} vision benchmark suite}, year = {2012}, } @inproceedings{halpern2014anchors, author = {Yoni Halpern and Youngduck Choi and Steve Horng and David Sontag}, booktitle = {American Medical Informatics Association Annual Symposium}, pages = {606--615}, title = {Using Anchors to Estimate Clinical State without Labeled Data}, year = {2014}, } @article{xu2008satzilla, author = {Lin Xu and Frank Hutter and Holger H. Hoos and Kevin Leyton-Brown}, journal = {Journal of Artificial Intelligence Research (JAIR)}, pages = {565--606}, title = {{SAT}zilla: portfolio-based algorithm selection for {SAT}}, volume = {32}, year = {2008}, } @inproceedings{chow2015risk, author = {Yinlam Chow and Aviv Tamar and Shie Mannor and Marco Pavone}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1522--1530}, title = {Risk-Sensitive and Robust Decision-Making: a {CV}a{R} Optimization Approach}, year = {2015}, } @article{shafer2008tutorial, author = {Glenn Shafer and Vladimir Vovk}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {371--421}, title = {A tutorial on conformal prediction}, volume = {9}, year = {2008}, } @article{li2011knows, author = {Lihong Li and Michael L. Littman and Thomas J. Walsh and Alexander L. Strehl}, journal = {Machine learning}, number = {3}, pages = {399--443}, title = {Knows what it knows: a framework for self-aware learning}, volume = {82}, year = {2011}, } @article{shalev2011online, author = {Shai Shalev-Shwartz}, journal = {Foundations and Trends in Machine Learning}, number = {2}, pages = {107--194}, title = {Online learning and online convex optimization}, volume = {4}, year = {2011}, } @inproceedings{mei2015security, author = {Shike Mei and Xiaojin Zhu}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, title = {The Security of Latent {D}irichlet Allocation}, year = {2015}, } @inproceedings{rubinstein1997discriminative, author = {Y Dan Rubinstein and Trevor Hastie}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, pages = {49--53}, title = {Discriminative vs Informative Learning}, volume = {5}, year = {1997}, } @article{friedman2010regularization, author = {Jerome Friedman and Trevor Hastie and Rob Tibshirani}, journal = {Journal of Statistical Software}, number = {1}, pages = {1--22}, title = {Regularization paths for generalized linear models via coordinate descent}, volume = {33}, year = {2010}, } @book{paulos1988innumeracy, author = {John Allen Paulos}, publisher = {Macmillan}, title = {Innumeracy: Mathematical illiteracy and its consequences}, year = {1988}, } @book{seife2010proofiness, author = {Charles Seife}, publisher = {Penguin}, title = {Proofiness: How you're being fooled by the numbers}, year = {2010}, } @inproceedings{kim2016analogies, author = {Yea-seul Kim and Jessica Hullman and Maneesh Agarwala}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Generating Personalized Spatial Analogies for Distances and Areas}, year = {2016}, } @inproceedings{barrio2016comprehension, author = {Pablo J. Barrio and Daniel G. Goldstein and Jake M. Hofman}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Improving the Comprehension of Numbers in the News}, year = {2016}, } @article{chevalier2013composition, author = {Fanny Chevalier and Romain Vuillemot and Guia Gali}, journal = {IEEE Transactions on Visualization and Computer Graphics}, pages = {2426--2435}, title = {Using concrete scales: A practical framework for effective visual depiction of complex measures}, volume = {19}, year = {2013}, } @misc{chiachieri2013dictionary, author = {Glen Chiacchieri}, howpublished = {\url{http://www.dictionaryofnumbers.com/}}, title = {Dictionary of Numbers}, year = {2013}, } @misc{wolfram2009alpha, author = {Wolfram Alpha LLC}, howpublished = {\url{http://www.wolframalpha.com/}}, title = {Wolfram|Alpha}, year = {2009}, } @article{tretter2006accuracy, author = {Thomas R. Tretter and M. Gail Jones and James Minogue}, journal = {Journal of Research in Science Teaching}, pages = {1061--1085}, title = {Accuracy of scale conceptions in science: Mental maneuverings across many orders of spatial magnitude}, volume = {43}, year = {2006}, } @article{roy2015reasoning, author = {Subhro Roy and Tom Vieira and Dan Roth}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {Reasoning about quantities in natural language}, volume = {1}, year = {2015}, } @article{markman1990constraints, author = {E.M. Markman}, journal = {Cognitive Science}, pages = {57--77}, title = {Constraints children place on word meanings}, volume = {14}, year = {1990}, } @article{markman1988exclusivity, author = {E.M. Markman and G. F. Wachtel}, journal = {Cognitive Psychology}, pages = {125--157}, title = {Children’s Use of Mutual Exclusivity to Constrain the Meanings of Words}, volume = {20}, year = {1988}, } @inproceedings{smith2013pragmatics, author = {Nathaniel J. Smith and Noah D. Goodman and Michael C. Frank}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {3039--3047}, title = {Learning and using language via recursive pragmatic reasoning about other agents}, year = {2013}, } @article{frank2012pragmatics, author = {M.C. Frank and N. D. Goodman}, journal = {Science}, pages = {998--998}, title = {Predicting Pragmatic Reasoning in Language Games}, volume = {336}, year = {2012}, } @article{frank2014inferring, author = {M.C. Frank and N. D. Goodman}, journal = {Cognitive Psychology}, pages = {80--96}, title = {Inferring word meanings by assuming that speakers are informative}, volume = {75}, year = {2014}, } @book{wittgenstein1953philosophical, author = {L. Wittgenstein}, publisher = {Blackwell, Oxford}, title = {Philosophical Investigations}, year = {1953}, } @article{orabona2015generalized, author = {Francesco Orabona and Koby Crammer and Nicolo Cesa-Bianchi}, journal = {Machine Learning}, number = {3}, pages = {411--435}, title = {A generalized online mirror descent with applications to classification and regression}, volume = {99}, year = {2015}, } @inproceedings{rakhlin2013online, author = {Alexander Rakhlin and Karthik Sridharan}, booktitle = {Conference on Learning Theory (COLT)}, pages = {993--1019}, title = {Online Learning with Predictable Sequences}, year = {2013}, } @article{thompson1933likelihood, author = {William R Thompson}, journal = {Biometrika}, number = {3}, pages = {285--294}, title = {On the likelihood that one unknown probability exceeds another in view of the evidence of two samples}, volume = {25}, year = {1933}, } @article{lai1985asymptotically, author = {Tze Leung Lai and Herbert Robbins}, journal = {Advances in applied mathematics}, number = {1}, pages = {4--22}, title = {Asymptotically efficient adaptive allocation rules}, volume = {6}, year = {1985}, } @article{auer2002finite, author = {Peter Auer and Nicolo Cesa-Bianchi and Paul Fischer}, journal = {Machine learning}, number = {2}, pages = {235--256}, title = {Finite-time analysis of the multiarmed bandit problem}, volume = {47}, year = {2002}, } @inproceedings{agrawal2012analysis, author = {Shipra Agrawal and Navin Goyal}, booktitle = {Conference on Learning Theory (COLT)}, title = {Analysis of Thompson Sampling for the Multi-armed Bandit Problem}, year = {2012}, } @inproceedings{flaxman2005online, author = {Abraham D Flaxman and Adam Tauman Kalai and H Brendan McMahan}, booktitle = {Symposium on Discrete Algorithms (SODA)}, pages = {385--394}, title = {Online convex optimization in the bandit setting: gradient descent without a gradient}, year = {2005}, } @book{goodman2015prob, author = {Noah Goodman and Daniel Lassiter}, publisher = {The Handbook of Contemporary Semantic Theory, 2nd Edition Wiley-Blackwell}, title = {Probabilistic Semantics and Pragmatics: Uncertainty in Language and Thought}, year = {2015}, } @article{ireland2011language, author = {Molly E Ireland and Richard B Slatcher and Paul W Eastwick and Lauren E Scissors and Eli J Finkel and James W Pennebaker}, journal = {Psychological Science}, number = {1}, pages = {39--44}, title = {Language style matching predicts relationship initiation and stability}, volume = {22}, year = {2011}, } @book{giles2008communication, author = {Howard Giles}, publisher = {Sage Publications, Inc}, title = {Communication accommodation theory}, year = {2008}, } @inproceedings{kwiatkowski2012probabilistic, author = {Tom Kwiatkowski and Sharon Goldwater and Luke Zettlemoyer and Mark Steedman}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {234--244}, title = {A probabilistic model of syntactic and semantic acquisition from child-directed utterances and their meanings}, year = {2012}, } @article{jones2009scale, author = {M. Gail Jones and Amy R. Taylor}, journal = {Journal of Research in Science Teaching}, pages = {460--475}, title = {Developing a sense of scale: Looking backward}, volume = {46}, year = {2009}, } @article{helmbold2015inductive, author = {David P. Helmbold and Philip M. Long}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {3403--3454}, title = {On the Inductive Bias of Dropout}, volume = {16}, year = {2015}, } @inproceedings{macmahon2006walk, author = {Matt MacMahon and Brian Stankiewicz and Benjamin Kuipers}, booktitle = {National Conference on Artificial Intelligence}, title = {Walk the talk: Connecting language, knowledge, and action in route instructions}, year = {2006}, } @article{vlachos2014new, author = {Andreas Vlachos and Stephen Clark}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, pages = {547--559}, title = {A New Corpus and Imitation Learning Framework for Context-Dependent Semantic Parsing}, volume = {2}, year = {2014}, } @inproceedings{hermann2015read, author = {Karl Moritz Hermann and Tomáš Kočiský and Edward Grefenstette and Lasse Espeholt and Will Kay and Mustafa Suleyman and Phil Blunsom}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Teaching Machines to Read and Comprehend}, year = {2015}, } @inproceedings{iyyer2014factoid, author = {Mohit Iyyer and Jordan Boyd-Graber and Leonardo Claudino and Hal Daumé III}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {A Neural Network for Factoid Question Answering over Paragraphs}, year = {2014}, } @inproceedings{kumar2016dmn, author = {Ankit Kumar and Ozan Irsoy and Peter Ondruska and Mohit Iyyer and James Bradbury and Ishaan Gulrajani and Victor Zhong and Romain Paulus and Richard Socher}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Ask Me Anaything: Dynamic Memory Networks for Natural Language Processing}, year = {2016}, } @inproceedings{monroe2015pragmatics, author = {Will Monroe and Christopher Potts}, booktitle = {Proceedings of 20th {A}msterdam {C}olloquium}, title = {Learning in the {R}ational {S}peech {A}cts Model}, year = {2015}, } @inproceedings{chiang2005hierarchical, author = {David Chiang}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {263--270}, title = {A Hierarchical Phrase-Based Model for Statistical Machine Translation}, year = {2005}, } @inproceedings{jaitly2013vocal, author = {Navdeep Jaitly and Geoffrey E. Hinton}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Vocal Tract Length Perturbation (VTLP) improves {s}peech recognition}, year = {2013}, } @article{kingma2014variational, author = {Diederik P. Kingma and Max Welling}, journal = {arXiv preprint arXiv:1312.6114}, title = {Auto-Encoding Variational {B}ayes}, year = {2014}, } @inproceedings{zhang2015character, author = {Xiang Zhang and Junbo Zhao and Yann LeCun}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Character-level Convolutional Networks for Text Classification}, year = {2015}, } @inproceedings{wang2015petpeeves, author = {William Y. Wang and Diyi Yang}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {That’s So Annoying!!!: A Lexical and Frame-Semantic Embedding Based Data Augmentation Approach to Automatic Categorization of Annoying Behaviors using \#petpeeve Tweets}, year = {2015}, } @inproceedings{flanigan2014discriminative, author = {Jeffrey Flanigan and Sam Thomson and Jaime G Carbonell and Chris Dyer and Noah A Smith}, booktitle = {Association for Computational Linguistics (ACL)}, title = {A discriminative graph-based parser for the abstract meaning representation}, year = {2014}, } @inproceedings{neelakantan2016neural, author = {Arvind Neelakantan and Quoc V. Le and Ilya Sutskever}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Neural Programmer: Inducing Latent Programs with Gradient Descent}, year = {2016}, } @article{yin2016neural, author = {Pengcheng Yin and Zhengdong Lu and Hang Li and Ben Kao}, journal = {arXiv}, title = {Neural Enquirer: Learning to Query Tables with Natural Language}, year = {2016}, } @article{miller1990empirical, author = {Barton P Miller and Louis Fredriksen and Bryan So}, journal = {Communications of the ACM}, number = {12}, pages = {32--44}, title = {An empirical study of the reliability of {UNIX} utilities}, volume = {33}, year = {1990}, } @inproceedings{reed2016neural, author = {Scott Reed and Nando de Freitas}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Neural Programmer-Interpreters}, year = {2016}, } @inproceedings{tellex2014asking, author = {Stefanie Tellex and Ross Knepper and Adrian Li and Daniela Rus and Nicholas Roy}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Asking for help using inverse semantics}, year = {2014}, } @inproceedings{vogel2013emergence, author = {Adam Vogel and Max Bodoia and Christopher Potts and Daniel Jurafsky}, booktitle = {North American Association for Computational Linguistics (NAACL)}, pages = {1072--1081}, title = {Emergence of {Gricean} Maxims from Multi-Agent Decision Theory}, year = {2013}, } @inproceedings{lee2014time, author = {Kenton Lee and Yoav Artzi and Jesse Dodge and Luke Zettlemoyer}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Context-dependent Semantic Parsing for Time Expressions}, year = {2014}, } @inproceedings{awasthi2013learning, author = {Pranjal Awasthi and Vitaly Feldman and Varun Kanade}, booktitle = {Conference on Learning Theory (COLT)}, pages = {398--431}, title = {Learning Using Local Membership Queries}, year = {2013}, } @article{sedghi2014provable, author = {Hanie Sedghi and Anima Anandkumar}, journal = {arXiv preprint arXiv:1412.2693}, title = {Provable methods for training neural networks with sparse connectivity}, year = {2014}, } @inproceedings{bottou2012stochastic, author = {Léon Bottou}, booktitle = {Neural Networks: Tricks of the Trade}, pages = {421--436}, title = {Stochastic gradient descent tricks}, year = {2012}, } @article{zhang2015l1, author = {Yuchen Zhang and Jason D Lee and Michael I Jordan}, journal = {arXiv preprint arXiv:1510.03528}, title = {$\ell_1$-regularized Neural Networks are Improperly Learnable in Polynomial Time}, year = {2015}, } @article{hinton2012speech, author = {Geoffrey Hinton and Li Deng and Dong Yu and George E Dahl and Abdel-rahman Mohamed and Navdeep Jaitly and Andrew Senior and Vincent Vanhoucke and Patrick Nguyen and Tara N Sainath and others}, journal = {Signal Processing Magazine, IEEE}, number = {6}, pages = {82--97}, title = {Deep neural networks for acoustic modeling in speech recognition: The shared views of four research groups}, volume = {29}, year = {2012}, } @inproceedings{klivans2006cryptographic, author = {Adam R Klivans and Alexander A Sherstov}, booktitle = {Foundations of Computer Science (FOCS)}, pages = {553--562}, title = {Cryptographic hardness for learning intersections of halfspaces}, year = {2006}, } @article{fukumizu2000statistical, author = {Kenji Fukumizu}, journal = {IEEE Transactions on Neural Networks}, number = {1}, pages = {17--26}, title = {Statistical active learning in multilayer perceptrons}, volume = {11}, year = {2000}, } @inproceedings{hasenjager2002active, author = {M Hasenjäger and H Ritter}, booktitle = {New learning paradigms in soft computing}, pages = {137--169}, title = {Active learning in neural networks}, year = {2002}, } @article{wright2012sparse, author = {John Wright}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {1--35}, title = {Exact Recovery of Sparsely-Used Dictionaries}, volume = {1}, year = {2012}, } @article{cote2012chernoff, author = {François D Côté and Ioannis N Psaromiligkos and Warren J Gross}, journal = {arXiv preprint arXiv:1202.6483}, title = {A Chernoff-type lower bound for the {G}aussian {Q}-function}, year = {2012}, } @inproceedings{maas2013rectifier, author = {Andrew L Maas and Awni Y Hannun and Andrew Y Ng}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Rectifier nonlinearities improve neural network acoustic models}, year = {2013}, } @inproceedings{janzamin2015score, author = {Majid Janzamin and Hanie Sedghi and Anima Anandkumar}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Score Function Features for Discriminative Learning}, year = {2015}, } @inproceedings{glorot2011deep, author = {Xavier Glorot and Antoine Bordes and Yoshua Bengio}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, pages = {315--323}, title = {Deep sparse rectifier neural networks}, year = {2011}, } @article{vapnik1971uniform, author = {Vladimir N. Vapnik and Aleksei Y. Chervonenkis}, journal = {Teoriya Veroyatnostei i ee Primeneniya}, number = {2}, pages = {264--279}, title = {On uniform convergence of the frequencies of events to their probabilities}, volume = {16}, year = {1971}, } @inproceedings{lee2001algorithms, author = {Daniel D. Lee and Sebastian H. Seung}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {556--562}, title = {Algorithms for non-negative matrix factorization}, year = {2001}, } @article{karger2014budget, author = {David R. Karger and Sewoong Oh and Devavrat Shah}, journal = {Operations Research}, number = {1}, pages = {1--24}, title = {Budget-optimal task allocation for reliable crowdsourcing systems}, volume = {62}, year = {2014}, } @inproceedings{shah2015approval, author = {Nihar Shah and Dengyong Zhou and Yuval Peres}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Approval Voting and Incentives in Crowdsourcing}, year = {2015}, } @inproceedings{shah2015double, author = {Nihar B. Shah and Denny Zhou}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Double or nothing: Multiplicative incentive mechanisms for crowdsourcing}, year = {2015}, } @article{zhou2015regularized, author = {Dengyong Zhou and Qiang Liu and John C. Platt and Christopher Meek and Nihar B. Shah}, journal = {arXiv}, title = {Regularized minimax conditional entropy for crowdsourcing}, year = {2015}, } @article{kamble2015truth, author = {Vijay Kamble and Nihar Shah and David Marn and Abhay Parekh and Kannan Ramachandran}, journal = {arXiv}, title = {Truth Serums for Massively Crowdsourced Evaluation Tasks}, year = {2015}, } @article{miller2005eliciting, author = {Nolan Miller and Paul Resnick and Richard Zeckhauser}, journal = {Management Science}, number = {9}, pages = {1359--1373}, title = {Eliciting informative feedback: The peer-prediction method}, volume = {51}, year = {2005}, } @misc{shnayder2016strong, author = {Victor Shnayder and Rafael Frongillo and Arpit Agarwal and David C. Parkes}, title = {Strong Truthfulness in Multi-Task Peer Prediction}, year = {2016}, } @inproceedings{dasgupta2013crowdsourced, author = {Anirban Dasgupta and Arpita Ghosh}, booktitle = {World Wide Web (WWW)}, pages = {319--330}, title = {Crowdsourced judgement elicitation with endogenous proficiency}, year = {2013}, } @article{harmon2004amazon, author = {Amy Harmon}, journal = {New York Times}, title = {Amazon Glitch Unmasks War Of Reviewers}, year = {2004}, } @article{white1999chatting, author = {Erin White}, journal = {Wall Street Journal}, title = {Chatting a singer up the pop charts}, year = {1999}, } @article{mayzlin2006promotional, author = {Dina Mayzlin}, journal = {Marketing Science}, number = {2}, pages = {155--163}, title = {Promotional chat on the Internet}, volume = {25}, year = {2006}, } @article{dellarocas2006strategic, author = {Chrysanthos Dellarocas}, journal = {Management science}, number = {10}, pages = {1577--1593}, title = {Strategic manipulation of internet opinion forums: Implications for consumers and firms}, volume = {52}, year = {2006}, } @inproceedings{resnick2007influence, author = {Paul Resnick and Rahul Sami}, booktitle = {ACM Conference on Recommender Systems}, pages = {25--32}, title = {The influence limiter: provably manipulation-resistant recommender systems}, year = {2007}, } @inproceedings{priedhorsky2007creating, author = {Reid Priedhorsky and Jilin Chen and Shyong T. K. Lam and Katherine Panciera and Loren Terveen and John Riedl}, booktitle = {International {ACM} Conference on Supporting Group Work}, pages = {259--268}, title = {Creating, destroying, and restoring value in {W}ikipedia}, year = {2007}, } @article{kulkarni2015peer, author = {Chinmay Kulkarni and Pang Wei Koh and Huy Huy and Daniel Chia and Kathryn Papadopoulos and Justin Cheng and Daphne Koller and Scott R. Klemmer}, journal = {Design Thinking Research}, pages = {131--168}, title = {Peer and self assessment in massive online classes}, year = {2015}, } @article{vuurens2011spam, author = {Jeroen Vuurens and Arjen P. de Vries and Carsten Eickhoff}, journal = {ACM SIGIR Workshop on Crowdsourcing for Information Retrieval}, title = {How much spam can you take? {A}n analysis of crowdsourcing results to increase accuracy}, year = {2011}, } @article{chen2014improved, author = {Yudong Chen and Sujay Sanghavi and Huan Xu}, journal = {IEEE Transactions on Information Theory}, number = {10}, pages = {6440--6455}, title = {Improved graph clustering}, volume = {60}, year = {2014}, } @article{condon2001algorithms, author = {Anne Condon and Richard M. Karp}, journal = {Random Structures and Algorithms}, pages = {116--140}, title = {Algorithms for graph partitioning on the planted partition model}, year = {2001}, } @article{holland1983stochastic, author = {Paul W. Holland and Kathryn B. Laskey and Samuel Leinhardt}, journal = {Social Networks}, pages = {109--137}, title = {Stochastic blockmodels: Some first steps}, volume = {5}, year = {1983}, } @article{coja2004coloring, author = {Amin Coja-Oghlan}, journal = {Automata, Languages and Programming}, pages = {71--100}, title = {Coloring semirandom graphs optimally}, year = {2004}, } @article{feige2001heuristics, author = {Uriel Feige and Joe Kilian}, journal = {Journal of Computer and System Sciences}, number = {4}, pages = {639--671}, title = {Heuristics for semirandom graph problems}, volume = {63}, year = {2001}, } @article{feige2000finding, author = {Uriel Feige and Robert Krauthgamer}, journal = {Random Structures and Algorithms}, number = {2}, pages = {195--208}, title = {Finding and certifying a large hidden clique in a semirandom graph}, volume = {16}, year = {2000}, } @inproceedings{makarychev2012approximation, author = {Konstantin Makarychev and Yury Makarychev and Aravindan Vijayaraghavan}, booktitle = {Symposium on Theory of Computing (STOC)}, pages = {367--384}, title = {Approximation algorithms for semi-random partitioning problems}, year = {2012}, } @inproceedings{krivelevich2006semirandom, author = {Michael Krivelevich and Dan Vilenchik}, booktitle = {Meeting on Analytic Algorithmics and Combinatorics}, pages = {211--221}, title = {Semirandom models as benchmarks for coloring algorithms}, year = {2006}, } @article{coja2002coloring, author = {Amin Coja-Oghlan}, journal = {Mathematical Foundations of Computer Science}, pages = {201--211}, title = {Coloring {K}-colorable semirandom graphs in polynomial expected time via semidefinite programming}, year = {2002}, } @article{coja2002finding, author = {Amin Coja-Oghlan}, journal = {Randomization and Approximation Techniques in Computer Science}, pages = {139--148}, title = {Finding sparse induced subgraphs of semirandom graphs}, year = {2002}, } @article{coja2007solving, author = {Amin Coja-Oghlan}, journal = {Journal of Algorithms}, number = {1}, pages = {19--46}, title = {Solving {NP}-hard semirandom graph problems in polynomial expected time}, volume = {62}, year = {2007}, } @inproceedings{kolla2011play, author = {Alexandra Kolla and Konstantin Makarychev and Yury Makarychev}, booktitle = {Foundations of Computer Science (FOCS)}, pages = {443--452}, title = {How to play unique games against a semi-random adversary: Study of semi-random models of unique games}, year = {2011}, } @article{mossel2013proof, author = {Elchanan Mossel and Joe Neeman and Allan Sly}, journal = {arXiv}, title = {A proof of the block model threshold conjecture}, year = {2013}, } @inproceedings{massoulie2014community, author = {Laurent Massouli{\'e}}, booktitle = {Symposium on Theory of Computing (STOC)}, pages = {694--703}, title = {Community detection thresholds and the weak {R}amanujan property}, year = {2014}, } @article{guedon2014community, author = {Olivier Gu{\'e}don and Roman Vershynin}, journal = {arXiv}, title = {Community detection in sparse networks via {G}rothendieck's inequality}, year = {2014}, } @article{abbe2015community, author = {Emmanuel Abbe and Colin Sandon}, journal = {arXiv}, title = {Community detection in general stochastic block models: fundamental limits and efficient recovery algorithms}, year = {2015}, } @article{abbe2015detection, author = {Emmanuel Abbe and Colin Sandon}, journal = {arXiv}, title = {Detection in the stochastic block model with multiple clusters: proof of the achievability conjectures, acyclic {BP}, and the information-computation gap}, year = {2015}, } @inproceedings{chin2015stochastic, author = {Peter Chin and Anup Rao and Van Vu}, booktitle = {Conference on Learning Theory (COLT)}, title = {Stochastic block model and community detection in the sparse graphs: A spectral algorithm with optimal rate of recovery}, year = {2015}, } @article{decelle2011asymptotic, author = {Aurelien Decelle and Florent Krzakala and Cristopher Moore and Lenka Zdeborov{\'a}}, journal = {Physical Review E}, number = {6}, title = {Asymptotic analysis of the stochastic block model for modular networks and its algorithmic applications}, volume = {84}, year = {2011}, } @article{decelle2011inference, author = {Aurelien Decelle and Florent Krzakala and Cristopher Moore and Lenka Zdeborov{\'a}}, journal = {Physical Review Letters}, number = {6}, title = {Inference and phase transitions in the detection of modules in sparse networks}, volume = {107}, year = {2011}, } @article{mossel2012stochastic, author = {Elchanan Mossel and Joe Neeman and Allan Sly}, journal = {arXiv}, title = {Stochastic block models and reconstruction}, year = {2012}, } @article{mossel2013belief, author = {Elchanan Mossel and Joe Neeman and Allan Sly}, journal = {arXiv}, title = {Belief propagation, robust reconstruction, and optimal recovery of block models}, year = {2013}, } @inproceedings{mossel2015consistency, author = {Elchanan Mossel and Joe Neeman and Allan Sly}, booktitle = {Symposium on Theory of Computing (STOC)}, pages = {69--75}, title = {Consistency thresholds for the planted bisection model}, year = {2015}, } @article{moitra2015robust, author = {Ankur Moitra and William Perry and Alexander S. Wein}, journal = {arXiv}, title = {How Robust are Reconstruction Thresholds for Community Detection?}, year = {2015}, } @article{agarwal2015multisection, author = {Naman Agarwal and Afonso S. Bandeira and Konstantinos Koiliaris and Alexandra Kolla}, journal = {arXiv}, title = {Multisection in the stochastic block model using semidefinite programming}, year = {2015}, } @article{makarychev2015learning, author = {Konstantin Makarychev and Yury Makarychev and Aravindan Vijayaraghavan}, journal = {arXiv}, title = {Learning Communities in the Presence of Errors}, year = {2015}, } @article{cai2015robust, author = {T. Tony Cai and Xiaodong Li}, journal = {The Annals of Statistics}, number = {3}, pages = {1027--1059}, title = {Robust and computationally feasible community detection in the presence of arbitrary outlier nodes}, volume = {43}, year = {2015}, } @article{christiano2014provably, author = {Paul Christiano}, journal = {arXiv}, title = {Provably Manipulation-Resistant Reputation Systems}, year = {2014}, } @article{christiano2016robust, author = {Paul Christiano}, journal = {arXiv}, title = {Robust Collaborative Online Learning}, year = {2016}, } @inproceedings{andreas2014grounding, author = {Jacob Andreas and Dan Klein}, booktitle = {Computational Natural Language Learning (CoNLL)}, pages = {58--67}, title = {Grounding Language with Points and Paths in Continuous Spaces}, year = {2014}, } @inproceedings{andreas2015alignment, author = {Jacob Andreas and Dan Klein}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Alignment-Based Compositional Semantics for Instruction Following}, year = {2015}, } @article{heider1944experimental, author = {Fritz Heider and Marianne Simmel}, journal = {American Journal of Psychology}, number = {2}, pages = {243--259}, title = {An experimental study of apparent behavior}, volume = {57}, year = {1944}, } @article{dorazio2010review, author = {Tiziana D'Orazio and Marco Leo}, journal = {Pattern recognition}, number = {8}, pages = {2911--2926}, title = {A review of vision-based systems for soccer video analysis}, volume = {43}, year = {2010}, } @article{regier2001grounding, author = {Terry Regier and Laura A Carlson}, journal = {Journal of experimental psychology: General}, number = {2}, title = {Grounding spatial language in perception: An empirical and computational investigation}, volume = {130}, year = {2001}, } @article{gorniak2004grounded, author = {Peter Gorniak and Deb Roy}, journal = {Journal of Artificial Intelligence Research (JAIR)}, pages = {429--470}, title = {Grounded semantic composition for visual scenes}, volume = {21}, year = {2004}, } @inproceedings{tellex2009grounding, author = {Stefanie Tellex and Deb Roy}, booktitle = {International Conference on Multimodal Interfaces (ICMI)}, pages = {253--260}, title = {Grounding spatial prepositions for video search}, year = {2009}, } @inproceedings{goodman2014concepts, author = {Noah D Goodman and Joshua B Tenenbaum and Tobias Gerstenberg}, booktitle = {The Conceptual Mind: New Directions in the Study of Concepts}, title = {Concepts in a probabilistic language of thought}, year = {2014}, } @inproceedings{kemp2007learning, author = {Charles Kemp and Noah Goodman and Joshua B Tenenbaum}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {753--760}, title = {Learning and using relational theories}, year = {2007}, } @inproceedings{lake2013one, author = {Brenden M Lake and Ruslan R Salakhutdinov and Josh Tenenbaum}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {2526--2534}, title = {One-shot learning by inverting a compositional causal process}, year = {2013}, } @phdthesis{narayanan1997knowledge, author = {Srinivas Sankara Narayanan}, school = {University of California Berkeley at Berkeley}, title = {Knowledge-based Action Representations for Metaphor and Aspect (KARMA)}, year = {1997}, } @article{hansen2014uncertainty, author = {Lars Peter Hansen}, journal = {Journal of Political Economy}, number = {5}, pages = {945--987}, title = {Uncertainty Outside and Inside Economic Models}, volume = {122}, year = {2014}, } @article{anderson1949estimation, author = {Theodore W. Anderson and Herman Rubin}, journal = {The Annals of Mathematical Statistics}, pages = {46--63}, title = {Estimation of the parameters of a single equation in a complete system of stochastic equations}, year = {1949}, } @article{anderson1950asymptotic, author = {Theodore W. Anderson and Herman Rubin}, journal = {The Annals of Mathematical Statistics}, pages = {570--582}, title = {The asymptotic properties of estimates of the parameters of a single equation in a complete system of stochastic equations}, year = {1950}, } @article{sargan1958estimation, author = {John D. Sargan}, journal = {Econometrica}, pages = {393--415}, title = {The estimation of economic relationships using instrumental variables}, year = {1958}, } @article{sargan1959estimation, author = {John D. Sargan}, journal = {Journal of the Royal Statistical Society: Series B (Statistical Methodology)}, pages = {91--105}, title = {The estimation of relationships with autocorrelated residuals by the use of instrumental variables}, year = {1959}, } @article{chegireddy1987algorithms, author = {Chandra R. Chegireddy and Horst W. Hamacher}, journal = {Discrete applied mathematics}, number = {2}, pages = {155--165}, title = {Algorithms for finding {k}-best perfect matchings}, volume = {18}, year = {1987}, } @inproceedings{karpathy2015deep, author = {Andrej Karpathy and Li Fei-Fei}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {3128--3137}, title = {Deep visual-semantic alignments for generating image descriptions}, year = {2015}, } @inproceedings{shirakawan2015ngramidf, author = {Masumi Shirakawa and Takahiro Hara and Shojiro Nishio}, booktitle = {World Wide Web (WWW)}, pages = {960--970}, title = {{N}-gram IDF: A Global Term Weighting Scheme Based on Information Distance}, year = {2015}, } @inproceedings{cartis2009finding, author = {Coralia Cartis and Gould Nicholas IM}, booktitle = {SPARS'09-Signal Processing with Adaptive Sparse Structured Representations}, title = {Finding a point in the relative interior of a polyhedron, with applications to compressed sensing}, year = {2009}, } @article{le2015concentration, author = {Can M. Le and Elizaveta Levina and Roman Vershynin}, journal = {arXiv}, title = {Concentration and Regularization of Random Graphs}, year = {2015}, } @article{balsubramani2016learning, author = {Akshay Balsubramani}, journal = {arXiv preprint arXiv:1602.08151}, title = {Learning to Abstain from Binary Prediction}, year = {2016}, } @article{chow1970optimum, author = {Chao K Chow}, journal = {IEEE Transactions on Information Theory}, number = {1}, pages = {41--46}, title = {On optimum recognition error and reject tradeoff}, volume = {16}, year = {1970}, } @inproceedings{tortorella2000optimal, author = {Francesco Tortorella}, booktitle = {Advances in Pattern Recognition}, pages = {611--620}, title = {An optimal reject rule for binary classifiers}, year = {2000}, } @inproceedings{hanneke2007bound, author = {Steve Hanneke}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {353--360}, title = {A bound on the label complexity of agnostic active learning}, year = {2007}, } @inproceedings{nelson2009misleading, author = {Blaine Nelson and Marco Barreno and Fuching Jack Chi and Anthony D Joseph and Benjamin IP Rubinstein and Udam Saini and Charles Sutton and JD Tygar and Kai Xia}, booktitle = {Machine learning in cyber trust}, pages = {17--51}, title = {Misleading learners: Co-opting your spam filter}, year = {2009}, } @article{mannor2004sample, author = {Shie Mannor and John N. Tsitsiklis}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {623--648}, title = {The sample complexity of exploration in the multi-armed bandit problem}, volume = {5}, year = {2004}, } @inproceedings{chandrasekaran2014finding, author = {Karthekeyan Chandrasekaran and Richard Karp}, booktitle = {Conference on Learning Theory (COLT)}, pages = {394--407}, title = {Finding a most biased coin with fewest flips}, year = {2014}, } @article{banks2016information, author = {Jess Banks and Christopher Moore}, journal = {arXiv}, title = {Information-theoretic thresholds for community detection in sparse networks}, year = {2016}, } @techreport{mayzlin2012promotional, author = {Dina Mayzlin and Yaniv Dover and Judith A. Chevalier}, institution = {National Bureau of Economic Research}, title = {Promotional reviews: An empirical investigation of online review manipulation}, year = {2012}, } @article{young2000probabilistic, author = {Steve J Young}, journal = {Philosophical Transactions of the Royal Society of London A: Mathematical, Physical and Engineering Sciences}, number = {1769}, pages = {1389--1402}, title = {Probabilistic methods in spoken-dialogue systems}, volume = {358}, year = {2000}, } @inproceedings{williams2013dialog, author = {Jason Williams and Antoine Raux and Deepak Ramachandran and Alan Black}, booktitle = {Proceedings of the SIGDIAL 2013 Conference}, pages = {404--413}, title = {The dialog state tracking challenge}, year = {2013}, } @inproceedings{li2016persona, author = {Jiwei Li and Michel Galley and Chris Brockett and Jianfeng Gao and Bill Dolan}, booktitle = {Association for Computational Linguistics (ACL)}, title = {A Persona-Based Neural Conversation Model}, year = {2016}, } @inproceedings{afantenos2012developing, author = {Stergos Afantenos and Nicholas Asher and Farah Benamara and Anais Cadilhac and Cédric Dégremont and Pascal Denis and Markus Guhe and Simon Keizer and Alex Lascarides and Oliver Lemon and Philippe Muller and Soumya Paul and Verena Rieser and Laure Vieu}, booktitle = {SeineDial 2012 - The 16th Workshop on the Semantics and Pragmatics of Dialogue}, title = {Developing a corpus of strategic conversation in The Settlers of Catan}, year = {2012}, } @inproceedings{potts2012cards, author = {Christopher Potts}, booktitle = {Proceedings of the 30th West Coast Conference on Formal Linguistics}, pages = {1--20}, title = {Goal-Driven Answers in the {C}ards Dialogue Corpus}, year = {2012}, } @article{serban2015survey, author = {Iulian Vlad Serban and Ryan Lowe and Laurent Charlin and Joelle Pineau}, journal = {arXiv preprint arXiv:1512.05742}, title = {A Survey of Available Corpora for Building Data-Driven Dialogue Systems}, year = {2015}, } @article{serban2015building, author = {Iulian V Serban and Alessandro Sordoni and Yoshua Bengio and Aaron Courville and Joelle Pineau}, journal = {arXiv preprint arXiv:1507.04808}, title = {Building End-To-End Dialogue Systems Using Generative Hierarchical Neural Network Models}, year = {2015}, } @article{lowe2015ubuntu, author = {Ryan Lowe and Nissan Pow and Iulian Serban and Joelle Pineau}, journal = {arXiv preprint arXiv:1506.08909}, title = {The {U}buntu dialogue corpus: A large dataset for research in unstructured multi-turn dialogue systems}, year = {2015}, } @inproceedings{shang2015neural, author = {Lifeng Shang and Zhengdong Lu and Hang Li}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Neural responding machine for short-text conversation}, year = {2015}, } @inproceedings{wen2015semantically, author = {Tsung-Hsien Wen and Milica Gasic and Nikola Mrksic and Pei-Hao Su and David Vandyke and Steve Young}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Semantically conditioned {LSTM}-based natural language generation for spoken dialogue systems}, year = {2015}, } @inproceedings{ritter2011data, author = {Alan Ritter and Colin Cherry and William B Dolan}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {583--593}, title = {Data-driven response generation in social media}, year = {2011}, } @inproceedings{oh2000stochastic, author = {Alice H Oh and Alexander I Rudnicky}, booktitle = {ANLP/NAACL Workshop on Conversational systems - Volume 3}, pages = {27--32}, title = {Stochastic language generation for spoken dialogue systems}, year = {2000}, } @inproceedings{mairesse2010phrase, author = {François Mairesse and Milica Gašić and Filip Jurčíček and Simon Keizer and Blaise Thomson and Kai Yu and Steve Young}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {1552--1561}, title = {Phrase-based statistical language generation using graphical models and active learning}, year = {2010}, } @article{walker2002training, author = {Marilyn A Walker and Owen C Rambow and Monica Rogati}, journal = {Computer Speech \& Language}, number = {3}, pages = {409--433}, title = {Training a sentence planner for spoken dialogue using boosting}, volume = {16}, year = {2002}, } @inproceedings{sordoni2015neural, author = {Alessandro Sordoni and Michel Galley and Michael Auli and Chris Brockett and Yangfeng Ji and Margaret Mitchell and Jian-Yun Nie and Jianfeng Gao and Bill Dolan}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {A neural network approach to context-sensitive generation of conversational responses}, year = {2015}, } @inproceedings{hirschman1999deep, author = {Lynette Hirschman and Marc Light and Eric Breck and John D Burger}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {325--332}, title = {Deep read: A reading comprehension system}, year = {1999}, } @inproceedings{riloff2000rule, author = {Ellen Riloff and Michael Thelen}, booktitle = {ANLP/NAACL Workshop on reading comprehension tests as evaluation for computer-based language understanding sytems - Volume 6}, pages = {13--19}, title = {A rule-based question answering system for reading comprehension tests}, year = {2000}, } @inproceedings{ng2000machine, author = {Hwee Tou Ng and Leong Hwee Teo and Jennifer Lai Pheng Kwan}, booktitle = {Joint SIGDAT conference on empirical methods in natural language processing and very large corpora - Volume 13}, pages = {124--132}, title = {A machine learning approach to answering questions for reading comprehension tests}, year = {2000}, } @inproceedings{xu2006maximum, author = {Kui Xu and Helen Meng and Fuliang Weng}, booktitle = {North American Association for Computational Linguistics (NAACL)}, pages = {185--188}, title = {A maximum entropy framework that integrates word dependencies and grammatical relations for reading comprehension}, year = {2006}, } @inproceedings{wang2015machine, author = {Hai Wang and Mohit Bansal and Kevin Gimpel and David McAllester}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Machine comprehension with syntax, frames, and semantics}, year = {2015}, } @inproceedings{hill2015goldilocks, author = {Felix Hill and Antoine Bordes and Sumit Chopra and Jason Weston}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {The Goldilocks Principle: Reading Children's Books with Explicit Memory Representations}, year = {2015}, } @inproceedings{narasimhan2015machine, author = {Karthik Narasimhan and Regina Barzilay}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Machine comprehension with discourse relations}, year = {2015}, } @inproceedings{yang2015wikiqa, author = {Yi Yang and Wen-tau Yih and Christopher Meek}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {2013--2018}, title = {{W}iki{QA}: A Challenge Dataset for Open-Domain Question Answering}, year = {2015}, } @inproceedings{chen2016thorough, author = {Danqi Chen and Jason Bolton and Christopher D. Manning}, booktitle = {Association for Computational Linguistics (ACL)}, title = {A Thorough Examination of the {CNN} / {D}aily {M}ail Reading Comprehension Task}, year = {2016}, } @inproceedings{sun2013answer, author = {Hong Sun and Nan Duan and Yajuan Duan and Ming Zhou}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Answer Extraction from Passage Graph for Question Answering}, year = {2013}, } @inproceedings{shen2006exploring, author = {Dan Shen and Dietrich Klakow}, booktitle = {International Conference on Computational Linguistics and Association for Computational Linguistics (COLING/ACL)}, pages = {889--896}, title = {Exploring correlation of dependency relation paths for answer extraction}, year = {2006}, } @inproceedings{ravichandran2002learning, author = {Deepak Ravichandran and Eduard Hovy}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {41--47}, title = {Learning surface text patterns for a question answering system}, year = {2002}, } @inproceedings{mostafazadeh2016corpus, author = {Nasrin Mostafazadeh and Nathanael Chambers and Xiaodong He and Devi Parikh and Dhruv Batra and Lucy Vanderwende and Pushmeet Kohli and James Allen}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {A corpus and cloze evaluation for deeper understanding of commonsense stories}, year = {2016}, } @inproceedings{wang2013simple, author = {Zhuoran Wang and Oliver Lemon}, booktitle = {Proceedings of the SIGDIAL 2013 Conference}, pages = {423--432}, title = {A simple and generic belief tracking mechanism for the dialog state tracking challenge: On the believability of observed information}, year = {2013}, } @inproceedings{roy2000spoken, author = {Nicholas Roy and Joelle Pineau and Sebastian Thrun}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {93--100}, title = {Spoken dialogue management using probabilistic reasoning}, year = {2000}, } @article{williams2007partially, author = {Jason D Williams and Steve Young}, journal = {Computer Speech \& Language}, number = {2}, pages = {393--422}, title = {Partially observable {M}arkov decision processes for spoken dialog systems}, volume = {21}, year = {2007}, } @article{clark2016my, author = {Peter Clark and Oren Etzioni}, journal = {AI Magazine}, number = {1}, pages = {5--12}, title = {My Computer is an Honor Student but how Intelligent is it? Standardized Tests as a Measure of {AI}}, volume = {37}, year = {2016}, } @article{schoenick2016moving, author = {Carissa Schoenick and Peter Clark and Oyvind Tafjord and Peter Turney and Oren Etzioni}, journal = {arXiv preprint arXiv:1604.04315}, title = {Moving Beyond the {T}uring Test with the {A}llen {AI} Science Challenge}, year = {2016}, } @inproceedings{gaikwad2015daemo, author = {Snehal Neil Gaikwad and Durim Morina and Rohit Nistala and Megha Agarwal and Alison Cossette and Radhika Bhanu and Saiph Savage and Vishwajeet Narwal and Karan Rajpal and Jeff Regino and others}, booktitle = {Proceedings of the 28th Annual ACM Symposium on User Interface Software \& Technology}, pages = {101--102}, title = {Daemo: A Self-Governed Crowdsourcing Marketplace}, year = {2015}, } @inproceedings{voorhees2000building, author = {Ellen M Voorhees and Dawn M Tice}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, pages = {200--207}, title = {Building a question answering test collection}, year = {2000}, } @inproceedings{sachan2015learning, author = {Mrinmaya Sachan and Avinava Dubey and Eric P Xing and Matthew Richardson}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Learning answer-entailing structures for machine comprehension}, year = {2015}, } @inproceedings{gu2016copying, author = {Jiatao Gu and Zhengdong Lu and Hang Li and Victor O.K. Li}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Incorporating Copying Mechanism in Sequence-to-Sequence Learning}, year = {2016}, } @inproceedings{gulcehre2016pointing, author = {Caglar Gulcehre and Sungjin Ahn and Ramesh Nallapati and Bowen Zhou and Yoshua Bengio}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Pointing the Unknown Words}, year = {2016}, } @inproceedings{liu2007oversampling, author = {Alexander Liu and Joydeep Ghosh and Cheryl Martin}, booktitle = {International Conference on Data Mining (DMIN)}, title = {Generative Oversampling for Mining Imbalanced Datasets}, year = {2007}, } @inproceedings{petrov2010uptraining, author = {Slav Petrov and Pi-Chuan Chang and Michael Ringgaard and Hiyan Alshawi}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Uptraining for accurate deterministic question parsing}, year = {2010}, } @inproceedings{reckman2010virtualgame, author = {Hilke Reckman and Jeff Orkin and Deb Roy}, booktitle = {Conference on Natural Language Processing (KONVENS)}, title = {Learning meanings of words and constructions, grounded in a virtual game}, year = {2010}, } @article{greenberg1996consistency, author = {Harvey J Greenberg}, journal = {Annals of Mathematics and Artificial Intelligence}, number = {1}, pages = {37--83}, title = {Consistency, redundancy, and implied equalities in linear systems}, volume = {17}, year = {1996}, } @inproceedings{wen2017network, author = {Tsung-Hsien Wen and Milica Gasic and Nikola Mrksic and Lina M Rojas-Barahona and Pei-Hao Su and Stefan Ultes and David Vandyke and Steve Young}, booktitle = {European Association for Computational Linguistics (EACL)}, pages = {438--449}, title = {A Network-based End-to-End Trainable Task-oriented Dialogue System}, year = {2017}, } @inproceedings{dong2016logical, author = {Li Dong and Mirella Lapata}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Language to Logical Form with Neural Attention}, year = {2016}, } @article{teigen2015framing, author = {Karl Halvor Teigen}, journal = {The Wiley Blackwell Handbook of Judgment and Decision Making}, pages = {568--589}, title = {Framing of Numeric Quantities}, year = {2015}, } @techreport{roundy1985identifying, author = {Robert M. Freund and Robin Roundy and Michael J Todd}, institution = {Massachusetts Institute of Technology, Alfred P. Sloan School of Management}, title = {Identifying the Set of Always-Active Constraints in a System of Linear Inequalities by a Single Linear Program}, year = {1985}, } @inproceedings{kirkpatrick2012significance, author = {Taylor Berg-Kirkpatrick and David Burkett and Dan Klein}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {995--1005}, title = {An empirical investigation of statistical significance in {NLP}}, year = {2012}, } @inproceedings{maccartney2007natural, author = {Bill MacCartney and Christopher D. Manning}, booktitle = {ACL-PASCAL Workshop on Textual Entailment and Paraphrasing}, pages = {193--200}, title = {Natural Logic for Textual Inference}, year = {2007}, } @inproceedings{angeli2014naturalli, author = {Gabor Angeli and Christopher D. Manning}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {NaturalLI: Natural Logic Inference for Common Sense Reasoning}, year = {2014}, } @inproceedings{angeli2016naturalli, author = {Gabor Angeli and Neha Nayak and Christopher D. Manning}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Combining Natural Logic and Shallow Reasoning for Question Answering}, year = {2016}, } @inproceedings{pavlick2015semantics, author = {Ellie Pavlick and Johan Bos and Malvina Nissim and Charley Beller and Benjamin Van and Durme Chris Callison-Burch}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Adding semantics to data-driven paraphrasing}, year = {2015}, } @inproceedings{zhang2013parallelparaphrase, author = {Congle Zhang and Daniel S. Weld}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Harvesting Parallel News Streams to Generate Paraphrases of Event Relations}, year = {2013}, } @article{zhang2015parallelevents, author = {Congle Zhang and Stephen Soderland and Daniel S. Weld}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {Exploiting Parallel News Streams for Unsupervised Event Extraction}, volume = {3}, year = {2015}, } @inproceedings{angeli2015openie, author = {Gabor Angeli and Melvin Johnson Premkumar and Christopher D. Manning}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Leveraging Linguistic Structure for Open Domain Information Extraction}, year = {2015}, } @inproceedings{clark2015coref, author = {Kevin Clark and Christopher D. Manning}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Entity-Centric Coreference Resolution with Model Stacking}, year = {2015}, } @article{horn1990analog, author = {Roger A. Horn and Roy Mathias}, journal = {SIAM Journal on Matrix Analysis and Applications}, number = {4}, pages = {481--498}, title = {An analog of the {C}auchy-{S}chwarz inequality for {H}adamard products and unitarily invariant norms}, volume = {11}, year = {1990}, } @article{bandeira2014sharp, author = {Afonso S. Bandeira and Ramon van Handel}, journal = {arXiv}, title = {Sharp nonasymptotic bounds on the norm of random matrices with independent entries}, year = {2014}, } @inproceedings{bach2010structured, author = {Francis R. Bach}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {118--126}, title = {Structured sparsity-inducing norms through submodular functions}, year = {2010}, } @inproceedings{kumar2010clustering, author = {Amit Kumar and Ravindran Kannan}, booktitle = {Foundations of Computer Science (FOCS)}, pages = {299--308}, title = {Clustering with spectral norm and the {k}-means algorithm}, year = {2010}, } @inproceedings{steinhardt2016memory, author = {Jacob Steinhardt and Gregory Valiant and Stefan Wager}, booktitle = {Conference on Learning Theory (COLT)}, title = {Memory, Communication, and Statistical Queries}, year = {2016}, } @inproceedings{fetaya2016unsupervised, author = {Ethan Fetaya and Boaz Nadler and Ariel Jaffe and Yuval Kluger and Tingting Jiang}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, pages = {351--360}, title = {Unsupervised Ensemble Learning with Dependent Classifiers}, year = {2016}, } @inproceedings{arora2012learning, author = {Sanjeev Arora and Rong Ge and Ankur Moitra}, booktitle = {Foundations of Computer Science (FOCS)}, title = {Learning topic models--going beyond {SVD}}, year = {2012}, } @inproceedings{bansal2014provable, author = {Trapit Bansal and Chiranjib Bhattacharyya and Ravindran Kannan}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {A provable {SVD}-based algorithm for learning topics in dominant admixture corpus}, year = {2014}, } @inproceedings{diakonikolas2016robust, author = {Ilias Diakonikolas and Gautam Kamath and Daniel Kane and Jerry Li and Ankur Moitra and Alistair Stewart}, booktitle = {Foundations of Computer Science (FOCS)}, title = {Robust Estimators in High Dimensions without the Computational Intractability}, year = {2016}, } @inproceedings{lai2016agnostic, author = {Kevin A. Lai and Anup B. Rao and Santosh Vempala}, booktitle = {Foundations of Computer Science (FOCS)}, title = {Agnostic Estimation of Mean and Covariance}, year = {2016}, } @inproceedings{wang2017machine, author = {Shuohang Wang and Jing Jiang}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Machine Comprehension Using Match-{LSTM} and Answer Pointer}, year = {2017}, } @article{awasthi2012improved, author = {Pranjal Awasthi and Or Sheffet}, journal = {Approximation, Randomization, and Combinatorial Optimization}, pages = {37--49}, title = {Improved spectral-norm bounds for clustering}, year = {2012}, } @article{mahajan2009planar, author = {Meena Mahajan and Prajakta Nimbhorkar and Kasturi Varadarajan}, journal = {International Workshop on Algorithms and Computation}, pages = {274--285}, title = {The planar {k}-means problem is {NP}-hard}, year = {2009}, } @inproceedings{sontag2011complexity, author = {David Sontag and Dan Roy}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Complexity of Inference in Latent {D}irichlet Allocation}, year = {2011}, } @article{lei2015consistency, author = {Jing Lei and Alessandro Rinaldo}, journal = {The Annals of Statistics}, pages = {215--237}, title = {Consistency of spectral clustering in stochastic block models}, volume = {43}, year = {2015}, } @inproceedings{vempala2002spectral, author = {Santosh Vempala and Grant Wang}, booktitle = {Foundations of Computer Science (FOCS)}, title = {A spectral algorithm for learning mixture models}, year = {2002}, } @article{vershynin2010introduction, author = {Roman Vershynin}, journal = {arXiv}, title = {Introduction to the non-asymptotic analysis of random matrices}, year = {2010}, } @article{batson2012twice, author = {Joshua Batson and Daniel A. Spielman and Nikhil Srivastava}, journal = {SIAM Journal on Computing}, number = {6}, pages = {1704--1721}, title = {Twice-{R}amanujan sparsifiers}, volume = {41}, year = {2012}, } @inproceedings{fakcharoenphol2003tight, author = {Jittat Fakcharoenphol and Satish Rao and Kunal Talwar}, booktitle = {Symposium on Theory of Computing (STOC)}, pages = {448--455}, title = {A tight bound on approximating arbitrary metrics by tree metrics}, year = {2003}, } @article{rudelson1999random, author = {Mark Rudelson}, journal = {Journal of Functional Analysis}, pages = {60--72}, title = {Random vectors in the isotropic position}, volume = {164}, year = {1999}, } @inproceedings{steinhardt2016avoiding, author = {Jacob Steinhardt and Gregory Valiant and Moses Charikar}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = { Avoiding Imposters and Delinquents: Adversarial Crowdsourcing and Peer Prediction}, year = {2016}, } @article{kearns1993learning, author = {Michael Kearns and Ming Li}, journal = {SIAM Journal on Computing}, number = {4}, pages = {807--837}, title = {Learning in the presence of malicious errors}, volume = {22}, year = {1993}, } @article{tukey1960survey, author = {John W. Tukey}, journal = {Contributions to probability and statistics}, pages = {448--485}, title = {A survey of sampling from contaminated distributions}, volume = {2}, year = {1960}, } @book{maronna2006robust, author = {Ricardo A. Maronna and Douglas R. Martin and Victor J. Yohai}, publisher = {Wiley}, title = {Robust Statistics: Theory and Methods}, year = {2006}, } @book{hampel1986robust, author = {Frank R. Hampel and Elvezio M. Ronchetti and Peter J. Rousseeuw and Werner A. Stahel}, publisher = {Wiley}, title = {Robust Statistics: The Approach Based on Influence Functions}, year = {1986}, } @book{huber2009robust, author = {Peter J. Huber and Elvezio M. Ronchetti}, publisher = {Wiley}, title = {Robust Statistics}, year = {2009}, } @inproceedings{bhatia2015robust, author = {Kush Bhatia and Prateek Jain and Puroshottam Kar}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {721--729}, title = {Robust regression via hard thresholding}, year = {2015}, } @article{chandrasekaran2011rank, author = {Venkat Chandrasekaran and Sujay Sanghavi and Pablo A. Parrilo and Alan S. Willsky}, journal = {SIAM Journal on Optimization}, number = {2}, pages = {572--596}, title = {Rank-sparsity incoherence for matrix decomposition}, volume = {21}, year = {2011}, } @article{candes2011robust, author = {Emmanuel J. Cand{\`e}s and Xiaodong Li and Yi Ma and John Wright}, journal = {Journal of the ACM}, number = {3}, title = {Robust principal component analysis?}, volume = {58}, year = {2011}, } @article{xu2010principal, author = {Huan Xu and Constantine Caramanis and Shie Mannor}, journal = {arXiv}, title = {Principal component analysis with contaminated data: The high dimensional case}, year = {2010}, } @article{chen2013robust, author = {Yudong Chen and Constantine Caramanis and Shie Mannor}, journal = {arXiv}, title = {Robust High Dimensional Sparse Regression and Matching Pursuit}, year = {2013}, } @article{guruswami2009hardness, author = {Venkatesan Guruswami and Prasad Raghavendra}, journal = {SIAM Journal on Computing}, number = {2}, pages = {742--765}, title = {Hardness of learning halfspaces with noise}, volume = {39}, year = {2009}, } @inproceedings{hardt2013algorithms, author = {Moritz Hardt and Ankur Moitra}, booktitle = {Conference on Learning Theory (COLT)}, title = {Algorithms and Hardness for Robust Subspace Recovery}, year = {2013}, } @inproceedings{achlioptas2005spectral, author = {Dimitris Achlioptas and Frank McSherry}, booktitle = {Conference on Learning Theory (COLT)}, title = {On spectral learning of mixtures of distributions}, year = {2005}, } @article{lowner1934monotone, author = {Karl L{\"o}wner}, journal = {Mathematische Zeitschrift}, number = {1}, pages = {177--216}, title = {{\"U}ber monotone matrixfunktionen}, volume = {38}, year = {1934}, } @inproceedings{mansour2009domain, author = {Yishay Mansour and Mehryar Mohri and Afshin Rostamizadeh}, booktitle = {Conference on Learning Theory (COLT)}, title = {Domain adaptation: Learning bounds and algorithms}, year = {2009}, } @inproceedings{bendavid2006analysis, author = {Shai Ben-David and John Blitzer and Koby Crammer and Fernando Pereira}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {137--144}, title = {Analysis of representations for domain adaptation}, year = {2006}, } @inproceedings{johansson2016learning, author = {Fredrik Johansson and Uri Shalit and David Sontag}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Learning Representations for Counterfactual Inference}, year = {2016}, } @inproceedings{ghosh2011moderates, author = {Arpita Ghosh and Satyen Kale and Preston McAfee}, booktitle = {12th ACM conference on Electronic commerce}, pages = {167--176}, title = {Who moderates the moderators?: crowdsourcing abuse detection in user-generated content}, year = {2011}, } @article{chen2016enhancing, author = {Chen, Qian and Zhu, Xiaodan and Ling, Zhenhua and Wei, Si and Jiang, Hui}, journal = {arXiv}, title = {Enhancing and Combining Sequential and Tree {LSTM} for Natural Language Inference}, year = {2016}, } @inproceedings{zhou2016amr, author = {Junsheng Zhou and Feiyu Xu and Hans Uszkoreit and Weiguang Qu and Ran Li and Yanhui Gu}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {{AMR} Parsing with an Incremental Joint Model}, year = {2016}, } @inproceedings{goodman2016noise, author = {James Goodman and Andreas Vlachos and Jason Naradowsky}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Noise reduction and targeted exploration in imitation learning for abstract meaning representation parsing}, year = {2016}, } @inproceedings{pust2015using, author = {Michael Pust and Ulf Hermjakob and Kevin Knight and Daniel Marcu and Jonathan May}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Using syntax-based machine translation to parse {E}nglish into abstract meaning representation}, year = {2015}, } @inproceedings{werling2015robust, author = {Keenon Werling and Gabor Angeli and Christopher Manning}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Robust subgraph generation improves abstract meaning representation parsing}, year = {2015}, } @inproceedings{prasad2008penn, author = {Rashmi Prasad and Nikhil Dinesh and Alan Lee and Eleni Miltsakaki and Livio Robaldo and Aravind K Joshi and Bonnie L Webber}, booktitle = {LREC}, title = {The {P}enn Discourse TreeBank 2.0}, year = {2008}, } @article{lin2014pdtb, author = {Ziheng Lin and Hwee Tou Ng and Min-Yen Kan}, journal = {Natural Language Engineering}, number = {2}, pages = {151--184}, title = {A {PDTB}-styled end-to-end discourse parser}, volume = {20}, year = {2014}, } @inproceedings{feizabadi2014crowdsourcing, author = {Parvin Sadat Feizabadi and Sebastian Pado}, booktitle = {European Association for Computational Linguistics (EACL)}, pages = {226--230}, title = {Crowdsourcing Annotation of Non-Local Semantic Roles}, year = {2014}, } @inproceedings{he2015question, author = {Luheng He and Mike Lewis and Luke Zettlemoyer}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Question-Answer Driven Semantic Role Labeling: Using Natural Language to Annotate Natural Language}, year = {2015}, } @inproceedings{he2016human, author = {Luheng He and Julian Michael and Mike Lewis and Luke Zettlemoyer}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Human-in-the-Loop Parsing}, year = {2016}, } @article{duan2016generating, author = {Manjuan Duan and Ethan Hill and Michael White}, journal = {Proceedings of 10th Linguistic Annotation Workshop}, title = {Generating disambiguating paraphrases for structurally ambiguous sentences}, year = {2016}, } @article{von2008designing, author = {Luis Von Ahn and Laura Dabbish}, journal = {Communications of the ACM}, number = {8}, pages = {58--67}, title = {Designing games with a purpose}, volume = {51}, year = {2008}, } @inproceedings{daume10easyss, author = {Hal {Daum{\'e} III} and Abhishek Kumar and Avishek Saha}, booktitle = {Workshop on Domain Adaptation for NLP}, title = {Frustratingly Easy Semi-Supervised Domain Adaptation}, year = {2010}, } @inproceedings{daume07easyadapt, author = {Hal {Daum{\'e} III}}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Frustratingly Easy Domain Adaptation}, year = {2007}, } @inproceedings{luong2016iclr_multi, author = {Minh-Thang Luong and Quoc V. Le and Ilya Sutskever and Oriol Vinyals and Lukasz Kaiser}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Multi-task Sequence to Sequence Learning}, year = {2016}, } @inproceedings{klerke2016improving, author = {Sigrid Klerke and Yoav Goldberg and Anders S{\o}gaard}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Improving sentence compression by learning to predict gaze}, year = {2016}, } @inproceedings{sogaard2016deep, author = {Anders S{\o}gaard and Yoav Goldberg}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Deep multi-task learning with low level tasks supervised at lower layers}, year = {2016}, } @article{walker2006ace, author = {Christopher Walker and Stephanie Strassel and Julie Medero and Kazuaki Maeda}, journal = {Linguistic Data Consortium}, title = {{ACE} 2005 multilingual training corpus}, volume = {1}, year = {2006}, } @inproceedings{kulick2014inter, author = {Seth Kulick and Ann Bies and Justin Mott}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Inter-Annotator Agreement for {ERE} Annotation}, year = {2014}, } @inproceedings{kim2011overview, author = {Jin-Dong Kim and Sampo Pyysalo and Tomoko Ohta and Robert Bossy and Ngan Nguyen and Jun'ichi Tsujii}, booktitle = {Proceedings of the BioNLP Shared Task 2011 Workshop}, title = {Overview of BioNLP shared task 2011}, year = {2011}, } @inproceedings{hewlett2016wikireading, author = {Daniel Hewlett and Alexandre Lacoste and Llion Jones and Illia Polosukhin and Andrew Fandrianto and Jay Han and Matthew Kelcey and David Berthelot}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Wikireading: A novel large-scale language understanding task over {W}ikipedia}, year = {2016}, } @inproceedings{kadlec2016text, author = {Rudolf Kadlec and Martin Schmid and Ondrej Bajgar and Jan Kleindienst}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Text Understanding with the Attention Sum Reader Network}, year = {2016}, } @inproceedings{sukhbaatar2015end, author = {Sainbayar Sukhbaatar and Jason Weston and Rob Fergus}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {End-to-end memory networks}, year = {2015}, } @inproceedings{durrett2015neural, author = {Greg Durrett and Dan Klein}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Neural {CRF} parsing}, year = {2015}, } @inproceedings{ribeiro2016lime, author = {Marco Tulio Ribeiro and Sameer Singh and Carlos Guestrin}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, title = { "{Why Should {I} Trust You?}": Explaining the Predictions of Any Classifier }, year = {2016}, } @inproceedings{lei2016rationalizing, author = {Tao Lei and Regina Barzilay and Tommi Jaakkola}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Rationalizing Neural Predictions}, year = {2016}, } @inproceedings{zaidan2011crowdsourcing, author = {Omar F. Zaidan and Chris Callison-Burch}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Crowdsourcing Translation: Professional Quality from Non-Professionals}, year = {2011}, } @inproceedings{chang2008importance, author = {Ming-Wei Chang and Lev-Arie Ratinov and Dan Roth and Vivek Srikumar}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Importance of Semantic Representation: Dataless Classification}, year = {2008}, } @inproceedings{srikumar2011joint, author = {Vivek Srikumar and Dan Roth}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {A joint model for extended semantic role labeling}, year = {2011}, } @inproceedings{ogorman2016richer, author = {Tim O’Gorman and Kristin Wright-Bettner and Martha Palmer}, booktitle = {Computing News Storylines Workshop}, title = {Richer Event Description: Integrating event coreference with temporal, causal and bridging annotation}, year = {2016}, } @inproceedings{roth2005integer, author = {Dan Roth and Wen-tau Yih}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Integer linear programming inference for conditional random fields}, year = {2005}, } @inproceedings{pavlick2015domain, author = {Ellie Pavlick and Juri Ganitkevitch and Tsz Ping Chan and Xuchen Yao and Benjamin Van Durme and Chris Callison-Burch}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Domain-Specific Paraphrase Extraction}, year = {2015}, } @inproceedings{louvan2016cross, author = {Louvan, Samuel and Chetan Naik and Sadhana Kumaravel and Heeyoung Kwon and Niranjan Balasubramanian and Peter Clark}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Cross-Sentence Inference for Process Knowledge}, year = {2016}, } @inproceedings{louvan2015semantic, author = {Louvan, Samuel and Naik, Chetan and Lynn, Veronica and Arun, Ankit and Balasubramanian, Niranjan and Clark, Peter}, booktitle = {K-CAP Scientific Knowledge Workshop}, title = {Semantic Role Labeling for Process Recognition Questions}, year = {2015}, } @article{berant2015efficient, author = {Jonathan Berant and Noga Alon and Ido Dagan and Jacob Goldberger}, journal = {Computational Linguistics}, pages = {221--264}, title = {Efficient Global Learning of Entailment Graphs}, volume = {41}, year = {2015}, } @article{berant2015kb, author = {Roy Bar-Haim and Ido Dagan and Jonathan Berant}, journal = {Journal of Artificial Intelligence Research (JAIR)}, pages = {1--57}, title = {Knowledge-based Textual Inference via Parse-Tree transformations}, volume = {54}, year = {2015}, } @inproceedings{liang2017nsm, author = {Chen Liang and Jonathan Berant and Quoc Le and Kenneth D. Forbus, Ni Lao}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Neural Symbolic Machines: Learning Semantic Parsers on {F}reebase with Weak Supervision}, year = {2017}, } @inproceedings{choi2017coarse, author = {Eunsol Choi and Daniel Hewlett and Alexandre Lacoste and Illia Polosukhin and Jakob Uszkoreit and Jonathan Berant}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Coarse-to-Fine Question Answering for Long Documents}, year = {2017}, } @article{atzmon2016compositions, author = {Yuval Atzmon and Jonathan Berant and Vahid Kezami and Amir Globerson and Gal Chechik}, journal = {arXiv preprint arXiv:1608.07639}, title = {Learning to generalize to new compositions in image understanding}, year = {2016}, } @inproceedings{zha2001spectral, author = {Hongyuan Zha and Xiaofeng He and Chris Ding and Horst Simon and Ming Gu}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1057--1064}, title = {Spectral relaxation for {k}-means clustering}, year = {2001}, } @article{chen2014clustering, author = {Yudong Chen and Ali Jalali and Sujay Sanghavi and Huan Xu}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {2213--2238}, title = {Clustering partially observed graphs via convex optimization}, volume = {15}, year = {2014}, } @inproceedings{mcsherry2001spectral, author = {Frank McSherry}, booktitle = {Foundations of Computer Science (FOCS)}, pages = {529--537}, title = {Spectral partitioning of random graphs}, year = {2001}, } @article{oord2016wavenet, author = {Aaron van den Oord and Sander Dieleman and Heiga Zen and Karen Simonyan and Oriol Vinyals and Alex Graves and Nal Kalchbrenner and Andrew Senior and Koray Kavukcuoglu}, journal = {arXiv preprint arXiv:1609.03499}, title = {WaveNet: A generative model for raw audio}, year = {2016}, } @article{wu2016google, author = {Yonghui Wu and Mike Schuster and Zhifeng Chen and Quoc V Le and Mohammad Norouzi and Wolfgang Macherey and Maxim Krikun and Yuan Cao and Qin Gao and Klaus Macherey and others}, journal = {arXiv preprint arXiv:1609.08144}, title = {Google's Neural Machine Translation System: Bridging the Gap between Human and Machine Translation}, year = {2016}, } @article{rebrova2015coverings, author = {Elizaveta Rebrova and Konstantin Tikhomirov}, journal = {arXiv}, title = {Coverings of random ellipsoids, and invertibility of matrices with iid heavy-tailed entries}, year = {2015}, } @article{rebrova2016norms, author = {Elizaveta Rebrova and Roman Vershynin}, journal = {arXiv}, title = {Norms of random matrices: local and global problems}, year = {2016}, } @article{kim2015character, author = {Yoon Kim and Yacine Jernite and David Sontag and Alexander M Rush}, journal = {arXiv preprint arXiv:1508.06615}, title = {Character-aware neural language models}, year = {2015}, } @article{sedghi2016training, author = {Hanie Sedghi and Anima Anandkumar}, journal = {arXiv preprint arXiv:1603.00954}, title = {Training Input-Output Recurrent Neural Networks through Spectral Methods}, year = {2016}, } @article{amodei2016concrete, author = {Dario Amodei and Chris Olah and Jacob Steinhardt and Paul Christiano and John Schulman and Dan Mané}, journal = {arXiv preprint arXiv:1606.06565}, title = {Concrete problems in {AI} safety}, year = {2016}, } @inproceedings{goodfellow2015explaining, author = {Ian J Goodfellow and Jonathon Shlens and Christian Szegedy}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Explaining and harnessing adversarial examples}, year = {2015}, } @article{johnson2016google, author = {Melvin Johnson and Mike Schuster and Quoc V. Le and Maxim Krikun and Yonghui Wu and Zhifeng Chen and Nikhil Thorat and Fernanda Viégas and Martin Wattenberg and Greg Corrado and Macduff Hughes and Jeffrey Dean}, journal = {arXiv preprint arXiv:1611.04558}, title = {Google's Multilingual Neural Machine Translation System: Enabling Zero-Shot Translation}, year = {2016}, } @inproceedings{charikar2017learning, author = {Moses Charikar and Jacob Steinhardt and Gregory Valiant}, booktitle = {Symposium on Theory of Computing (STOC)}, title = {Learning from Untrusted Data}, year = {2017}, } @inproceedings{firat2016multi, author = {Orhan Firat and Kyunghyun Cho and Yoshua Bengio}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Multi-Way, Multilingual Neural Machine Translation with a Shared Attention Mechanism}, year = {2016}, } @article{haagerup1981best, author = {Uffe Haagerup}, journal = {Studia Mathematica}, number = {3}, pages = {231--283}, title = {The best constants in the Khintchine inequality}, volume = {70}, year = {1981}, } @inproceedings{quirk2015language, author = {Chris Quirk and Raymond J. Mooney and Michel Galley}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Language to Code: Learning Semantic Parsers for If-This-Then-That Recipes}, year = {2015}, } @mastersthesis{steinberg2005computation, author = {Daureen Steinberg}, school = {Technion -- Israel Institute of Technology}, title = {Computation of Matrix Norms with Applications to Robust Optimization}, year = {2005}, } @article{diakonikolas2017practical, author = {Ilias Diakonikolas and Gautam Kamath and Daniel Kane and Jerry Li and Ankur Moitra and Alistair Stewart}, journal = {arXiv}, title = {Being Robust (in High Dimensions) Can Be Practical}, year = {2017}, } @article{feldman2009agnostic, author = {Vitaly Feldman and Parikshit Gopalan and Subhash Khot and Ashok Kumar Ponnuswami}, journal = {SIAM Journal on Computing}, number = {2}, pages = {606--645}, title = {On agnostic learning of parities, monomials, and halfspaces}, volume = {39}, year = {2009}, } @inproceedings{berthet2013complexity, author = {Quentin Berthet and Philippe Rigollet}, booktitle = {Conference on Learning Theory (COLT)}, pages = {1046--1066}, title = {Complexity Theoretic Lower Bounds for Sparse Principal Component Detection}, year = {2013}, } @inproceedings{steinhardt2018resilience, author = {Jacob Steinhardt and Moses Charikar and Gregory Valiant}, booktitle = {Innovations in Theoretical Computer Science (ITCS)}, title = {Resilience: A Criterion for Learning in the Presence of Arbitrary Outliers}, year = {2018}, } @article{katz2017reluplex, author = {Guy Katz and Clark Barrett and David Dill and Kyle Julian and Mykel Kochenderfer}, journal = {arXiv preprint arXiv:1702.01135}, title = {Reluplex: An Efficient {SMT} Solver for Verifying Deep Neural Networks}, year = {2017}, } @article{hoeffding1963probability, author = {Wassily Hoeffding}, journal = {Journal of the American Statistical Association}, number = {301}, pages = {13--30}, title = {Probability inequalities for sums of bounded random variables}, volume = {58}, year = {1963}, } @article{kesten1966limit, author = {Harry Kesten and Bernt P. Stigum}, journal = {The Annals of Mathematical Statistics}, number = {5}, pages = {1211--1223}, title = {A limit theorem for multidimensional {G}alton-{W}atson processes}, volume = {37}, year = {1966}, } @article{kesten1966additional, author = {Harry Kesten and Bernt P. Stigum}, journal = {The Annals of Mathematical Statistics}, number = {6}, pages = {1463--1481}, title = {Additional limit theorems for indecomposable multidimensional {G}alton-{W}atson processes}, volume = {37}, year = {1966}, } @article{janson2004robust, author = {Svante Janson and Elchanan Mossel}, journal = {Annals of Probability}, pages = {2630--2649}, title = {Robust reconstruction on trees is determined by the second eigenvalue}, volume = {32}, year = {2004}, } @article{blum1995coloring, author = {Avrim Blum and Joel Spencer}, journal = {Journal of Algorithms}, number = {2}, pages = {204--234}, title = {Coloring random and semi-random {k}-colorable graphs}, volume = {19}, year = {1995}, } @inproceedings{barak2016nearly, author = {Boaz Barak and Samuel B. Hopkins and Jonathan Kelner and Pravesh Kothari and Ankur Moitra and Aaron Potechin}, booktitle = {Foundations of Computer Science (FOCS)}, pages = {428--437}, title = {A nearly tight sum-of-squares lower bound for the planted clique problem}, year = {2016}, } @inproceedings{steinhardt2015minimax, author = {Jacob Steinhardt and John Duchi}, booktitle = {Conference on Learning Theory (COLT)}, title = {Minimax rates for memory-constrained sparse linear regression}, year = {2015}, } @inproceedings{steinhardt2012flexible, author = {Jacob Steinhardt and Zoubin Ghahramani}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, title = {Flexible martingale priors for deep hierarchies}, year = {2012}, } @inproceedings{steinhardt2011finite, author = {Jacob Steinhardt and Russ Tedrake}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Finite-time regional verification of stochastic nonlinear systems}, year = {2011}, } @article{steinhardt2010permutations, author = {Jacob Steinhardt}, journal = {Electronic Journal of Combinatorics}, title = {Permutations with ascending and descending blocks}, volume = {17}, year = {2010}, } @article{steinhardt2009coloring, author = {Jacob Steinhardt}, journal = {Electronic Journal of Combinatorics}, title = {On coloring the odd-distance graph}, volume = {16}, year = {2009}, } @inproceedings{balcan2008discriminative, author = {Maria-Florina Balcan and Avrim Blum and Santosh Vempala}, booktitle = {Symposium on Theory of Computing (STOC)}, pages = {671--680}, title = {A discriminative framework for clustering via similarity functions}, year = {2008}, } @inproceedings{newell2014practicality, author = {Andrew Newell and Rahul Potharaju and Luojie Xiang and Cristina Nita-Rotaru}, booktitle = {Workshop on Artificial Intelligence and Security (AISec)}, pages = {83--93}, title = {On the practicality of integrity attacks on document-level sentiment analysis}, year = {2014}, } @article{biggio2014security, author = {Battista Biggio and Giorgio Fumera and Fabio Roli}, journal = {IEEE Transactions on Knowledge and Data Engineering}, number = {4}, pages = {984--996}, title = {Security evaluation of pattern classifiers under attack}, volume = {26}, year = {2014}, } @article{laishram2016curie, author = {Ricky Laishram and Vir Virander Phoha}, journal = {arXiv}, title = {Curie: A method for protecting {SVM} Classifier from Poisoning Attack}, year = {2016}, } @article{barreno2010security, author = {Marco Barreno and Blaine Nelson and Anthony D. Joseph and J. D. Tygar}, journal = {Machine Learning}, number = {2}, pages = {121--148}, title = {The security of machine learning}, volume = {81}, year = {2010}, } @inproceedings{park2017resilient, author = {Sangdon Park and James Weimer and Insup Lee}, booktitle = {International Conference on Cyber-Physical Systems}, pages = {155--164}, title = {Resilient linear classification: an approach to deal with attacks on training data}, year = {2017}, } @article{liu2016teaching, author = {Ji Liu and Xiaojin Zhu}, journal = {Journal of Machine Learning Research (JMLR)}, number = {162}, title = {The Teaching Dimension of Linear Learners}, volume = {17}, year = {2016}, } @inproceedings{cretu2008casting, author = {Gabriela F. Cretu and Angelos Stavrou and Michael E. Locasto and Salvatore J. Stolfo and Angelos D. Keromytis}, booktitle = {IEEE Symposium on Security and Privacy}, pages = {81--95}, title = {Casting out demons: Sanitizing training data for anomaly sensors}, year = {2008}, } @article{papernot2016towards, author = {Nicolas Papernot and Patrick McDaniel and Arunesh Sinha and Michael Wellman}, journal = {arXiv}, title = {Towards the Science of Security and Privacy in Machine Learning}, year = {2016}, } @article{gardiner2016security, author = {Joseph Gardiner and Shishir Nagaraja}, journal = {ACM Computing Surveys (CSUR)}, number = {3}, title = {On the Security of Machine Learning in Malware {C\&C} Detection: A Survey}, volume = {49}, year = {2016}, } @inproceedings{carlini2016hidden, author = {Nicholas Carlini and Pratyush Mishra and Tavish Vaidya and Yuankai Zhang and Micah Sherr and Clay Shields and David Wagner and Wenchao Zhou}, booktitle = {USENIX Security}, title = {Hidden voice commands}, year = {2016}, } @article{kurakin2016adversarial, author = {Alexey Kurakin and Ian Goodfellow and Samy Bengio}, journal = {arXiv}, title = {Adversarial examples in the physical world}, year = {2016}, } @article{papernot2016transferability, author = {Nicolas Papernot and Patrick McDaniel and Ian Goodfellow}, journal = {arXiv}, title = {Transferability in machine learning: from phenomena to black-box attacks using adversarial samples}, year = {2016}, } @inproceedings{xiao2012adversarial, author = {Han Xiao and Huang Xiao and Claudia Eckert}, booktitle = {European Conference on Artificial Intelligence}, title = {Adversarial Label Flips Attack on Support Vector Machines}, year = {2012}, } @article{xiao2015contamination, author = {Huang Xiao and Battista Biggio and Blaine Nelson and Han Xiao and Claudia Eckert and Fabio Roli}, journal = {Neurocomputing}, pages = {53--62}, title = {Support vector machines under adversarial label contamination}, volume = {160}, year = {2015}, } @inproceedings{li2016data, author = {Bo Li and Yining Wang and Aarti Singh and Yevgeniy Vorobeychik}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Data Poisoning Attacks on Factorization-Based Collaborative Filtering}, year = {2016}, } @inproceedings{biggio2014securitysvm, author = {Battista Biggio and Igino Corona and Blaine Nelson and Benjamin Rubinstein and Davide Maiorca and Giorgio Fumera and Giorgio Giacinto and Fabio Roli}, booktitle = {Support Vector Machines Applications}, title = {Security evaluation of support vector machines in adversarial environments}, year = {2014}, } @inproceedings{biggio2014malware, author = {Battista Biggio and Konrad Rieck and Davide Ariu and Christian Wressnegger and Igino Corona and Giorgio Giacinto and Fabio Roli}, booktitle = {Workshop on Artificial Intelligence and Security (AISec)}, title = {Poisoning behavioral malware clustering}, year = {2014}, } @inproceedings{biggio2013clustering, author = {Battista Biggio and Ignazio Pillai and Samuel Rota Bul{\`o} and Davide Ariu and Marcello Pelillo and Fabio Roli}, booktitle = {Workshop on Artificial Intelligence and Security (AISec)}, title = {Is data clustering in adversarial settings secure?}, year = {2013}, } @inproceedings{biggio2014linkage, author = {Battista Biggio and Bul{\`o}, Samuel Rota and Pillai, Ignazio and Mura, Michele and Mequanint, Eyasu Zemene and Pelillo, Marcello and Roli, Fabio}, booktitle = {Workshop on Structural, Syntactic, and Statistical Pattern Recognition}, title = {Poisoning Complete-Linkage Hierarchical Clustering}, year = {2014}, } @article{yang2017generative, author = {Chaofei Yang and Qing Wu and Hai Li and Yiran Chen}, journal = {arXiv}, title = {Generative Poisoning Attack Method Against Neural Networks}, year = {2017}, } @inproceedings{laskov2014practical, author = {Pavel Laskov and Nedim \v{S}rndi{\`c}}, booktitle = {Symposium on Security and Privacy}, title = {Practical evasion of a learning-based classifier: A case study}, year = {2014}, } @inproceedings{xiao2015lasso, author = {Huang Xiao and Battista Biggio and Gavin Brown and Giorgio Fumera and Claudia Eckert and Fabio Roli}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Is Feature Selection Secure against Training Data Poisoning?}, year = {2015}, } @inproceedings{burkard2017analysis, author = {Cody Burkard and Brent Lagesse}, booktitle = {International Workshop on Security And Privacy Analytics}, title = {Analysis of Causative Attacks against {SVM}s Learning from Data Streams}, year = {2017}, } @phdthesis{wang2016combating, author = {Gang Wang}, school = {University of California Santa Barbara}, title = {Combating Attacks and Abuse in Large Online Communities}, year = {2016}, } @inproceedings{zhou2016modeling, author = {Yan Zhou and Murat Kantarcioglu}, booktitle = {Pacific-Asia Conference on Knowledge Discovery and Data Mining}, title = {Modeling Adversarial Learning as Nested {S}tackelberg Games}, year = {2016}, } @inproceedings{bruckner2011stackelberg, author = {Michael Br{\"u}ckner and Tobias Scheffer}, booktitle = {SIGKDD}, pages = {547--555}, title = {{S}tackelberg games for adversarial prediction problems}, year = {2011}, } @article{bruckner2012static, author = {Michael Br{\"u}ckner and Christian Kanzow and Tobias Scheffer}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {2617--2654}, title = {Static prediction games for adversarial learning problems}, volume = {13}, year = {2012}, } @article{klivans2009learning, author = {Adam R. Klivans and Philip M. Long and Rocco A. Servedio}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {2715--2740}, title = {Learning halfspaces with malicious noise}, volume = {10}, year = {2009}, } @inproceedings{awasthi2014power, author = {Pranjal Awasthi and Maria Florina Balcan and Philip M. Long}, booktitle = {Symposium on Theory of Computing (STOC)}, pages = {449--458}, title = {The power of localization for efficiently learning linear separators with noise}, year = {2014}, } @inproceedings{balcan2009agnostic, author = {Maria Florina Balcan and Heiko R{\"o}glin and Shang-Hua Teng}, booktitle = {International Conference on Algorithmic Learning Theory}, pages = {384--398}, title = {Agnostic clustering}, year = {2009}, } @inproceedings{kushagra2016finding, author = {Shrinu Kushagra and Samira Samadi and Shai Ben-David}, booktitle = {International Conference on Algorithmic Learning Theory}, pages = {339--354}, title = {Finding Meaningful Cluster Structure Amidst Background Noise}, year = {2016}, } @article{nguyen2013exact, author = {Nam H. Nguyen and Trac D. Tran}, journal = {IEEE Transactions on Information Theory}, number = {4}, pages = {2017--2035}, title = {Exact Recoverability From Dense Corrupted Observations via $\ell_1$-Minimization}, volume = {59}, year = {2013}, } @inproceedings{nasrabadi2011robust, author = {Nasser M. Nasrabadi and Trac D. Tran and Nam Nguyen}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Robust lasso with missing and grossly corrupted observations}, year = {2011}, } @inproceedings{newsome2006paragraph, author = {James Newsome and Brad Karp and Dawn Song}, booktitle = {International Workshop on Recent Advances in Intrusion Detection}, title = {Paragraph: Thwarting signature learning by training maliciously}, year = {2006}, } @inproceedings{rubinstein2009antidote, author = {Benjamin Rubinstein and Blaine Nelson and Ling Huang and Anthony D. Joseph and Shing-Hon Lau and Satish Rao and Nina Taft and JD Tygar}, booktitle = {ACM SIGCOMM Conference on Internet measurement conference}, title = {Antidote: Understanding and defending against poisoning of anomaly detectors}, year = {2009}, } @article{mozaffari2015systematic, author = {Mehran Mozaffari-Kermani and Susmita Sur-Kolay and Anand Raghunathan and Niraj K. Jha}, journal = {IEEE Journal of Biomedical and Health Informatics}, number = {6}, pages = {1893--1905}, title = {Systematic poisoning attacks on and defenses for machine learning in healthcare}, volume = {19}, year = {2015}, } @book{bard1999, author = {Jonathan F. Bard}, publisher = {Springer}, title = {Practical Bilevel Optimization: Algorithms and Applications}, year = {1999}, } @article{huang2017adversarial, author = {Sandy Huang and Nicolas Papernot and Ian Goodfellow and Yan Duan and Pieter Abbeel}, journal = {arXiv}, title = {Adversarial attacks on neural network policies}, year = {2017}, } @article{lin2017tactics, author = {Yen-Chen Lin and Zhang-Wei Hong and Yuan-Hong Liao and Meng-Li Shih and Ming-Yu Liu and Min Sun}, journal = {arXiv}, title = {Tactics of Adversarial Attack on Deep Reinforcement Learning Agents}, year = {2017}, } @article{behzadan2017vulnerability, author = {Vahid Behzadan and Arslan Munir}, journal = {arXiv}, title = {Vulnerability of Deep Reinforcement Learning to Policy Induction Attacks}, year = {2017}, } @inproceedings{kakade2009complexity, author = {Sham M. Kakade and Karthik Sridharan and Ambuj Tewari}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {On the complexity of linear prediction: Risk bounds, margin bounds, and regularization}, year = {2009}, } @article{xiao2010rda, author = {Lin Xiao}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {2543--2596}, title = {Dual Averaging Methods for Regularized Stochastic Learning and Online Optimization}, volume = {11}, year = {2010}, } @inproceedings{maas2011imdb, author = {Andrew L. Maas and Raymond E. Daly and Peter T. Pham and Dan Huang and Andrew Y. Ng and Christopher Potts}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Learning Word Vectors for Sentiment Analysis}, year = {2011}, } @misc{gurobi2016, author = {{{Gurobi {Optimization}, Inc.}}}, title = {Gurobi Optimizer Reference Manual}, year = {2016}, } @inproceedings{metsis2006spam, author = {Vangelis Metsis and Ion Androutsopoulos and Georgios Paliouras}, booktitle = {CEAS}, pages = {28--69}, title = {Spam Filtering with Naive {B}ayes -- Which Naive {B}ayes?}, volume = {17}, year = {2006}, } @inproceedings{tramer2016stealing, author = {Florian Tram{\`e}r and Fan Zhang and Ari Juels and Michael K. Reiter and Thomas Ristenpart}, booktitle = {USENIX Security}, title = {Stealing machine learning models via prediction {API}s}, year = {2016}, } @article{kerckhoffs1883security, author = {Auguste Kerckhoffs}, journal = {Journal des sciences militaires}, title = {La cryptographie militaire}, volume = {9}, year = {1883}, } @inproceedings{dosovitskiy2016inverting, author = {Alexey Dosovitskiy and Thomas Brox}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Inverting visual representations with convolutional networks}, year = {2016}, } @inproceedings{mahendran2015understanding, author = {Aravindh Mahendran and Andrea Vedaldi}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Understanding deep image representations by inverting them}, year = {2015}, } @inproceedings{lofberg2004, author = {Johan L{\"{o}}fberg}, booktitle = {CACSD}, title = {{YALMIP}: A Toolbox for Modeling and Optimization in {MATLAB}}, year = {2004}, } @article{sturm1999guide, author = {Jos F. Sturm}, journal = {Optimization Methods and Software}, pages = {625--653}, title = {Using {SeDuMi} 1.02, a {MATLAB} toolbox for optimization over symmetric cones}, volume = {11}, year = {1999}, } @inproceedings{balakrishnan2017sparse, author = {Sivaraman Balakrishnan and Simon S. Du and Jerry Li and Aarti Singh}, booktitle = {Conference on Learning Theory (COLT)}, pages = {169--212}, title = {Computationally Efficient Robust Sparse Estimation in High Dimensions}, year = {2017}, } @article{diakonikolas2017learning, author = {Ilias Diakonikolas and Daniel M. Kane and Alistair Stewart}, journal = {arXiv}, title = {Learning Geometric Concepts with Nasty Noise}, year = {2017}, } @article{diakonikolas2017robustly, author = {Ilias Diakonikolas and Gautam Kamath and Daniel M. Kane and Jerry Li and Ankur Moitra and Alistair Stewart}, journal = {arXiv}, title = {Robustly Learning a {G}aussian: Getting Optimal Error, Efficiently}, year = {2017}, } @article{diakonikolas2016bayes, author = {Ilias Diakonikolas and Daniel Kane and Alistair Stewart}, journal = {arXiv}, title = {Robust learning of fixed-structure {B}ayesian networks}, year = {2016}, } @article{diakonikolas2016statistical, author = {Ilias Diakonikolas and Daniel M. Kane and Alistair Stewart}, journal = {arXiv}, title = {Statistical query lower bounds for robust estimation of high-dimensional {G}aussians and {G}aussian mixtures}, year = {2016}, } @article{kane2017robust, author = {Daniel Kane and Sushrut Karmalkar and Eric Price}, journal = {arXiv}, title = {Robust polynomial regression up to the information theoretic limit}, year = {2017}, } @article{you2017provable, author = {Chong You and Daniel P. Robinson and Ren{'e} Vidal}, journal = {arXiv}, title = {Provable Self-Representation Based Outlier Detection in a Union of Subspaces}, year = {2017}, } @article{ashtiani2017sample, author = {Hassan Ashtiani and Shai Ben-David and Abbas Mehrabian}, journal = {arXiv}, title = {Sample-Efficient Learning of Mixtures}, year = {2017}, } @article{li2017sparse, author = {Jerry Li}, journal = {arXiv}, title = {Robust Sparse Estimation Tasks in High Dimensions}, year = {2017}, } @inproceedings{li2017robust, author = {Jerry Li and Ludwig Schmidt}, booktitle = {Conference on Learning Theory (COLT)}, pages = {1302--1382}, title = {Robust and Proper Learning for Mixtures of {G}aussians via Systems of Polynomial Inequalities}, year = {2017}, } @article{meister2017data, author = {Michela Meister and Gregory Valiant}, journal = {arXiv}, title = {A Data Prism: Semi-Verified Learning in the Small-Alpha Regime}, year = {2017}, } @article{khintchine1923uber, author = {Aleksandr Khintchine}, journal = {Mathematische Zeitschrift}, pages = {109--116}, title = {{\"U}ber dyadische Br{\"u}che}, volume = {18}, year = {1923}, } @inproceedings{raz2016fast, author = {Ran Raz}, booktitle = {Foundations of Computer Science (FOCS)}, pages = {266--275}, title = {Fast learning requires good memory: {A} time-space lower bound for parity learning}, year = {2016}, } @inproceedings{raz2017time, author = {Ran Raz}, booktitle = {ECCC}, title = {A Time-Space Lower Bound for a Large Class of Learning Problems}, volume = {24}, year = {2017}, } @inproceedings{moshkovitz2017mixing, author = {Dana Moshkovitz and Michal Moshkovitz}, booktitle = {Conference on Learning Theory (COLT)}, title = {Mixing implies lower bounds for space bounded learning}, year = {2017}, } @inproceedings{kol2016time, author = {Gillat Kol and Ran Raz and Avishay Tal}, booktitle = {ECCC}, title = {Time-Space Hardness of Learning Sparse Parities}, volume = {23}, year = {2016}, } @article{beame2017time, author = {Paul Beame and Shayan Oveis Gharan and Xin Yang}, journal = {arXiv}, title = {Time-Space Tradeoffs for Learning from Small Test Spaces: Learning Low Degree Polynomial Functions}, year = {2017}, } @article{garg2017extractor, author = {Sumegha Garg and Ran Raz and Avishay Tal}, journal = {arXiv}, title = {Extractor-Based Time-Space Lower Bounds for Learning}, year = {2017}, } @article{steinhardt2017clique, author = {Jacob Steinhardt}, journal = {arXiv}, title = {Does robustness imply tractability? {A} lower bound for planted clique in the semi-random model}, year = {2017}, } @article{madry2017towards, author = {Aleksander Madry and Aleksandar Makelov and Ludwig Schmidt and Dimitris Tsipras and Adrian Vladu}, journal = {arXiv}, title = {Towards deep learning models resistant to adversarial attacks (published at {ICLR} 2018)}, year = {2017}, } @inproceedings{madry2018towards, author = {Aleksander Madry and Aleksandar Makelov and Ludwig Schmidt and Dimitris Tsipras and Adrian Vladu}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Towards deep learning models resistant to adversarial attacks}, year = {2018}, } @article{carlini2017adversarial, author = {Nicholas Carlini and David Wagner}, journal = {arXiv}, title = {Adversarial Examples Are Not Easily Detected: Bypassing Ten Detection Methods}, year = {2017}, } @article{evtimov2017robust, author = {Ivan Evtimov and Kevin Eykholt and Earlence Fernandes and Tadayoshi Kohno and Bo Li and Atul Prakash and Amir Rahmati and Dawn Song}, journal = {arXiv}, title = {Robust Physical-World Attacks on Machine Learning Models}, year = {2017}, } @article{xu2017feature, author = {Weilin Xu and David Evans and Yanjun Qi}, journal = {arXiv}, title = {Feature Squeezing: Detecting Adversarial Examples in Deep Neural Networks}, year = {2017}, } @article{kos2017adversarial, author = {Jernej Kos and Ian Fischer and Dawn Song}, journal = {arXiv}, title = {Adversarial examples for generative models}, year = {2017}, } @inproceedings{papernot2016distillation, author = {Nicolas Papernot and Patrick McDaniel and Xi Wu and Somesh Jha and Ananthram Swami}, booktitle = {IEEE Symposium on Security and Privacy}, pages = {582--597}, title = {Distillation as a defense to adversarial perturbations against deep neural networks}, year = {2016}, } @article{carlini2016defensive, author = {Nicholas Carlini and David Wagner}, journal = {arXiv}, title = {Defensive distillation is not robust to adversarial examples}, year = {2016}, } @inproceedings{papernot2017practical, author = {Nicolas Papernot and Patrick McDaniel and Ian Goodfellow and Somesh Jha and Berkay Z. Celik and Ananthram Swami}, booktitle = {Asia Conference on Computer and Communications Security}, pages = {506--519}, title = {Practical black-box attacks against machine learning}, year = {2017}, } @book{russell1991right, author = {Stuart Russell and Eric Wefald}, publisher = {MIT Press}, title = {Do the right thing: studies in limited rationality}, year = {1991}, } @article{daspremont2008smooth, author = {Alexandre d{\'}Aspremont}, journal = {SIAM Journal on Optimization}, number = {3}, pages = {1171--1183}, title = {Smooth optimization with approximate gradient}, volume = {19}, year = {2008}, } @article{devolder2014first, author = {Olivier Devolder and Fran{\c{c}}ois Glineur and Yurii Nesterov}, journal = {Mathematical Programming}, pages = {37--75}, title = {First-order methods of smooth convex optimization with inexact oracle}, volume = {146}, year = {2014}, } @article{narodytska2017verifying, author = {Nina Narodytska and Shiva Prasad Kasiviswanathan and Leonid Ryzhyk and Mooly Sagiv and Toby Walsh}, journal = {arXiv preprint arXiv:1709.06662}, title = {Verifying Properties of Binarized Deep Neural Networks}, year = {2017}, } @article{adamczak2015concentration, author = {Rados{\l{}}aw Adamczak and Pawe{\l{}} Wolff}, journal = {Probability Theory and Related Fields}, pages = {531--586}, title = {Concentration inequalities for non-{L}ipschitz functions with bounded derivatives of higher order}, volume = {162}, year = {2015}, } @article{latala2006estimates, author = {Rafa{\l{}} Lata{\l{}}a}, journal = {The Annals of Probability}, number = {6}, pages = {2315--2331}, title = {Estimates of moments and tails of {G}aussian chaoses}, volume = {34}, year = {2006}, } @incollection{bakry1985diffusions, author = {Dominique Bakry and Michel {\'E}mery}, booktitle = {S{\'e}minaire de Probabilit{\'e}s XIX 1983/84}, pages = {177--206}, title = {Diffusions hypercontractives}, year = {1985}, } @article{bardet2018functional, author = {Jean-Baptiste Bardet and Natha{\"e}l Gozlan and Florent Malrieu and Pierre-Andr{\'e} Zitt}, journal = {Bernoulli}, pages = {333--353}, title = {Functional inequalities for {G}aussian convolutions of compactly supported measures: explicit bounds and dimension dependence}, volume = {24}, year = {2018}, } @article{gromov1983topological, author = {Mikhail Gromov and Vitali D. Milman}, journal = {American Journal of Mathematics}, number = {4}, pages = {843--854}, title = {A topological application of the isoperimetric inequality}, volume = {105}, year = {1983}, } @article{bobkov1997poincare, author = {S. Bobkov and M. Ledoux}, journal = {Probability Theory and Related Fields}, number = {3}, pages = {383--400}, title = {{P}oincar{\'e}'s inequalities and {T}alagrand's concentration phenomenon for the exponential distribution}, volume = {107}, year = {1997}, } @inproceedings{carlini2017towards, author = {Nicholas Carlini and David Wagner}, booktitle = {IEEE Symposium on Security and Privacy}, pages = {39--57}, title = {Towards evaluating the robustness of neural networks}, year = {2017}, } @inproceedings{sivaraman2014experimental, author = {Anirudh Sivaraman and Keith Winstein and Pratiksha Thaker and Hari Balakrishnan}, booktitle = {SIGCOMM}, title = {An Experimental Study of the Learnability of Congestion Control}, year = {2014}, } @inproceedings{winstein2013tcp, author = {Keith Winstein and Hari Balakrishnan}, booktitle = {SIGCOMM}, title = {{TCP} ex Machina: Computer-Generated Congestion Control}, year = {2013}, } @article{bernardo2003variational, author = {Matthew J. Beal and Zoubin Ghahramani}, journal = {Bayesian Statistics}, title = {The variational {B}ayesian {EM} algorithm for incomplete data: with application to scoring graphical model structures}, year = {2003}, } @article{mackey2014matrix, author = {Lester Mackey and Michael I. Jordan and Richard Y. Chen and Brendan Farrell and Joel A. Tropp}, journal = {The Annals of Probability}, number = {3}, pages = {906--945}, title = {Matrix concentration inequalities via the method of exchangeable pairs}, volume = {42}, year = {2014}, } @article{tropp2015introduction, author = {Joel A. Tropp}, journal = {Foundations and Trends in Machine Learning}, pages = {1--230}, title = {An introduction to matrix concentration inequalities}, volume = {8}, year = {2015}, } @inproceedings{moitra2010settling, author = {Ankur Moitra and Gregory Valiant}, booktitle = {Foundations of Computer Science (FOCS)}, title = {Settling the polynomial learnability of mixtures of {G}aussians}, year = {2010}, } @inproceedings{belkin2010polynomial, author = {Mikhail Belkin and Kaushik Sinha}, booktitle = {Foundations of Computer Science (FOCS)}, title = {Polynomial learning of distribution families}, year = {2010}, } @inproceedings{bhaskara2014uniqueness, author = {Aditya Bhaskara and Moses Charikar and Aravindan Vijayaraghavan}, booktitle = {Conference on Learning Theory (COLT)}, title = {Uniqueness of tensor decompositions with applications to polynomial identifiability}, year = {2014}, } @inproceedings{goyal2014fourier, author = {Navin Goyal and Santosh Vempala and Ying Xiao}, booktitle = {Symposium on Theory of Computing (STOC)}, title = {Fourier {PCA} and robust tensor decomposition}, year = {2014}, } @inproceedings{ge2015learning, author = {Rong Ge and Qingqing Huang and Sham M. Kakade}, booktitle = {Symposium on Theory of Computing (STOC)}, title = {Learning mixtures of {G}aussians in high dimensions}, year = {2015}, } @inproceedings{bhaskara2014smoothed, author = {Aditya Bhaskara and Moses Charikar and Ankur Moitra and Aravindan Vijayaraghavan}, booktitle = {Symposium on Theory of Computing (STOC)}, title = {Smoothed analysis of tensor decompositions}, year = {2014}, } @inproceedings{anderson2014blessing, author = {Joseph Anderson and Mikhail Belkin and Navin Goyal and Luis Rademacher and James R. Voss}, booktitle = {Conference on Learning Theory (COLT)}, title = {The more, the merrier: the blessing of dimensionality for learning large {G}aussian mixtures}, year = {2014}, } @book{bishop2002art, author = {Matthew A. Bishop}, publisher = {Addison-Wesley Longman Publishing Co., Inc.}, title = {The art and science of computer security}, year = {2002}, } @article{johnson1978densest, author = {D. S. Johnson and F. P. Preparata}, journal = {Theoretical Computer Science}, pages = {93--107}, title = {The densest hemisphere problem}, volume = {6}, year = {1978}, } @inproceedings{tukey1975mathematics, author = {John W. Tukey}, booktitle = {ICM}, pages = {523--531}, title = {Mathematics and picturing of data}, volume = {6}, year = {1975}, } @inproceedings{knight2006unsupervised, author = {Kevin Knight and Anish Nair and Nishit Rathod and Kenji Yamada}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Unsupervised analysis for decipherment problems}, year = {2006}, } @article{manski1988identification, author = {Charles F. Manski}, journal = {Journal of the American Statistical Association (JASA)}, number = {403}, pages = {729--738}, title = {Identification of binary response models}, volume = {83}, year = {1988}, } @article{manski1985semiparametric, author = {Charles F. Manski}, journal = {Journal of Econometrics}, number = {3}, pages = {313--333}, title = {Semiparametric analysis of discrete response: Asymptotic properties of the maximum score estimator}, volume = {27}, year = {1985}, } @article{newey1994asymptotic, author = {Whitney K. Newey}, journal = {Econometrica: Journal of the Econometric Society}, pages = {1349--1382}, title = {The asymptotic variance of semiparametric estimators}, year = {1994}, } @article{adelman2008sixth, author = {Jennifer K. Adelman-McCarthy and Marcel A. Ag{\"u}eros and Sahar S. Allam and Carlos Allende Prieto and Kurt S. J. Anderson and Scott F. Anderson and James Annis and Neta A. Bahcall and C. A. L. Bailer-Jones, and Ivan K. Baldry and others}, journal = {The Astrophysical Journal Supplement Series}, number = {2}, title = {The sixth data release of the {S}loan digital sky survey}, volume = {175}, year = {2008}, } @inproceedings{mcmahan2013ad, author = {Brendan H. Mc{M}ahan and Gary Holt and D Sculley and Michael Young and Dietmar Ebner and Julian Grady and Lan Nie and Todd Phillips and Eugene Davydov and Daniel Golovin and others}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, title = {Ad click prediction: a view from the trenches}, year = {2013}, } @article{assouad1983deux, author = {Patrice Assouad}, journal = {Comptes rendus des s{\'e}ances de l'Acad{\'e}mie des sciences. S{\'e}rie 1, Math{\'e}matique}, number = {23}, pages = {1021--1024}, title = {Deux remarques sur l'estimation}, volume = {296}, year = {1983}, } @article{maronna1976robust, author = {Ricardo A. Maronna}, journal = {Annals of Statistics}, number = {1}, pages = {51--67}, title = {Robust estimation of multivariate location and scatter}, volume = {4}, year = {1976}, } @article{gordon1993novel, author = {Neil J. Gordon and David J. Salmond and Adrian F. M. Smith}, journal = {IEE Proceedings F (Radar and Signal Processing)}, number = {2}, pages = {107--113}, title = {Novel approach to nonlinear/non-{G}aussian {B}ayesian state estimation}, volume = {140}, year = {1993}, } @article{gilks2001following, author = {Walter R. Gilks and Carlo Berzuini}, journal = {Journal of the Royal Statistical Society: Series B (Statistical Methodology)}, number = {1}, pages = {127--146}, title = {Following a moving target--{M}onte {C}arlo inference for dynamic {B}ayesian models}, volume = {63}, year = {2001}, } @article{lin2013lookahead, author = {Ming Lin and Rong Chen and Jun S. Liu}, journal = {Statistical Science}, number = {1}, pages = {69--94}, title = {Lookahead strategies for sequential {M}onte {C}arlo}, volume = {28}, year = {2013}, } @article{doucet2000sequential, author = {Arnaud Doucet and Simon Godsill and Christophe Andrieu}, journal = {Statistics and computing}, number = {3}, pages = {197--208}, title = {On sequential {M}onte {C}arlo sampling methods for {B}ayesian filtering}, volume = {10}, year = {2000}, } @article{metropolis1953equation, author = {Nicholas Metropolis and Arianna W. Rosenbluth and Marshall N. Rosenbluth and Augusta H. Teller and Edward Teller}, journal = {The journal of chemical physics}, number = {6}, pages = {1087--1092}, title = {Equation of state calculations by fast computing machines}, volume = {21}, year = {1953}, } @article{hastings1970monte, author = {Keith W. Hastings}, journal = {Biometrika}, number = {1}, pages = {97--109}, title = {{M}onte {C}arlo sampling methods using {M}arkov chains and their applications}, volume = {57}, year = {1970}, } @inproceedings{minka2001ep, author = {Thomas P. Minka}, booktitle = {Uncertainty in Artificial Intelligence (UAI)}, pages = {362--369}, title = {Expectation propagation for approximate {B}ayesian inference}, year = {2001}, } @article{geyer1995annealing, author = {Charles J. Geyer and Elizabeth A. Thompson}, journal = {Journal of the American Statistical Association}, pages = {909--920}, title = {Annealing {M}arkov chain {M}onte {C}arlo with applications to ancestral inference}, volume = {90}, year = {1995}, } @article{halpern2011dealing, author = {Joseph Y. Halpern and Riccardo Pucella}, journal = {Artificial intelligence}, pages = {220--235}, title = {Dealing with logical omniscience: Expressiveness and pragmatics}, volume = {175}, year = {2011}, } @article{fagin1987belief, author = {Ronald Fagin and Joseph Y. Halpern}, journal = {Artificial intelligence}, pages = {39--76}, title = {Belief, awareness, and limited reasoning}, volume = {34}, year = {1987}, } @article{hintikka1975impossible, author = {Jaakko Hintikka}, journal = {Journal of Philosophical Logic}, number = {4}, title = {Impossible Possible Worlds Vindicated}, volume = {4}, year = {1975}, } @article{donoho1992breakdown, author = {David L. Donoho and Miriam Gasko}, journal = {Annals of Statistics}, number = {4}, pages = {1803--1827}, title = {Breakdown properties of location estimates based on halfspace depth and projected outlyingness}, volume = {20}, year = {1992}, } @misc{donoho1982breakdown, author = {David L. Donoho}, howpublished = {Ph.D.~qualifying paper}, school = {Department of Statistics, Harvard University}, title = {Breakdown properties of multivariate location estimators}, year = {1982}, } @phdthesis{hampel1968thesis, author = {Frank R. Hampel}, school = {University of California at Berkeley}, title = {Contributions to the theory of robust estimation}, year = {1968}, } @inproceedings{shivaswamy2010empirical, author = {Pannagadatta Shivaswamy and Tony Jebara}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, pages = {733--740}, title = {Empirical {B}ernstein boosting}, year = {2010}, } @inproceedings{namkoong2017variance, author = {Hongseok Namkoong and John Duchi}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Variance regularization with convex objectives}, year = {2017}, } @article{berk2017convex, author = {Richard Berk and Hoda Heidari and Shahin Jabbari and Matthew Joseph and Michael Kearns and Jamie Morgenstern and Seth Neel and Aaron Roth}, journal = {arXiv preprint arXiv:1706.02409}, title = {A convex framework for fair regression}, year = {2017}, } @article{kim2018fairness, author = {Michael P Kim and Omer Reingold and Guy N Rothblum}, journal = {arXiv preprint arXiv:1803.03239}, title = {Fairness Through Computationally-Bounded Awareness}, year = {2018}, } @article{angwin2016machine, author = {Julia Angwin and Jeff Larson and Surya Mattu and Lauren Kirchner}, journal = {ProPublica}, title = {Machine bias: There’s software used across the country to predict future criminals. and it’s biased against blacks}, volume = {23}, year = {2016}, } @article{waddell2016algorithms, author = {Kaveh Waddell}, journal = {The Atlantic}, title = {How algorithms can bring down minorities' credit scores}, year = {2016}, } @inproceedings{corbett2017algorithmic, author = {Sam Corbett-Davies and Emma Pierson and Avi Feller and Sharad Goel and Aziz Huq}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, pages = {797--806}, title = {Algorithmic decision making and the cost of fairness}, year = {2017}, } @article{binns2018fairness, author = {Reuben Binns}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {1--11}, title = {Fairness in Machine Learning: Lessons from Political Philosophy}, volume = {81}, year = {2018}, } @inproceedings{athalye2018obfuscated, author = {Anish Athalye and Nicholas Carlini and David Wagner}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Obfuscated gradients give a false sense of security: Circumventing defenses to adversarial examples}, year = {2018}, } @inproceedings{sinha2018certifiable, author = {Aman Sinha and Hongseok Namkoong and John Duchi}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Certifiable Distributional Robustness with Principled Adversarial Training}, year = {2018}, } @article{lu2017no, author = {Jiajun Lu and Hussein Sibai and Evan Fabry and David Forsyth}, journal = {arXiv preprint arXiv:1707.03501}, title = {No need to worry about adversarial examples in object detection in autonomous vehicles}, year = {2017}, } @article{athalye2017synthesizing, author = {Anish Athalye and Ilya Sutskever}, journal = {arXiv preprint arXiv:1707.07397}, title = {Synthesizing robust adversarial examples}, year = {2017}, } @article{weng2018towards, author = {Tsui-Wei Weng and Huan Zhang and Hongge Chen and Zhao Song and Cho-Jui Hsieh and Duane Boning and Inderjit S Dhillon and Luca Daniel}, journal = {arXiv preprint arXiv:1804.09699}, title = {Towards Fast Computation of Certified Robustness for ReLU Networks}, year = {2018}, } @article{brown2017adversarial, author = {Tom B Brown and Dandelion Mané and Aurko Roy and Martín Abadi and Justin Gilmer}, journal = {arXiv preprint arXiv:1712.09665}, title = {Adversarial patch}, year = {2017}, } @article{tjeng2017verifying, author = {Vincent Tjeng and Russ Tedrake}, journal = {arXiv preprint arXiv:1711.07356}, title = {Verifying Neural Networks with Mixed Integer Programming}, year = {2017}, } @article{diakonikolas2018sever, author = {Ilias Diakonikolas and Gautam Kamath and Daniel M. Kane and Jerry Li and Jacob Steinhardt and Alistair Stewart}, journal = {arXiv preprint arXiv:1803.02815}, title = {Sever: A Robust Meta-Algorithm for Stochastic Optimization}, year = {2018}, } @article{prasad2018robust, author = {Adarsh Prasad and Arun Sai Suggala and Sivaram Balakrishnan and Pradeep Ravikumar}, journal = {arXiv preprint arXiv:1802.06485}, title = {Robust estimation via robust gradient estimation}, year = {2018}, } @article{du2017sparse, author = {Simon S. Du and Sivaraman Balakrishnan and Aarti Singh}, journal = {arXiv preprint arXiv:1702.07709}, title = {Computationally efficient robust estimation of sparse functionals}, year = {2017}, } @misc{barak2016tutorial, author = {Boaz Barak and David Steurer}, howpublished = {\url{https://www.sumofsquares.org/public/index.html}}, title = {Proofs, beliefs, and algorithms through the lens of sum-of-squares}, year = {2016}, } @article{frenkel2014minkowski, author = {P{\'e}ter E. Frenkel and P{\'e}ter Horv{\'a}th}, journal = {Central European Journal of Mathematics}, number = {3}, pages = {510--516}, title = {Minkowski's inequality and sums of squares}, volume = {12}, year = {2014}, } @inproceedings{hopkins2018mixture, author = {Samuel B. Hopkins and Jerry Li}, booktitle = {Symposium on Theory of Computing (STOC)}, title = {Mixture Models, Robustness, and Sum of Squares Proofs}, year = {2018}, } @inproceedings{diakonikolas2018list, author = {Ilias Diakonikolas and Daniel M. Kane and Alistair Stewart}, booktitle = {Symposium on Theory of Computing (STOC)}, title = {List-Decodable Robust Mean Estimation and Learning Mixtures of Spherical {G}aussians}, year = {2018}, } @book{ledoux1991probability, author = {Michel Ledoux and Michel Talagrand}, publisher = {Springer Berlin Heidelberg}, title = {Probability in Banach Spaces: Isoperimetry and Processes}, year = {1991}, } @article{leek2010tackling, author = {Jeffrey T. Leek and Robert B. Scharpf and H{\'e}ctor Corrada Bravo and David Simcha and Benjamin Langmead and W. Evan Johnson and Donald Geman and Keith Baggerly and Rafael A. Irizarry}, journal = {Nature Reviews Genetics}, number = {10}, title = {Tackling the widespread and critical impact of batch effects in high-throughput data}, volume = {11}, year = {2010}, } @article{johnson2007adjusting, author = {W. Evan Johnson and Cheng Li and Ariel Rabinovic}, journal = {Biostatistics}, pages = {118--127}, title = {Adjusting batch effects in microarray expression data using empirical {B}ayes methods}, volume = {8}, year = {2007}, } @article{mckenzie2018robust, author = {Theo McKenzie and Hermish Mehta and Luca Trevisan}, journal = {arXiv}, title = {A New Algorithm for the Robust Semi-Random Independent Set Problem}, year = {2018}, } @phdthesis{steinhardt2018thesis, author = {Jacob Steinhardt}, school = {Stanford University}, title = {Robust Learning: Information Theory and Algorithms}, year = {2018}, } @phdthesis{li2018thesis, author = {Jerry Li}, school = {Massachusetts Institute of Technology}, title = {Principled Approaches to Robust Machine Learning and Beyond}, year = {2018}, } @inproceedings{chen2020simclr, author = {Ting Chen and Simon Kornblith and Mohammad Norouzi and Geoffrey Hinton}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1597--1607}, title = {A simple framework for contrastive learning of visual representations}, year = {2020}, } @inproceedings{lowe1999sift, author = {David G Lowe}, booktitle = {International Conference on Computer Vision (ICCV) Proceedings of the seventh IEEE international conference on computer vision}, pages = {1150--1157}, title = {Object recognition from local scale-invariant features}, volume = {2}, year = {1999 1999}, } @article{hinton2006fast, author = {Geoffrey E Hinton and Simon Osindero and Yee-Whye Teh}, journal = {Neural computation}, number = {7}, pages = {1527--1554}, title = {A fast learning algorithm for deep belief nets}, volume = {18}, year = {2006}, } @article{thrun1998lifelong, author = {Sebastian Thrun}, journal = {Learning to learn}, pages = {181--209}, title = {Lifelong learning algorithms}, year = {1998}, } @article{cortes1995svm, author = {Corinna Cortes and Vladimir Vapnik}, journal = {Machine Learning}, number = {3}, pages = {273--297}, title = {Support-vector networks}, volume = {20}, year = {1995}, } @article{lecun2015deep, author = {Yann LeCun and Yoshua Bengio and Geoffrey Hinton}, journal = {Nature}, number = {7553}, pages = {436--444}, title = {Deep learning}, volume = {521}, year = {2015}, } @article{creel2021algorithmic, author = {Kathleen Creel and Deborah Hellman}, journal = {Virginia Public Law and Legal Theory Research Paper}, title = {The Algorithmic Leviathan: Arbitrariness, Fairness, and Opportunity in Algorithmic Decision Making Systems}, volume = {13}, year = {2021}, } @inproceedings{collobert2008unified, author = {Ronan Collobert and Jason Weston}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {160--167}, title = {A unified architecture for natural language processing: Deep neural networks with multitask learning}, year = {2008}, } @article{fukushima1988neocognitron, author = {Kunihiko Fukushima}, journal = {Neural networks}, number = {2}, pages = {119--130}, title = {Neocognitron: A hierarchical neural network capable of visual pattern recognition}, volume = {1}, year = {1988}, } @inproceedings{zellers2019neuralfakenews, author = {Rowan Zellers and Ari Holtzman and Hannah Rashkin and Yonatan Bisk and Ali Farhadi and Franziska Roesner and Yejin Choi}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {9054--9065}, title = {Defending Against Neural Fake News}, year = {2019}, } @book{kerr2001university, author = {Clark Kerr}, publisher = {Harvard University Press}, title = {The Uses of the University}, year = {2001}, } @book{rhoten2011knowledge, author = {Diana Rhoten and Craig Calhoun}, publisher = {Columbia University Press}, title = {Knowledge matters: The public mission of the research university}, year = {2011}, } @book{nussbaum2010not, author = {Martha Craven Nussbaum}, publisher = {Princeton University Press}, title = {Not for profit: Why democracy needs the humanities}, year = {2010}, } @article{engstrom2020government, author = {David Freeman Engstrom and Daniel E Ho and Catherine M Sharkey and Mariano-Florentino Cuéllar}, journal = {NYU School of Law, Public Law Research Paper}, title = {Government by algorithm: Artificial intelligence in federal administrative agencies}, volume = {20}, year = {2020}, } @article{hong2004groups, author = {Lu Hong and Scott E Page}, journal = {Science}, number = {46}, title = {Groups of diverse problem solvers can outperform groups of high-ability problem solvers}, volume = {101}, year = {2004}, } @article{solomon2006norms, author = {Miriam Solomon}, journal = {Episteme}, number = {1}, pages = {23--36}, title = {Norms of epistemic diversity}, volume = {3}, year = {2006}, } @article{steel2018multiple, author = {Daniel Steel and Sina Fazelpour and Kinley Gillette and Bianca Crewe and Michael Burgess}, journal = {European journal for philosophy of science}, number = {3}, pages = {761--780}, title = {Multiple diversity concepts and their ethical-epistemic implications}, volume = {8}, year = {2018}, } @article{merton1979normative, author = {Robert K Merton}, journal = {The sociology of science: Theoretical and empirical investigations}, pages = {267--278}, title = {The normative structure of science}, year = {1979}, } @article{radinsky2015data, author = {Kira Radinsky}, journal = {Harvard Business Review}, title = {Data monopolists like {G}oogle are threatening the economy}, volume = {2}, year = {2015}, } @article{rogers2020primer, author = {Anna Rogers and Olga Kovaleva and Anna Rumshisky}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, pages = {842--866}, title = {A primer in bertology: What we know about how bert works}, volume = {8}, year = {2020}, } @inproceedings{beberg2009folding, author = {Adam L Beberg and Daniel L Ensign and Guha Jayachandran and Siraj Khaliq and Vijay S Pande}, booktitle = {2009 IEEE International Symposium on Parallel \& Distributed Processing}, pages = {1--8}, title = {Folding@home: Lessons from eight years of volunteer distributed computing}, year = {2009}, } @inproceedings{turian2010word, author = {Joseph Turian and Lev Ratinov and Yoshua Bengio}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {384--394}, title = {Word representations: a simple and general method for semi-supervised learning}, year = {2010}, } @inproceedings{cho2021unifying, author = {Jaemin Cho and Jie Lei and Hao Tan and Mohit Bansal}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Unifying vision-and-language tasks via text generation}, year = {2021}, } @inproceedings{kim2021vilt, author = {Wonjae Kim and Bokyung Son and Ildoo Kim}, booktitle = {International Conference on Machine Learning (ICML)}, title = {{ViLT}: Vision-and-language transformer without convolution or region supervision}, year = {2021}, } @article{rae2021gopher, author = {Jack W. Rae and Sebastian Borgeaud and Trevor Cai and Katie Millican and Jordan Hoffmann and Francis Song and J. Aslanides and Sarah Henderson and Roman Ring and Susannah Young and Eliza Rutherford and Tom Hennigan and Jacob Menick and Albin Cassirer and Richard Powell and G. V. D. Driessche and Lisa Anne Hendricks and Maribeth Rauh and Po-Sen Huang and Amelia Glaese and Johannes Welbl and Sumanth Dathathri and Saffron Huang and Jonathan Uesato and John F. J. Mellor and I. Higgins and Antonia Creswell and Nathan McAleese and Amy Wu and Erich Elsen and Siddhant M. Jayakumar and Elena Buchatskaya and D. Budden and Esme Sutherland and K. Simonyan and Michela Paganini and L. Sifre and Lena Martens and Xiang Lorraine Li and A. Kuncoro and Aida Nematzadeh and E. Gribovskaya and Domenic Donato and Angeliki Lazaridou and A. Mensch and J. Lespiau and Maria Tsimpoukelli and N. Grigorev and Doug Fritz and Thibault Sottiaux and Mantas Pajarskas and Tobias Pohlen and Zhitao Gong and Daniel Toyama and Cyprien de Masson d'Autume and Yujia Li and Tayfun Terzi and Vladimir Mikulik and I. Babuschkin and Aidan Clark and Diego de Las Casas and Aurelia Guy and Chris Jones and James Bradbury and Matthew Johnson and Blake A. Hechtman and Laura Weidinger and Iason Gabriel and William S. Isaac and Edward Lockhart and Simon Osindero and Laura Rimell and Chris Dyer and Oriol Vinyals and Kareem W. Ayoub and Jeff Stanway and L. Bennett and D. Hassabis and K. Kavukcuoglu and Geoffrey Irving}, journal = {arXiv}, title = {Scaling Language Models: Methods, Analysis \& Insights from Training Gopher}, year = {2021}, } @article{chowdhery2022palm, author = {Aakanksha Chowdhery and Sharan Narang and Jacob Devlin and Maarten Bosma and Gaurav Mishra and Adam Roberts and Paul Barham and Hyung Won Chung and Charles Sutton and Sebastian Gehrmann and Parker Schuh and Kensen Shi and Sasha Tsvyashchenko and Joshua Maynez and A. Rao and Parker Barnes and Yi Tay and Noam M. Shazeer and Vinodkumar Prabhakaran and Emily Reif and Nan Du and B. Hutchinson and Reiner Pope and James Bradbury and Jacob Austin and M. Isard and Guy Gur-Ari and Pengcheng Yin and Toju Duke and Anselm Levskaya and S. Ghemawat and Sunipa Dev and Henryk Michalewski and Xavier García and Vedant Misra and Kevin Robinson and Liam Fedus and Denny Zhou and Daphne Ippolito and D. Luan and Hyeontaek Lim and Barret Zoph and A. Spiridonov and Ryan Sepassi and David Dohan and Shivani Agrawal and Mark Omernick and Andrew M. Dai and T. S. Pillai and Marie Pellat and Aitor Lewkowycz and E. Moreira and Rewon Child and Oleksandr Polozov and Katherine Lee and Zongwei Zhou and Xuezhi Wang and Brennan Saeta and Mark Diaz and Orhan Firat and Michele Catasta and Jason Wei and K. Meier-Hellstern and D. Eck and J. Dean and Slav Petrov and Noah Fiedel}, journal = {arXiv}, title = {{PaLM}: Scaling Language Modeling with Pathways}, year = {2022}, } @inproceedings{lewis2020rag, author = {Patrick Lewis and Ethan Perez and Aleksandara Piktus and Fabio Petroni and Vladimir Karpukhin and Naman Goyal and Heinrich Kuttler and M. Lewis and Wen-tau Yih and Tim Rocktäschel and Sebastian Riedel and Douwe Kiela}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Retrieval-Augmented Generation for Knowledge-Intensive {NLP} Tasks}, year = {2020}, } @article{nakano2021webgpt, author = {Reiichiro Nakano and Jacob Hilton and S. Balaji and Jeff Wu and Long Ouyang and Christina Kim and Christopher Hesse and Shantanu Jain and V. Kosaraju and W. Saunders and Xu Jiang and Karl Cobbe and Tyna Eloundou and Gretchen Krueger and Kevin Button and Matthew Knight and Benjamin Chess and J. Schulman}, journal = {arXiv}, title = {{WebGPT}: Browser-assisted question-answering with human feedback}, year = {2021}, } @article{ouyang2022instructions, author = {Long Ouyang and Jeff Wu and Xu Jiang and Diogo Almeida and Carroll L. Wainwright and Pamela Mishkin and Chong Zhang and Sandhini Agarwal and Katarina Slama and Alex Ray and J. Schulman and Jacob Hilton and Fraser Kelton and Luke E. Miller and Maddie Simens and Amanda Askell and P. Welinder and P. Christiano and J. Leike and Ryan J. Lowe}, journal = {arXiv}, title = {Training language models to follow instructions with human feedback}, year = {2022}, } @article{bai2022helpful, author = {Yuntao Bai and Andy Jones and Kamal Ndousse and Amanda Askell and Anna Chen and Nova DasSarma and Dawn Drain and Stanislav Fort and Deep Ganguli and T. Henighan and Nicholas Joseph and Saurav Kadavath and John Kernion and Tom Conerly and S. El-Showk and Nelson Elhage and Zac Hatfield-Dodds and Danny Hernandez and Tristan Hume and Scott Johnston and S. Kravec and Liane Lovitt and Neel Nanda and Catherine Olsson and Dario Amodei and Tom B. Brown and Jack Clark and Sam McCandlish and C. Olah and Benjamin Mann and J. Kaplan}, journal = {arXiv}, title = {Training a Helpful and Harmless Assistant with Reinforcement Learning from Human Feedback}, year = {2022}, } @article{zhang2022opt, author = {Susan Zhang and Stephen Roller and Naman Goyal and Mikel Artetxe and Moya Chen and Shuohui Chen and Christopher Dewan and Mona Diab and Xian Li and Xi Victoria Lin and Todor Mihaylov and Myle Ott and Sam Shleifer and Kurt Shuster and Daniel Simig and Punit Singh Koura and Anjali Sridhar and Tianlu Wang and Luke Zettlemoyer}, journal = {arXiv}, title = {{OPT}: Open Pre-trained Transformer Language Models}, year = {2022}, } @article{du2021glam, author = {Nan Du and Yanping Huang and Andrew M. Dai and Simon Tong and Dmitry Lepikhin and Yuanzhong Xu and M. Krikun and Yanqi Zhou and Adams Wei Yu and Orhan Firat and Barret Zoph and Liam Fedus and Maarten Bosma and Zongwei Zhou and Tao Wang and Yu Emma Wang and Kellie Webster and Marie Pellat and Kevin Robinson and K. Meier-Hellstern and Toju Duke and Lucas Dixon and Kun Zhang and Quoc V. Le and Yonghui Wu and Zhifeng Chen and Claire Cui}, journal = {arXiv}, title = {{GLaM}: Efficient Scaling of Language Models with Mixture-of-Experts}, year = {2021}, } @article{black2022neox, author = {Sid Black and Stella Rose Biderman and Eric Hallahan and Quentin G. Anthony and Leo Gao and Laurence Golding and Horace He and Connor Leahy and Kyle McDonell and Jason Phang and M. Pieler and Usvsn Sai Prashanth and Shivanshu Purohit and Laria Reynolds and J. Tow and Ben Wang and Samuel Weinbach}, journal = {arXiv}, title = {{GPT-NeoX-20B}: An Open-Source Autoregressive Language Model}, year = {2022}, } @article{smith2022mtnlg, author = {Shaden Smith and M. Patwary and Brandon Norick and P. LeGresley and Samyam Rajbhandari and J. Casper and Zhun Liu and Shrimai Prabhumoye and George Zerveas and V. Korthikanti and Elton Zhang and Rewon Child and Reza Yazdani Aminabadi and J. Bernauer and Xia Song and M. Shoeybi and Yuxiong He and Michael Houston and Saurabh Tiwary and Bryan Catanzaro}, journal = {arXiv}, title = {Using DeepSpeed and Megatron to Train {Megatron-Turing} {NLG} 530B, A Large-Scale Generative Language Model}, year = {2022}, } @inproceedings{liu2017imagetoimage, author = {Ming-Yu Liu and Thomas Breuel and Jan Kautz}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Unsupervised Image-to-Image Translation Networks}, year = {2017}, } @inproceedings{larsen2016autoencoding, author = {Anders Boesen Lindbo Larsen and Søren Kaae Sønderby and Hugo Larochelle and Ole Winther}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Autoencoding beyond pixels using a learned similarity metric}, year = {2016}, } @article{maxwell2018MLremotesensing, author = {Aaron E. Maxwell and Timothy A. Warner and Fang Fang}, journal = {International Journal of Remote Sensing}, number = {9}, pages = {2784--2817}, title = {Implementation of machine-learning classification in remote sensing: an applied review}, volume = {39}, year = {2018}, } @article{lary2016MLremotesensing, author = {David J. Lary and Amir H. Alavi and Amir H. Gandomi and Annette L. Walker}, journal = {Geoscience Frontiers}, number = {1}, pages = {3--10}, title = {Machine learning in geosciences and remote sensing}, volume = {7}, year = {2016}, } @article{ahmad2010soilmoisture, author = {Sajjad Ahmad and Ajay Kalra and Haroon Stephen}, journal = {Advances in Water Resources}, number = {1}, pages = {69--80}, title = {Estimating soil moisture using remote sensing data: A machine learning approach}, volume = {33}, year = {2010}, } @article{gislason2006landcover, author = {Pall Oskar Gislason and Jon Atli Benediktsson and Johannes R. Sveinsson}, journal = {Pattern Recognition Letters}, number = {4}, pages = {294--300}, title = {Random Forests for land cover classification}, volume = {27}, year = {2006}, } @inproceedings{russwurm2020meta, author = {Marc Ru{\ss}wurm and Sherrie Wang and Marco Korner and David Lobell}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops}, pages = {200--201}, title = {Meta-Learning for Few-Shot Land Cover Classification}, year = {2020}, } @article{li2007estimating, author = {Ainong Li and Shunlin Liang and Angsheng Wang and Jun Qin}, journal = {Photogrammetric Engineering \& Remote Sensing}, number = {10}, pages = {1149--1157}, title = {Estimating crop yield from multi-temporal satellite data using multivariate regression and neural network techniques}, volume = {73}, year = {2007}, } @article{kussul2017classification, author = {N. {Kussul} and M. {Lavreniuk} and S. {Skakun} and A. {Shelestov}}, journal = {IEEE Geoscience and Remote Sensing Letters}, number = {5}, pages = {778--782}, title = {Deep Learning Classification of Land Cover and Crop Types Using Remote Sensing Data}, volume = {14}, year = {2017}, } @article{johnson2016crop, author = {Michael D. Johnson and William W. Hsieh and Alex J. Cannon and Andrew Davidson and Frédéric Bédard}, journal = {Agricultural and Forest Meteorology}, pages = {74--84}, title = {Crop yield forecasting on the Canadian Prairies by remotely sensed vegetation indices and machine learning methods}, volume = {218}, year = {2016}, } @article{cai2018crop, author = {Yaping Cai and Kaiyu Guan and Jian Peng and Shaowen Wang and Christopher Seifert and Brian Wardlow and Zhan Li}, journal = {Remote Sensing of Environment}, pages = {74--84}, title = {A high-performance and in-season classification system of field-level crop types using time-series Landsat data and a machine learning approach}, volume = {210}, year = {2018}, } @misc{modis2015landcover, author = {E. Vermote}, howpublished = {\url{https://doi.org/10.5067/MODIS/MOD09A1.006}}, title = {{MOD09A1} {MODIS}/Terra surface reflectance 8-Day {L3} global 500m {SIN} grid {V006}}, year = {2015}, } @misc{dataset2017era5, author = {C3S}, title = {{ERA5}: Fifth generation of {ECMWF} atmospheric reanalyses of the global climate}, year = {2017}, } @article{kiranyaz2019cnn1d, author = {Serkan Kiranyaz and Onur Avci and Osama Abdeljaber and Turker Ince and Moncef Gabbouj and Daniel J Inman}, journal = {arXiv preprint arXiv:1905.03554}, title = {1D Convolutional Neural Networks and Applications: A Survey}, year = {2019}, } @article{lunetta2006land, author = {Ross Lunetta and Joseph F Knight and Jayantha Ediriwickremaand John G Lyon and L Dorsey Worthy}, journal = {Remote sensing of environment}, number = {2}, pages = {142--154}, title = {Land-cover change detection using multi-temporal {MODIS} {NDVI} data}, volume = {105}, year = {2006}, } @article{defries1994ndvi, author = {R S DeFries and JRG Townshend}, journal = {International Journal of Remote Sensing}, number = {17}, pages = {3567--3586}, title = {{NDVI}-derived land cover classifications at a global scale}, volume = {15}, year = {1994}, } @article{defries1995AVHRR, author = {Ruth DeFries and Matthew Hansen and John Townshend}, journal = {Remote Sensing of Environment}, number = {3}, pages = {209--222}, title = {Global discrimination of land cover types from metrics derived from {AVHRR} pathfinder data}, volume = {54}, year = {1995}, } @article{rolnick2019tackling, author = {David Rolnick and Priya L Donti and Lynn H Kaack and Kelly Kochanski and Alexandre Lacoste and Kris Sankaran and Andrew Ross and Nikola Milojevic-Dupont and Natasha Jaques and Anna Waldman-Brown and others}, journal = {arXiv preprint arXiv:1906.05433}, title = {Tackling climate change with machine learning}, year = {2019}, } @article{haochen2021spectral, author = {Jeff Z. HaoChen and Colin Wei and Adrien Gaidon and Tengyu Ma}, journal = {arXiv preprint arXiv:2106.04156}, title = {Provable guarantees for self-supervised deep learning with spectral contrastive loss}, year = {2021}, } @misc{madrylab2019robustnesslib, author = {Logan Engstrom and Andrew Ilyas and Hadi Salman and Shibani Santurkar and Dimitris Tsipras}, howpublished = {\url{https://github.com/MadryLab/robustness}}, title = {Robustness (Python Library)}, year = {2019}, } @inproceedings{coates2011stl10, author = {Adam Coates and Andrew Ng and Honlak Lee}, booktitle = {Proceedings of the Fourteenth International Conference on Artificial Intelligence and Statistics}, pages = {215--223}, title = {An analysis of single-layer networks in unsupervised feature learning}, volume = {15}, year = {2011}, } @article{tan2020coal, author = {Shuhan Tan and Xingchao Peng and Kate Saenko}, journal = {arXiv preprint arXiv:1910.10320}, title = {Class-imbalanced Domain Adaptation: An Empirical Odyssey}, year = {2020}, } @inproceedings{french2018selfensembling, author = {Geoff French and Michal Mackiewicz and Mark Fisher}, booktitle = {International Conference on Learning Representations}, title = {Self-ensembling for visual domain adaptation}, year = {2018}, } @inproceedings{arora2019contrastive, author = {Sanjeev Arora and Hrishikesh Khandeparkar and Mikhail Khodak and Orestis Plevrakis and Nikunj Saunshi}, booktitle = {Proceedings of the 36th International Conference on Machine Learning}, pages = {5628--5637}, title = {A theoretical analysis of contrastive unsupervised representation learning}, volume = {97}, year = {2019}, } @article{tosh2021topic, author = {Christopher Tosh and Akshay Krishnamurthy and Daniel Hsu}, journal = {Journal of Machine Learning Research (JMLR)}, number = {281}, pages = {1--31}, title = {Contrastive estimation reveals topic posterior information to linear models}, volume = {22}, year = {2021}, } @inproceedings{tosh2021redundancy, author = {Christopher Tosh and Akshay Krishnamurthy and Daniel Hsu}, booktitle = {Proceedings of the 32nd International Conference on Algorithmic Learning Theory}, pages = {1179--1206}, title = {Contrastive learning, multi-view redundancy, and linear models}, volume = {132}, year = {2021}, } @article{li2021mdd, author = {Jingjing Li and Erpeng Chen and Zhengming Ding and Lei Zhu and Ke Lu and Heng Tao Shen}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence}, number = {11}, pages = {3918--3930}, title = {Maximum density divergence for domain adaptation}, volume = {43}, year = {2021}, } @book{li2020transport, author = {Mengxue Li and Yi-Ming Zhai and You-Wei Luo and Peng-Fei Ge and Chuan-Xian Ren}, publisher = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, title = {Enhanced transport distance for unsupervised domain adaptation}, year = {2020}, } @book{xiao2021dynamic, author = {Ni Xiao and Lei Zhang}, publisher = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, title = {Dynamic weighted learning for unsupervised domain adaptation}, year = {2021}, } @inproceedings{levesque2013best, author = {Hector J. Levesque}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {On our best behaviour}, year = {2013}, } @inproceedings{szegedy2014intriguing, author = {Christian Szegedy and Wojciech Zaremba and Ilya Sutskever and Joan Bruna and Dumitru Erhan and Ian Goodfellow and Rob Fergus}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Intriguing properties of neural networks}, year = {2014}, } @inproceedings{seo2017bidaf, author = {Minjoon Seo and Aniruddha Kembhavi and Ali Farhadi and Hannaneh Hajishirzi}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Bidirectional Attention Flow for Machine Comprehension}, year = {2017}, } @inproceedings{papernot2017blackbox, author = {Nicolas Papernot and Patrick McDaniel and Ian Goodfellow and Somesh Jha and Z.Berkay Celik and Ananthram Swami}, booktitle = {Proceedings of the ACM Asia Conference on Computer and Communications Security}, title = {Practical Black-Box Attacks against Deep Learning Systems using Adversarial Examples}, year = {2017}, } @inproceedings{narodytska2017blackbox, author = {Nina Narodytska and Shiva Prasad Kasiviswanathan}, booktitle = {IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)}, title = {Simple Black-Box Adversarial Perturbations for Deep Networks}, year = {2017}, } @inproceedings{paice1990lancaster, author = {Chris D. Paice}, booktitle = {ACM SIGIR Forum}, title = {Another Stemmer}, year = {1990}, } @manual{marcus1999ptb, author = {Mitchell Marcus and Beatrice Santorini and Mary Ann Marcinkiewicz and Ann Taylor}, title = {Treebank-3}, year = {1999}, } @manual{francis1979brown, author = {W. Nelson Francis and Henry Kucera}, title = {Brown Corpus Manual}, year = {1979}, } @inproceedings{hixon2015dialog, author = {Ben Hixon and Peter Clark and Hannaneh Hajishirzi}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Learning knowledge graphs for question answering through conversational dialog}, year = {2015}, } @article{smith2012adversarial, author = {Noah A. Smith}, journal = {arXiv preprint arXiv:1207.0245}, title = {Adversarial Evaluation for Models of Natural Language}, year = {2012}, } @inproceedings{bowman2016continuous, author = {Samuel R. Bowman and Luke Vilnis and Oriol Vinyals and Andrew M. Dai and Rafal Jozefowicz and Samy Bengio}, booktitle = {Computational Natural Language Learning (CoNLL)}, pages = {10--21}, title = {Generating Sentences from a Continuous Space}, year = {2016}, } @inproceedings{li2017adversarial, author = {Jiwei Li and Will Monroe and Tianlin Shi and Alan Ritter and Dan Jurafsky}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Adversarial Learning for Neural Dialogue Generation}, year = {2017}, } @inproceedings{dalvi2004adversarial, author = {Nilesh Dalvi and Pedro Domingos and Mausam and Sumit Sanghai and Deepak Verma}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, title = {Adversarial Classification}, year = {2004}, } @inproceedings{lowd2005adversarial, author = {Daniel Lowd and Christopher Meek}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, title = {Adversarial learning}, year = {2005}, } @inproceedings{paperno2016lambada, author = {Denis Paperno and German Kruszewski and Angeliki Lazaridou and Quan Ngoc Pham and Raffaella Bernardi and Sandro Pezzelle and Marco Baroni and Gemma Boleda and Raquel Fernandez}, booktitle = {Association for Computational Linguistics (ACL)}, title = {The {LAMBADA} dataset: Word prediction requiring a broad discourse context}, year = {2016}, } @inproceedings{rimell2009unbounded, author = {Laura Rimell and Stephen Clark and Mark Steedman}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Unbounded Dependency Recovery for Parser Evaluation}, year = {2009}, } @inproceedings{goodfellow2014gan, author = {Ian J. Goodfellow and Jean Pouget-Abadie and Mehdi Mirza and Bing Xu and David Warde-Farley and Sherjil Ozair and Aaron Courville and Yoshua Bengio}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Generative Adversarial Nets}, year = {2014}, } @article{zhang2017jnet, author = {Junbei Zhang and Xiaodan Zhu and Qian Chen and Lirong Dai and Si Wei and Hui Jiang}, journal = {arXiv preprint arXiv:1703.04617}, title = {Exploring Question Understanding and Adaptation in Neural-Network-Based Question Answering}, year = {2017}, } @article{wang2016multi, author = {Zhiguo Wang and Haitao Mi and Wael Hamza and Radu Florian}, journal = {arXiv preprint arXiv:1612.04211}, title = {Multi-Perspective Context Matching for Machine Comprehension}, year = {2016}, } @article{lee2017rasor, author = {Kenton Lee and Shimi Salant and Tom Kwiatkowski and Ankur Parikh and Dipanjan Das and Jonathan Berant}, journal = {arXiv}, title = {Learning Recurrent Span Representations for Extractive Question Answering}, year = {2017}, } @misc{bender2017buildit, author = {Emily M. Bender and Hal {Daum{\'e} III} and Allyson Ettinger and Harita Kannan and Sudha Rao and Ephraim Rothschild}, howpublished = {\url{https://bibinlp.umiacs.umd.edu/}}, title = {Build It, Break It: The Language Edition}, year = {2017}, } @inproceedings{moosavidezfooli2017universal, author = {Seyed-Mohsen Moosavi-Dezfooli and Alhussein Fawzi and Omar Fawzi and Pascal Frossard}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Universal adversarial perturbations}, year = {2017}, } @inproceedings{shen2017reasonet, author = {Yelong Shen and Po-Sen Huang and Jianfeng Gao and Weizhu Chen}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, title = {{ReasoNet}: Learning to Stop Reading in Machine Comprehension}, year = {2017}, } @inproceedings{hu2018mnemonic, author = {Minghao Hu and Yuxing Peng and Xipeng Qiu}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Reinforced Mnemonic Reader for Machine Reading Comprehension}, year = {2018}, } @inproceedings{liu2017sect, author = {Rui Liu and Junjie Hu and Wei Wei and Zi Yang and Eric Nyberg}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Structural Embedding of Syntactic Trees for Machine Comprehension}, year = {2017}, } @inproceedings{gong2018ruminating, author = {Yichen Gong and Samuel R. Bowman}, booktitle = {Workshop on Machine Reading for Question Answering (MRQA)}, title = {Ruminating Reader: Reasoning with Gated Multi-Hop Attention}, year = {2018}, } @article{yu2016dcr, author = {Yang Yu and Wei Zhang and Kazi Hasan and Mo Yu and Bing Xiang and Bowen Zhou}, journal = {arXiv preprint arXiv:1610.09996}, title = {End-to-End Answer Chunk Extraction and Ranking for Reading Comprehension}, year = {2016}, } @inproceedings{weissenborn2017fastqa, author = {Dirk Weissenborn and Georg Wiese and Laura Seiffe}, booktitle = {Computational Natural Language Learning (CoNLL)}, title = {Making Neural {QA} as Simple as Possible but not Simpler}, year = {2017}, } @article{radford2016dcgan, author = {Alec Radford and Luke Metz and Soumith Chintala}, journal = {arXiv}, title = {Unsupervised Representation Learning with Deep Convolutional Generative Adversarial Networks}, year = {2016}, } @inproceedings{salimans2016gan, author = {Tim Salimans and Ian Goodfellow and Wojciech Zaremba and Vicki Cheung and Alec Radford and Xi Chen}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Improved Techniques for Training GANs}, year = {2016}, } @inproceedings{arjovsky2017gan, author = {Martin Arjovsky and Leon Bottou}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Towards Principled Methods for Training Generative Adversarial Networks}, year = {2017}, } @inproceedings{bousmalis2017domain, author = {Konstantinos Bousmalis and Nathan Silberman and David Dohan and Dumitru Erhan and Dilip Krishnan}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Unsupervised Pixel-Level Domain Adaptation with Generative Adversarial Networks}, year = {2017}, } @inproceedings{wang2012baselines, author = {Sida Wang and Christopher D. Manning}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Baselines and Bigrams: Simple, Good Sentiment and Topic Classification}, year = {2012}, } @inproceedings{li2015gmmn, author = {Yujia Li and Kevin Swersky and Richard Zemel}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Generative Moment Matching Networks}, year = {2015}, } @inproceedings{zhang2017matching, author = {Yizhe Zhang and Zhe Gan and Kai Fan and Zhi Chen and Ricardo Henao and Dinghan Shen and Lawrence Carin}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Adversarial Feature Matching for Text Generation}, year = {2017}, } @article{arora2017gan, author = {Sanjeev Arora and Rong Ge and Yingyu Liang and Tengyu Ma and Yi Zhang}, journal = {arXiv}, title = {Generalization and Equilibrium in Generative Adversarial Nets (GANs)}, year = {2017}, } @inproceedings{tzeng2017domain, author = {Eric Tzeng and Judy Hoffman and Kate Saenko and Trevor Darrell}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Adversarial Discriminative Domain Adaptation}, year = {2017}, } @article{conneau2017word, author = {Alexis Conneau and Guillaume Lample and Marc'Aurelio Ranzato and Ludovic Denoyer and Herve Jegou}, journal = {arXiv}, title = {Word Translation Without Parallel Data}, year = {2017}, } @inproceedings{li2017demystifying, author = {Yanghao Li and Naiyan Wang and Jiaying Liu and Xiaodi Hou}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Demystifying Neural Style Transfer}, year = {2017}, } @inproceedings{wang2007qa, author = {Mengqiu Wang and Noah A. Smith and Teruko Mitamura}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {What is the Jeopardy Model? A Quasi-Synchronous Grammar for {QA}}, year = {2007}, } @inproceedings{yih2013enhanced, author = {Wen-tau Yih and Ming-Wei Chang and Christopher Meek and Andrzej Pastusiak}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Question Answering Using Enhanced Lexical Semantic Models}, year = {2013}, } @inproceedings{peters2018elmo, author = {Matthew E. Peters and Mark Neumann and Mohit Iyyer and Matt Gardner and Christopher Clark and Kenton Lee and Luke Zettlemoyer}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Deep contextualized word representations}, year = {2018}, } @inproceedings{zhang2017tacred, author = {Yuhao Zhang and Victor Zhong and Danqi Chen and Gabor Angeli and Christopher D. Manning}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Position-aware Attention and Supervised Data Improve Slot Filling}, year = {2017}, } @inproceedings{hendrickx2010relations, author = {Iris Hendrickx and Su Nam Kim and Zornitsa Kozareva and Preslav Nakov and Diarmuid OSeaghdha and Sebastian Pado and Marco Pennacchiotti and Lorenza Romano and Stan Szpakowicz}, booktitle = {5th International Workshop on Semantic Evaluation}, title = {SemEval-2010 Task 8: Multi-Way Classification of Semantic Relations Between Pairs of Nominals}, year = {2010}, } @inproceedings{marelli2014sick, author = {Marco Marelli and Stefano Menini and Marco Baroni and Luisa Bentivogli and Raffaella bernardi and Roberto Zamparelli}, booktitle = {Language Resources and Evaluation Conference (LREC)}, title = {A {SICK} cure for the evaluation of compositional distributional semantic models}, year = {2014}, } @inproceedings{huang2018fusion, author = {Hsin-Yuan Huang and Chenguang Zhu and Yelong Shen and Weizhu Chen}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {FusionNet: Fusing via Fully-Aware Attention with Application to Machine Comprehension}, year = {2018}, } @inproceedings{golub2017transfer, author = {David Golub and Po-Sen Huang and Xiaodong He and Li Deng}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Two-Stage Synthesis Networks for Transfer Learning in Machine Comprehension}, year = {2017}, } @inproceedings{michael2018qamr, author = {Julian Michael and Gabriel Stanovsky and Luheng He and Ido Dagan and Luke Zettlemoyer}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Crowdsourcing Question--Answer Meaning Representations}, year = {2018}, } @inproceedings{min2017transfer, author = {Sewon Min and Minjoon Seo and Hannaneh Hajishirzi}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Question Answering through Transfer Learning from Large Fine-grained Supervision Data}, year = {2017}, } @inproceedings{zhai2017chunking, author = {Feifei Zhai and Saloni Potdar and Bing Xiang and Bowen Zhou}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Neural Models for Sequence Chunking}, year = {2017}, } @inproceedings{hakkanitur2016multidomain, author = {Dilek Hakkani-T{\"u}r and Gokhan Tur and Asli Celikyilmaz and Yun-Nung Chen and Jianfeng Gao and Li Deng and Ye-Yi Wang}, booktitle = {InterSpeech}, title = {Multi-Domain Joint Semantic Frame Parsing using Bi-directional {RNN}-{LSTM}}, year = {2016}, } @article{vrandecic2014wikidata, author = {Denny Vrande\v{c}i\'{c} and Markus Kr\H{o}tzsch}, journal = {Communications of the ACM}, title = {Wikidata: A free collaborative knowledgebase}, volume = {57}, year = {2014}, } @inproceedings{alzantot2018adversarial, author = {Moustafa Alzantot and Yash Sharma and Ahmed Elgohary and Bo-Jhang Ho and Mani Srivastava and Kai-Wei Chang}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Generating Natural Language Adversarial Examples}, year = {2018}, } @inproceedings{iyyer2018adversarial, author = {Mohit Iyyer and John Wieting and Kevin Gimpel and Luke Zettlemoyer}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Adversarial Example Generation with Syntactically Controlled Paraphrase Networks}, year = {2018}, } @inproceedings{parikh2016decomposable, author = {Ankur Parikh and Oscar T\"{a}ckstr\"{o}m and Dipanjan Das and Jakob Uszkoreit}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {A Decomposable Attention Model for Natural Language Inference}, year = {2016}, } @inproceedings{mrksic2016counterfitting, author = {Nikola Mrk\v{s}i\'{c} and Diarmuid \'{O} S\'{e}aghdha and Blaise Thomson and Milica Ga\v{s}i\'{c} and Lina Rojas-Barahona and Pei-Hao Su and David Vandyke and Tsung-Hsien Wen and Steve Young}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Counter-fitting Word Vectors to Linguistic Constraints}, year = {2016}, } @inproceedings{ribeiro2018sears, author = {Marco Tulio Ribeiro and Sameer Singh and Carlos Guestrin}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Semantically Equivalent Adversarial Rules for Debugging {NLP} Models}, year = {2018}, } @inproceedings{liu2019inoculation, author = {Nelson F. Liu and Roy Schwartz and Noah A. Smith}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Inoculation by Fine-Tuning: A Method for Analyzing Challenge Datasets}, year = {2019}, } @inproceedings{ribeiro2018anchors, author = {Marco Tulio Ribeiro and Sameer Singh and Carlos Guestrin}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Anchors: High-Precision Model-Agnostic Explanations}, year = {2018}, } @inproceedings{mudrakarta2018question, author = {Pramod K. Mudrakarta and Ankur Taly and Mukund Sundararajan and Kedar Dhamdhere}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Did the Model Understand the Question?}, year = {2018}, } @inproceedings{feng2018pathologies, author = {Shi Feng and Eric Wallace and Alvin {Grissom II} and Mohit Iyyer and Pedro Rodriguez and Jordan Boyd-Graber}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Pathologies of Neural Models Make Interpretations Difficult}, year = {2018}, } @inproceedings{hu2019parabank, author = {J. Edward Hu and Rachel Rudinger and Matt Post and Benjamin Van Durme}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {ParaBank: Monolingual Bitext Generation and Sentential Paraphrasing via Lexically-constrained Neural Machine Translation}, year = {2019}, } @inproceedings{pruthi2019misspellings, author = {Danish Pruthi and Bhuwan Dhingra and Zachary C. Lipton}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Combating Adversarial Misspellings with Robust Word Recognition}, year = {2019}, } @inproceedings{michel2019adversarial, author = {Paul Michel and Xian Li and Graham Neubig and Juan Miguel Pino}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {On Evaluation of Adversarial Perturbations for Sequence-to-Sequence Models}, year = {2019}, } @article{hosseini2017deceiving, author = {Hossein Hosseini and Sreeram Kannan and Baosen Zhang and Radha Poovendran}, journal = {arXiv preprint arXiv:1702.08138}, title = {Deceiving {G}oogle's {P}erspective {API} Built for Detecting Toxic Comments}, year = {2017}, } @inproceedings{ebrahimi2018adversarial, author = {Javid Ebrahimi and Daniel Lowd and Dejing Dou}, booktitle = {International Conference on Computational Linguistics (COLING)}, title = {On Adversarial Examples for Character-Level Neural Machine Translation}, year = {2018}, } @inproceedings{lee2005spam, author = {Honglak Lee and Andrew Y. Ng}, booktitle = {Conference on Email and Anti-Spam (CEAS)}, title = {Spam Deobfuscation using a Hidden {M}arkov Model}, year = {2005}, } @inproceedings{huang2019achieving, author = {Po-Sen Huang and Robert Stanforth and Johannes Welbl and Chris Dyer and Dani Yogatama and Sven Gowal and Krishnamurthy Dvijotham and Pushmeet Kohli}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Achieving Verified Robustness to Symbol Substitutions via Interval Bound Propagation}, year = {2019}, } @article{arora2018linear, author = {Sanjeev Arora and Yuanzhi Li and Yingyu Liang and Tengyu Ma and Andrej Risteski}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {Linear Algebraic Structure of Word Senses, with Applications to Polysemy}, volume = {6}, year = {2018}, } @inproceedings{kocijan2019winograd, author = {Vid Kocijan and Ana-Maria Cretu and Oana-Maria Camburu and Yordan Yordanov and Thomas Lukasiewicz}, booktitle = {Association for Computational Linguistics (ACL)}, title = {A Surprisingly Robust Trick for the {W}inograd Schema Challenge}, year = {2019}, } @inproceedings{jia2019document, author = {Robin Jia and Cliff Wong and Hoifung Poon}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Document-Level {N}-ary Relation Extraction with Multiscale Representation Learning}, year = {2019}, } @inproceedings{marcovitz2016reverse, author = {Amir Marcovitz and Robin Jia and Gill Bejerano}, booktitle = {Molecular Biology and Evolution (MBE)}, title = {``{R}everse {G}enomics'' Predicts Function of Human Conserved Noncoding Elements}, year = {2016}, } @inproceedings{braun2015mx, author = {Benjamin A. Braun and Amir Marcovitz and J. Gray Camp and Robin Jia and Gill Bejerano}, booktitle = {Proceedings of the National Academy of Sciences of the United States of America (PNAS)}, title = {{M}x1 and {M}x2 key antiviral proteins are surprisingly lost in toothed whales}, year = {2015}, } @inproceedings{zhao2017gender, author = {Jieyu Zhao and Tianlu Wang and Mark Yatskar and Vicente Ordo{\~n}ez and Kai-Wei Chang}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Men Also Like Shopping: Reducing Gender Bias Amplification using Corpus-level Constraints}, year = {2017}, } @inproceedings{lake2018generalization, author = {Brenden Lake and Marco Baroni}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Generalization without Systematicity: On the Compositional Skills of Sequence-to-Sequence Recurrent Networks}, year = {2018}, } @inproceedings{fisch2019mrqa, author = {Adam Fisch and Alon Talmor and Robin Jia and Minjoon Seo and Eunsol Choi and Danqi Chen}, booktitle = {Workshop on Machine Reading for Question Answering (MRQA)}, title = {{MRQA} 2019 Shared Task: Evaluating Generalization in Reading Comprehension}, year = {2019}, } @phdthesis{lehnert1977process, author = {Wendy Lehnert}, school = {Yale University}, title = {The Process of Question Answering}, year = {1977}, } @article{elyaniv2010foundations, author = {Ran El-Yaniv and Yair Wiener}, journal = {Journal of Machine Learning Research (JMLR)}, title = {On the Foundations of Noise-free Selective Classification}, volume = {11}, year = {2010}, } @inproceedings{chow1957optimum, author = {C. K. Chow}, booktitle = {IRE Transactions on Electronic Computers}, title = {An optimum character recognition system using decision functions}, year = {1957}, } @inproceedings{blitzer2006domain, author = {John Blitzer and Ryan McDonald and Fernando Pereira}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Domain Adaptation with Structural Correspondence Learning}, year = {2006}, } @inproceedings{penas2009respubliqa, author = {Anselmo Pe{\~n}as and Pamela Forner and Richard Sutcliffe and \'{A}lvaro Rodrigo and Corina For\u{a}scu and I\={n}aki Alegria and Danilo Giampiccolo and Nicolas Moreau and Petya Osenova}, booktitle = {Cross Language Evaluation Forum}, title = {Overview of {ResPubliQA} 2009: Question Answering Evaluation over European Legislation}, year = {2009}, } @inproceedings{penas2013mre, author = {Anselmo Pe{\~n}as and Eduard Hovy and Pamela Forner and \'{A}lvaro Rodrigo and Richard Sutcliffe and Roser Morante}, booktitle = {Cross Language Evaluation Forum}, title = {{QA4MRE} 2011-2013: Overview of Question Answering for Machine Reading Evaluation}, year = {2013}, } @article{gondek2012framework, author = {D. C. Gondek and A. Lally and A. Kalyanpur and J. W. Murdock and P. A. Duboue and L. Zhang and Y. Pan and Z. M. Qiu and C. Welty}, journal = {{IBM} Journal of Research and Development}, title = {A framework for merging and ranking of answers in {DeepQA}}, volume = {56}, year = {2012}, } @article{rodriguez2019quizbowl, author = {Pedro Rodriguez and Shi Feng and Mohit Iyyer and He He and Jordan Boyd-Graber}, journal = {arXiv preprint arXiv:1904.04792}, title = {Quizbowl: The Case for Incremental Question Answering}, year = {2019}, } @article{feng2019selective, author = {Jean Feng and Arjun Sondhi and Jessica Perry and Noah Simon}, journal = {arXiv preprint arXiv:1906.05473}, title = {Selective prediction-set models with coverage guarantees}, year = {2019}, } @article{toplak2014assessment, author = {Marko Toplak and Rok Mo\v{c}nik and Matija Polajnar and Zoran Bosni\'{c} and Lars Carlsson and Catrin Hasselgren and Janez Dem\v{s}ar and Scott Boyer and Blaz Zupan and Jonna St{\aa}lring}, journal = {Journal of Chemical Information and Modeling}, title = {Assessment of Machine Learning Reliability Methods for Quantifying the Applicability Domain of {QSAR} Regression Models}, volume = {54}, year = {2014}, } @inproceedings{geifman2017selective, author = {Yonatan Geifman and Ran El-Yaniv}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Selective classification for deep neural networks}, year = {2017}, } @inproceedings{thorne2018fever, author = {James Thorne and Andreas Vlachos and Christos Christodoulopoulos and Arpit Mittal}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {FEVER: a large-scale dataset for Fact Extraction and VERification}, year = {2018}, } @inproceedings{geiger2019posing, author = {Atticus Geiger and Ignacio Cases and Lauri Karttunen and Chris Potts}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Posing Fair Generalization Tasks for Natural Language Inference}, year = {2019}, } @inproceedings{hendrycks2017baseline, author = {Dan Hendrycks and Kevin Gimpel}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {A Baseline for Detecting Misclassified and Out-of-Distribution Examples in Neural Networks}, year = {2017}, } @inproceedings{lakshminarayanan2017simple, author = {Balaji Lakshminarayanan and Alexander Pritzel and Charles Blundell}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Simple and Scalable Predictive Uncertainty Estimation using Deep Ensembles}, year = {2017}, } @article{li2019reducing, author = {Zhizhong Li and Derek Hoiem}, journal = {arXiv preprint arXiv:1804.03166}, title = {Reducing Over-confident Errors outside the Known Distribution}, year = {2019}, } @inproceedings{magnini2002right, author = {Bernardo Magnini and Matteo Negri and Roberto Prevete and Hristo Tanev}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Is It the Right Answer? Exploiting Web Redundancy for Answer Validation}, year = {2002}, } @inproceedings{ko2007probabilistic, author = {Jeongwoo Ko and Luo Si and Eric Nyberg}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {A Probabilistic Framework for Answer Selection in Question Answering}, year = {2007}, } @inproceedings{gal2016dropout, author = {Yarin Gal and Zoubin Ghahramani}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Dropout as a {Bayesian} Approximation: Representing Model Uncertainty in Deep Learning}, year = {2016}, } @inproceedings{smith2018understanding, author = {Lewis Smith and Yarin Gal}, booktitle = {Uncertainty in Artificial Intelligence (UAI)}, title = {Understanding Measures of Uncertainty for Adversarial Example Detection}, year = {2018}, } @inproceedings{liang2018enhancing, author = {Shiyu Liang and Yixuan Li and R. Srikant}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Enhancing The Reliability of Out-of-distribution Image Detection in Neural Networks}, year = {2018}, } @inproceedings{wallace2019universal, author = {Eric Wallace and Shi Feng and Nikhil Kandpal and Matt Gardner and Sameer Singh}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Universal Adversarial Triggers for Attacking and Analyzing {NLP}}, year = {2019}, } @inproceedings{cheng2020seq, author = {Minhao Cheng and Jinfeng Yi and Huan Zhang and Pin-Yu Chen and Cho-Jui Hsieh}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {{Seq2Sick}: Evaluating the Robustness of Sequence-to-Sequence Models with Adversarial Examples}, year = {2020}, } @article{pedregosa2011sklearn, author = {F. Pedregosa and G. Varoquaux and A. Gramfort and V. Michel and B. Thirion and O. Grisel and M. Blondel and P. Prettenhofer and R. Weiss and V. Dubourg and J. Vanderplas and A. Passos and D. Cournapeau and M. Brucher and M. Perrot and E. Duchesnay}, journal = {Journal of Machine Learning Research (JMLR)}, title = {Scikit-learn: Machine Learning in {P}ython}, volume = {12}, year = {2011}, } @inproceedings{chen2019evaluating, author = {Anthony Chen and Gabriel Stanovsky and Sameer Singh and Matt Gardner}, booktitle = {Workshop on Machine Reading for Question Answering (MRQA)}, title = {Evaluating Question Answering Evaluation}, year = {2019}, } @inproceedings{chen2019understanding, author = {Jifan Chen and Greg Durrett}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Understanding Dataset Design Choices for Multi-hop Reasoning}, year = {2019}, } @inproceedings{min2019compositional, author = {Sewon Min and Eric Wallace and Sameer Singh and Matt Gardner and Hannaneh Hajishirzi and Luke Zettlemoyer}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Compositional Questions Do Not Necessitate Multi-hop Reasoning}, year = {2019}, } @inproceedings{scholkopf1999support, author = {Bernhard Sch{\"o}lkopf and Robert Williamson and Alex Smola and John Shawe-Taylor and John Platt}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Support vector method for novelty detection}, year = {1999}, } @inproceedings{gillick2019learning, author = {Daniel Gillick and Sayali Kulkarni and Larry Lansing and Alessandro Presta and Jason Baldridge and Eugene Ie and Diego Garcia-Olano}, booktitle = {Computational Natural Language Learning (CoNLL)}, title = {Learning Dense Representations for Entity Retrieval}, year = {2019}, } @inproceedings{lee2019latent, author = {Kenton Lee and Ming-Wei Chang and Kristina Toutanova}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Latent Retrieval for Weakly Supervised Open Domain Question Answering}, year = {2019}, } @inproceedings{ovadia2019uncertainty, author = {Yaniv Ovadia and Emily Fertig and Jie Ren and Zachary Nado and D Sculley and Sebastian Nowozin and Joshua V. Dillon and Balaji Lakshminarayanan and Jasper Snoek}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Can You Trust Your Model's Uncertainty? Evaluating Predictive Uncertainty Under Dataset Shift}, year = {2019}, } @inproceedings{glockner2018breaking, author = {Max Glockner and Vered Shwartz and Yoav Goldberg}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Breaking {NLI} Systems with Sentences that Require Simple Lexical Inferences}, year = {2018}, } @inproceedings{shi2020robustness, author = {Zhouxing Shi and Huan Zhang and Kai-Wei Chang and Minlie Huang and Cho-Jui Hsieh}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Robustness Verification for Transformers}, year = {2020}, } @inproceedings{garg2018robust, author = {Shivam Garg and Vatsal Sharan and Brian Hu Zhang and Gregory Valiant}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {A Spectral View of Adversarially Robust Features}, year = {2018}, } @article{liu2019roberta, author = {Yinhan Liu and Myle Ott and Naman Goyal and Jingfei Du and Mandar Joshi and Danqi Chen and Omer Levy and Mike Lewis and Luke Zettlemoyer and Veselin Stoyanov}, journal = {arXiv preprint arXiv:1907.11692}, title = {{R}o{BERT}a: A Robustly Optimized {BERT} Pretraining Approach}, year = {2019}, } @inproceedings{lan2020albert, author = {Zhenzhong Lan and Mingda Chen and Sebastian Goodman and Kevin Gimpel and Piyush Sharma and Radu Soricut}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {{ALBERT}: A Lite {BERT} for Self-supervised Learning of Language Representations}, year = {2020}, } @inproceedings{reimers2019sentence, author = {Nils Reimers and Iryna Gurevych}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Sentence-{BERT}: Sentence Embeddings using Siamese {BERT}-Networks}, year = {2019}, } @inproceedings{garg2020tanda, author = {Siddhant Garg and Thuy Vu and Alessandro Moschitti}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {{TANDA}: Transfer and Adapt Pre-Trained Transformer Models for Answer Sentence Selection}, year = {2020}, } @inproceedings{yoon2019compare, author = {Seunghyun Yoon and Franck Dernoncourt and Doo Soon Kim and Trung Bui and Kyomin Jung}, booktitle = {Conference on Information and Knowledge Management (CIKM)}, title = {A Compare-Aggregate Model with Latent Clustering for Answer Selection}, year = {2019}, } @inproceedings{shen2017inter, author = {Gehui Shen and Yunlun Yang and Zhi-Hong Deng}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Inter-Weighted Alignment Network for Sentence Pair Modeling}, year = {2017}, } @inproceedings{zhang2019selection, author = {Guanhua Zhang and Bing Bai and Jian Liang and Kun Bai and Shiyu Chang and Mo Yu and Conghui Zhu and Tiejun Zhao}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Selection Bias Explorations and Debias Methods for Natural Language Sentence Matching Datasets}, year = {2019}, } @article{warstadt2018cola, author = {Alex Warstadt and Amanpreet Singh and Samuel R. Bowman}, journal = {arXiv preprint arXiv:1805.12471}, title = {Neural Network Acceptability Judgments}, year = {2018}, } @article{lewis2004rcv1, author = {David D. Lewis and Yiming Yang and Tony G. Rose and Fan Li}, journal = {Journal of Machine Learning Research (JMLR)}, title = {RCV1: A New Benchmark Collection for Text Categorization Research}, volume = {5}, year = {2004}, } @article{sun2009strategies, author = {Aixin Sun and Ee-Peng Lim and Ying Liu}, journal = {Decision Support Systems}, number = {1}, title = {On Strategies for Imbalanced Text Classification Using SVM: A Comparative Study}, volume = {48}, year = {2009}, } @article{chawla2004imbalanced, author = {Nitesh V. Chawla and Nathalie Japkowicz and Aleksander R. Kolcz}, journal = {ACM SIGKDD Explorations Newsletter}, number = {1}, title = {Editorial: Special Issue on Learning from Imbalanced Data Sets}, volume = {6}, year = {2004}, } @inproceedings{dendamrongvit2009undersampling, author = {Sareewan Dendamrongvit and Miroslav Kubat}, booktitle = {PAKDD Workshop on New Frontiers in Applied Data Mining}, title = {Undersampling Approach for Imbalanced Training Sets and Induction from Multi-label Text-Categorization Domains}, year = {2009}, } @inproceedings{attenberg2010why, author = {Josh Attenberg and Foster Provost}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, title = {Why Label when you can Search? Alternatives to Active Learning for Applying Human Resources to Build Classification Models Under Extreme Class Imbalance}, year = {2010}, } @article{nogueira2019passage, author = {Rodrigo Nogueira and Kyunghyun Cho}, journal = {arXiv preprint arXiv:1901.04085}, title = {Passage Re-ranking with {BERT}}, year = {2019}, } @inproceedings{khattab2020colbert, author = {Omar Khattab and Matei Zaharia}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, title = {{ColBERT}: Efficient and Effective Passage Search via Contextualized Late Interaction over {BERT}}, year = {2020}, } @article{roland2007frequency, author = {Douglas Roland and Frederic Dick and Jeffrey Elman}, journal = {Journal of Memory and Language}, title = {Frequency of Basic {E}nglish Grammatical Structures: A Corpus Analysis}, volume = {57}, year = {2007}, } @inproceedings{lewis1995evaluating, author = {David D. Lewis}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, title = {Evaluating and Optimizing Autonomous Text Classification Systems}, year = {1995}, } @inproceedings{johnson2019billion, author = {Jeff Johnson and Matthijs Douze and Herv{\'e} J{\'e}gou}, booktitle = {IEEE Transactions on Big Data}, title = {Billion-scale similarity search with GPUs}, year = {2019}, } @inproceedings{balcan2007margin, author = {Maria-Florina Balcan and Andrei Broder and Tong Zhang}, booktitle = {International Conference on Computational Learning Theory}, title = {Margin based active learning}, year = {2007}, } @inproceedings{balcan2013active, author = {Maria-Florina Balcan and Phil Long}, booktitle = {Conference on Learning Theory (COLT)}, title = {Active and passive learning of linear separators under log-concave distributions}, year = {2013}, } @misc{iyer2017qqp, author = {Shankar Iyer and Nikhil Dandekar and Korn{'e}l Csernai}, howpublished = {\url{https://www.quora.com/q/quoradata/First-Quora-Dataset-Release-Question-Pairs}}, title = {First Quora Dataset Release: Question Pairs}, year = {2017}, } @article{yang2018benchmark, author = {Yazhou Yang and Marco Loog}, journal = {Pattern Recognition}, title = {A benchmark and comparison of active learning for logistic regression}, volume = {83}, year = {2018}, } @inproceedings{ertekin2007learning, author = {Seyda Ertekin and Jian Huang and Leon Bottou and Lee Giles}, booktitle = {Conference on Information and Knowledge Management (CIKM)}, title = {Learning on the border: active learning in imbalanced data classification}, year = {2007}, } @inproceedings{wang2019superglue, author = {Alex Wang and Yada Pruksachatkun and Nikita Nangia and Amanpreet Singh and Julian Michael and Felix Hill and Omer Levy and Samuel R. Bowman}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {{SuperGLUE}: A Stickier Benchmark for General-Purpose Language Understanding Systems}, year = {2019}, } @article{clark2019aristo, author = {Peter Clark and Oren Etzioni and Daniel Khashabi and Tushar Khot and Bhavana Dalvi Mishra and Kyle Richardson and Ashish Sabharwal and Carissa Schoenick and Oyvind Tafjord and Niket Tandon and Sumithra Bhakthavatsalam and Dirk Groeneveld and Michal Guerquin and Michael Schmitz}, journal = {arXiv preprint arXiv:1909.01958}, title = {From `{F}' to `{A}' on the {N.Y.} {R}egents Science Exams: An Overview of the {A}risto Project}, year = {2019}, } @article{partee2011origins, author = {Barbara H. Partee}, journal = {Baltic International Yearbook of Cognition, Logic and Communication}, title = {Formal Semantics: Origins, Issues, Early Impact}, volume = {6}, year = {2011}, } @article{partee2007compositionality, author = {Barbara H. Partee}, journal = {Cognitive Foundations of Interpretation}, title = {Compositionality and coercion in semantics: The dynamics of adjective meaning}, year = {2007}, } @incollection{montague1970english, author = {Richard Montague}, booktitle = {Linguaggi nella Societ\`{a} e nella Tecnica}, pages = {189--224}, title = {{E}nglish as a Formal Language}, year = {1970}, } @article{fodor1988connectionism, author = {Jerry A. Fodor and Zenon W. Pylyshyn}, journal = {Cognition}, pages = {3--71}, title = {Connectionism and Cognitive Architecture: A Critical Analysis}, volume = {28}, year = {1988}, } @article{shieber2016principles, author = {Stuart Shieber}, journal = {{AI} Magazine}, number = {1}, title = {Principles for Designing an {AI} Competition, or Why the {T}uring Test Fails as an Inducement Prize}, volume = {37}, year = {2016}, } @inproceedings{sap2019risk, author = {Maarten Sap and Dallas Card and Saadia Gabriel and Yejin Choi and Noah A Smith}, booktitle = {Association for Computational Linguistics (ACL)}, title = {The Risk of Racial Bias in Hate Speech Detection}, year = {2019}, } @inproceedings{zhao2018gender, author = {Jieyu Zhao and Tianlu Wang and Mark Yatskar and Vicente Ordo{\~n}ez and Kai-Wei Chang}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Gender Bias in Coreference Resolution: Evaluation and Debiasing Methods}, year = {2018}, } @incollection{winograd1991thinking, author = {Terry Winograd}, booktitle = {The Boundaries of Humanity: Humans, Animals, Machines}, pages = {198--223}, title = {Thinking machines: Can there be? Are we?}, year = {1991}, } @inproceedings{mccarthy1984some, author = {John McCarthy}, booktitle = {Proceedings of a symposium on Computer culture: The scientific, intellectual, and social impact of the computer}, title = {Some expert systems need common sense}, year = {1984}, } @article{lenat1985cyc, author = {Doug Lenat and Mayank Prakash and Mary Shepherd}, journal = {{AI} Magazine}, number = {4}, title = {CYC: Using Common Sense Knowledge to Overcome Brittleness and Knowledge Acquisition Bottlenecks}, volume = {6}, year = {1985}, } @article{yahia2000rough, author = {M.E. Yahia and R. Mahmood and N. Sulaiman and F. Ahmad}, journal = {Expert Systems with Applications}, pages = {87--99}, title = {Rough neural expert systems}, volume = {18}, year = {2000}, } @inproceedings{gallant1988connectionist, author = {Stephen I. Gallant}, booktitle = {Communications of the ACM}, title = {Connectionist expert systems}, year = {1988}, } @article{zadeh1983computational, author = {Lotfi A. Zadeh}, journal = {Computers and Mathematics with Applications}, number = {1}, title = {A computational approach to fuzzy quantifiers in natural languages}, volume = {9}, year = {1983}, } @inproceedings{jin2020robust, author = {Di Jin and Zhijing Jin and Joey Tianyi Zhou and Peter Szolovits}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Is {BERT} Really Robust? A Strong Baseline for Natural Language Attack on Text Classification and Entailment}, year = {2020}, } @inproceedings{rudinger2018gender, author = {Rachel Rudinger and Jason Naradowsky and Brian Leonard and Benjamin Van Durme}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Gender Bias in Coreference Resolution}, year = {2018}, } @inproceedings{volpi2018generalizing, author = {Riccardo Volpi and Hongseok Namkoong and Ozan Sener and John Duchi and Vittorio Murino and Silvio Savarese}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Generalizing to Unseen Domains via Adversarial Data Augmentation}, year = {2018}, } @article{ganin2016domain, author = {Yaroslav Ganin and Evgeniya Ustinova and Hana Ajakan and Pascal Germain and Hugo Larochelle and Francois Laviolette and Mario March and Victor Lempitsky}, journal = {Journal of Machine Learning Research (JMLR)}, title = {Domain-Adversarial Training of Neural Networks}, volume = {17}, year = {2016}, } @inproceedings{zhu2020freelb, author = {Chen Zhu and Yu Cheng and Zhe Gan and Siqi Sun and Tom Goldstein and Jingjing Liu}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {{F}ree{LB}: Enhanced Adversarial Training for Natural Language Understanding}, year = {2020}, } @inproceedings{miyato2017adversarial, author = {Takeru Miyato and Andrew M. Dai and Ian Goodfellow}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Adversarial Training Methods for Semi-Supervised Text Classification}, year = {2017}, } @article{kang2019testing, author = {Daniel Kang and Yi Sun and Dan Hendrycks and Tom Brown and Jacob Steinhardt}, journal = {arXiv preprint arXiv:1908.08016}, title = {Testing Robustness Against Unforeseen Adversaries}, year = {2019}, } @inproceedings{feng2019misleading, author = {Shi Feng and Eric Wallace and Jordan Boyd-Graber}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Misleading Failures of Partial-input Baselines}, year = {2019}, } @inproceedings{zhang2019paws, author = {Yuan Zhang and Jason Baldridge and Luheng He}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {PAWS: Paraphrase Adversaries from Word Scrambling}, year = {2019}, } @misc{christian2018translate, author = {Jon Christian}, howpublished = {\url{https://www.vice.com/en_us/article/j5npeg/why-is-google-translate-spitting-out-sinister-religious-prophecies}}, title = {Why Is {G}oogle Translate Spitting Out Sinister Religious Prophecies?}, year = {2018}, } @misc{sussmann2007robust, author = {Gerald Jay Sussman}, howpublished = {\url{https://groups.csail.mit.edu/mac/users/gjs/6.945/readings/robust-systems.pdf}}, title = {Building Robust Systems: An essay}, year = {2007}, } @inproceedings{clark2019dont, author = {Christopher Clark and Mark Yatskar and Luke Zettlemoyer}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Don't Take the Easy Way Out: Ensemble Based Methods for Avoiding Known Dataset Biases}, year = {2019}, } @inproceedings{he2019unlearn, author = {He He and Sheng Zha and Haohan Wang}, booktitle = {Workshop on Deep Learning for Low-Resource Natural Language Processing (DeepLo)}, title = {Unlearn Dataset Bias in Natural Language Inference by Fitting the Residual}, year = {2019}, } @incollection{gretton2008covariate, author = {Arthur Gretton and Alex Smola and Jiayuan Huang and Marcel Schmittfull and Karsten Borgwardt and Bernhard Sch{\"o}lkopf}, booktitle = {Dataset Shift in Machine Learning}, title = {Covariate Shift by Kernel Mean Matching}, year = {2008}, } @article{bhagat2013paraphrase, author = {Rahul Bhagat and Eduard Hovy}, journal = {Computational Linguistics}, title = {What Is a Paraphrase?}, volume = {39}, year = {2013}, } @inproceedings{drozdov2019unsupervised, author = {Andrew Drozdov and Pat Verga and Mohit Yadav and Mohit Iyyer and Andrew McCallum}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Unsupervised Latent Tree Induction with Deep Inside-Outside Recursive Autoencoders}, year = {2019}, } @inproceedings{liu2018stochastic, author = {Xiaodong Liu and Yelong Shen and Kevin Duh and Jianfeng Gao}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Stochastic Answer Networks for Machine Reading Comprehension}, year = {2018}, } @inproceedings{wang2018multi, author = {Wei Wang and Ming Yan and Chen Wu}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Multi-Granularity Hierarchical Attention Fusion Networks for Reading Comprehension and Question Answering}, year = {2018}, } @inproceedings{lowell2019practical, author = {David Lowell and Zachary C. Lipton and Byron C. Wallace}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Practical Obstacles to Deploying Active Learning}, year = {2019}, } @article{simeoni2019rethinking, author = {Oriane Sim{\'e}oni and Mateusz Budnik and Yannis Avrithis and Guillaume Gravier}, journal = {arXiv preprint arXiv:1911.08177}, title = {Rethinking deep active learning: Using unlabeled data at model training}, year = {2019}, } @inproceedings{fathi2011combining, author = {Alireza Fathi and Maria-Florina Balcan and Xiaofeng Ren and James M. Rehg}, booktitle = {British Machine Vision Conference (BMVC)}, title = {Combining Self Training and Active Learning for Video Segmentation}, year = {2011}, } @inproceedings{ribeiro2019red, author = {Marco Tulio Ribeiro and Carlos Guestrin and Sameer Singh}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Are Red Roses Red? Evaluating Consistency of Question-Answering Models}, year = {2019}, } @inproceedings{manning2011pos, author = {Christopher D. Manning}, booktitle = {International Conference on Computational Linguistics and Intelligent Text Processing (CICLing)}, title = {Part-of-Speech Tagging from 97% to 100%: Is It Time for Some Linguistics?}, year = {2011}, } @inproceedings{goodwin2020probing, author = {Emily Goodwin and Koustuv Sinha and Timothy J. O'Donnell}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Probing Linguistic Systematicity}, year = {2020}, } @article{brown2020gpt3, author = {Tom B. Brown and Benjamin Mann and Nick Ryder and Melanie Subbiah and Jared Kaplan and Prafulla Dhariwal and Arvind Neelakantan and Pranav Shyam and Girish Sastry and Amanda Askell and Sandhini Agarwal and Ariel Herbert-Voss and Gretchen Krueger and Tom Henighan and Rewon Child and Aditya Ramesh and Daniel M. Ziegler and Jeffrey Wu and Clemens Winter and Christopher Hesse and Mark Chen and Eric Sigler and Mateusz Litwin and Scott Gray and Benjamin Chess and Jack Clark and Christopher Berner and Sam McCandlish and Alec Radford and Ilya Sutskever and Dario Amodei}, journal = {arXiv preprint arXiv:2005.14165}, title = {Language Models are Few-Shot Learners}, year = {2020}, } @article{robey2020modelbased, author = {Alexander Robey and Hamed Hassani and George J. Pappas}, journal = {arXiv preprint arXiv:2005.10247}, title = {Model-Based Robust Deep Learning}, year = {2020}, } @misc{berger2017translated, author = {Yotam Berger}, howpublished = {\url{https://www.haaretz.com/israel-news/palestinian-arrested-over-mistranslated-good-morning-facebook-post-1.5459427}}, title = {Israel Arrests Palestinian Because Facebook Translated `Good Morning' to `Attack Them'}, year = {2017}, } @inproceedings{maccartney2008nli, author = {Bill MacCartney and Christopher D. Manning}, booktitle = {International Conference on Computational Linguistics (COLING)}, title = {Modeling Semantic Containment and Exclusion in Natural Language Inference}, year = {2008}, } @phdthesis{schain2015robustness, author = {Mariano Schain}, school = {Tel Aviv University}, title = {Machine Learning Algorithms and Robustness}, year = {2015}, } @inproceedings{gowal2019scalable, author = {Sven Gowal and Krishnamurthy Dvijotham and Robert Stanforth and Rudy Bunel and Chongli Qin and Jonathan Uesato and Relja Arandjelovi{\'c} and Timothy Mann and Pushmeet Kohli}, booktitle = {International Conference on Computer Vision (ICCV)}, title = {Scalable Verified Training for Provably Robust Image Classification}, year = {2019}, } @inproceedings{ettinger2017generalizable, author = {Allyson Ettinger and Sudha Rao and Hal {Daum{\'e} III} and Emily M. Bender}, booktitle = {Workshop on Building Linguistically Generalizable NLP Systems}, title = {Towards Linguistically Generalizable {NLP} Systems: A Workshop and Shared Task}, year = {2017}, } @article{wallace2019trick, author = {Eric Wallace and Pedro Rodriguez and Shi Feng and Ikuya Yamada and Jordan Boyd-Graber}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {Trick Me If You Can: Human-in-the-Loop Generation of Adversarial Examples for Question Answering}, volume = {7}, year = {2019}, } @inproceedings{klein2001parsing, author = {Dan Klein and Christopher D. Manning}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {338--345}, title = {Parsing with Treebank Grammars: Empirical Bounds, Theoretical Models, and the Structure of the {P}enn Treebank}, year = {2001}, } @inproceedings{azaria2016instructable, author = {Amos Azaria and Jayant Krishnamurthy and Tom M. Mitchell}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {2681--2689}, title = {Instructable Intelligent Personal Agent}, year = {2016}, } @article{iyyer2016answering, author = {Mohit Iyyer and Wen{-}tau Yih and Ming{-}Wei Chang}, journal = {CoRR}, title = {Answering Complicated Question Intents Expressed in Decomposed Question Sequences}, volume = {0}, year = {2016}, } @inproceedings{jia2017concepts, author = {Robin Jia and Larry Heck and Dilek Hakkani-T{\"u}r and Georgi Nikolov}, booktitle = {International Conference on Acoustics, Speech, and Signal Processing (ICASSP)}, title = {Learning Concepts through Conversations in Spoken Dialogue Systems}, year = {2017}, } @article{dijkstra1978ewd667, author = {Edsger W. Dijkstra}, journal = {EWD667}, title = {On the foolishness of ``natural language programming''}, year = {1978}, } @inproceedings{campagna2017almond, author = {Giovanni Campagna and Rakesh Ramesh and Silei Xu and Michael Fischer and Monica S. Lam}, booktitle = {World Wide Web (WWW)}, pages = {341--350}, title = {Almond: The Architecture of an Open, Crowdsourced, Privacy-Preserving, Programmable Virtual Assistant}, year = {2017}, } @inproceedings{gulwani2014nlyze, author = {Sumit Gulwani and Mark Marron}, booktitle = {International Conference on Management of Data, SIGMOD}, pages = {803--814}, title = {N{L}yze: interactive programming by natural language for spreadsheet data analysis and manipulation}, year = {2014}, } @techreport{lin2017program, author = {Xi Victoria Lin and Chenglong Wang and Deric Pang and Kevin Vu and Luke Zettlemoyer and Michael D. Ernst}, institution = {University of Washington}, number = {0}, title = {Program synthesis from natural language using recurrent neural networks}, year = {2017 2017}, } @book{ullmann1962semantics, author = {S. Ullmann}, publisher = {W. de Gruyter}, title = {Semantics: An Introduction to the Science of Meaning}, year = {1962}, } @book{kittredge1982sublanguage, author = {R. Kittredge and J. Lehrberger}, publisher = {B. Blackwell}, title = {Sublanguage: Studies of Language in Restricted Semantic Domains}, year = {1982}, } @article{srinivasan2017nli, author = {Arjun Srinivasan and John Stasko}, journal = {EuroVis}, title = {Natural Language Interfaces for Data Analysis with Visualization: Considering What Has and Could Be Asked}, year = {2017}, } @article{kuhl2004earlylanguage, author = {Patricia K Kuhl}, journal = {Nature Reviews Neuroscience}, title = {Early language acquisition: cracking the speech code}, year = {2004}, } @book{krashen1982second, author = {Stephen Krashen}, publisher = {Pergamon Press}, title = {Principles and Practice in Second Language Acquisition}, year = {1982}, } @article{sachs1981language, author = {Jacqueline Sachs and Barbara Bard and Marie L Johnson}, journal = {Applied Psycholinguistics}, title = {Language learning with restricted input: Case studies of two hearing children of deaf parents}, volume = {0}, year = {1981}, } @article{partee1995lexical, author = {Partee, Barbara}, journal = {An Invitation to Cognitive Science}, title = {Lexical semantics and compositionality}, volume = {0}, year = {1995}, } @inproceedings{dostert1969rel2, author = {Bozena Dostert and Frederick B. Thompson}, booktitle = {International Conference on Computational Linguistics (COLING)}, title = {{REL}: A Rapidly Extensible Language System {II}. {REL} {E}nglish}, year = {1969}, } @inproceedings{dostert1969rel, author = {Bozena Dostert and Frederick B. Thompson}, booktitle = {International Conference on Computational Linguistics (COLING)}, title = {{REL}: A Rapidly Extensible Language System {I}}, year = {1969}, } @article{thompson1975rel, author = {Frederick B. Thompson and Bozena Henisz Thompson}, journal = {Advances in Computers}, pages = {109--168}, title = {Practical Natural Language Processing: The {REL} System as Prototype}, volume = {13}, year = {1975}, } @book{campbell1998historical, author = {L. Campbell}, publisher = {Edinburgh University Press}, title = {Historical Linguistics: An Introduction}, year = {1998}, } @book{bar1964language, author = {Y Bar-Hillel}, publisher = {Addison-Wesley/The Jerusalem Academic Press}, title = {Language and Information: Selected Essays on Their Theory and Application}, year = {1964}, } @article{konstas2017neural, author = {Ioannis Konstas and Srinivasan Iyer and Mark Yatskar and Yejin Choi and Luke Zettlemoyer}, journal = {CoRR}, title = {Neural {AMR:} Sequence-to-Sequence Models for Parsing and Generation}, volume = {0}, year = {2017}, } @inproceedings{iyer2017neural, author = {Srinivasan Iyer and Ioannis Konstas and Alvin Cheung and Jayant Krishnamurthy and Luke Zettlemoyer}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Learning a Neural Semantic Parser from User Feedback}, year = {2017}, } @article{scassellati2012robots, author = {Brian Scassellati and Henny Admoni and Maja Mataric}, journal = {Annual review of biomedical engineering}, pages = {275--294}, title = {Robots for Use in Autism Research}, volume = {14}, year = {2012}, } @inproceedings{knepper2013ikeabot, author = {Ross A. Knepper and Todd Layton and John Romanishin and Daniela Rus}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {855--862}, title = {IkeaBot: An autonomous multi-robot coordinated furniture assembly system}, year = {2013}, } @inproceedings{thomason2015learning, author = {Jesse Thomason and Shiqi Zhang and Raymond J. Mooney and Peter Stone}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Learning to Interpret Natural Language Commands through Human-Robot Dialog}, year = {2015}, } @inproceedings{koch2015siamese, author = {Gregory R. Koch and Richard Zemel and Ruslan Salakhutdinov}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Siamese Neural Networks for One-Shot Image Recognition}, year = {2015}, } @inproceedings{johnson2016malmo, author = {Matthew Johnson and Katja Hofmann and Tim Hutton and David Bignell}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {The Malmo Platform for Artificial Intelligence Experimentation}, year = {2016}, } @inproceedings{arumugam2017accurately, author = {Dilip Arumugam and Siddharth Karamcheti and Nakul Gopalan and Lawson L. S. Wong and Stefanie Tellex}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Accurately and Efficiently Interpreting Human-Robot Instructions of Varying Granularities}, year = {2017}, } @inproceedings{karamcheti2017draggns, author = {Siddharth Karamcheti and Edward C. Williams and Dilip Arumugam and Mina Rhee and Nakul Gopalan and Lawson L. S. Wong and Stefanie Tellex}, booktitle = {First Workshop on Language Grounding for Robotics @ ACL}, title = {A Tale of Two DRAGGNs: A Hybrid Approach for Interpreting Action-Oriented and Goal-Oriented Instructions}, year = {2017}, } @inproceedings{koehn2017six, author = {Philipp Koehn and Rebecca Knowles}, booktitle = {NMT@ACL}, title = {Six Challenges for Neural Machine Translation}, year = {2017}, } @article{hermann2017grounded, author = {Karl Moritz Hermann and Felix Hill and Simon Green and Fumin Wang and Ryan Faulkner and Hubert Soyer and David Szepesvari and Wojciech Czarnecki and Max Jaderberg and Denis Teplyashin and Marcus Wainwright and Chris Apps and Demis Hassabis and Phil Blunsom}, journal = {arXiv preprint arXiv:1706.06551}, title = {Grounded Language Learning in a Simulated 3D World}, year = {2017}, } @article{kolve2017ai2thor, author = {Eric Kolve and Roozbeh Mottaghi and Daniel Gordon and Yuke Zhu and Abhinav Gupta and Ali Farhadi}, journal = {arXiv preprint arXiv:1712.05474}, title = {AI2-THOR: An Interactive 3D Environment for Visual {AI}}, year = {2017}, } @inproceedings{labutov2018lia, author = {Igor Labutov and Shashank Srivastava and Tom Michael Mitchell}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {LIA: A Natural Language Programmable Personal Assistant}, year = {2018}, } @inproceedings{chaplot2018gated, author = {Devendra Singh Chaplot and Kanthashree Mysore Sathyendra and Rama Kumar Pasumarthi and Dheeraj Rajagopal and Ruslan Salakhutdinov}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Gated-Attention Architectures for Task-Oriented Language Grounding}, year = {2018}, } @inproceedings{ott2018analyzing, author = {Myle Ott and Michael Auli and David Grangier and Marc'Aurelio Ranzato}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Analyzing Uncertainty in Neural Machine Translation}, year = {2018}, } @inproceedings{damen2018kitchens, author = {Dima Damen and Hazel Doughty and Giovanni Maria Farinella and Sanja Fidler and Antonino Furnari and Evangelos Kazakos and Davide Moltisanti and Jonathan Munro and Toby Perrett and Will Price and Michael Wray}, booktitle = {European Conference on Computer Vision (ECCV)}, title = {Scaling Egocentric Vision: The {EPIC}-{KITCHENS} Dataset}, year = {2018}, } @inproceedings{fried2018speakerfollower, author = {Daniel Fried and Ronghang Hu and Volkan Cirik and Anna Rohrbach and Jacob Andreas and Louis-Philippe Morency and Taylor Berg-Kirkpatrick and Kate Saenko and Dan Klein and Trevor Darrell}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Speaker-Follower Models for Vision-and-Language Navigation}, year = {2018}, } @inproceedings{yu2019cosql, author = {Tao Yu and Rui Zhang and He Yang Er and Suyi Li and Eric Xue and Bo Pang and Xi Victoria Lin and Yi Chern Tan and Tianze Shi and Zihan Li and Youxuan Jiang and Michihiro Yasunaga and Sungrok Shim and Tao Chen and Alexander R. Fabbri and Zifan Li and Luyao Chen and Yuwen Zhang and Shreya Dixit and Vincent Zhang and Caiming Xiong and Richard Socher and Walter S. Lasecki and Dragomir R. Radev}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {CoSQL: A Conversational Text-to-{SQL} Challenge Towards Cross-Domain Natural Language Interfaces to Databases}, year = {2019}, } @inproceedings{chevalierboisvert2019babyai, author = {Maxime Chevalier-Boisvert and Dzmitry Bahdanau and Salem Lahlou and Lucas Willems and Chitwan Saharia and Thien Huu Nguyen and Yoshua Bengio}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {BabyAI: A Platform to Study the Sample Efficiency of Grounded Language Learning}, year = {2019}, } @inproceedings{yao2019model, author = {Ziyu Yao and Yu Su and Huan Sun and Wen-tau Yih}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Model-based Interactive Semantic Parsing: A Unified Framework and A Text-to-{SQL} Case Study}, year = {2019}, } @article{gray2019craftassist, author = {Jonathan Gray and Kavya Srinet and Yacine Jernite and Haonan Yu and Zhuoyuan Chen and Demi Guo and Siddharth Goyal and C. Lawrence Zitnick and Arthur Szlam}, journal = {arXiv preprint arXiv:1907.08584}, title = {CraftAssist: A Framework for Dialogue-enabled Interactive Agents}, year = {2019}, } @article{lee2019ikea, author = {Youngwoon Lee and Edward S. Hu and Zhengyu Yang and Alex Yin and Joseph J Lim}, journal = {arXiv preprint arXiv:1911.07246}, title = {{IKEA} Furniture Assembly Environment for Long-Horizon Complex Manipulation Tasks}, year = {2019}, } @inproceedings{thomason2019improving, author = {Jesse Thomason and Aishwarya Padmakumar and Jivko Sinapov and Nick Walker and Yuqian Jiang and Harel Yedidsion and Justin W. Hart and Peter Stone and Raymond J. Mooney}, booktitle = {International Conference on Robotics and Automation (ICRA)}, title = {Improving Grounded Natural Language Understanding through Human-Robot Dialog}, year = {2019}, } @inproceedings{weigelt2020programmingfuse, author = {Sebastian Weigelt and Vanessa Steurer and Tobias Hey and W. Tichy}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Programming in Natural Language with fuSE: Synthesizing Methods from Spoken Utterances Using Deep Natural Language Understanding}, year = {2020}, } @inproceedings{shridhar2020alfred, author = {Mohit Shridhar and Jesse Thomason and Daniel Gordon and Yonatan Bisk and Winson Han and Roozbeh Mottaghi and Luke Zettlemoyer and Dieter Fox}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {ALFRED: A Benchmark for Interpreting Grounded Instructions for Everyday Tasks}, year = {2020}, } @article{wilson1996relative, author = {William J Wilson and CC Williams Hulls and Graham S Bell}, journal = {IEEE Transactions on Robotics (T-RO)}, pages = {684--696}, title = {Relative end-effector control using cartesian position based visual servoing}, volume = {12}, year = {1996}, } @article{ciocarlie2009hand, author = {Matei T Ciocarlie and Peter K Allen}, journal = {International Journal of Robotics Research (IJRR)}, pages = {851--867}, title = {Hand posture subspaces for dexterous robotic grasping}, volume = {28}, year = {2009}, } @article{artemiadis2010emg, author = {Panagiotis K Artemiadis and Kostas J Kyriakopoulos}, journal = {IEEE Transactions on Robotics (T-RO)}, pages = {393--398}, title = {{EMG}-based control of a robot arm using low-dimensional embeddings}, volume = {26}, year = {2010}, } @inproceedings{lai2012detection, author = {Kevin Lai and Liefeng Bo and Xiaofeng Ren and Dieter Fox}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {1330--1337}, title = {Detection-based object labeling in 3d scenes}, year = {2012}, } @article{matrone2012real, author = {Giulia C Matrone and Christian Cipriani and Maria Chiara Carrozza and Giovanni Magenes}, journal = {Journal of Neuroengineering and Rehabilitation}, pages = {40--40}, title = {Real-time myoelectric control of a multi-fingered hand prosthesis using principal components analysis}, volume = {9}, year = {2012}, } @inproceedings{todorov2012mujoco, author = {E. Todorov and T. Erez and Y. Tassa}, booktitle = {International Conference on Intelligent Robots and Systems (IROS)}, pages = {5026--5033}, title = {MuJoCo: A physics engine for model-based control}, year = {2012}, } @article{dragan2013policy, author = {Anca D Dragan and Siddhartha S Srinivasa}, journal = {International Journal of Robotics Research (IJRR)}, pages = {790--805}, title = {A policy-blending formalism for shared control}, volume = {32}, year = {2013}, } @article{chen2013robots, author = {T. L. Chen and M. Ciocarlie and S. Cousins and Phillip M. Grice and Kelsey P. Hawkins and K. Hsiao and Charles C. Kemp and C. King and Daniel A. Lazewatsky and A. Leeper and H. Nguyen and A. Paepcke and C. Pantofaru and W. Smart and L. Takayama}, journal = {IEEE Robotics \& Automation Magazine (RAM)}, pages = {30--39}, title = {Robots for humanity: using assistive robotics to empower people with disabilities}, volume = {20}, year = {2013}, } @article{carlson2013brain, author = {Tom Carlson and Jose del R Millan}, journal = {IEEE Robotics \& Automation Magazine (RAM)}, pages = {65--73}, title = {Brain-controlled wheelchairs: a robotic architecture}, volume = {20}, year = {2013}, } @article{goodrich2013teleoperation, author = {M. A. Goodrich and J. Crandall and E. Barakova}, journal = {Reviews of Human Factors and Ergonomics}, pages = {175--226}, title = {Teleoperation and Beyond for Assistive Humanoid Robots}, volume = {9}, year = {2013}, } @inproceedings{conti2014interface, author = {Fran{\c}ois Conti and Jaeheung Park and Oussama Khatib}, booktitle = {Experimental Robotics}, pages = {97--113}, title = {Interface design and control strategies for a robot assisted ultrasonic examination system}, year = {2014}, } @misc{tzutalin2015labelimg, author = {Tzutalin}, howpublished = {\url{https://github.com/tzutalin/labelImg}}, title = {LabelImg}, year = {2015}, } @inproceedings{jain2015assistive, author = {Siddarth Jain and Ali Farshchiansadegh and Alexander Broad and Farnaz Abdollahi and Ferdinando Mussa-Ivaldi and Brenna Argall}, booktitle = {IEEE International Conference on Rehabilitation Robotics (ICORR)}, pages = {526--531}, title = {Assistive robotic manipulation through shared autonomy and a body-machine interface}, year = {2015}, } @inproceedings{watter2015embed, author = {Manuel Watter and Jost Springenberg and Joschka Boedecker and Martin Riedmiller}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {2746--2754}, title = {Embed to control: a locally linear latent dynamics model for control from raw images}, year = {2015}, } @article{muelling2015autonomy, author = {Katharina Muelling and Arun Venkatraman and Jean-Sebastien Valois and John Downey and Jeffrey Weiss and Shervin Javdani and Martial Hebert and Andrew B Schwartz and Jennifer L Collinger and J Andrew Bagnell}, journal = {arXiv preprint arXiv:1503.05451}, title = {Autonomy infused teleoperation with application to {BCI} manipulation}, year = {2015}, } @article{jonschkowski2015statereps, author = {Rico Jonschkowski and Oliver Brock}, journal = {Autonomous Robots}, pages = {407--428}, title = {Learning state representations with robotic priors}, volume = {39}, year = {2015}, } @inproceedings{redmon2016yolo, author = {Joseph Redmon and Santosh Divvala and Ross B. Girshick and Ali Farhadi}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {779--788}, title = {You Only Look Once: Unified, Real-Time Object Detection}, year = {2016}, } @inproceedings{herlant2016assistive, author = {Laura V Herlant and Rachel M Holladay and Siddhartha S Srinivasa}, booktitle = {ACM/IEEE International Conference on Human Robot Interaction (HRI)}, pages = {35--42}, title = {Assistive teleoperation of robot arms via automatic time-optimal mode switching}, year = {2016}, } @article{levine2016end, author = {S. Levine and Chelsea Finn and Trevor Darrell and P. Abbeel}, journal = {Journal of Machine Learning Research (JMLR)}, title = {End-to-End Training of Deep Visuomotor Policies}, volume = {17}, year = {2016}, } @article{gopinath2016human, author = {Deepak Gopinath and Siddarth Jain and Brenna D Argall}, journal = {IEEE Robotics and Automation Letters (RA-L)}, pages = {247--254}, title = {Human-in-the-loop optimization of shared autonomy in assistive robotics}, volume = {2}, year = {2016}, } @inproceedings{nikolaidis2017human, author = {Stefanos Nikolaidis and Yu Xiang Zhu and David Hsu and Siddhartha Srinivasa}, booktitle = {ACM/IEEE International Conference on Human Robot Interaction (HRI)}, pages = {294--302}, title = {Human-robot mutual adaptation in shared autonomy}, year = {2017}, } @inproceedings{zhu2017target, author = {Yuke Zhu and Roozbeh Mottaghi and Eric Kolve and Joseph J Lim and Abhinav Gupta and Li Fei-Fei and Ali Farhadi}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {3357--3364}, title = {Target-driven visual navigation in indoor scenes using deep reinforcement learning}, year = {2017}, } @inproceedings{laghi2017teleimpedance, author = {Marco Laghi and A. Ajoudani and M. Catalano and A. Bicchi}, booktitle = {International Conference on Intelligent Robots and Systems (IROS)}, pages = {2564--2571}, title = {Tele-impedance with force feedback under communication time delay}, year = {2017}, } @book{taylor2018americans, author = {Danielle M Taylor}, publisher = {US Census Bureau}, title = {Americans With Disabilities: 2014}, year = {2018}, } @article{newman2018harmonic, author = {Benjamin A. Newman and Reuben M. Aronson and S. Srinivasa and K. Kitani and Henny Admoni}, journal = {arXiv preprint arXiv:1807.11154}, title = {HARMONIC: A Multimodal Dataset of Assistive Human-Robot Collaboration}, year = {2018}, } @inproceedings{aronson2018eye, author = {Reuben M Aronson and Thiago Santini and Thomas C K{\"u}bler and Enkelejda Kasneci and Siddhartha Srinivasa and Henny Admoni}, booktitle = {ACM/IEEE International Conference on Human Robot Interaction (HRI)}, pages = {4--13}, title = {Eye-hand behavior in human-robot shared manipulation}, year = {2018}, } @inproceedings{reddy2018shared, author = {Siddharth Reddy and Anca D Dragan and Sergey Levine}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Shared autonomy via deep reinforcement learning}, year = {2018}, } @article{javdani2018shared, author = {Shervin Javdani and Henny Admoni and Stefania Pellegrinelli and Siddhartha S Srinivasa and J Andrew Bagnell}, journal = {International Journal of Robotics Research (IJRR)}, pages = {717--742}, title = {Shared autonomy via hindsight optimization for teleoperation and teaming}, volume = {37}, year = {2018}, } @article{losey2018review, author = {Dylan P Losey and Craig G McDonald and Edoardo Battaglia and Marcia K O'Malley}, journal = {Applied Mechanics Reviews}, title = {A review of intent detection, arbitration, and communication aspects of shared control for physical human-robot interaction}, volume = {70}, year = {2018}, } @article{argall2018autonomy, author = {Brenna D Argall}, journal = {Annual Review of Control, Robotics, and Autonomous Systems}, pages = {441--463}, title = {Autonomy in rehabilitation robotics: an intersection}, volume = {1}, year = {2018}, } @misc{openvino2018cvat, author = {OpenVinoToolKit}, howpublished = {\url{https://github.com/openvinotoolkit/cvat}}, title = {Computer Vision Annotation Tool}, year = {2018}, } @inproceedings{fan2018surreal, author = {Linxi Fan and Yuke Zhu and Jiren Zhu and Zihua Liu and Orien Zeng and Anchit Gupta and Joan Creus-Costa and Silvio Savarese and Li Fei-Fei}, booktitle = {Conference on Robot Learning}, title = {SURREAL: Open-Source Reinforcement Learning Framework and Robot Manipulation Benchmark}, year = {2018}, } @inproceedings{reyes2018self, author = {John Co-Reyes and YuXuan Liu and Abhishek Gupta and Benjamin Eysenbach and Pieter Abbeel and Sergey Levine}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1009--1018}, title = {Self-consistent trajectory autoencoder: hierarchical reinforcement learning with trajectory embeddings}, year = {2018}, } @inproceedings{broad2018learning, author = {Alexander Broad and Todd Murphey and Brenna Argall}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Learning models for shared control of human-machine systems with unknown dynamics}, year = {2018}, } @article{jain2019probabilistic, author = {Siddarth Jain and Brenna Argall}, journal = {ACM Transactions on Human-Robot Interaction (THRI)}, pages = {1--23}, title = {Probabilistic human intent recognition for shared autonomy in assistive robotics}, volume = {9}, year = {2019}, } @inproceedings{yu2019unsupervised, author = {Tianhe Yu and Gleb Shevchuk and Dorsa Sadigh and Chelsea Finn}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Unsupervised Visuomotor Control through Distributional Planning Networks}, year = {2019}, } @inproceedings{wang2019learning, author = {Angelina Wang and Thanard Kurutach and Kara Liu and P. Abbeel and A. Tamar}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Learning Robotic Manipulation through Visual Planning and Acting}, year = {2019}, } @inproceedings{broad2019highly, author = {Alexander Broad and Todd Murphey and Brenna Argall}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Highly parallelized data-driven {MPC} for minimal intervention shared control}, year = {2019}, } @inproceedings{chandak2019learning, author = {Yash Chandak and Georgios Theocharous and James Kostas and Scott Jordan and Philip Thomas}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {941--950}, title = {Learning action representations for reinforcement learning}, year = {2019}, } @article{lynch2019learning, author = {Corey Lynch and Mohi Khansari and Ted Xiao and Vikash Kumar and Jonathan Tompson and Sergey Levine and Pierre Sermanet}, journal = {arXiv preprint arXiv:1903.01973}, title = {Learning Latent Plans from Play}, year = {2019}, } @article{feng2019robot, author = {Ryan Feng and Young-sun Kim and Gilwoo Lee and E. Gordon and Matt Schmittle and Shivaum Kumar and T. Bhattacharjee and S. Srinivasa}, journal = {arXiv preprint arXiv:1906.02350}, title = {Robot-Assisted Feeding: Generalizing Skewering Strategies across Food Items on a Realistic Plate}, year = {2019}, } @inproceedings{edwards2019imitating, author = {Ashley Edwards and Himanshu Sahni and Yannick Schroecker and Charles Isbell}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1755--1763}, title = {Imitating latent policies from observation}, year = {2019}, } @inproceedings{bhattacharjee2020more, author = {Tapomayukh Bhattacharjee and Ethan K Gordon and Rosario Scalise and Maria E Cabrera and Anat Caspi and Maya Cakmak and Siddhartha S Srinivasa}, booktitle = {ACM/IEEE International Conference on Human Robot Interaction (HRI)}, pages = {181--190}, title = {Is More Autonomy Always Better? Exploring Preferences of Users with Mobility Impairments in Robot-assisted Feeding}, year = {2020}, } @manual{jocher2020yolov5, author = {Glenn Jocher and Alex Stoken and Jirka Borovec and NanoCode012 and ChristopherSTAN and Laughing and tkianai and Adam Hogan and lorenzomammana and yxNONG and AlexWang1900 and Laurentiu Diaconu and Marc and wanghaoyang0106 and ml5ah and Doug and Francisco Ingham and Frederik and Guilhen and Hatovix and Jake Poznanski and Jiacong Fang and Lijun Yu and changyu98 and Mingyu Wang and Naman Gupta and Osama Akhtar and PetrDvoracek and Prashant Rai}, title = {{YOLO}-v5 repository}, year = {2020}, } @article{broad2020datadriven, author = {A. Broad and Ian Abraham and T. Murphey and Brenna Argall}, journal = {International Journal of Robotics Research (IJRR)}, pages = {1178--1195}, title = {Data-driven Koopman operators for model-based shared control of human–machine systems}, volume = {39}, year = {2020}, } @article{jing2020selfsupervised, author = {Longlong Jing and Yingli Tian}, journal = {IEEE transactions on pattern analysis and machine intelligence}, title = {Self-supervised Visual Feature Learning with Deep Neural Networks: A Survey}, year = {2020}, } @article{park2020toward, author = {Daehyung Park and Yuuna Hoshi and Harshal P. Mahajan and W. Rogers and Charles C. Kemp}, journal = {Robotics and Autonomous Systems}, title = {Toward Active Robot-Assisted Feeding with a General-Purpose Mobile Manipulator: Design, Evaluation, and Lessons Learned}, volume = {124}, year = {2020}, } @article{laghi2020unifying, author = {Marco Laghi and A. Ajoudani and M. Catalano and A. Bicchi}, journal = {International Journal of Robotics Research (IJRR)}, pages = {514--539}, title = {Unifying bilateral teleoperation and tele-impedance for enhanced user experience}, volume = {39}, year = {2020}, } @inproceedings{losey2020latent, author = {Dylan P. Losey and Krishnan Srinivasan and Ajay Mandlekar and Animesh Garg and Dorsa Sadigh}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {378--384}, title = {Controlling Assistive Robots with Learned Latent Actions}, year = {2020}, } @inproceedings{jeon2020sharedlatent, author = {Hong Jun Jeon and Dylan P. Losey and Dorsa Sadigh}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Shared Autonomy with Learned Latent Actions}, year = {2020}, } @inproceedings{li2020intuitive, author = {Mengxi Li and Dylan P. Losey and Jeannette Bohg and Dorsa Sadigh}, booktitle = {International Conference on Intelligent Robots and Systems (IROS)}, title = {Learning User-Preferred Mappings for Intuitive Robot Control}, year = {2020}, } @inproceedings{freund1995adaboost, author = {Y. Freund and R. Schapire}, booktitle = {Conference on Learning Theory (COLT)}, title = {A decision-theoretic generalization of on-line learning and an application to boosting}, year = {1995}, } @inproceedings{kumar2010self, author = {M Pawan Kumar and Benjamin Packer and Daphne Koller}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1189--1197}, title = {Self-paced learning for latent variable models}, year = {2010}, } @article{young2014image, author = {P. Young and A. Lai and M. Hodosh and J. Hockenmaier}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, pages = {67--78}, title = {From image descriptions to visual denotations: New similarity metrics for semantic inference over event descriptions}, volume = {2}, year = {2014}, } @inproceedings{ma2017self, author = {Fan Ma and Deyu Meng and Qi Xie and Zina Li and Xuanyi Dong}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Self-paced co-training}, year = {2017}, } @inproceedings{chang2017active, author = {Haw-Shiuan Chang and Erik Learned-Miller and Andrew McCallum}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1002--1012}, title = {Active bias: Training more accurate neural networks by emphasizing high variance samples}, year = {2017}, } @inproceedings{ren2018reweighting, author = {Mengye Ren and Wenyuan Zeng and B. Yang and R. Urtasun}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Learning to Reweight Examples for Robust Deep Learning}, year = {2018}, } @inproceedings{romanov2018mednli, author = {Alexey Romanov and Chaitanya Shivade}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Lessons from Natural Language Inference in the Clinical Domain}, year = {2018}, } @inproceedings{belinkov2019premise, author = {Yonatan Belinkov and Adam Poliak and S. Shieber and Benjamin Van Durme and Alexander M. Rush}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Don't Take the Premise for Granted: Mitigating Artifacts in Natural Language Inference}, year = {2019}, } @inproceedings{jiang2018mentornet, author = {Lu Jiang and Zhengyuan Zhou and Thomas Leung and Li-Jia Li and Li Fei-Fei}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {2304--2313}, title = {{MentorNet}: Learning data-driven curriculum for very deep neural networks on corrupted labels}, year = {2018}, } @inproceedings{shu2019meta, author = {Jun Shu and Qi Xie and Lixuan Yi and Qian Zhao and Sanping Zhou and Zongben Xu and Deyu Meng}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1919--1930}, title = {{Meta-Weight-Net}: Learning an explicit mapping for sample weighting}, year = {2019}, } @article{grefenstette2019higher, author = {Edward Grefenstette and Brandon Amos and Denis Yarats and Phu Mon Htut and Artem Molchanov and F. Meier and Douwe Kiela and Kyunghyun Cho and Soumith Chintala}, journal = {arXiv preprint arXiv:1910.01727}, title = {Generalized Inner Loop Meta-Learning}, year = {2019}, } @inproceedings{nie2020adversarial, author = {Yixin Nie and Adina Williams and Emily Dinan and Mohit Bansal and J. Weston and Douwe Kiela}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Adversarial NLI: A New Benchmark for Natural Language Understanding}, year = {2020}, } @inproceedings{mccoy2020berts, author = {R. Thomas McCoy and Junghyun Min and Tal Linzen}, booktitle = {Proceedings of the Third BlackBoxNLP Workshop on Analyzing and Interpreting Neural Networks for NLP @ EMNLP}, title = {BERTs of a feather do not generalize together: Large variability in generalization across models with similar test set performance}, year = {2020}, } @inproceedings{lewis1994heterogeneous, author = {David D Lewis and Jason Catlett}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {148--156}, title = {Heterogeneous uncertainty sampling for supervised learning}, year = {1994}, } @inproceedings{cohn1994active, author = {David A. Cohn and Zoubin Ghahramani and Michael I. Jordan}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Active Learning with Statistical Models}, year = {1994}, } @book{han2000datamining, author = {Jiawei Han and Micheline Kamber}, publisher = {Morgan Kaufmann}, title = {Data Mining: Concepts and Techniques}, year = {2000}, } @inproceedings{scheffer2001active, author = {Tobias Scheffer and Christian Decomain and Stefan Wrobel}, booktitle = {International Symposium on Intelligent Data Analysis}, pages = {309--318}, title = {Active hidden {M}arkov models for information extraction}, year = {2001}, } @inproceedings{krymolowski2002distinguishing, author = {Yuval Krymolowski}, booktitle = {International Conference on Computational Linguistics (COLING)}, title = {Distinguishing easy and hard instances}, year = {2002}, } @inproceedings{jones2003active, author = {Rosie Jones and Rayid Ghani and Tom Mitchell and Ellen Riloff}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, pages = {26--34}, title = {Active learning for information extraction with multiple view feature sets}, year = {2003}, } @inproceedings{finn2003active, author = {Aidan Finn and Nicolas Kushmerick}, booktitle = {Proceedings of the International Workshop on Adaptive Text Extraction and Mining (ATEM-03)}, pages = {18--25}, title = {Active learning selection strategies for information extraction}, year = {2003}, } @techreport{abramson2004active, author = {Yotam Abramson and Yoav Freund}, institution = {University of California, San Diego}, title = {Active learning for visual object recognition}, year = {2004}, } @inproceedings{hachey2005investigating, author = {Ben Hachey and Beatrice Alex and Markus Becker}, booktitle = {Computational Natural Language Learning (CoNLL)}, pages = {144--151}, title = {Investigating the effects of selective sampling on the annotation task}, year = {2005}, } @inproceedings{hoi2006batch, author = {Steven CH Hoi and Rong Jin and Jianke Zhu and Michael R Lyu}, booktitle = {Proceedings of the 23rd international conference on Machine learning}, pages = {417--424}, title = {Batch mode active learning and its application to medical image classification}, year = {2006}, } @article{schein2007active, author = {A. Schein and Lyle H. Ungar}, journal = {Machine Learning}, pages = {235--265}, title = {Active learning for logistic regression: An evaluation}, volume = {68}, year = {2007}, } @inproceedings{collins2008towards, author = {Brendan Collins and Jia Deng and Kai Li and Li Fei-Fei}, booktitle = {European Conference on Computer Vision (ECCV)}, pages = {86--98}, title = {Towards scalable dataset construction: An active learning approach}, year = {2008}, } @inproceedings{joshi2009multi, author = {Ajay J Joshi and Fatih Porikli and Nikolaos Papanikolopoulos}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {2372--2379}, title = {Multi-class active learning for image classification}, year = {2009}, } @techreport{settles2009active, author = {Burr Settles}, institution = {University of Wisconsin, Madison}, title = {Active learning literature survey}, year = {2009}, } @inproceedings{bigham2010vizwiz, author = {Jeffrey P Bigham and Chandrika Jayant and Hanjie Ji and Greg Little and Andrew Miller and Robert C Miller and Robin Miller and Aubrey Tatarowicz and Brandyn White and Samual White and Tom Yeh}, booktitle = {User Interface Software and Technology (UIST)}, pages = {333--342}, title = {{VizWiz}: nearly real-time answers to visual questions}, year = {2010}, } @article{houlsby2011bayesian, author = {Neil Houlsby and Ferenc Husz{\'a}r and Zoubin Ghahramani and M{\'a}t{\'e} Lengyel}, journal = {arXiv preprint arXiv:1112.5745}, title = {{B}ayesian active learning for classification and preference learning}, year = {2011}, } @inproceedings{khosla2012undoing, author = {Aditya Khosla and Tinghui Zhou and Tomasz Malisiewicz and Alexei A Efros and Antonio Torralba}, booktitle = {European Conference on Computer Vision (ECCV)}, pages = {158--171}, title = {Undoing the damage of dataset bias}, year = {2012}, } @article{zhou2015simple, author = {Bolei Zhou and Yuandong Tian and Sainbayar Sukhbaatar and Arthur Szlam and Rob Fergus}, journal = {arXiv preprint arXiv:1512.02167}, title = {Simple baseline for visual question answering}, year = {2015}, } @article{ren2015frcnn, author = {Shaoqing Ren and Kaiming He and Ross B. Girshick and Jian Sun}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI)}, pages = {1137--1149}, title = {Faster {R}-{CNN}: Towards Real-Time Object Detection with Region Proposal Networks}, volume = {39}, year = {2015}, } @article{agrawal2015vqa1, author = {Aishwarya Agrawal and Jiasen Lu and Stanislaw Antol and Margaret Mitchell and C. Lawrence Zitnick and Devi Parikh and Dhruv Batra}, journal = {International Journal of Computer Vision}, pages = {4--31}, title = {{VQA}: Visual Question Answering}, volume = {123}, year = {2015}, } @inproceedings{malinowski2015ask, author = {Mateusz Malinowski and Marcus Rohrbach and Mario Fritz}, booktitle = {International Conference on Computer Vision (ICCV)}, pages = {1--9}, title = {Ask your neurons: A neural-based approach to answering questions about images}, year = {2015}, } @inproceedings{ren2015exploring, author = {Mengye Ren and Ryan Kiros and Richard Zemel}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {2953--2961}, title = {Exploring models and data for image question answering}, year = {2015}, } @inproceedings{lu2016hierarchical, author = {Jiasen Lu and Jianwei Yang and Dhruv Batra and Devi Parikh}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Hierarchical question-image co-attention for visual question answering}, year = {2016}, } @inproceedings{fukui2016multimodal, author = {Akira Fukui and Dong Huk Park and Daylen Yang and Anna Rohrbach and Trevor Darrell and Marcus Rohrbach}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Multimodal compact bilinear pooling for visual question answering and visual grounding}, year = {2016}, } @inproceedings{wu2016ask, author = {Qi Wu and Peng Wang and Chunhua Shen and Anthony Dick and Anton van den Hengel}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {4622--4630}, title = {Ask me anything: Free-form visual question answering based on knowledge from external sources}, year = {2016}, } @inproceedings{zhu2016visual7w, author = {Yuke Zhu and Oliver Groth and Michael Bernstein and Li Fei-Fei}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {4995--5004}, title = {Visual7{W}: Grounded question answering in images}, year = {2016}, } @article{lin2017active, author = {Xiao Lin and Devi Parikh}, journal = {arXiv preprint arXiv:1711.01732}, title = {Active Learning for Visual Question Answering: An Empirical Study}, year = {2017}, } @inproceedings{shen2017deep, author = {Yanyao Shen and Hyokun Yun and Zachary C Lipton and Yakov Kronrod and Animashree Anandkumar}, booktitle = {Proceedings of the Second Workshop on Representation Learning for NLP (Repl4NLP)}, title = {Deep active learning for named entity recognition}, year = {2017}, } @inproceedings{kendall2017uncertainties, author = {Alex Kendall and Yarin Gal}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {5574--5584}, title = {What uncertainties do we need in {B}ayesian deep learning for computer vision?}, year = {2017}, } @article{krishna2017visual, author = {Ranjay Krishna and Yuke Zhu and Oliver Groth and Justin Johnson and Kenji Hata and Joshua Kravitz and Stephanie Chen and Yannis Kalantidi and Li-Jia Li and David A. Shamma and Michael S. Bernstein and Fei-Fei Li}, journal = {International Journal of Computer Vision}, pages = {32--73}, title = {Visual genome: Connecting language and vision using crowdsourced dense image annotations}, volume = {123}, year = {2017}, } @inproceedings{gal2017dbal, author = {Yarin Gal and R. Islam and Zoubin Ghahramani}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Deep {B}ayesian Active Learning with Image Data}, year = {2017}, } @inproceedings{deng2018adversarial, author = {Yue Deng and KaWai Chen and Yilin Shen and Hongxia Jin}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, pages = {4012--4018}, title = {Adversarial Active Learning for Sequences Labeling and Generation}, year = {2018}, } @inproceedings{teney2018tips, author = {Damien Teney and Peter Anderson and Xiaodong He and Anton V. D. Hengel}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {4223--4232}, title = {Tips and Tricks for Visual Question Answering: Learnings from the 2017 Challenge}, year = {2018}, } @inproceedings{anderson2018butd, author = {Peter Anderson and X. He and C. Buehler and Damien Teney and Mark Johnson and Stephen Gould and Lei Zhang}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {6077--6086}, title = {Bottom-Up and Top-Down Attention for Image Captioning and Visual Question Answering}, year = {2018}, } @inproceedings{siddhant2018deep, author = {Aditya Siddhant and Zachary C Lipton}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Deep {B}ayesian active learning for natural language processing: Results of a large-scale empirical study}, year = {2018}, } @inproceedings{sener2018active, author = {Ozan Sener and Silvio Savarese}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Active learning for convolutional neural networks: A core-set approach}, year = {2018}, } @inproceedings{perez2018film, author = {Ethan Perez and Florian Strub and Harm D. Vries and Vincent Dumoulin and Aaron C. Courville}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {FiLM: Visual Reasoning with a General Conditioning Layer}, year = {2018}, } @inproceedings{misra2018learning, author = {Ishan Misra and Ross Girshick and Rob Fergus and Martial Hebert and Abhinav Gupta and Laurens Van Der Maaten}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {11--20}, title = {Learning by asking questions}, year = {2018}, } @inproceedings{hudson2018mac, author = {Drew A. Hudson and Christopher D. Manning}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Compositional Attention Networks for Machine Reasoning}, year = {2018}, } @inproceedings{park2019ai, author = {Junwon Park and Ranjay Krishna and Pranav Khadpe and Li Fei-Fei and Michael Bernstein}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {115--124}, title = {{AI}-based request augmentation to increase crowdsourcing participation}, volume = {7}, year = {2019}, } @inproceedings{suhr2019nlvr2, author = {Alane Suhr and Stephanie Zhou and Ally Zhang and Iris Zhang and Huajun Bai and Yoav Artzi}, booktitle = {Association for Computational Linguistics (ACL)}, title = {A corpus for reasoning about natural language grounded in photographs}, year = {2019}, } @inproceedings{tan2019lxmert, author = {Hao Hao Tan and Mohit Bansal}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {{LXMERT}: Learning Cross-Modality Encoder Representations from Transformers}, year = {2019}, } @inproceedings{paszke2019pytorch, author = {Adam Paszke and Sam Gross and Francisco Massa and Adam Lerer and James Bradbury and Gregory Chanan and Trevor Killeen and Zeming Lin and Natalia Gimelshein and Luca Antiga and Alban Desmaison and Andreas K{\"o}pf and Edward Yang and Zach DeVito and Martin Raison and Alykhan Tejani and Sasank Chilamkurthy and Benoit Steiner and Lu Fang and Junjie Bai and Soumith Chintala}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {PyTorch: An Imperative Style, High-Performance Deep Learning Library}, year = {2019}, } @inproceedings{zellers2019recognition, author = {Rowan Zellers and Yonatan Bisk and Ali Farhadi and Yejin Choi}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {6720--6731}, title = {From recognition to cognition: Visual commonsense reasoning}, year = {2019}, } @article{jedoui2019deep, author = {Khaled Jedoui and Ranjay Krishna and Michael Bernstein and Li Fei-Fei}, journal = {arXiv preprint arXiv:1912.01119}, title = {Deep {B}ayesian active learning for multiple correct outputs}, year = {2019}, } @inproceedings{li2019repair, author = {Yi Li and Nuno Vasconcelos}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {9572--9581}, title = {Repair: Removing representation bias by dataset resampling}, year = {2019}, } @inproceedings{toneva2019empirical, author = {Mariya Toneva and Alessandro Sordoni and Remi Tachet des Combes and Adam Trischler and Yoshua Bengio and Geoffrey J Gordon}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {An empirical study of example forgetting during deep neural network learning}, year = {2019}, } @inproceedings{hudson2019nsm, author = {Drew A. Hudson and Christopher D. Manning}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Learning by Abstraction: The Neural State Machine}, year = {2019}, } @inproceedings{chen2020uniter, author = {Yen-Chun Chen and Linjie Li and Licheng Yu and Ahmed El Kholy and Faisal Ahmed and Zhe Gan and Yu Cheng and Jingjing Liu}, booktitle = {European Conference on Computer Vision (ECCV)}, pages = {104--120}, title = {Uniter: Universal image-text representation learning}, year = {2020}, } @inproceedings{le2020adversarial, author = {Ronan Le Bras and Swabha Swayamdipta and Chandra Bhagavatula and Rowan Zellers and Matthew Peters and Ashish Sabharwal and Yejin Choi}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1078--1088}, title = {Adversarial filters of dataset biases}, year = {2020}, } @inproceedings{swayamdipta2020dataset, author = {Swabha Swayamdipta and Roy Schwartz and Nicholas Lourie and Yizhong Wang and Hannaneh Hajishirzi and Noah A. Smith and Yejin Choi}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Dataset cartography: Mapping and diagnosing datasets with training dynamics}, year = {2020}, } @article{deming1944theory, author = {W. E. Deming and J. Neumann and O. Morgenstern}, journal = {Journal of the American Statistical Association (JASA)}, title = {Theory of Games and Economic Behavior}, volume = {40}, year = {1944}, } @article{nash1950bargaining, author = {John Nash}, journal = {Econometrica}, pages = {155--162}, title = {The Bargaining Problem}, volume = {18}, year = {1950}, } @article{nash1951noncooperative, author = {John Nash}, journal = {Annals of Mathematics}, title = {Non-Cooperative Games}, volume = {54}, year = {1951}, } @inproceedings{panait2005cooperative, author = {Liviu Panait and Sean Luke}, booktitle = {International Conference on Autonomous Agents and Multiagent Systems (AAMAS)}, pages = {387--434}, title = {Cooperative Multi-Agent Learning: The State of the Art}, year = {2005}, } @inproceedings{he2016opponent, author = {He He and Jordan L. Boyd-Graber}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Opponent Modeling in Deep Reinforcement Learning}, year = {2016}, } @inproceedings{baarslag2016negotiation, author = {Tim Baarslag and Alper T. Alan and Richard C. Gomer and Ilaria Liccardi and Helia Marreiros and Enrico Gerding and M. C. Schraefel}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, title = {Negotiation as an Interaction Mechanism for Deciding App Permissions}, year = {2016}, } @inproceedings{khanpour2016dialogue, author = {Hamed Khanpour and Nishitha Guntakandla and Rodney D. Nielsen}, booktitle = {International Conference on Computational Linguistics (COLING)}, title = {Dialogue Act Classification in Domain-Independent Conversations Using a Deep Recurrent Neural Network}, year = {2016}, } @inproceedings{yarats2018hierarchical, author = {Denis Yarats and Mike Lewis}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Hierarchical Text Generation and Planning for Strategic Dialogue}, year = {2018}, } @inproceedings{yang2018mastering, author = {Z. Yang and Saizheng Zhang and Jack Urbanek and Will Feng and Alexander H. Miller and Arthur Szlam and Douwe Kiela and J. Weston}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Mastering the Dungeon: Grounded Language Learning by Mechanical Turker Descent}, year = {2018}, } @inproceedings{le2018preference, author = {Tiep Le and Atena M. Tabakhi and Long Tran-Thanh and William Yeoh and Tran Cao Son}, booktitle = {International Conference on Autonomous Agents and Multiagent Systems (AAMAS)}, title = {Preference Elicitation with Interdependency and User Bother Cost}, year = {2018}, } @inproceedings{chen2018planning, author = {Min Chen and Stefanos Nikolaidis and Harold Soh and David Hsu and Siddhartha Srinivasa}, booktitle = {ACM/IEEE International Conference on Human Robot Interaction (HRI)}, title = {Planning with Trust for Human-Robot Collaboration}, year = {2018}, } @inproceedings{raileanu2018modeling, author = {Roberta Raileanu and Emily L. Denton and Arthur Szlam and Rob Fergus}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Modeling Others using Oneself in Multi-Agent Reinforcement Learning}, year = {2018}, } @inproceedings{kang2019recommendation, author = {Dongyeop Kang and Anusha Balakrishnan and Pararth Shah and Paul A. Crook and Y-Lan Boureau and Jason Weston}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Recommendation as a Communication Game: Self-Supervised Bot-Play for Goal-oriented Dialogue}, year = {2019}, } @inproceedings{coreyes2019guiding, author = {John D. Co-Reyes and Abhishek Gupta and Suvansh Sanjeev and Nick Altieri and John DeNero and Pieter Abbeel and Sergey Levine}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Guiding Policies with Language via Meta-Learning}, year = {2019}, } @inproceedings{zhao2019rethinking, author = {Tiancheng Zhao and Kaige Xie and M. Eskenazi}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Rethinking Action Spaces for Reinforcement Learning in End-to-end Dialog Agents with Latent Variable Models}, year = {2019}, } @article{yang2020generating, author = {Runzhe Yang and Jingxiao Chen and Karthik Narasimhan}, journal = {arXiv preprint arXiv:2010.09954}, title = {Generating Strategic Dialogue for Negotiation with Theory of Mind}, year = {2020}, } @inproceedings{arzate2020survey, author = {Christian Arzate Cruz and Takeo Igarashi}, booktitle = {Proceedings of the 2020 ACM Designing Interactive Systems Conference}, pages = {1195--1209}, title = {A survey on interactive reinforcement learning: Design principles and open challenges}, year = {2020}, } @inproceedings{lowe2020selfplay, author = {Ryan Lowe and Abhinav Gupta and Jakob N. Foerster and Douwe Kiela and Joelle Pineau}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {On the interaction between supervision and self-play in emergent communication}, year = {2020}, } @article{shuster2020deploying, author = {Kurt Shuster and Jack Urbanek and Emily Dinan and Arthur Szlam and J. Weston}, journal = {arXiv preprint arXiv:2008.08076}, title = {Deploying Lifelong Open-Domain Dialogue Learning}, year = {2020}, } @article{dafoe2020open, author = {Allan Dafoe and Edward Hughes and Yoram Bachrach and Tantum Collins and Kevin R McKee and Joel Z Leibo and Kate Larson and Thore Graepel}, journal = {arXiv preprint arXiv:2012.08630}, title = {Open Problems in Cooperative {AI}}, year = {2020}, } @article{vries2020ecological, author = {Harm D. Vries and Dzmitry Bahdanau and Christopher D. Manning}, journal = {arXiv preprint arXiv:2007.14435}, title = {Towards Ecologically Valid Research on Language User Interfaces}, year = {2020}, } @article{schuurmans2020intent, author = {J. Schuurmans and F. Frasincar and E. Cambria}, journal = {IEEE Intelligent Systems}, pages = {82--88}, title = {Intent Classification for Dialogue Utterances}, volume = {35}, year = {2020}, } @inproceedings{hawkins2020continual, author = {Robert D. Hawkins and Minae Kwon and Dorsa Sadigh and Noah D. Goodman}, booktitle = {Computational Natural Language Learning (CoNLL)}, title = {Continual adaptation for efficient machine communication}, year = {2020}, } @inproceedings{xie2020lili, author = {Annie Xie and Dylan P. Losey and Ryan Tolsma and Chelsea Finn and Dorsa Sadigh}, booktitle = {Conference on Robot Learning (CoRL)}, title = {Learning Latent Representations to Influence Multi-Agent Interaction}, year = {2020}, } @inproceedings{shih2021critical, author = {Andy Shih and Arjun Sawhney and Jovana Kondic and Stefano Ermon and Dorsa Sadigh}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {On the Critical Role of Conventions in Adaptive Human-{AI} Collaboration}, year = {2021}, } @techreport{schmidhuber1991adaptive, author = {J{\"{u}}rgen Schmidhuber}, institution = {Institut fur Informatik, Technische Universitat Munchen, Arcisstr. 21, 800 Munchen 2}, title = {Adaptive Confidence And Adaptive Curiosity}, year = {1991}, } @inproceedings{randlov1998learning, author = {Jette Randl{\o{}}v and Preben Alstr{\o{}}m}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Learning to Drive a Bicycle Using Reinforcement Learning and Shaping}, year = {1998}, } @inproceedings{mcgovern2001subgoals, author = {Amy McGovern and Andrew G. Barto}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Automatic Discovery of Subgoals in Reinforcement Learning using Diverse Density}, year = {2001}, } @inproceedings{stolle2002options, author = {Martin Stolle and Doina Precup}, booktitle = {Proceedings of the 5th International Symposium on Abstraction, Reformulation and Approximation}, title = {Learning Options in Reinforcement Learning}, year = {2002}, } @inproceedings{devlin2012dynamic, author = {Sam Devlin and Daniel Kudenko}, booktitle = {International Conference on Autonomous Agents and Multiagent Systems (AAMAS)}, title = {Dynamic potential-based reward shaping}, year = {2012}, } @article{hausknecht2015deeprq, author = {M. Hausknecht and P. Stone}, journal = {arXiv preprint arXiv:1507.06527}, title = {Deep Recurrent {Q}-Learning for Partially Observable MDPs}, year = {2015}, } @inproceedings{misra2017mapping, author = {Dipendra K. Misra and John Langford and Yoav Artzi}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Mapping Instructions and Visual Observations to Actions with Reinforcement Learning}, year = {2017}, } @inproceedings{andreas2017sketches, author = {Jacob Andreas and Dan Klein and Sergey Levine}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Modular Multitask Reinforcement Learning with Policy Sketches}, year = {2017}, } @inproceedings{grzes2017reward, author = {Marek Grzes}, booktitle = {International Conference on Autonomous Agents and Multiagent Systems (AAMAS)}, title = {Reward Shaping in Episodic Reinforcement Learning}, year = {2017}, } @article{schulman2017ppo, author = {John Schulman and Filip Wolski and Prafulla Dhariwal and Alec Radford and Oleg Klimov}, journal = {arXiv preprint arXiv:1707.06347}, title = {Proximal Policy Optimization Algorithms}, year = {2017}, } @article{yu2017compositional, author = {Haonan Yu and Haichao Zhang and Wei Xu}, journal = {arXiv preprint arXiv:1703.09831}, title = {A Deep Compositional Framework for Human-like Language Acquisition in Virtual Environment}, year = {2017}, } @inproceedings{das2018modular, author = {Abhishek Das and Georgia Gkioxari and Stefan Lee and Devi Parikh and Dhruv Batra}, booktitle = {Conference on Robot Learning (CoRL)}, title = {Neural Modular Control for Embodied Question Answering}, year = {2018}, } @inproceedings{zheng2018learning, author = {Zeyu Zheng and Junhyuk Oh and Satinder Singh}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {On Learning Intrinsic Rewards for Policy Gradient Methods}, year = {2018}, } @inproceedings{cideron2019selfeducated, author = {Geoffrey Cideron and Mathieu Seurin and Florian Strub and Olivier Pietquin}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Self-Educated Language Agent with Hindsight Experience Replay for Instruction Following}, year = {2019}, } @inproceedings{goyal2019shaping, author = {Prasoon Goyal and Scott Niekum and Raymond J. Mooney}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Using Natural Language for Reward Shaping in Reinforcement Learning}, year = {2019}, } @inproceedings{luketina2019survey, author = {Jelena Luketina and Nantas Nardelli and Gregory Farquhar and Jakob Foerster and Jacob Andreas and Edward Grefenstette and Shimon Whiteson and Tim Rockt{\"{a}}schel}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {A Survey of Reinforcement Learning Informed by Natural Language}, year = {2019}, } @inproceedings{waytowich2019narration, author = {Nicholas Waytowich and Sean L. Barton and Vernon Lawhern and Garrett Warnell}, booktitle = {International Conference on Machine Learning (ICML)}, title = {A Narration-based Reward Shaping Approach using Grounded Natural Language Commands}, year = {2019}, } @inproceedings{burda2019curiosity, author = {Yuri Burda and Harri Edwards and Deepak Pathak and Amos Storkey and Trevor Darrell and Alexei A. Efros}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Large-Scale Study of Curiosity-Driven Learning}, year = {2019}, } @inproceedings{bahdanau2019reward, author = {Dzmitry Bahdanau and Felix Hill and Jan Leike and Edward Hughes and S. A. Hosseini and Pushmeet Kohli and Edward Grefenstette}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Learning to Understand Goal Specifications by Modelling Reward}, year = {2019}, } @inproceedings{wang2019rcm, author = {Xin Eric Wang and Qiuyuan Huang and Asli Celikyilmaz and Jianfeng Gao and Dinghan Shen and Yuan-Fang Wang and William Yang Wang and Lei Zhang}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Reinforced Cross-Modal Matching and Self-Supervised Imitation Learning for Vision-Language Navigation}, year = {2019}, } @inproceedings{fu2019lang2goals, author = {Justin Fu and Anoop Korattikara and Sergey Levine and Sergio Guadarrama}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {From Language to Goals: Inverse Reinforcement Learning for Vision-Based Instruction Following}, year = {2019}, } @inproceedings{jiang2019abstraction, author = {Yiding Jiang and Shixiang (Shane) Gu and Kevin P. Murphy and Chelsea Finn}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Language as an Abstraction for Hierarchical Deep Reinforcement Learning}, year = {2019}, } @article{lynch2020grounding, author = {Corey Lynch and Pierre Sermanet}, journal = {arXiv preprint arXiv:2005.07648}, title = {Grounding Language in Play}, year = {2020}, } @inproceedings{bisk2020experience, author = {Yonatan Bisk and Ari Holtzman and Jesse Thomason and Jacob Andreas and Yoshua Bengio and Joyce Chai and Mirella Lapata and Angeliki Lazaridou and Jonathan May and Aleksandr Nisnevich and Nicolas Pinto and Joseph Turian}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Experience Grounds Language}, year = {2020}, } @article{hill2020human, author = {Felix Hill and Sona Mokra and Nathaniel Wong and Tim Harley}, journal = {arXiv preprint arXiv:2005.09382}, title = {Human Instruction-Following with Deep Reinforcement Learning via Transfer-Learning from Text}, year = {2020}, } @article{behboudian2020useful, author = {Paniz Behboudian and Yash Satsangi and Matthew E. Taylor and Anna Harutyunyan and Michael Bowling}, journal = {arXiv preprint arXiv:2011.01297}, title = {Useful Policy Invariant Shaping from Arbitrary Advice}, year = {2020}, } @techreport{yun2020evaluating, author = {Anthony Yun}, institution = {The University of Texas at Austin}, title = {Evaluating the Robustness of Natural Language Reward Shaping Models to Spatial Relations}, year = {2020}, } @article{campero2020learning, author = {Andres Campero and Roberta Raileanu and Heinrich K{\"{u}}ttler and Joshua B. Tenenbaum and Tim Rockt{\"{a}}schel and Edward Grefenstette}, journal = {arXiv preprint arXiv:2006.12122}, title = {Learning with {AMIG}o: Adversarially Motivated Intrinsic Goals}, year = {2020}, } @inproceedings{colas2020language, author = {C{'{e}}dric Colas and Tristan Karch and Nicolas Lair and Jean-Michel Dussoux and Cl{'{e}}ment Moulin-Frier and Peter F. Dominey and Pierre-Yves Oudeyer}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Language as a Cognitive Tool to Imagine Goals in Curiosity Driven Exploration}, year = {2020}, } @inproceedings{cobbe2020leveraging, author = {Karl Cobbe and Christopher Hesse and Jacob Hilton and John Schulman}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Leveraging Procedural Generation to Benchmark Reinforcement Learning}, year = {2020}, } @inproceedings{raileanu2020ride, author = {Roberta Raileanu and Tim Rockt{\"{a}}schel}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {RIDE: Rewarding Impact-Driven Exploration for Procedurally-Generated Environments}, year = {2020}, } @inproceedings{andreas2020geca, author = {Jacob Andreas}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Good-Enough Compositional Data Augmentation}, year = {2020}, } @article{khatib1987osc, author = {Oussama Khatib}, journal = {IEEE Journal on Robotics and Automation}, pages = {43--53}, title = {A unified approach for motion and force control of robot manipulators: The operational space formulation}, volume = {3}, year = {1987}, } @inproceedings{macglashan2015grounding, author = {J. MacGlashan and Monica Babes-Vroman and M. desJardins and M. Littman and S. Muresan and S. Squire and Stefanie Tellex and Dilip Arumugam and Lei Yang}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Grounding {E}nglish Commands to Reward Functions}, year = {2015}, } @inproceedings{laskey2017dart, author = {Michael Laskey and Jonathan N. Lee and Roy Fox and A. Dragan and Ken Goldberg}, booktitle = {Conference on Robot Learning (CoRL)}, title = {DART: Noise Injection for Robust Imitation Learning}, year = {2017}, } @inproceedings{blukis2018following, author = {Valts Blukis and Nataly Brukhim and Andrew Bennett and Ross A. Knepper and Yoav Artzi}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Following High-level Navigation Instructions on a Simulated Quadcopter with Imitation Learning}, year = {2018}, } @article{scalise2018natural, author = {Rosario Scalise and Shen Li and H. Admoni and Stephanie Rosenthal and S. Srinivasa}, journal = {International Journal of Robotics Research (IJRR)}, pages = {558--565}, title = {Natural language instructions for human–robot collaborative manipulation}, volume = {37}, year = {2018}, } @inproceedings{matuszek2018groundedlang, author = {Cynthia Matuszek}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Grounded Language Learning: Where Robotics and {NLP} Meet}, year = {2018}, } @inproceedings{reimers2020multisbert, author = {Nils Reimers and Iryna Gurevych}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Making Monolingual Sentence Embeddings Multilingual using Knowledge Distillation}, year = {2020}, } @article{zhu2020robosuite, author = {Yuke Zhu and Josiah Wong and Ajay Mandlekar and Roberto Martín-Martín}, journal = {arXiv preprint arXiv:2009.12293}, title = {Robosuite: A Modular Simulation Framework and Benchmark for Robot Learning}, year = {2020}, } @article{tellex2020robonlp, author = {Stefanie Tellex and Nakul Gopalan and Hadas Kress-Gazit and Cynthia Matuszek}, journal = {Annual Review of Control, Robotics, and Autonomous Systems}, number = {1}, pages = {25--55}, title = {Robots That Use Language}, volume = {3}, year = {2020}, } @article{marzoev2020unnatural, author = {Alana Marzoev and S. Madden and M. Kaashoek and Michael J. Cafarella and Jacob Andreas}, journal = {arXiv preprint arXiv:2004.13645}, title = {Unnatural Language Processing: Bridging the Gap Between Synthetic and Natural Language Data}, year = {2020}, } @inproceedings{ku2020rxr, author = {Alexander Ku and Peter Anderson and Roma Patel and Eugene Ie and Jason Baldridge}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Room-Across-Room: Multilingual Vision-and-Language Navigation with Dense Spatiotemporal Grounding}, year = {2020}, } @inproceedings{schaff2020residual, author = {Charles B. Schaff and Matthew R. Walter}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Residual Policy Learning for Shared Autonomy}, year = {2020}, } @inproceedings{karamcheti2021vla, author = {Siddharth Karamcheti and A. Zhai and Dylan P. Losey and Dorsa Sadigh}, booktitle = {Learning for Dynamics \& Control Conference (L4DC)}, title = {Learning Visually Guided Latent Actions for Assistive Teleoperation}, year = {2021}, } @inproceedings{matuszek2014unscripted, author = {Cynthia Matuszek and Liefeng Bo and Luke Zettlemoyer and D. Fox}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Learning from Unscripted Deictic Gesture and Language for Human-Robot Interactions}, year = {2014}, } @inproceedings{kollar2013towards, author = {T. Kollar and J. Krishnamurthy and Grant P. Strimel}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Toward Interactive Grounded Language Acqusition}, year = {2013}, } @inproceedings{kennington2013situated, author = {C. Kennington and Spyros Kousidis and David Schlangen}, booktitle = {SIGDIAL Conference}, title = {Interpreting Situated Dialogue Utterances: an Update Model that Uses Speech, Gaze, and Gesture Information}, year = {2013}, } @inproceedings{whitney2016multimodal, author = {David Whitney and Miles Eldon and John G. Oberlin and Stefanie Tellex}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {3331--3338}, title = {Interpreting multimodal referring expressions in real time}, year = {2016}, } @inproceedings{duvallet2013imitation, author = {Felix Duvallet and T. Kollar and A. Stentz}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {1047--1053}, title = {Imitation learning for natural language direction following through unknown environments}, year = {2013}, } @article{losey2021latentactions, author = {Dylan P. Losey and Hong Jun Jeon and Mengxi Li and Krishna Parasuram Srinivasan and Ajay Mandlekar and Animesh Garg and Jeannette Bohg and Dorsa Sadigh}, journal = {Autonomous Robots (AURO)}, pages = {1--33}, title = {Learning latent actions to control assistive robots}, year = {2021}, } @inproceedings{kaelbling1993learning, author = {Leslie Kaelbling}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Learning to Achieve Goals}, year = {1993}, } @inproceedings{russell1998learning, author = {Stuart J. Russell}, booktitle = {Conference on Learning Theory (COLT)}, title = {Learning agents for uncertain environments}, year = {1998}, } @inproceedings{schaul2015uvf, author = {Tom Schaul and Dan Horgan and K. Gregor and D. Silver}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Universal Value Function Approximators}, year = {2015}, } @inproceedings{taylor2016alignment, author = {Jessica Taylor and Eliezer Yudkowsky and Patrick LaVictoire and Andrew Critch}, booktitle = {Ethics of Artificial Intelligence}, title = {Alignment for Advanced Machine Learning Systems}, year = {2016}, } @inproceedings{berkenkamp2017safe, author = {Felix Berkenkamp and Matteo Turchetta and Angela P. Schoellig and Andreas Krause}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Safe Model-based Reinforcement Learning with Stability Guarantees}, year = {2017}, } @article{leike2017gridworlds, author = {Jan Leike and Miljan Martic and Victoria Krakovna and Pedro A. Ortega and Tom Everitt and Andrew Lefrancq and Laurent Orseau and S. Legg}, journal = {arXiv preprint arXiv:1711.09883}, title = {{AI} Safety Gridworlds}, year = {2017}, } @inproceedings{dreossi2017compositional, author = {T. Dreossi and Alexandre Donzé and S. Seshia}, booktitle = {NFM}, title = {Compositional Falsification of Cyber-Physical Systems with Machine Learning Components}, year = {2017}, } @inproceedings{bajcsy2017learning, author = {Andrea Bajcsy and Dylan P. Losey and M. O'Malley and A. Dragan}, booktitle = {Conference on Robot Learning (CoRL)}, title = {Learning Robot Objectives from Physical Human Interaction}, year = {2017}, } @article{eysenbach2017leave, author = {Benjamin Eysenbach and Shixiang Gu and J. Ibarz and Sergey Levine}, journal = {arXiv preprint arXiv:1711.06782}, title = {Leave no Trace: Learning to Reset for Safe and Autonomous Reinforcement Learning}, year = {2017}, } @inproceedings{finn2017deep, author = {Chelsea Finn and Sergey Levine}, booktitle = {International Conference on Robotics and Automation (ICRA)}, title = {Deep visual foresight for planning robot motion}, year = {2017}, } @inproceedings{fu2018variational, author = {Justin Fu and Avi Singh and Dibya Ghosh and Larry Yang and Sergey Levine}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Variational Inverse Control with Events: A General Framework for Data-Driven Reward Definition}, year = {2018}, } @inproceedings{sharma2018mime, author = {Pratyusha Sharma and L. Mohan and Lerrel Pinto and A. Gupta}, booktitle = {Conference on Robot Learning (CoRL)}, title = {Multiple Interactions Made Easy (MIME): Large Scale Demonstrations Data for Imitation}, year = {2018}, } @inproceedings{biyik2018batch, author = {Erdem Biyik and Dorsa Sadigh}, booktitle = {Conference on Robot Learning (CoRL)}, title = {Batch Active Preference-Based Learning of Reward Functions}, year = {2018}, } @inproceedings{chow2018lyapunov, author = {Yinlam Chow and Ofir Nachum and Edgar A. Duéñez-Guzmán and M. Ghavamzadeh}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {A Lyapunov-based Approach to Safe Reinforcement Learning}, year = {2018}, } @inproceedings{singh2019endtoend, author = {Avi Singh and Larry Yang and Kristian Hartikainen and Chelsea Finn and Sergey Levine}, booktitle = {Robotics: Science and Systems (RSS)}, title = {End-to-End Robotic Reinforcement Learning without Reward Engineering}, year = {2019}, } @inproceedings{mandlekar2019scaling, author = {Ajay Mandlekar and Jonathan Booher and Max Spero and Albert Tung and Anchit Gupta and Yuke Zhu and Animesh Garg and Silvio Savarese and Li Fei-Fei}, booktitle = {International Conference on Intelligent Robots and Systems (IROS)}, title = {Scaling Robot Supervision to Hundreds of Hours with RoboTurk: Robotic Manipulation Dataset through Human Reasoning and Dexterity}, year = {2019}, } @inproceedings{dasari2019robonet, author = {Sudeep Dasari and F. Ebert and Stephen Tian and Suraj Nair and Bernadette Bucher and K. Schmeckpeper and Siddharth Singh and Sergey Levine and Chelsea Finn}, booktitle = {Conference on Robot Learning (CoRL)}, title = {RoboNet: Large-Scale Multi-Robot Learning}, year = {2019}, } @inproceedings{ding2019goal, author = {Yiming Ding and Carlos Florensa and Mariano Phielipp and P. Abbeel}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Goal-conditioned Imitation Learning}, year = {2019}, } @inproceedings{fisac2019bridging, author = {Jaime F. Fisac and Neil F. Lugovoy and Vicenç Rúbies Royo and S. Ghosh and C. Tomlin}, booktitle = {International Conference on Robotics and Automation (ICRA)}, title = {Bridging {Hamilton-Jacobi} Safety Analysis and Reinforcement Learning}, year = {2019}, } @inproceedings{hafner2019latent, author = {Danijar Hafner and T. Lillicrap and Ian S. Fischer and Ruben Villegas and David R Ha and Honglak Lee and James Davidson}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Learning Latent Dynamics for Planning from Pixels}, year = {2019}, } @inproceedings{stepputtis2020lcil, author = {Simon Stepputtis and J. Campbell and Mariano Phielipp and Stefan Lee and Chitta Baral and H. B. Amor}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Language-Conditioned Imitation Learning for Robot Manipulation Tasks}, year = {2020}, } @inproceedings{shao2020concept2robot, author = {Lin Shao and Toki Migimatsu and Q. Zhang and Karen Yang and Jeannette Bohg}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Concept2Robot: Learning Manipulation Concepts from Instructions and Human Demonstrations}, year = {2020}, } @article{corso2020survey, author = {Anthony Corso and Robert J. Moss and Mark Koren and R. Lee and Mykel J. Kochenderfer}, journal = {arXiv preprint arXiv:2005.02979}, title = {A Survey of Algorithms for Black-Box Safety Validation}, year = {2020}, } @article{lee2020detect, author = {Michelle A. Lee and Matthew Tan and Yuke Zhu and Jeannette Bohg}, journal = {arXiv preprint arXiv:2012.00201}, title = {Detect, Reject, Correct: Crossmodal Compensation of Corrupted Sensors}, year = {2020}, } @inproceedings{lee2020addressing, author = {Seunghyun Lee and Younggyo Seo and Kimin Lee and Pieter Abbeel and Jinwoo Shin}, booktitle = {Offline Reinforcement Learning Workshop @ NeurIPS}, title = {Addressing Distribution Shift in Online Reinforcement Learning with Offline Datasets}, year = {2020}, } @article{gupta2021reset, author = {Abhishek Gupta and Justin Yu and Tony Zhao and Vikash Kumar and Aaron Rovinsky and Kelvin Xu and Thomas Devlin and Sergey Levine}, journal = {arXiv preprint arXiv:2104.11203}, title = {Reset-Free Reinforcement Learning via Multi-Task Learning: Learning Dexterous Manipulation Behaviors without Human Intervention}, year = {2021}, } @inproceedings{chen2021generalizable, author = {Annie S. Chen and Suraj Nair and Chelsea Finn}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Learning Generalizable Robotic Reward Functions from "In-The-Wild" Human Videos}, year = {2021}, } @article{deletang2021causal, author = {Grégoire Déletang and J. Grau-Moya and Miljan Martic and Tim Genewein and Tom McGrath and Vladimir Mikulik and M. Kunesch and S. Legg and Pedro A. Ortega}, journal = {arXiv preprint arXiv:2103.03938}, title = {Causal Analysis of Agent Behavior for {AI} Safety}, year = {2021}, } @inproceedings{jaegle2021perceiver, author = {Andrew Jaegle and Felix Gimeno and Andrew Brock and Andrew Zisserman and Oriol Vinyals and Jo{\~a}o Carreira}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Perceiver: General Perception with Iterative Attention}, year = {2021}, } @article{janner2021reinforcement, author = {Michael Janner and Qiyang Li and Sergey Levine}, journal = {arXiv preprint arXiv:2106.02039}, title = {Reinforcement Learning as One Big Sequence Modeling Problem}, year = {2021}, } @article{chen2021decisiontransformer, author = {Lili Chen and Kevin Lu and Aravind Rajeswaran and Kimin Lee and Aditya Grover and M. Laskin and P. Abbeel and A. Srinivas and Igor Mordatch}, journal = {arXiv preprint arXiv:2106.01345}, title = {Decision Transformer: Reinforcement Learning via Sequence Modeling}, year = {2021}, } @article{herbert2021scalable, author = {Sylvia L. Herbert and Jason J. Choi and Suvansh Qazi and Marsalis Gibson and K. Sreenath and C. Tomlin}, journal = {arXiv preprint arXiv:2101.05916}, title = {Scalable Learning of Safety Guarantees for Autonomous Systems using {Hamilton-Jacobi} Reachability}, year = {2021}, } @article{wu2021greedy, author = {Bohan Wu and Suraj Nair and Roberto Martín-Martín and Li Fei-Fei and Chelsea Finn}, journal = {arXiv preprint arXiv:2103.04174}, title = {Greedy Hierarchical Variational Autoencoders for Large-Scale Video Prediction}, year = {2021}, } @article{osa2018algorithmic, author = {Takayuki Osa and Joni Pajarinen and Gerhard Neumann and J. Andrew Bagnell and P. Abbeel and Jan Peters}, journal = {Found. Trends Robotics}, pages = {1--179}, title = {An Algorithmic {p}erspective on Imitation Learning}, volume = {7}, year = {2018}, } @inproceedings{kelly2019hgdagger, author = {Michael Kelly and Chelsea Sidrane and K. Driggs-Campbell and Mykel J. Kochenderfer}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {8077--8083}, title = {{HG-DAgger}: Interactive Imitation Learning with Human Experts}, year = {2019}, } @article{hoque2021lazydagger, author = {Ryan Hoque and Ashwin Balakrishna and Carl Putterman and Michael Luo and Daniel S. Brown and Daniel Seita and Brijen Thananjeyan and Ellen R. Novoseller and Ken Goldberg}, journal = {IEEE 17th International Conference on Automation Science and Engineering (CASE)}, pages = {502--509}, title = {{LazyDAgger}: Reducing Context Switching in Interactive Imitation Learning}, volume = {3}, year = {2021}, } @inproceedings{hoque2021thriftydagger, author = {Ryan Hoque and Ashwin Balakrishna and Ellen R. Novoseller and Albert Wilcox and Daniel S. Brown and Ken Goldberg}, booktitle = {Conference on Robot Learning (CoRL)}, title = {{ThriftyDAgger}: Budget-Aware Novelty and Risk Gating for Interactive Imitation Learning}, year = {2021}, } @article{schaal1999imitation, author = {Stefan Schaal}, journal = {Science}, pages = {233--242}, title = {Is imitation learning the route to humanoid robots?}, volume = {3}, year = {1999}, } @article{goil2013blend, author = {Aditya Goil and Matthew Derry and Brenna Argall}, journal = {2013 IEEE 13th International Conference on Rehabilitation Robotics (ICORR)}, pages = {1--6}, title = {Using machine learning to blend human and robot controls for assisted wheelchair navigation}, volume = {6}, year = {2013}, } @article{kim1992force, author = {Won S. Kim and Blake Hannaford and Antal K. Bejczy}, journal = {IEEE Trans. Robotics Autom.}, pages = {176--185}, title = {Force-reflection and shared compliant control in operating telemanipulators with time delay}, volume = {8}, year = {1992}, } @inproceedings{shridhar2021clipport, author = {Mohit Shridhar and Lucas Manuelli and Dieter Fox}, booktitle = {Conference on Robot Learning (CoRL)}, title = {CLIPort: What and Where Pathways for Robotic Manipulation}, year = {2021}, } @inproceedings{thomason2019visdial, author = {Jesse Thomason and Michael Murray and Maya Cakmak and Luke Zettlemoyer}, booktitle = {Conference on Robot Learning (CoRL)}, title = {Vision-and-Dialog Navigation}, year = {2019}, } @inproceedings{rakelly2021mutual, author = {Kate Rakelly and Abhishek Gupta and Carlos Florensa and Sergey Levine}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Which Mutual-Information Representation Learning Objectives are Sufficient for Control?}, year = {2021}, } @article{oord2018cpc, author = {Aäron van den Oord and Yazhe Li and Oriol Vinyals}, journal = {arXiv preprint arXiv:1807.03748}, title = {Representation Learning with Contrastive Predictive Coding}, year = {2018}, } @inproceedings{anand2019unsupervised, author = {Ankesh Anand and Evan Racah and Sherjil Ozair and Yoshua Bengio and Marc{-}Alexandre Côté and R. Devon Hjelm}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {8766--8779}, title = {Unsupervised State Representation Learning in {Atari}}, year = {2019}, } @inproceedings{stooke2021decoupling, author = {Adam Stooke and Kimin Lee and Pieter Abbeel and Michael Laskin}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {9870--9879}, title = {Decoupling Representation Learning from Reinforcement Learning}, volume = {139}, year = {2021}, } @inproceedings{torabi2018bco, author = {Faraz Torabi and Garrett Warnell and Peter Stone}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, pages = {4950--4957}, title = {Behavioral Cloning from Observation}, year = {2018}, } @inproceedings{lee2020slac, author = {Alex X. Lee and Anusha Nagabandi and Pieter Abbeel and Sergey Levine}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Stochastic Latent Actor-Critic: Deep Reinforcement Learning with a Latent Variable Model}, year = {2020}, } @inproceedings{yang2021representation, author = {Mengjiao Yang and Ofir Nachum}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Representation Matters: Offline Pretraining for Sequential Decision Making}, year = {2021}, } @article{torabi2018gaifo, author = {Faraz Torabi and Garrett Warnell and Peter Stone}, journal = {arXiv preprint arXiv:1807.06158}, title = {Generative Adversarial Imitation from Observation}, year = {2018}, } @inproceedings{liu2018ifo, author = {Yuxuan Liu and Abhishek Gupta and P. Abbeel and Sergey Levine}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {1118--1125}, title = {Imitation from Observation: Learning to Imitate Behaviors from Raw Video via Context Translation}, year = {2018}, } @inproceedings{sharma2019third, author = {Pratyusha Sharma and Deepak Pathak and Abhinav Kumar Gupta}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Third-Person Visual Imitation Learning via Decoupled Hierarchical Controller}, year = {2019}, } @inproceedings{smith2020avid, author = {Laura Smith and Nikita Dhawan and Marvin Zhang and P. Abbeel and Sergey Levine}, booktitle = {Robotics: Science and Systems (RSS)}, title = {AVID: Learning Multi-Stage Tasks via Pixel-Level Translation of Human Videos}, year = {2020}, } @inproceedings{schmeckpeper2020predictive, author = {Karl Schmeckpeper and Annie Xie and Oleh Rybkin and Stephen Tian and Kostas Daniilidis and Sergey Levine and Chelsea Finn}, booktitle = {European Conference on Computer Vision (ECCV)}, title = {Learning Predictive Models From Observation and Interaction}, year = {2020}, } @inproceedings{schmeckpeper2020reinforcement, author = {Karl Schmeckpeper and Oleh Rybkin and Kostas Daniilidis and Sergey Levine and Chelsea Finn}, booktitle = {Conference on Robot Learning (CoRL)}, title = {Reinforcement Learning with Videos: Combining Offline Observations with Interaction}, year = {2020}, } @inproceedings{sermanet2018tcn, author = {Pierre Sermanet and Corey Lynch and Yevgen Chebotar and Jasmine Hsu and Eric Jang and Stefan Schaal and Sergey Levine}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {1134--1141}, title = {Time-Contrastive Networks: Self-Supervised Learning from Video}, year = {2018}, } @inproceedings{rybkin2019learning, author = {Oleh Rybkin and Karl Pertsch and Konstantinos G. Derpanis and Kostas Daniilidis and Andrew Jaegle}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Learning what you can do before doing anything}, year = {2019}, } @inproceedings{agrawal2016poking, author = {Pulkit Agrawal and Ashvin Nair and P. Abbeel and Jitendra Malik and Sergey Levine}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Learning to Poke by Poking: Experiential Learning of Intuitive Physics}, year = {2016}, } @inproceedings{pathak2017curiosity, author = {Deepak Pathak and Pulkit Agrawal and Alexei A. Efros and Trevor Darrell}, booktitle = {IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)}, title = {Curiosity-Driven Exploration by Self-Supervised Prediction}, year = {2017}, } @inproceedings{shelhamer2017loss, author = {Evan Shelhamer and Parsa Mahmoudieh and Max Argus and Trevor Darrell}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Loss is its own Reward: Self-Supervision for Reinforcement Learning}, year = {2017}, } @inproceedings{kollar2021simnet, author = {Thomas Kollar and Michael Laskey and Kevin Stone and Brijen Thananjeyan and Mark Tjersland}, booktitle = {Conference on Robot Learning (CoRL)}, title = {SimNet: Enabling Robust Unknown Object Manipulation from Pure Synthetic Data via Stereo}, year = {2021}, } @inproceedings{mandlekar2018roboturk, author = {Ajay Mandlekar and Yuke Zhu and Animesh Garg and Jonathan Booher and Max Spero and Albert Tung and Julian Gao and John Emmons and Anchit Gupta and Emre Orbay and Silvio Savarese and Li Fei-Fei}, booktitle = {Conference on Robot Learning (CoRL)}, title = {{ROBOTURK}: A Crowdsourcing Platform for Robotic Skill Learning through Imitation}, year = {2018}, } @inproceedings{mandlekar2021robomimic, author = {Ajay Mandlekar and Danfei Xu and Josiah Wong and Soroush Nasiriany and Chen Wang and Rohun Kulkarni and Li Fei-Fei and Silvio Savarese and Yuke Zhu and Roberto Martín-Martín}, booktitle = {Conference on Robot Learning (CoRL)}, title = {What Matters in Learning from Offline Human Demonstrations for Robot Manipulation}, year = {2021}, } @article{chen2021batch, author = {Annie S. Chen and Hyunji Alex Nam and Suraj Nair and Chelsea Finn}, journal = {IEEE Robotics and Automation Letters (RA-L)}, pages = {4401--4408}, title = {Batch Exploration With Examples for Scalable Robotic Reinforcement Learning}, volume = {6}, year = {2021}, } @inproceedings{gupta2018robothomes, author = {Abhinav Kumar Gupta and Adithyavairavan Murali and Dhiraj Gandhi and Lerrel Pinto}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Robot Learning in Homes: Improving Generalization and Reducing Dataset Bias}, year = {2018}, } @article{ebert2018foresight, author = {Frederik Ebert and Chelsea Finn and Sudeep Dasari and Annie Xie and Alex X. Lee and Sergey Levine}, journal = {arXiv preprint arXiv:1812.00568}, title = {Visual Foresight: Model-Based Deep Reinforcement Learning for Vision-Based Robotic Control}, year = {2018}, } @inproceedings{nair2018visualrl, author = {Ashvin Nair and Vitchyr H. Pong and Murtaza Dalal and Shikhar Bahl and Steven Lin and Sergey Levine}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Visual Reinforcement Learning with Imagined Goals}, year = {2018}, } @inproceedings{kalashnikov2018qtopt, author = {Dmitry Kalashnikov and Alex Irpan and Peter Pastor and Julian Ibarz and Alexander Herzog and Eric Jang and Deirdre Quillen and Ethan Holly and Mrinal Kalakrishnan and Vincent Vanhoucke and Sergey Levine}, booktitle = {Conference on Robot Learning (CoRL)}, title = {{QT-Opt}: Scalable Deep Reinforcement Learning for Vision-Based Robotic Manipulation}, year = {2018}, } @inproceedings{mazoure2020infomax, author = {Bogdan Mazoure and Rémi Tachet des Combes and Thang Van Doan and Philip Bachman and R. Devon Hjelm}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Deep Reinforcement and InfoMax Learning}, year = {2020}, } @inproceedings{nachum2019nearoptimal, author = {Ofir Nachum and Shixiang Shane Gu and Honglak Lee and Sergey Levine}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Near-Optimal Representation Learning for Hierarchical Reinforcement Learning}, year = {2019}, } @inproceedings{schwarzer2021dataefficient, author = {Max Schwarzer and Ankesh Anand and Rishab Goel and R. Devon Hjelm and Aaron C. Courville and Philip Bachman}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Data-Efficient Reinforcement Learning with Self-Predictive Representations}, year = {2021}, } @inproceedings{shu2020predictive, author = {Rui Shu and Tung D. Nguyen and Yinlam Chow and Tu Pham and Khoat Than and Mohammad Ghavamzadeh and Stefano Ermon and Hung Hai Bui}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Predictive Coding for Locally-Linear Control}, year = {2020}, } @article{levine2020offlinerl, author = {Sergey Levine and Aviral Kumar and G. Tucker and Justin Fu}, journal = {arXiv preprint arXiv:2005.01643}, title = {Offline Reinforcement Learning: Tutorial, Review, and Perspectives on Open Problems}, year = {2020}, } @inproceedings{kumar2020cql, author = {Aviral Kumar and Aurick Zhou and G. Tucker and Sergey Levine}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Conservative {Q-}Learning for Offline Reinforcement Learning}, year = {2020}, } @inproceedings{yu2021combo, author = {Tianhe Yu and Aviral Kumar and Rafael Rafailov and Aravind Rajeswaran and Sergey Levine and Chelsea Finn}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {COMBO: Conservative Offline Model-Based Policy Optimization}, year = {2021}, } @inproceedings{fujimoto2021minimalist, author = {Scott Fujimoto and Shixiang Shane Gu}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {A Minimalist Approach to Offline Reinforcement Learning}, year = {2021}, } @article{zhao2021offline, author = {Tony Z. Zhao and Jianlan Luo and Oleg O. Sushkov and Rugile Pevceviciute and Nicolas Manfred Otto Heess and Jonathan Scholz and Stefan Schaal and Sergey Levine}, journal = {arXiv preprint arXiv:2110.04276}, title = {Offline Meta-Reinforcement Learning for Industrial Insertion}, year = {2021}, } @inproceedings{pomerleau1988alvinn, author = {Dean A. Pomerleau}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {ALVINN: An Autonomous Land Vehicle in a Neural Network}, year = {1988}, } @inproceedings{yu2019metaworld, author = {Tianhe Yu and Deirdre Quillen and Zhanpeng He and Ryan C. Julian and Karol Hausman and Chelsea Finn and Sergey Levine}, booktitle = {Conference on Robot Learning (CoRL)}, title = {Meta-World: A Benchmark and Evaluation for Multi-Task and Meta Reinforcement Learning}, year = {2019}, } @misc{kannan2021robodesk, author = {Harini Kannan and Danijar Hafner and Chelsea Finn and Dumitru Erhan}, howpublished = {\url{https://github.com/google-research/robodesk}}, title = {RoboDesk: A Multi-Task Reinforcement Learning Benchmark}, year = {2021}, } @article{xiao2022mvp, author = {Tete Xiao and Ilija Radosavovic and Trevor Darrell and Jitendra Malik}, journal = {arXiv preprint arXiv:2203.06173}, title = {Masked Visual Pre-training for Motor Control}, year = {2022}, } @article{nair2022r3m, author = {Suraj Nair and Aravind Rajeswaran and Vikash Kumar and Chelsea Finn and Abhinav Gupta}, journal = {arXiv preprint arXiv:2203.12601}, title = {R3M: A Universal Visual Representation for Robot Manipulation}, year = {2022}, } @article{parisi2022unsurprising, author = {Simone Parisi and Aravind Rajeswaran and Senthil Purushwalkam and Abhinav Kumar Gupta}, journal = {arXiv preprint arXiv:2203.03580}, title = {The Unsurprising Effectiveness of Pre-Trained Vision Models for Control}, year = {2022}, } @article{seo2022actionfree, author = {Younggyo Seo and Kimin Lee and Stephen James and P. Abbeel}, journal = {arXiv preprint arXiv:2203.13880}, title = {Reinforcement Learning with Action-Free Pre-Training from Videos}, year = {2022}, } @inproceedings{pari2022surprising, author = {Jyothish Pari and Nur Muhammad (Mahi) Shafiullah and Sridhar Pandian Arunachalam and Lerrel Pinto}, booktitle = {Robotics: Science and Systems (RSS)}, title = {The Surprising Effectiveness of Representation Learning for Visual Imitation}, year = {2022}, } @inproceedings{zhang2021correspondence, author = {Qiang Zhang and Tete Xiao and Alexei A. Efros and Lerrel Pinto and Xiaolong Wang}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Learning Cross-Domain Correspondence for Control with Dynamics Cycle-Consistency}, year = {2021}, } @inproceedings{chen2021representation, author = {Cynthia Chen and Xin Chen and Sam Toyer and Cody Wild and Scott Emmons and Ian S. Fischer and Kuang-Huei Lee and Neel Alex and Steven H. Wang and Ping Luo and Stuart J. Russell and P. Abbeel and Rohin Shah}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {An Empirical Investigation of Representation Learning for Imitation}, year = {2021}, } @inproceedings{zakka2021xirl, author = {Kevin Zakka and Andy Zeng and Peter R. Florence and Jonathan Tompson and Jeannette Bohg and Debidatta Dwibedi}, booktitle = {Conference on Robot Learning (CoRL)}, title = {{XIRL}: Cross-embodiment Inverse Reinforcement Learning}, year = {2021}, } @inproceedings{srinivas2020curl, author = {A. Srinivas and Michael Laskin and P. Abbeel}, booktitle = {International Conference on Machine Learning (ICML)}, title = {{CURL}: Contrastive Unsupervised Representations for Reinforcement Learning}, year = {2020}, } @inproceedings{gelada2019deepmdp, author = {Carles Gelada and Saurabh Kumar and Jacob Buckman and Ofir Nachum and Marc G. Bellemare}, booktitle = {International Conference on Machine Learning (ICML)}, title = {DeepMDP: Learning Continuous Latent Space Models for Representation Learning}, year = {2019}, } @inproceedings{lange2010dae, author = {Sascha Lange and Martin A. Riedmiller}, booktitle = {International Joint Conference on Neural Networks (IJCNN)}, pages = {1--8}, title = {Deep auto-encoder neural networks in reinforcement learning}, year = {2010}, } @inproceedings{zhang2021invariant, author = {Amy Zhang and Rowan McAllister and Roberto Calandra and Yarin Gal and Sergey Levine}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Learning Invariant Representations for Reinforcement Learning without Reconstruction}, year = {2021}, } @inproceedings{jaderberg2017auxiliary, author = {Max Jaderberg and Volodymyr Mnih and Wojciech M. Czarnecki and Tom Schaul and Joel Z. Leibo and David Silver and Koray Kavukcuoglu}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Reinforcement Learning with Unsupervised Auxiliary Tasks}, year = {2017}, } @article{wiles2021finegrained, author = {Olivia Wiles and Sven Gowal and Florian Stimberg and Sylvestre-Alvise Rebuffi and Ira Ktena and Krishnamurthy Dvijotham and Ali Taylan Cemgil}, journal = {arXiv preprint arXiv:2110.11328}, title = {A Fine-Grained Analysis on Distribution Shift}, year = {2021}, } @inproceedings{kumar2019navigation, author = {Ashish Kumar and Saurabh Gupta and Jitendra Malik}, booktitle = {Conference on Robot Learning (CoRL)}, title = {Learning Navigation Subroutines from Egocentric Videos}, year = {2019}, } @inproceedings{chang2020semanticnav, author = {Matthew Chang and Arjun Gupta and Saurabh Gupta}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Semantic Visual Navigation by Watching YouTube Videos}, year = {2020}, } @inproceedings{mandikal2021dexvip, author = {Priyanka Mandikal and Kristen Grauman}, booktitle = {Conference on Robot Learning (CoRL)}, title = {DexVIP: Learning Dexterous Grasping with Human Hand Pose Priors from Video}, year = {2021}, } @inproceedings{nagarajan2021shaping, author = {Tushar Nagarajan and Kristen Grauman}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Shaping embodied agent behavior with activity-context priors from egocentric video}, year = {2021}, } @inproceedings{pinto2017robust, author = {Lerrel Pinto and James Davidson and Rahul Sukthankar and Abhinav Kumar Gupta}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Robust Adversarial Reinforcement Learning}, year = {2017}, } @inproceedings{lee2018unified, author = {Kimin Lee and Kibok Lee and Honglak Lee and Jinwoo Shin}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {A Simple Unified Framework for Detecting Out-of-Distribution Samples and Adversarial Attacks}, year = {2018}, } @inproceedings{tzeng2014confusion, author = {Eric Tzeng and Judy Hoffman and N. Zhang and Kate Saenko and Trevor Darrell}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Deep Domain Confusion: Maximizing for Domain Invariance}, year = {2014}, } @article{sun2019unsupervised, author = {Yu Sun and Eric Tzeng and Trevor Darrell and Alexei A. Efros}, journal = {arXiv preprint arXiv:1909.11825}, title = {Unsupervised Domain Adaptation through Self-Supervision}, year = {2019}, } @inproceedings{xiao2021noise, author = {Kai Y. Xiao and Logan Engstrom and Andrew Ilyas and Aleksander Madry}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Noise or Signal: The Role of Image Backgrounds in Object Recognition}, year = {2021}, } @article{tzeng2015towards, author = {Eric Tzeng and Coline Devin and Judy Hoffman and Chelsea Finn and Xingchao Peng and Sergey Levine and Kate Saenko and Trevor Darrell}, journal = {arXiv preprint arXiv:1511.07111}, title = {Towards Adapting Deep Visuomotor Representations from Simulated to Real Environments}, year = {2015}, } @inproceedings{gupta2017invariant, author = {Abhishek Gupta and Coline Devin and Yuxuan Liu and P. Abbeel and Sergey Levine}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Learning Invariant Feature Spaces to Transfer Skills with Reinforcement Learning}, year = {2017}, } @article{christiano2016sim2real, author = {Paul Francis Christiano and Zain Shah and Igor Mordatch and Jonas Schneider and Trevor Blackwell and Joshua Tobin and Pieter Abbeel and Wojciech Zaremba}, journal = {arXiv preprint arXiv:1610.03518}, title = {Transfer from Simulation to Real World through Learning Deep Inverse Dynamics Model}, year = {2016}, } @inproceedings{tobin2017domain, author = {Joshua Tobin and Rachel Fong and Alex Ray and Jonas Schneider and Wojciech Zaremba and Pieter Abbeel}, booktitle = {International Conference on Intelligent Robots and Systems (IROS)}, pages = {23--30}, title = {Domain randomization for transferring deep neural networks from simulation to the real world}, year = {2017}, } @inproceedings{sadeghi2017cad2rl, author = {Fereshteh Sadeghi and Sergey Levine}, booktitle = {Robotics: Science and Systems (RSS)}, title = {{(CAD)$^2$RL}: Real Single-Image Flight without a Single Real Image}, year = {2017}, } @inproceedings{peng2018sim2real, author = {Xue Bin Peng and Marcin Andrychowicz and Wojciech Zaremba and P. Abbeel}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {1--8}, title = {Sim-to-Real Transfer of Robotic Control with Dynamics Randomization}, year = {2018}, } @inproceedings{tan2018sim2real, author = {Jie Tan and Tingnan Zhang and Erwin Coumans and Atil Iscen and Yunfei Bai and Danijar Hafner and Steven Bohez and Vincent Vanhoucke}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Sim-to-Real: Learning Agile Locomotion For Quadruped Robots}, year = {2018}, } @article{openai2019rubiks, author = {OpenAI and Ilge Akkaya and Marcin Andrychowicz and Maciek Chociej and Mateusz Litwin and Bob McGrew and Arthur Petron and Alex Paino and Matthias Plappert and Glenn Powell and Raphael Ribas and Jonas Schneider and Nikolas A. Tezak and Jerry Tworek and Peter Welinder and Lilian Weng and Qiming Yuan and Wojciech Zaremba and Lei M. Zhang}, journal = {arXiv preprint arXiv:1910.07113}, title = {Solving Rubik's Cube with a Robot Hand}, year = {2019}, } @inproceedings{mattner2012swing, author = {Jan Mattner and Sascha Lange and Martin A. Riedmiller}, booktitle = {International Conference on Neural Information Processing (ICONIP)}, title = {Learn to Swing Up and Balance a Real Pole Based on Raw Visual Input Data}, year = {2012}, } @inproceedings{finn2016deepsa, author = {Chelsea Finn and Xin Yu Tan and Yan Duan and Trevor Darrell and Sergey Levine and Pieter Abbeel}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {512--519}, title = {Deep Spatial Autoencoders for Visuomotor Learning}, year = {2016}, } @inproceedings{karl2017deepvb, author = {Maximilian Karl and Maximilian Sölch and Justin Bayer and Patrick van der Smagt}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Deep Variational {Bayes} Filters: Unsupervised Learning of State Space Models from Raw Data}, year = {2017}, } @inproceedings{alvernaz2017autoencoder, author = {Samuel Alvernaz and Julian Togelius}, booktitle = {IEEE Conference on Computational Intelligence and Games (CIG)}, pages = {1--8}, title = {Autoencoder-Augmented Neuroevolution for Visual {DOOM} Playing}, year = {2017}, } @inproceedings{goroshin2015linearize, author = {Ross Goroshin and Michaël Mathieu and Yann LeCun}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Learning to Linearize under Uncertainty}, year = {2015}, } @inproceedings{hoof2016stablerl, author = {Herke van Hoof and Nutan Chen and Maximilian Karl and Patrick van der Smagt and Jan Peters}, booktitle = {International Conference on Intelligent Robots and Systems (IROS)}, pages = {3928--3934}, title = {Stable Reinforcement Learning with Autoencoders for Tactile and Visual Data}, year = {2016}, } @inproceedings{hafner2020dream2control, author = {Danijar Hafner and Timothy P. Lillicrap and Jimmy Ba and Mohammad Norouzi}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Dream to Control: Learning Behaviors by Latent Imagination}, year = {2020}, } @inproceedings{zhang2018decoupling, author = {Amy Zhang and Harsh Satija and Joelle Pineau}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Decoupling Dynamics and Reward for Transfer Learning}, year = {2018}, } @inproceedings{guo2020bootstrap, author = {Zhaohan Daniel Guo and Bernardo Ávila Pires and Bilal Piot and Jean-Bastien Grill and Florent Altché and Rémi Munos and Mohammad Gheshlaghi Azar}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Bootstrap Latent-Predictive Representations for Multitask Reinforcement Learning}, year = {2020}, } @inproceedings{goyal2017sthsth, author = {Raghav Goyal and Samira Ebrahimi Kahou and Vincent Michalski and Joanna Materzynska and Susanne Westphal and Heuna Kim and Valentin Haenel and Ingo Fründ and Peter N. Yianilos and Moritz Mueller-Freitag and Florian Hoppe and Christian Thurau and Ingo Bax and Roland Memisevic}, booktitle = {International Conference on Computer Vision (ICCV)}, title = {The ``Something Something Video Database for Learning and Evaluating Visual Common Sense}, year = {2017}, } @inproceedings{miech2019howto100m, author = {Antoine Miech and Dimitri Zhukov and Jean-Baptiste Alayrac and Makarand Tapaswi and Ivan Laptev and Josef Sivic}, booktitle = {International Conference on Computer Vision (ICCV)}, pages = {2630--2640}, title = {{HowTo100M}: Learning a Text-Video Embedding by Watching Hundred Million Narrated Video Clips}, year = {2019}, } @inproceedings{grauman2022ego4d, author = {Kristen Grauman and Andrew Westbury and Eugene Byrne and Zachary Q. Chavis and Antonino Furnari and Rohit Girdhar and Jackson Hamburger and Hao Jiang and Miao Liu and Xingyu Liu and Miguel Martin and Tushar Nagarajan and Ilija Radosavovic and Santhosh K. Ramakrishnan and F. Ryan and Jayant Sharma and Michael Wray and Mengmeng Xu and Eric Z. Xu and Chen Zhao and Siddhant Bansal and Dhruv Batra and Vincent Cartillier and Sean Crane and Tien Do and Morrie Doulaty and Akshay Erapalli and Christoph Feichtenhofer and Adriano Fragomeni and Qichen Fu and Christian Fuegen and Abrham Gebreselasie and Cristina González and James M. Hillis and Xuhua Huang and Yifei Huang and Wenqi Jia and Weslie Yu Heng Khoo and Jáchym Kolár and Satwik Kottur and Anurag Kumar and Federico Landini and Chao Li and Yanghao Li and Zhenqiang Li and Karttikeya Mangalam and Raghava Modhugu and Jonathan Munro and Tullie Murrell and Takumi Nishiyasu and Will Price and Paola Ruiz Puentes and Merey Ramazanova and Leda Sari and Kiran K. Somasundaram and Audrey Southerland and Yusuke Sugano and Ruijie Tao and Minh Vo and Yuchen Wang and Xindi Wu and Takuma Yagi and Yunyi Zhu and Pablo Arbeláez and David J. Crandall and Dima Damen and Giovanni Maria Farinella and Bernard Ghanem and Vamsi Krishna Ithapu and C. V. Jawahar and Hanbyul Joo and Kris Kitani and Haizhou Li and Richard A. Newcombe and Aude Oliva and Hyun Soo Park and James M. Rehg and Yoichi Sato and Jianbo Shi and Mike Zheng Shou and Antonio Torralba and Lorenzo Torresani and Mingfei Yan and Jitendra Malik}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {{Ego4D}: Around the World in 3,000 Hours of Egocentric Video}, year = {2022}, } @inproceedings{lange2012autonomousrl, author = {Sascha Lange and Martin A. Riedmiller and Arne Voigtländer}, booktitle = {International Joint Conference on Neural Networks (IJCNN)}, pages = {1--8}, title = {Autonomous Reinforcement Learning on Raw Visual Input Data in a Real World Application}, year = {2012}, } @inproceedings{okada2021dreaming, author = {Masashi Okada and Tadahiro Taniguchi}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {4209--4215}, title = {Dreaming: Model-based Reinforcement Learning by Latent Imagination without Reconstruction}, year = {2021}, } @article{lesort2018staterl, author = {Timothée Lesort and Natalia Díaz Rodríguez and Jean-François Goudou and David Filliat}, journal = {Neural Networks: the Official Journal of the Neural Network Society}, pages = {379--392}, title = {State Representation Learning for Control: An Overview}, volume = {108}, year = {2018}, } @inproceedings{liu2021behavior, author = {Hao Liu and P. Abbeel}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Behavior From the Void: Unsupervised Active Pre-Training}, year = {2021}, } @inproceedings{he2022mae, author = {Kaiming He and Xinlei Chen and Saining Xie and Yanghao Li and Piotr Dollár and Ross B. Girshick}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Masked Autoencoders Are Scalable Vision Learners}, year = {2022}, } @article{babaeizadeh2021fitvid, author = {Mohammad Babaeizadeh and Mohammad Taghi Saffar and Suraj Nair and Sergey Levine and Chelsea Finn and D. Erhan}, journal = {arXiv preprint arXiv:2106.13195}, title = {FitVid: Overfitting in Pixel-Level Video Prediction}, year = {2021}, } @inproceedings{hu2018squeeze, author = {Jie Hu and Li Shen and Gang Sun}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Squeeze-and-Excitation Networks}, year = {2018}, } @article{ramachandran2018searching, author = {Prajit Ramachandran and Barret Zoph and Quoc V. Le}, journal = {arXiv preprint arXiv:1710.05941}, title = {Searching for Activation Functions}, year = {2018}, } @misc{polymetis2021, author = {Yixin Lin and Austin S. Wang and Giovanni Sutanto and Akshara Rai and Franziska Meier}, howpublished = {\url{https://facebookresearch.github.io/fairo/polymetis/}}, title = {Polymetis}, year = {2021}, } @article{hendrycks2016gelu, author = {Dan Hendrycks and Kevin Gimpel}, journal = {arXiv preprint arXiv:1606.08415}, title = {{Gaussian} Error Linear Units (GELUs)}, year = {2016}, } @inproceedings{hart2006nasa, author = {Sandra G Hart}, booktitle = {Proceedings of the Human Factors and Ergonomics Society Annual Meeting}, pages = {904--908}, title = {{NASA} Task Load Index (NASA-TLX); 20 Years Later}, volume = {50}, year = {2006}, } @article{ba2016layer, author = {Jimmy Lei Ba and Jamie Ryan Kiros and Geoffrey E Hinton}, journal = {arXiv preprint arXiv:1607.06450}, title = {Layer Normalization}, year = {2016}, } @article{peng2019awr, author = {Xue Bin Peng and Aviral Kumar and Grace H. Zhang and Sergey Levine}, journal = {arXiv preprint arXiv:abs/1910.00177}, title = {Advantage-Weighted Regression: Simple and Scalable Off-Policy Reinforcement Learning}, year = {2019}, } @inproceedings{spencer2020eil, author = {Jonathan Spencer and Sanjiban Choudhury and Matt Barnes and Matt Schmittle and Mung Chiang and Peter J. Ramadge and Siddhartha S. Srinivasa}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Learning from Interventions: Human-robot Interaction as both Explicit and Implicit Feedback}, year = {2020}, } @inproceedings{kim2013mmd, author = {Beomjoon Kim and Joelle Pineau}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Maximum Mean Discrepancy Imitation Learning}, year = {2013}, } @inproceedings{menda2019ensemble, author = {Kunal Menda and K. Driggs-Campbell and Mykel J. Kochenderfer}, booktitle = {International Conference on Intelligent Robots and Systems (IROS)}, pages = {5041--5048}, title = {EnsembleDAgger: A {Bayesian} Approach to Safe Imitation Learning}, year = {2019}, } @inproceedings{zhang2017queryefficient, author = {Jiakai Zhang and Kyunghyun Cho}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Query-Efficient Imitation Learning for End-to-End Autonomous Driving}, year = {2017}, } @inproceedings{wang2020criticrr, author = {Ziyun Wang and Alexander Novikov and Konrad Zolna and Jost Tobias Springenberg and Scott E. Reed and Bobak Shahriari and Noah Siegel and Josh Merel and Caglar Gulcehre and Nicolas Manfred Otto Heess and Nando de Freitas}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Critic Regularized Regression}, year = {2020}, } @inproceedings{yang2022trail, author = {Mengjiao Yang and Sergey Levine and Ofir Nachum}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {TRAIL: Near-Optimal Imitation Learning with Suboptimal Data}, year = {2022}, } @inproceedings{karamcheti2021outliers, author = {Siddharth Karamcheti and Ranjay Krishna and Li Fei-Fei and Christopher D. Manning}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Mind Your Outliers! Investigating the Negative Impact of Outliers on Active Learning for Visual Question Answering}, year = {2021}, } @article{grigsby2021filteredbc, author = {Jake Grigsby and Yanjun Qi}, journal = {arXiv preprint arXiv:2110.04698}, title = {A Closer Look at Advantage-Filtered Behavioral Cloning in High-Noise Datasets}, year = {2021}, } @inproceedings{emmons2022rvs, author = {Scott Emmons and Benjamin Eysenbach and Ilya Kostrikov and Sergey Levine}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {RvS: What is Essential for Offline {RL} via Supervised Learning?}, year = {2022}, } @inproceedings{jang2021bcz, author = {Eric Jang and Alex Irpan and Mohi Khansari and Daniel Kappler and Frederik Ebert and Corey Lynch and Sergey Levine and Chelsea Finn}, booktitle = {Conference on Robot Learning (CoRL)}, title = {{BC-Z}: Zero-Shot Task Generalization with Robotic Imitation Learning}, year = {2021}, } @inproceedings{ebert2022bridge, author = {Frederik Ebert and Yanlai Yang and Karl Schmeckpeper and Bernadette Bucher and Georgios Georgakis and Kostas Daniilidis and Chelsea Finn and Sergey Levine}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Bridge Data: Boosting Generalization of Robotic Skills with Cross-Domain Datasets}, year = {2022}, } @inproceedings{dasari2021rb2, author = {Sudeep Dasari and Jianren Wang and Joyce Hong and Shikhar Bahl and Yixin Lin and Austin S. Wang and Abitha Thankaraj and Karanbir Singh Chahal and Berk Çalli and Saurabh Gupta and David Held and Lerrel Pinto and Deepak Pathak and Vikash Kumar and Abhinav Kumar Gupta}, booktitle = {Neural Information Processing Systems Track on Datasets and Benchmarks (NeurIPS Datasets and Benchmarks)}, title = {RB2: Robotics Benchmarking with a Twist}, year = {2021}, } @inproceedings{beliaev2022ileed, author = {Mark Beliaev and Andy Shih and Stefano Ermon and Dorsa Sadigh and Ramtin Pedarsani}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Imitation Learning by Estimating Expertise of Demonstrators}, year = {2022}, } @article{ahn2022saycan, author = {Michael Ahn and Anthony Brohan and Noah Brown and Yevgen Chebotar and Omar Cortes and Byron David and Chelsea Finn and Keerthana Gopalakrishnan and Karol Hausman and Alexander Herzog and Daniel Ho and Jasmine Hsu and Julian Ibarz and Brian Ichter and Alex Irpan and Eric Jang and Rosario Jauregui Ruano and Kyle Jeffrey and Sally Jesmonth and Nikhil Jayant Joshi and Ryan C. Julian and Dmitry Kalashnikov and Yuheng Kuang and Kuang-Huei Lee and Sergey Levine and Yao Lu and Linda Luu and Carolina Parada and Peter Pastor and Jornell Quiambao and Kanishka Rao and Jarek Rettinghouse and Diego M Reyes and Pierre Sermanet and Nicolas Sievers and Clayton Tan and Alexander Toshev and Vincent Vanhoucke and Fei Xia and Ted Xiao and Peng Xu and Sichun Xu and Mengyuan Yan}, journal = {arXiv preprint arXiv:2204.01691}, title = {Do As {I} Can, Not As {I} Say: Grounding Language in Robotic Affordances}, year = {2022}, } @inproceedings{florence2021implicitbc, author = {Peter R. Florence and Corey Lynch and Andy Zeng and Oscar Ramirez and Ayzaan Wahid and Laura Downs and Adrian S. Wong and Johnny Lee and Igor Mordatch and Jonathan Tompson}, booktitle = {Conference on Robot Learning (CoRL)}, title = {Implicit Behavioral Cloning}, year = {2021}, } @inproceedings{bishop1994mdn, author = {Christopher M. Bishop}, booktitle = {NCRG Report}, title = {Mixture density networks}, year = {1994}, } @inproceedings{zhang2021cail, author = {Songyuan Zhang and Zhangjie Cao and Dorsa Sadigh and Yanan Sui}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Confidence-Aware Imitation Learning from Demonstrations with Varying Optimality}, year = {2021}, } @inproceedings{gopalan2022negativelfd, author = {Nakul Gopalan and Nina Moorman and Manisha Natarajan and Matthew Craig Gombolay and Georgia}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Negative Result for Learning from Demonstration: Challenges for End-Users Teaching Robots with Task And Motion Planning Abstractions}, year = {2022}, } @inproceedings{hausman2017multimodal, author = {Karol Hausman and Yevgen Chebotar and Stefan Schaal and Gaurav S. Sukhatme and Joseph J. Lim}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Multi-Modal Imitation Learning from Unstructured Demonstrations using Generative Adversarial Nets}, year = {2017}, } @inproceedings{kuefler2018burnin, author = {Alex Kuefler and Mykel J. Kochenderfer}, booktitle = {International Conference on Autonomous Agents and Multiagent Systems (AAMAS)}, title = {Burn-In Demonstrations for Multi-Modal Imitation Learning}, year = {2018}, } @inproceedings{chen2020suboptimal, author = {Letian Chen and Rohan R. Paleja and Matthew Craig Gombolay}, booktitle = {Conference on Robot Learning (CoRL)}, title = {Learning from Suboptimal Demonstration via Self-Supervised Reward Regression}, year = {2020}, } @inproceedings{brown2019extrapolating, author = {Daniel S. Brown and Wonjoon Goo and Prabhat Nagarajan and Scott Niekum}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Extrapolating Beyond Suboptimal Demonstrations via Inverse Reinforcement Learning from Observations}, year = {2019}, } @inproceedings{myers2021multimodal, author = {Vivek Myers and Erdem Biyik and Nima Anari and Dorsa Sadigh}, booktitle = {Conference on Robot Learning (CoRL)}, title = {Learning Multimodal Rewards from Rankings}, year = {2021}, } @article{zhu2022buds, author = {Yifeng Zhu and Peter Stone and Yuke Zhu}, journal = {IEEE Robotics and Automation Letters (RA-L)}, pages = {4126--4133}, title = {Bottom-Up Skill Discovery From Unsegmented Demonstrations for Long-Horizon Robot Manipulation}, volume = {7}, year = {2022}, } @inproceedings{chernova2014robot, author = {S. Chernova and Andrea Lockerd Thomaz}, booktitle = {Robot Learning from Human Teachers}, title = {Robot Learning from Human Teachers}, year = {2014}, } @article{broad2017realtime, author = {Alexander Broad and Jacob Arkin and Nathan D. Ratliff and Thomas M. Howard and Brenna Argall}, journal = {International Journal of Robotics Research (IJRR)}, pages = {684--698}, title = {Real-time natural language corrections for assistive robotic manipulators}, volume = {36}, year = {2017}, } @inproceedings{cui2018active, author = {Yuchen Cui and Scott Niekum}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {6907--6914}, title = {Active Reward Learning from Critiques}, year = {2018}, } @article{sanh2019distilbert, author = {Victor Sanh and Lysandre Debut and Julien Chaumond and Thomas Wolf}, journal = {arXiv preprint arXiv:1910.01108}, title = {{DistilBERT}, a distilled version of {BERT}: smaller, faster, cheaper and lighter}, year = {2019}, } @article{mandlekar2020human, author = {Ajay Mandlekar and Danfei Xu and Roberto Martín-Martín and Yuke Zhu and Li Fei-Fei and Silvio Savarese}, journal = {arXiv preprint arXiv:2012.06733}, title = {Human-in-the-Loop Imitation Learning using Remote Teleoperation}, year = {2020}, } @inproceedings{schmittle2020learning, author = {Matthew Schmittle and Sanjiban Choudhury and Siddhartha S Srinivasa}, booktitle = {Conference on Robot Learning (CoRL)}, title = {Learning Online from Corrective Feedback: A Meta-Algorithm for Robotics}, year = {2020}, } @inproceedings{li2021learning, author = {Mengxi Li and Alper Canberk and Dylan P. Losey and Dorsa Sadigh}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {2877--2883}, title = {Learning Human Objectives from Sequences of Physical Corrections}, year = {2021}, } @inproceedings{sharma2022correcting, author = {Pratyusha Sharma and Balakumar Sundaralingam and Valts Blukis and Chris Paxton and Tucker Hermans and Antonio Torralba and Jacob Andreas and Dieter Fox}, booktitle = {Robotics: Science and Systems (RSS)}, title = {Correcting Robot Plans with Natural Language Feedback}, year = {2022}, } @inproceedings{bucker2022reshaping, author = {Arthur Fender C. Bucker and Luis F. C. Figueredo and Sami Haddadin and Ashish Kapoor and Shuang Ma and Rogerio Bonatti}, booktitle = {International Conference on Intelligent Robots and Systems (IROS)}, pages = {978--984}, title = {Reshaping Robot Trajectories Using Natural Language Commands: A Study of Multi-Modal Data Alignment Using Transformers}, year = {2022}, } @article{bucker2022latte, author = {Arthur Fender C. Bucker and Luis F. C. Figueredo and Sami Haddadin and Ashish Kapoor and Shuang Ma and Sai Vemprala and Rogerio Bonatti}, journal = {arXiv preprint arXiv:2208.02918}, title = {LaTTe: Language Trajectory TransformEr}, year = {2022}, } @article{mees2022matters, author = {Oier Mees and Lukás Hermann and Wolfram Burgard}, journal = {IEEE Robotics and Automation Letters (RA-L)}, pages = {11205--11212}, title = {What Matters in Language Conditioned Robotic Imitation Learning Over Unstructured Data}, volume = {7}, year = {2022}, } @article{rockafellar2000optimization, author = {R. Tyrrell Rockafellar and Stanislav Uryasev}, journal = {Journal of Risk}, pages = {21--41}, title = {Optimization of Conditional Value-at-Risk}, volume = {2}, year = {2000}, } @article{nemirovski2009robust, author = {Arkadi Nemirovski and Anatoli Juditsky and Guanghui Lan and Alexander Shapiro}, journal = {SIAM Journal on optimization}, number = {4}, pages = {1574--1609}, title = {Robust stochastic approximation approach to stochastic programming}, volume = {19}, year = {2009}, } @article{azzalini2012some, author = {Adelchi Azzalini and Giuliana Regoli}, journal = {Annals of the Institute of Statistical Mathematics}, number = {4}, pages = {857--879}, title = {Some properties of skew-symmetric distributions}, volume = {64}, year = {2012}, } @inproceedings{ni2019justifying, author = {Jianmo Ni and Jiacheng Li and Julian McAuley}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {188--197}, title = {Justifying recommendations using distantly-labeled reviews and fine-grained aspects}, year = {2019}, } @article{zhang2020adaptive, author = {Marvin Zhang and Henrik Marklund and Abhishek Gupta and Sergey Levine and Chelsea Finn}, journal = {arXiv preprint arXiv:2007.02931}, title = {Adaptive Risk Minimization: A Meta-Learning Approach for Tackling Group Shift}, year = {2020}, } @article{caldas2018leaf, author = {Sebastian Caldas and Peter Wu and Tian Li and Jakub Kone{\v{c}}n{\`y} and H Brendan McMahan and Virginia Smith and Ameet Talwalkar}, journal = {arXiv preprint arXiv:1812.01097}, title = {Leaf: A benchmark for federated settings}, year = {2018}, } @article{li2019fair, author = {Tian Li and Maziar Sanjabi and Ahmad Beirami and Virginia Smith}, journal = {arXiv preprint arXiv:1905.10497}, title = {Fair resource allocation in federated learning}, year = {2019}, } @article{west2014exploiting, author = {Robert West and Hristo S Paskov and Jure Leskovec and Christopher Potts}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, pages = {297--310}, title = {Exploiting social network structure for person-to-person sentiment analysis}, volume = {2}, year = {2014}, } @inproceedings{patro2020fairrec, author = {Gourab K Patro and Arpita Biswas and Niloy Ganguly and Krishna P Gummadi and Abhijnan Chakraborty}, booktitle = {Proceedings of The Web Conference 2020}, pages = {1194--1204}, title = {FairRec: Two-Sided Fairness for Personalized Recommendations in Two-Sided Platforms}, year = {2020}, } @article{lau2014social, author = {Raymond YK Lau and Chunping Li and Stephen SY Liao}, journal = {Decision Support Systems}, pages = {80--94}, title = {Social analytics: Learning fuzzy product ontologies for aspect-oriented sentiment analysis}, volume = {65}, year = {2014}, } @inproceedings{muandet2013domain, author = {Krikamol Muandet and David Balduzzi and Bernhard Sch{\"o}lkopf}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {10--18}, title = {Domain generalization via invariant feature representation}, year = {2013}, } @inproceedings{blanchard2011generalizing, author = {Gilles Blanchard and Gyemin Lee and Clayton Scott}, booktitle = {Advances in neural information processing systems}, pages = {2178--2186}, title = {Generalizing from several related classification tasks to a new unlabeled sample}, year = {2011}, } @inproceedings{sun2020test, author = {Yu Sun and Xiaolong Wang and Zhuang Liu and John Miller and Alexei A Efros and Moritz Hardt}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Test-time training with self-supervision for generalization under distribution shifts}, year = {2020}, } @inproceedings{worrall2017harmonic, author = {Daniel E Worrall and Stephan J Garbin and Daniyar Turmukhambetov and Gabriel J Brostow}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {5028--5037}, title = {Harmonic networks: Deep translation and rotation equivariance}, year = {2017}, } @article{gulrajani2020search, author = {Ishaan Gulrajani and David Lopez-Paz}, journal = {arXiv preprint arXiv:2007.01434}, title = {In search of lost domain generalization}, year = {2020}, } @article{taori2020measuring, author = {Rohan Taori and Achal Dave and Vaishaal Shankar and Nicholas Carlini and Benjamin Recht and Ludwig Schmidt}, journal = {arXiv preprint arXiv:2007.00644}, title = {Measuring Robustness to Natural Distribution Shifts in Image Classification}, year = {2020}, } @inproceedings{ros2016synthia, author = {German Ros and Laura Sellart and Joanna Materzynska and David Vazquez and Antonio M Lopez}, booktitle = {Proceedings of the IEEE conference on computer vision and pattern recognition}, pages = {3234--3243}, title = {The synthia dataset: A large collection of synthetic images for semantic segmentation of urban scenes}, year = {2016}, } @inproceedings{richter2016playing, author = {Stephan R Richter and Vibhav Vineet and Stefan Roth and Vladlen Koltun}, booktitle = {European conference on computer vision}, pages = {102--118}, title = {Playing for data: Ground truth from computer games}, year = {2016}, } @inproceedings{barbu2019objectnet, author = {Andrei Barbu and David Mayo and Julian Alverio and William Luo and Christopher Wang and Dan Gutfreund and Josh Tenenbaum and Boris Katz}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {9453--9463}, title = {Objectnet: A large-scale bias-controlled dataset for pushing the limits of object recognition models}, year = {2019}, } @inproceedings{peng2018visda, author = {Xingchao Peng and Ben Usman and Neela Kaushik and Dequan Wang and Judy Hoffman and Kate Saenko}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {2021--2026}, title = {Visda: A synthetic-to-real benchmark for visual domain adaptation}, year = {2018}, } @inproceedings{venkateswara2017deep, author = {Hemanth Venkateswara and Jose Eusebio and Shayok Chakraborty and Sethuraman Panchanathan}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {5018--5027}, title = {Deep hashing network for unsupervised domain adaptation}, year = {2017}, } @inproceedings{fang2013unbiased, author = {Chen Fang and Ye Xu and Daniel N Rockmore}, booktitle = {International Conference on Computer Vision (ICCV)}, pages = {1657--1664}, title = {Unbiased metric learning: On the utilization of multiple datasets and web images for softening bias}, year = {2013}, } @article{hendrycks2020pretrained, author = {Dan Hendrycks and Xiaoyuan Liu and Eric Wallace and Adam Dziedzic and Rishabh Krishnan and Dawn Song}, journal = {arXiv preprint arXiv:2004.06100}, title = {Pretrained transformers improve out-of-distribution robustness}, year = {2020}, } @inproceedings{dasgupta2009mine, author = {Sajib Dasgupta and Vincent Ng}, booktitle = {Conference on Natural Language Processing (KONVENS)}, pages = {701--709}, title = {Mine the easy, classify the hard: a semi-supervised approach to automatic sentiment classification}, year = {2009}, } @inproceedings{li2011semi, author = {Shoushan Li and Zhongqing Wang and Guodong Zhou and Sophia Yat Mei Lee}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Semi-supervised learning for imbalanced sentiment classification}, year = {2011}, } @inproceedings{glorot2011domain, author = {Xavier Glorot and Antoine Bordes and Yoshua Bengio}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Domain adaptation for large-scale sentiment classification: A deep learning approach}, year = {2011}, } @book{ripley2009stochastic, author = {Brian D Ripley}, publisher = {John Wiley \& Sons}, title = {Stochastic simulation}, year = {2009}, } @inproceedings{ranganath2014black, author = {Rajesh Ranganath and Sean Gerrish and David Blei}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, pages = {814--822}, title = {Black box variational inference}, year = {2014}, } @inproceedings{paisley2012variational, author = {John Paisley and David M Blei and Michael I Jordan}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1363--1370}, title = {Variational {B}ayesian inference with stochastic search}, year = {2012}, } @article{greensmith2004variance, author = {Evan Greensmith and Peter L Bartlett and Jonathan Baxter}, journal = {Journal of Machine Learning Research (JMLR)}, pages = {1471--1530}, title = {Variance reduction techniques for gradient estimates in reinforcement learning}, volume = {5}, year = {2004}, } @article{kulkarni2016hierarchical, author = {T. D. Kulkarni and K. Narasimhan and A. Saeedi and J. Tenenbaum}, journal = {Advances in neural information processing systems}, pages = {3675--3683}, title = {Hierarchical deep reinforcement learning: Integrating temporal abstraction and intrinsic motivation}, year = {2016}, } @article{brafman2002r, author = {R. Brafman and M. Tennenholtz}, journal = {Journal of Machine Learning Research}, pages = {213--231}, title = {{R}-max-a general polynomial time algorithm for near-optimal reinforcement learning}, year = {2002}, } @article{strehl2005theoretical, author = {A. L. Strehl and M. L. Littman}, journal = {Proceedings of the 22nd international conference on Machine learning}, pages = {856--863}, title = {A theoretical analysis of model-based interval estimation}, year = {2005}, } @article{strehl2009reinforcement, author = {A. L. Strehl and L. Li and M. L. Littman}, journal = {Journal of Machine Learning Research}, pages = {2413--2444}, title = {Reinforcement learning in finite MDPs: {PAC} analysis}, year = {2009}, } @article{osband2013more, author = {I. Osband and D. Russo and B. Van Roy}, journal = {Advances in Neural Information Processing Systems}, pages = {3003--3011}, title = {(More) efficient reinforcement learning via posterior sampling}, year = {2013}, } @article{osband2016posterior, author = {I. Osband and B. Van Roy}, journal = {arXiv preprint arXiv:1607.00215}, title = {Why is posterior sampling better than optimism for reinforcement learning}, year = {2016}, } @article{jaksch2010near, author = {T. Jaksch and R. Ortner and P. Auer}, journal = {Journal of Machine Learning Research}, pages = {1563--1600}, title = {Near-optimal regret bounds for reinforcement learning}, year = {2010}, } @article{dann2017unifying, author = {C. Dann and T. Lattimore and E. Brunskill}, journal = {Advances in Neural Information Processing Systems}, pages = {5713--5723}, title = {Unifying {PAC} and regret: Uniform {PAC} bounds for episodic reinforcement learning}, year = {2017}, } @inproceedings{azar2017minimax, author = {M. G. Azar and I. Osband and R. Munos}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Minimax regret bounds for reinforcement learning}, year = {2017}, } @article{singh1995reinforcement, author = {S. P. Singh and T. Jaakkola and M. Jordan}, journal = {Advances in neural information processing systems}, pages = {361--368}, title = {Reinforcement learning with soft state aggregation}, year = {1995}, } @article{dietterich2000hierarchical, author = {T. G. Dietterich}, journal = {Journal of Artificial Intelligence Research}, pages = {227--303}, title = {Hierarchical reinforcement learning with the {MAXQ} value function decomposition}, year = {2000}, } @article{aytar2018playing, author = {Y. Aytar and T. Pfaff and D Budden and T. L. Paine and Z. Wang and N. de Freitas}, journal = {arXiv preprint arXiv:1805.11592}, title = {Playing hard exploration games by watching YouTube}, year = {2018}, } @article{pohlen2018observe, author = {T. Pohlen and B. Piot and T. Hester and M. G. Azar and D. Horgan and D. Budden and G. Barth-Maron and H. van Hasselt and J. Quan and M. Ve{\v{c}}er{'\i}k and others}, journal = {arXiv preprint arXiv:1805.11593}, title = {Observe and Look Further: Achieving Consistent Performance on {ATARI}}, year = {2018}, } @article{sutton1995td, author = {R. S. Sutton}, journal = {Machine Learning Proceedings}, pages = {531--539}, title = {{TD} models: Modeling the world at a mixture of time scales}, year = {1995}, } @article{vezhnevets2017feudal, author = {A. S. Vezhnevets and S. Osindero and T. Schaul and N. Heess and M. Jaderberg and D. Silver and K. Kavukcuoglu}, journal = {arXiv preprint arXiv:1703.01161}, title = {Feudal networks for hierarchical reinforcement learning}, year = {2017}, } @article{kirkpatrick2017overcoming, author = {J. Kirkpatrick and R. Pascanu and N. Rabinowitz and J. Veness and G. Desjardins and A. A. Rusu and K. Milan and J. Quan and T. Ramalho and A. Grabska-Barwinska and others}, journal = {Proceedings of the national academy of sciences}, title = {Overcoming catastrophic forgetting in neural networks}, year = {2017}, } @article{keramati2018strategic, author = {R. Keramati and J. Whang and P. Cho and E. Brunskill}, journal = {arXiv preprint arXiv:1806.00175}, title = {Strategic Object Oriented Reinforcement Learning}, year = {2018}, } @article{oh2018self, author = {J. Oh and Y. Guo and S. Singh and H. Lee}, journal = {arXiv preprint arXiv::1806.05635}, title = {Self-Imitation Learning}, year = {2018}, } @article{dann2018polynomial, author = {C. Dann and N. Jiang and A. Krishnamurthy and A. Agarwal and J. Langford and R. E. Schapire}, journal = {arXiv preprint arXiv:1803.00606}, title = {On Polynomial Time {PAC} Reinforcement Learning with Rich Observations}, year = {2018}, } @article{jiang2016contextual, author = {N. Jiang and A. Krishnamurthy and A. Agarwal and J. Langford and R. E. Schapire}, journal = {arXiv preprint arXiv:1610.09512}, title = {Contextual decision processes with low Bellman rank are {PAC}-learnable}, year = {2016}, } @article{russo2013eluder, author = {D. Russo and B. Van Roy}, journal = {Advances in Neural Information Processing Systems}, pages = {2256--2264}, title = {Eluder dimension and the sample complexity of optimistic exploration}, year = {2013}, } @article{wen2013efficient, author = {Z. Wen and B. Van Roy}, journal = {Advances in Neural Information Processing Systems}, pages = {3021--3029}, title = {Efficient exploration and value function generalization in deterministic systems}, year = {2013}, } @article{islam2017reproducibility, author = {R. Islam and P. Henderson and M. Gomrokchi and D. Precup}, journal = {arXiv preprint arXiv:1708.04133}, title = {Reproducibility of benchmarked deep reinforcement learning tasks for continuous control}, year = {2017}, } @article{machado2017revisiting, author = {M. C. Machado and M. G. Bellemare and E. Talvitie and J. Veness and M. Hausknecht and M. Bowling}, journal = {arXiv preprint arXiv:1709.06009}, title = {Revisiting the arcade learning environment: Evaluation protocols and open problems for general agents}, year = {2017}, } @inproceedings{talvitie2014model, author = {E. Talvitie}, booktitle = {Uncertainty in Artificial Intelligence (UAI)}, pages = {780--789}, title = {Model Regularization for Stable Sample Rollouts}, year = {2014}, } @inproceedings{talvitie2017self, author = {E. Talvitie}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, pages = {2597--2603}, title = {Self-Correcting Models for Model-Based Reinforcement Learning}, year = {2017}, } @inproceedings{nair2010rectified, author = {V. Nair and G. E. Hinton}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {807--814}, title = {Rectified linear units improve restricted {boltzmann} machines}, year = {2010}, } @article{watkins1989learning, author = {C. Watkins}, journal = {King's College, Cambridge}, title = {Learning from delayed rewards}, year = {1989}, } @inproceedings{auer1995gambling, author = {P. Auer and N. Cesa-Bianchi and Y. Freund and R. E. Schapire}, booktitle = {International Conference on Robotics and Automation (ICRA)}, pages = {322--322}, title = {Gambling in a rigged casino: The adversarial multi-armed bandit problem}, year = {1995}, } @article{oh2017value, author = {J. Oh and S. Singh and H. Lee}, journal = {Advances in Neural Information Processing Systems}, pages = {6118--6128}, title = {Value prediction network}, year = {2017}, } @article{simard2003best, author = {Patrice Y. Simard and Dave Steinkraus and John C. Platt}, journal = {International Conference on Document Analysis and Recognition}, pages = {958--964}, title = {Best Practices for Convolutional Neural Networks Applied to Visual Document Analysis}, volume = {2}, year = {2003}, } @inproceedings{yaeger1996effective, author = {Larry Yaeger and Richard Lyon and Brandyn Webb}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {807--813}, title = {Effective Training of a Neural Network Character Classifier for Word Recognition}, year = {1996}, } @article{ciresan2011high, author = {Dan C. Ciresan and Ueli Meier and Jonathan Masci and Luca M. Gambardella and Jurgen Schmidhuber}, journal = {arXiv}, title = {High-Performance Neural Networks for Visual Object Classification}, year = {2011}, } @inproceedings{ravuri2019seeing, author = {Suman Ravuri and Oriol Vinyals}, booktitle = {International Conference on Learning Representations Workshop (ICLR)}, title = {Seeing is Not Necessarily Believing: Limitations of BigGANs for Data Augmentation}, year = {2019}, } @book{rao2007linear, author = {C. Radhakrishna Rao and Helge Toutenburg and Shalabh and Christian Heumann}, publisher = {Springer Publishing Company}, title = {Linear Models and Generalizations: Least Squares and Alternatives}, year = {2007}, } @article{lamb2019interpolated, author = {Alex Lamb and Vikas Verma and Juho Kannala and Yoshua Bengio}, journal = {arXiv}, title = {Interpolated Adversarial Training: Achieving Robust Neural Networks without Sacrificing Too Much Accuracy}, year = {2019}, } @inproceedings{prabhu2019understanding, author = {Vinay Uday Prabhu and Joyce Xu and Dian Ang Yap and John Whaley}, booktitle = {International Conference on Learning Representations Workshop (ICLR)}, title = {Understanding Adversarial Robustness Through Loss Landscape Geometries}, year = {2019}, } @article{dobriban2015high, author = {Edgar Dobriban and Stefan Wager}, journal = {arXiv}, title = {High-Dimensional Asymptotics of Prediction: Ridge Regression and Classification}, year = {2015}, } @article{bartlett2019benign, author = {Peter L. Bartlett and Philip M. Long and G´abor Lugosi and Alexander Tsigler}, journal = {arXiv}, title = {Benign Overfitting in Linear Regression}, year = {2019}, } @article{kleinman1968design, author = {D. Kleinman and M. Athans}, journal = {IEEE Transactions on Automatic Control}, pages = {150--159}, title = {The design of suboptimal linear time-varying systems}, volume = {13}, year = {1968}, } @article{kovanic1979pseudoinverse, author = {Pavel Kovanic}, journal = {Kybernetika}, title = {On the Pseudoinverse of a Sum of Symmetric Matrices with Applications to Estimation}, volume = {15}, year = {1979}, } @article{berthelot2019mixmatch, author = {David Berthelot and Nicholas Carlini and Ian Goodfellow and Nicolas Papernot and Avital Oliver and Colin Raffel}, journal = {arXiv}, title = {MixMatch: A Holistic Approach to Semi-Supervised Learning}, year = {2019}, } @article{belkin2019two, author = {Mikhail Belkin and Daniel Hsu and Ji Xu}, journal = {arXiv}, title = {Two models of double descent for weak features}, year = {2019}, } @article{schwartz2006ranking, author = {S. Shalev-Schwartz and Y. Singer}, journal = {Journal of Machine Learning Research (JMLR)}, title = {Efficient learning of label ranking by soft projections onto polyhedra}, volume = {7}, year = {2006}, } @inproceedings{duchi2008projections, author = {J. Duchi and S. Shalev-Shwartz and Y. Singer and T. Chandra}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Efficient Projections onto the l1-Ball for Learning in High Dimensions}, year = {2008}, } @article{sennrich2016monolingual, author = {R. Sennrich and B. Haddow and A. Birch}, journal = {arXiv}, title = {Improving neural machine translation models with monolingual data}, year = {2016}, } @inproceedings{cheng2016sslnlp, author = {Y. Cheng and W. Xu and Z. He and W. He and H. Wu and M. Sun and Y. Liu}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Semi-supervised learning for neural machine translation}, year = {2016}, } @article{ramachandran2018pretraining, author = {P. Ramachandran and P. J. Liu and Q. V. Le}, journal = {arXiv}, title = {Unsupervised pretraining for sequence to sequence learning}, year = {2018}, } @inproceedings{skorokhodov2018ssl, author = {I. Skorokhodov and A. Rykachevskiy and D. Emelyanenko and S. Slotin and A. Ponkratov}, booktitle = {AMTA 2018 Workshop on Technologies for MT of Low Resource Languages (LoResMT)}, title = {Semi-supervised neural machine translation with language models}, year = {2018}, } @article{ronneberger2015unet, author = {Olaf Ronneberger and Philipp Fischer and Thomas Brox}, journal = {arXiv}, title = {{U-Net}: Convolutional Networks for Biomedical Image Segmentation}, year = {2015}, } @article{savarese2019function, author = {Pedro Savarese and Itay Evron and Daniel Soudry and Nathan Srebro}, journal = {arXiv}, title = {How do infinite width bounded norm networks look in function space?}, year = {2019}, } @article{neyshabur2014implicit, author = {Behnam Neyshabur and Ryota Tomioka and Nathan Srebro}, journal = {arXiv}, title = {In search of the real inductive bias: On the role of implicit regularization in deep learning}, year = {2014}, } @inproceedings{eldan2016depth, author = {R. Eldan and O. Shamir}, booktitle = {Conference on Learning Theory (COLT)}, title = {The Power of Depth for Feedforward Neural Networks}, year = {2016}, } @article{parhi2019minnorm, author = {R. Parhi and R. D. Nowak}, journal = {arXiv}, title = {Minimum "Norm" Neural Networks are Splines}, year = {2019}, } @misc{bernhardsson2016fonts, author = {E. Bernhardsson}, title = {Analyzing 50k fonts using deep neural networks}, year = {2016}, } @inproceedings{kudo2018sentencepiece, author = {Taku Kudo and John Richardson}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {SentencePiece: A simple and language independent subword tokenizer and detokenizer for Neural Text Processing}, year = {2018}, } @inproceedings{sennrich2016bpe, author = {Rico Sennrich and Barry Haddow and Alexandra Birch}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Neural Machine Translation of Rare Words with Subword Units}, year = {2016}, } @inproceedings{you2018moleculegraph, author = {J. You and B. Liu and Z. Ying and V. Pande and J. Leskovec}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Graph Convolutional Policy Network for Goal-Directed Molecular Graph Generation}, year = {2018}, } @article{tsuda2017chemts, author = {X. Yang and J. Zhang and K. Yoshizoe and K. Terayama and K. Tsuda}, journal = {arXiv}, title = {ChemTS: An Efficient {Python} Library for de novo Molecular Generation}, year = {2017}, } @inproceedings{lipton2018labelshift, author = {Z. C. Lipton and Y. Wang and A. J. Smola}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Detecting and Correcting for Label Shift with Black Box Predictors}, year = {2018}, } @inproceedings{azizzadenesheli2019reglabel, author = {Kamyar Azizzadenesheli and Anqi Liu and Fanny Yang and Animashree Anandkumar}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Regularized Learning for Domain Adaptation under Label Shifts}, year = {2019}, } @article{guzman2019flores, author = {Francisco Guzmán and Peng-Jen Chen and Myle Ott and Juan Pino and Guillaume Lample and Philipp Koehn and Vishrav Chaudhary and Marc'Aurelio Ranzato}, journal = {arXiv}, title = {Two New Evaluation Datasets for Low-Resource Machine Translation: Nepali-{English} and Sinhala-{English}}, year = {2019}, } @article{lucio2020molecule, author = {Oscar Méndez-Lucio and Benoit Baillif and Djork-Arné Clevert and David Rouquié and Joerg Wichard}, journal = {Nature Communications}, title = {De novo generation of hit-like molecules from gene expression signatures using artificial intelligence}, volume = {11}, year = {2020}, } @article{senior2020protein, author = {Andrew W. Senior and Richard Evans and John Jumper and James Kirkpatrick and Laurent Sifre and Tim Green and Chongli Qin and Augustin Žídek and Alexander W. R. Nelson and Alex Bridgland and Hugo Penedones and Stig Petersen and Karen Simonyan and Steve Crossan and Pushmeet Kohli and David T. Jones and David Silver and Koray Kavukcuoglu and Demis Hassabis}, journal = {Nature}, title = {Improved protein structure prediction using potentials from deep learning}, volume = {577}, year = {2020}, } @inproceedings{neyshabur2017generalization, author = {Behnam Neyshabur and Srinadh Bhojanapalli and David McAllester and Nathan Srebro}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Exploring Generalization in Deep Learning}, year = {2017}, } @inproceedings{bartlett2017spectral, author = {Peter Bartlett and Dylan J. Foster and Matus Telgarsky}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Spectrally-normalized margin bounds for neural networks}, year = {2017}, } @inproceedings{wei2020improved, author = {Colin Wei and Tengyu Ma}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Improved Sample Complexities for Deep Networks and Robust Classification via an All-Layer Margin}, year = {2020}, } @inproceedings{wei2019data, author = {Colin Wei and Tengyu Ma}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Data-dependent Sample Complexity of Deep Neural Networks via {Lipschitz} Augmentation}, year = {2019}, } @inproceedings{chen2020more, author = {Lin Chen and Yifei Min and Mingrui Zhang and Amin Karbasi}, booktitle = {International Conference on Machine Learning (ICML)}, title = {More Data Can Expand the Generalization Gap Between Adversarially Robust and Standard Models}, year = {2020}, } @inproceedings{gu2015robustdenoise, author = {Shixiang Gu and Luca Rigazio}, booktitle = {International Conference on Learning Representations Workshop (ICLR)}, title = {Towards deep neural network architectures robust to adversarial examples}, year = {2015}, } @article{wong2020learningpert, author = {Eric Wong and J. Zico Kolter}, journal = {arXiv}, title = {Learning perturbation sets for robust machine learning}, year = {2020}, } @article{vincent2010stacked, author = {Pascal Vincent and Hugo Larochelle and Isabelle Lajoie and Yoshua Bengio and Pierre-Antoine Manzagol}, journal = {Journal of Machine Learning Research (JMLR)}, title = {Stacked Denoising Autoencoders: Learning Useful Representations in a Deep Network with a Local Denoising Criterion}, volume = {11}, year = {2010}, } @article{zhang2013denoising, author = {Xiao-Lei Zhang and Ji Wu}, journal = {arXiv}, title = {Denoising deep neural networks based voice activity detection}, year = {2013}, } @inproceedings{jagannatha2016structured, author = {Abhyuday Jagannatha and Hong Yu}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Structured prediction models for {RNN} based sequence labeling in clinical text}, year = {2016}, } @article{huang2015bidirectional, author = {Zhiheng Huang and Wei Xu and Kai Yu}, journal = {arXiv}, title = {Bidirectional {LSTM-CRF} Models for Sequence Tagging}, year = {2015}, } @inproceedings{recht2019doimagenet, author = {Benjamin Recht and Rebecca Roelofs and Ludwig Schmidt and Vaishaal Shankar}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Do ImageNet Classifiers Generalize to ImageNet?}, year = {2019}, } @article{santurkar2020breeds, author = {Shibani Santurkar and Dimitris Tsipras and Aleksander Madry}, journal = {arXiv}, title = {BREEDS: Benchmarks for Subpopulation Shift}, year = {2020}, } @inproceedings{xie2016transfer, author = {Michael Xie and Neal Jean and Marshall Burke and David Lobell and Stefano Ermon}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Transfer Learning from Deep Features for Remote Sensing and Poverty Mapping}, year = {2016}, } @article{jean2016combining, author = {Neal Jean and Marshall Burke and Michael Xie and W. Matthew Davis and David B. Lobell and Stefano Ermon}, journal = {Science}, title = {Combining satellite imagery and machine learning to predict poverty}, volume = {353}, year = {2016}, } @article{wang2020weakly, author = {Sherrie Wang and William Chen and Sang Michael Xie and George Azzari and David B. Lobell}, journal = {Remote Sensing}, title = {Weakly Supervised Deep Learning for Segmentation of Remote Sensing Imagery}, volume = {12}, year = {2020}, } @article{albadawy2018tumor, author = {EA AlBadawy and A Saha and MA Mazurowski}, journal = {Med Phys.}, title = {Deep learning for segmentation of brain tumors: Impact of cross-institutional training and testing}, volume = {45}, year = {2018}, } @article{tripuraneni2020multitask, author = {Nilesh Tripuraneni and Michael I. Jordan and Chi Jin}, journal = {arXiv}, title = {On the Theory of Transfer Learning: The Importance of Task Diversity}, year = {2020}, } @article{du2020fewshot, author = {Simon S. Du and Wei Hu and Sham M. Kakade and Jason D. Lee and Qi Lei}, journal = {arXiv}, title = {Few-Shot Learning via Learning the Representation, Provably}, year = {2020}, } @inproceedings{wu2020multitask, author = {Sen Wu and Hongyang R. Zhang and Christopher Ré}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Understanding and Improving Information Transfer in Multi-Task Learning}, year = {2020}, } @article{caruana2003outputs, author = {Rich Caruana and Virginia R. de Sa}, journal = {Journal of Machine Learning Research (JMLR)}, title = {Benefitting from the Variables that Variable Selection Discards}, volume = {3}, year = {2003}, } @inproceedings{simonyan2015verydeep, author = {Simonyan, K and Zisserman, A.}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Very deep convolutional networks for large-scale image recognition}, year = {2015}, } @article{zoph2020rethinking, author = {Barret Zoph and Golnaz Ghiasi and Tsung-Yi Lin and Yin Cui and Hanxiao Liu and Ekin D. Cubuk and Quoc V. Le}, journal = {arXiv}, title = {Rethinking Pre-training and Self-training}, year = {2020}, } @inproceedings{hendrycks2019selfsupervised, author = {Dan Hendrycks and Mantas Mazeika and Saurav Kadavath and Dawn Song}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Using Self-Supervised Learning Can Improve Model Robustness and Uncertainty}, year = {2019}, } @article{blitzer2007adaptation, author = {John Blitzer and Fernando Pereira}, journal = {University of Pennsylvania}, title = {Domain adaptation of natural language processing systems}, year = {2007}, } @article{yeh2020poverty, author = {Christopher Yeh and Anthony Perez and Anne Driscoll and George Azzari and Zhongyi Tang and David Lobell and Stefano Ermon and Marshall Burke}, journal = {Nature Communications}, title = {Using publicly available satellite imagery and deep learning to understand economic well-being in Africa}, volume = {11}, year = {2020}, } @inproceedings{chen2020selftraining, author = {Yining Chen and Colin Wei and Ananya Kumar and Tengyu Ma}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Self-Training Avoids Using Spurious Features Under Domain Shift}, year = {2020}, } @article{blumenstock2015poverty, author = {J. Blumenstock and G. Cadamuro and R. On}, journal = {Science}, title = {Predicting poverty and wealth from mobile phone metadata}, volume = {350}, year = {2015}, } @article{epsey2015development, author = {Jessica Espey and Eric Swanson and Shaida Badiee and Zach Chistensen and Alex Fischer and Marc Levy and Greg Yetman and Alex de Sherbinin and Robert Chen and Yue Qiu and Geoffrey Greenwell and Thilo Klein and Johannes Jutting and Morten Jerven and Grant Cameron and Ana Milena Aguilar Rivera and Victoriano C. Arias and Samuel Lantei Mills and Albert Motivans}, journal = {Sustainable Development Solutions Network}, title = {Data for Development: A Needs Assessment for {SDG} Monitoring and Statistical Capacity Development}, year = {2015}, } @article{noor2008nighttime, author = {Abdisalan Noor and Victor Alegana and Peter Gething and Andrew Tatem and Robert Snow}, journal = {Population Health Metrics}, title = {Using remotely sensed night-time light as a proxy for poverty in Africa}, volume = {6}, year = {2008}, } @article{elvidge2009poverty, author = {Christopher D. Elvidge and Paul C. Sutton and Tilottama Ghosh and Benjamin T. Tuttle and Kimberly E. Baugh and Budhendra Bhaduri and Edward Bright}, journal = {Computers and Geosciences}, title = {A global poverty map derived from satellite data}, volume = {35}, year = {2009}, } @article{osgood2018mapping, author = {Aaron Osgood-Zimmerman and Anoushka I. Millear and Rebecca W. Stubbs and Chloe Shields and Brandon V. Pickering and Lucas Earl and Nicholas Graetz and Damaris K. Kinyoki and Sarah E. Ray and Samir Bhatt and Annie J. Browne and Roy Burstein and Ewan Cameron and Daniel C. Casey and Aniruddha Deshpande and Nancy Fullman and Peter W. Gething and Harry S. Gibson and Nathaniel J. Henry and Mario Herrero and L. Kendall Krause and Ian D. Letourneau and Aubrey J. Levine and Patrick Y. Liu and Joshua Longbottom and Benjamin K. Mayala and Jonathan F. Mosser and Abdisalan M. Noor and David M. Pigott and Ellen G. Piwoz and Puja Rao and Rahul Rawat and Robert C. Reiner and David L. Smith and Daniel J. Weiss and Kirsten E. Wiens and Ali H. Mokdad and Stephen S. Lim and Christopher J. L. Murray and Nicholas J. Kassebaum and Simon I. Hay}, journal = {Nature}, title = {Mapping child growth failure in Africa between 2000 and 2015}, volume = {555}, year = {2018}, } @article{reiner2018mortality, author = {Robert C. Reiner and Nicholas Graetz and Daniel C. Casey and Christopher Troeger and Gregory M. Garcia and Jonathan F. Mosser and Aniruddha Deshpande and Scott J. Swartz and Sarah E. Ray and Brigette F. Blacker and Puja C. Rao and Aaron Osgood-Zimmerman and Roy Burstein and David M. Pigott and Ian M. Davis and Ian D. Letourneau and Lucas Earl and Jennifer M. Ross and Ibrahim A. Khalil and Tamer H. Farag and Oliver J. Brady and Moritz U.G. Kraemer and David L. Smith and Samir Bhatt and Daniel J. Weiss and Peter W. Gething and Nicholas J. Kassebaum and Ali H. Mokdad and Christopher J.L. Murray and Simon I. Hay}, journal = {New England Journal of Medicine}, title = {Variation in Childhood Diarrheal Morbidity and Mortality in Africa, 2000–2015}, volume = {379}, year = {2018}, } @article{bengio2013estimating, author = {Yoshua Bengio and Nicholas Leonard and Aaron Courville}, journal = {arXiv}, title = {Estimating or Propagating Gradients Through Stochastic Neurons for Conditional Computation}, year = {2013}, } @article{burke2016mortality, author = {Marshall Burke and Sam Heft-Neal and Eran Bendavid}, journal = {Lancet Global Health}, title = {Sources of variation in under-5 mortality across sub-Saharan Africa: a spatial analysis}, volume = {4}, year = {2016}, } @article{graetz2018education, author = {Nicholas Graetz and Joseph Friedman and Aaron Osgood-Zimmerman and Roy Burstein and Molly H. Biehl and Chloe Shields and Jonathan F. Mosser and Daniel C. Casey and Aniruddha Deshpande and Lucas Earl and Robert C. Reiner and Sarah E. Ray and Nancy Fullman and Aubrey J. Levine and Rebecca W. Stubbs and Benjamin K. Mayala and Joshua Longbottom and Annie J. Browne and Samir Bhatt and Daniel J. Weiss and Peter W. Gething and Ali H. Mokdad and Stephen S. Lim and Christopher J. L. Murray and Emmanuela Gakidou and Simon I. Hay}, journal = {Nature}, title = {Mapping local variation in educational attainment across Africa}, volume = {555}, year = {2018}, } @inproceedings{you2017crop, author = {Jiaxuan You and Xiaocheng Li and Melvin Low and David Lobell and Stefano Ermon}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Deep {gaussian} process for crop yield prediction based on remote sensing data}, year = {2017}, } @inproceedings{jean2018ssdkl, author = {Neal Jean and Sang Michael Xie and Stefano Ermon}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Semi-supervised Deep Kernel Learning: Regression with Unlabeled Data by Minimizing Predictive Variance}, year = {2018}, } @inproceedings{abelson2014poor, author = {Brian Abelson and Kush R. Varshney and Joy Sun}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, title = {Targeting Direct Cash Transfers to the Extremely Poor}, year = {2014}, } @article{hansen2013forest, author = {M. C. Hansen and P. V. Potapov and R. Moore and M. Hancher and S. A. Turubanova and A. Tyukavina and D. Thau and S. V. Stehman and S. J. Goetz and T. R. Loveland and A. Kommareddy and A. Egorov and L. Chini and C. O. Justice and J. R. G. Townshend}, journal = {Science}, title = {High-Resolution Global Maps of 21st-Century Forest Cover Change}, volume = {342}, year = {2013}, } @article{tiecke2017population, author = {Tobias G. Tiecke and Xianming Liu and Amy Zhang and Andreas Gros and Nan Li and Gregory Yetman and Talip Kilic and Siobhan Murray and Brian Blankespoor and Espen B. Prydz and Hai-Anh H. Dang}, journal = {arXiv}, title = {Mapping the world population one building at a time}, year = {2017}, } @article{katona2018parking, author = {Zsolt Katona and Marcus Painter and Panos N. Patatoukas and Jean Zeng}, journal = {Miami Behavioral Finance Conference}, title = {On the Capital Market Consequences of Alternative Data: Evidence from Outer Space}, year = {2018}, } @inproceedings{christie2018fmow, author = {Gordon Christie and Neil Fendley and James Wilson and Ryan Mukherjee}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Functional Map of the World}, year = {2018}, } @inproceedings{uzkent2020zoom, author = {Burak Uzkent and Stefano Ermon}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Learning When and Where to Zoom with Deep Reinforcement Learning}, year = {2020}, } @article{kim2016multiresolution, author = {Jae Hyun Kim and Michael Xie and Neal Jean and Stefano Ermon}, journal = {Stanford University}, title = {Incorporating Spatial Context and Fine-grained Detail from Satellite Imagery to Predict Poverty}, year = {2016}, } @article{yang2010landuse, author = {Yi Yang and Shawn Newsam}, journal = {Geographic Information Systems}, title = {Bag-of-visual-words and spatial extensions for land-use classification}, year = {2010}, } @inproceedings{wang2017torontocity, author = {Shenlong Wang and Min Bai and Gellert Mattyus and Hang Chu and Wenjie Luo and Bin Yang and Justin Liang and Joel Cheverie and Sanja Fidler and Raquel Urtasun}, booktitle = {International Conference on Computer Vision (ICCV)}, title = {TorontoCity: Seeing the World with a Million Eyes}, year = {2017}, } @article{digitalglobe2016spacenet, author = {N. DigitalGlobe and CosmiQ Works}, journal = {https://aws.amazon.com/publicdatasets/spacenet/}, title = {SpaceNet}, year = {2016}, } @article{sahn2003asset, author = {David E. Sahn and David Stifel}, journal = {The Review of Income and Wealth}, title = {Exploring Alternative Measures of Welfare in the Absence of Expenditure Data}, volume = {49}, year = {2003}, } @article{filmer2011asset, author = {Deon Filmer and Kinnon Scott}, journal = {Demography}, title = {Assessing Asset Indices}, volume = {49}, year = {2011}, } @inproceedings{rolf2020post, author = {Esther Rolf and Michael I. Jordan and Benjamin Recht}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, title = {Post-Estimation Smoothing: A Simple Baseline for Learning with Side Information}, year = {2020}, } @inproceedings{lewis2020bart, author = {Mike Lewis and Yinhan Liu and Naman Goyal and Marjan Ghazvininejad and Abdelrahman Mohamed and Omer Levy and Ves Stoyanov and Luke Zettlemoyer}, booktitle = {Association for Computational Linguistics (ACL)}, title = {BART: Denoising Sequence-to-Sequence Pre-training for Natural Language Generation, Translation, and Comprehension}, year = {2020}, } @article{french1999catastrophic, author = {Robert M French}, journal = {Trends in cognitive sciences}, title = {Catastrophic forgetting in connectionist networks}, volume = {3}, year = {1999}, } @article{mccloskey1989catastrphic, author = {Michael McCloskey and Neal J Cohen}, journal = {The psychology of learning and motivation}, title = {Catastrophic interference in connectionist networks: The sequential learning problem}, volume = {24}, year = {1989}, } @article{ratcliff1990connectionist, author = {Roger Ratcliff}, journal = {Psychological review}, title = {Connectionist models of recognition memory: constraints imposed by learning and forgetting functions}, volume = {97}, year = {1990}, } @inproceedings{zhang2021revisiting, author = {Tianyi Zhang and Felix Wu and Arzuo Katiyar and Kilian Q. Weinberger and Yoav Artzi}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Revisiting Few-sample {BERT} Fine-tuning}, year = {2021}, } @article{dodge2020finetuning, author = {Jesse Dodge and Gabriel Ilharco and Roy Schwartz and Ali Farhadi and Hannaneh Hajishirzi and Noah Smith}, journal = {arXiv}, title = {Finetuning pretrained language models: Weight initializations, data orders, and early stopping}, year = {2020}, } @inproceedings{lee2020mixout, author = {Cheolhyoung Lee and Kyunghyun Cho and Wanmo Kang}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Mixout: Effective regularization to finetune large-scale pretrained language models}, year = {2020}, } @article{houlsby2019parameter, author = {Neil Houlsby and Andrei Giurgiu and Stanislaw Jastrzebski and Bruna Morrone and Quentin de Laroussilhe and Andrea Gesmundo and Mona Attariyan and Sylvain Gelly}, journal = {arXiv}, title = {Parameter-Efficient Transfer Learning for {NLP}}, year = {2019}, } @misc{github2021repos, author = {Github}, howpublished = {\url{https://github.com/search?q=is:public}}, title = {Repository search for public repositories}, year = {2021}, } @article{miyazaki2020automatic, author = {Tomo Miyazaki and Tatsunori Tsuchiya and Yoshihiro Sugaya and Shinichiro Omachi and Masakazu Iwamura and Seiichi Uchida and Koichi Kise}, journal = {IEEE Computer Graphics and Applications}, title = {Automatic Generation of Typographic Font from a Small Font Subset}, volume = {40}, year = {2020}, } @article{tenenbaum2000separating, author = {Joshua B. Tenenbaum and William T. Freeman}, journal = {Neural Computation}, title = {Separating Style and Content with Bilinear Models}, volume = {12}, year = {2000}, } @inproceedings{mostajabi2018regularizing, author = {Mohammadreza Mostajabi and Michael Maire and Gregory Shakhnarovich}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {Regularizing Deep Networks by Modeling and Predicting Label Structure}, year = {2018}, } @article{reed2021self, author = {Colorado J. Reed and Xiangyu Yue and Ani Nrusimha and Sayna Ebrahimi and Vivek Vijaykumar and Richard Mao and Bo Li and Shanghang Zhang and Devin Guillory and Sean Metzger and Kurt Keutzer and Trevor Darrell}, journal = {arXiv}, title = {Self-Supervised Pretraining Improves Self-Supervised Pretraining}, year = {2021}, } @article{wei2021finetuned, author = {Jason Wei and Maarten Bosma and Vincent Y. Zhao and Kelvin Guu and Adams Wei Yu and Brian Lester and Nan Du and Andrew M. Dai and Quoc V. Le}, journal = {arXiv}, title = {Finetuned Language Models Are Zero-Shot Learners}, year = {2021}, } @article{gao2021making, author = {Tianyu Gao and Adam Fisch and Danqi Chen}, journal = {arXiv}, title = {Making Pre-trained Language Models Better Few-shot Learners}, year = {2021}, } @article{kleijn2012bernstein, author = {B.J.K. Kleijn and A.W. van der Vaart}, journal = {Electronic Journal of Statistics}, title = {The {Bernstein}-von Mises theorem under misspecification}, volume = {6}, year = {2012}, } @article{wei2021why, author = {Colin Wei and Sang Michael Xie and Tengyu Ma}, journal = {arXiv}, title = {Why Do Pretrained Language Models Help in Downstream Tasks? An Analysis of Head and Prompt Tuning}, year = {2021}, } @misc{rong2021extrapolating, author = {Frieda Rong}, title = {Extrapolating to Unnatural Language Processing with {GPT-3}'s In-context Learning: The Good, the Bad, and the Mysterious}, year = {2021}, } @article{pires2016multiclass, author = {Bernardo Ávila Pires and Csaba Szepesvári}, journal = {arXiv}, title = {Multiclass Classification Calibration Functions}, year = {2016}, } @article{steinwart2007how, author = {Ingo Steinwart}, journal = {Constructive Approximation}, title = {How to Compare Different Loss Functions and Their Risks}, volume = {26}, year = {2007}, } @inproceedings{chiu2020scaling, author = {Justin T. Chiu and Alexander M. Rush}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Scaling Hidden {Markov} Language Models}, year = {2020}, } @inproceedings{ravi2017metalearning, author = {Sachin Ravi and Hugo Larochelle}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Optimization as a Model for Few-shot Learning}, year = {2017}, } @inproceedings{holtzman2020curious, author = {Ari Holtzman and Jan Buys and Li Du and Maxwell Forbes and Yejin Choi}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {The Curious Case of Neural Text Degeneration}, year = {2020}, } @article{jones2004markov, author = {Galin L. Jones}, journal = {Probability Surveys}, title = {On the {Markov} chain central limit theorem}, volume = {1}, year = {2004}, } @inproceedings{zhao2021calibrate, author = {Tony Z. Zhao and Eric Wallace and Shi Feng and Dan Klein and Sameer Singh}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Calibrate Before Use: Improving Few-Shot Performance of Language Models}, year = {2021}, } @inproceedings{kuhn1994hmm, author = {Thomas Kuhn and Heinrich Niemann and Ernst Gunter and Schukat-Talamazzini}, booktitle = {International Conference on Acoustics, Speech, and Signal Processing (ICASSP)}, title = {Ergodic hidden {markov} models and polygrams for language modeling}, year = {1994}, } @inproceedings{tu2019benchmarking, author = {Lifu Tu and Kevin Gimpel}, booktitle = {North American Association for Computational Linguistics (NAACL)}, title = {Benchmarking Approximate Inference Methods for Neural Structured Prediction}, year = {2019}, } @inproceedings{power2021grokking, author = {Alethea Power and Yuri Burda and Harri Edwards and Igor Babuschkin and Vedant Misra}, booktitle = {International Conference on Learning Representations Workshop (ICLR)}, title = {Grokking: Generalization beyond overfitting on small algorithmic datasets}, year = {2021}, } @inproceedings{jiang2020how, author = {Zhengbao Jiang and Frank F Xu and Jun Araki and Graham Neubig}, booktitle = {Association for Computational Linguistics (ACL)}, title = {How can we know what language models know?}, year = {2020}, } @article{gunst2008asymptotic, author = {M. Gunst and O. Shcherbakova}, journal = {Mathematical Methods of Statistics}, title = {Asymptotic behavior of {Bayes} estimators for hidden {Markov} models with application to ion channels}, volume = {17}, year = {2008}, } @misc{wang2021gptj, author = {Wang, Ben and Komatsuzaki, Aran}, title = {{GPT}-{J}-{6B}: A 6 Billion Parameter Autoregressive Language Model}, year = {2021}, } @article{baum1966statistical, author = {Baum, Leonard E and Petrie, Ted}, journal = {The Annals of Mathematical Statistics}, title = {Statistical inference for probabilistic functions of finite state {Markov} chains}, volume = {37}, year = {1966}, } @article{sanh2021multitask, author = {Victor Sanh and Albert Webson and Colin Raffel and Stephen H. Bach and Lintang Sutawika and Zaid Alyafeai and Antoine Chaffin and Arnaud Stiegler and Teven Le Scao and Arun Raja and Manan Dey and M Saiful Bari and Canwen Xu and Urmish Thakker and Shanya Sharma Sharma and Eliza Szczechla and Taewoon Kim and Gunjan Chhablani and Nihal Nayak and Debajyoti Datta and Jonathan Chang and Mike Tian-Jian Jiang and Han Wang and Matteo Manica and Sheng Shen and Zheng Xin Yong and Harshit Pandey and Rachel Bawden and Thomas Wang and Trishala Neeraj and Jos Rozen and Abheesht Sharma and Andrea Santilli and Thibault Fevry and Jason Alan Fries and Ryan Teehan and Stella Biderman and Leo Gao and Tali Bers and Thomas Wolf and Alexander M. Rush}, journal = {arXiv}, title = {Multitask Prompted Training Enables Zero-Shot Task Generalization}, year = {2021}, } @inproceedings{clark2020electra, author = {Kevin Clark and Minh-Thang Luong and Quoc V. Le and Christopher D. Manning}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {ELECTRA: Pre-training Text Encoders as Discriminators Rather Than Generators}, year = {2020}, } @inproceedings{gruber2007hidden, author = {Gruber, Amit and Weiss, Yair and Rosen-Zvi, Michal}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, title = {Hidden Topic {Markov} Models}, year = {2007}, } @inproceedings{dosovitskiy2021vit, author = {Alexey Dosovitskiy and Lucas Beyer and Alexander Kolesnikov and Dirk Weissenborn and Xiaohua Zhai and Thomas Unterthiner and Mostafa Dehghani and Matthias Minderer and Georg Heigold and Sylvain Gelly and Jakob Uszkoreit and Neil Houlsby}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {An Image is Worth 16x16 Words: Transformers for Image Recognition at Scale}, year = {2021}, } @article{gao2020pile, author = {Leo Gao and Stella Biderman and Sid Black and Laurence Golding and Travis Hoppe and Charles Foster and Jason Phang and Horace He and Anish Thite and Noa Nabeshima and Shawn Presser and Connor Leahy}, journal = {arXiv}, title = {The Pile: An 800GB Dataset of Diverse Text for Language Modeling}, year = {2020}, } @inproceedings{yao2022scratch, author = {Xingcheng Yao and Yanan Zheng and Xiaocong Yang and Zhilin Yang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {{NLP} From Scratch Without Large-Scale Pretraining: A Simple and Efficient Framework}, year = {2022}, } @article{joulin2017bag, author = {Armand Joulin and Edouard Grave and Piotr Bojanowski and Tomas Mikolov}, journal = {European Chapter of the Association for Computational Linguistics (EACL)}, title = {Bag of Tricks for Efficient Text Classification}, volume = {2}, year = {2017}, } @inproceedings{lee2022dedup, author = {Katherine Lee and Daphne Ippolito and Andrew Nystrom and Chiyuan Zhang and Douglas Eck and Chris Callison-Burch and Nicholas Carlini}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Deduplicating Training Data Makes Language Models Better}, year = {2022}, } @article{hernandez2022repeated, author = {Danny Hernandez and Tom Brown and Tom Conerly and Nova DasSarma and Dawn Drain and Sheer El-Showk and Nelson Elhage and Zac Hatfield-Dodds and Tom Henighan and Tristan Hume and Scott Johnston and Ben Mann and Chris Olah and Catherine Olsson and Dario Amodei and Nicholas Joseph and Jared Kaplan and Sam McCandlish}, journal = {arXiv}, title = {Scaling Laws and Interpretability of Learning from Repeated Data}, year = {2022}, } @article{baevski2019cloze, author = {Alexei Baevski and Sergey Edunov and Yinhan Liu and Luke Zettlemoyer and Michael Auli}, journal = {arXiv}, title = {Cloze-driven Pretraining of Self-attention Networks}, year = {2019}, } @article{sorscher2022beyond, author = {Ben Sorscher and Robert Geirhos and Shashank Shekhar and Surya Ganguli and Ari S. Morcos}, journal = {arXiv}, title = {Beyond neural scaling laws: beating power law scaling via data pruning}, year = {2022}, } @inproceedings{mindermann2022prioritized, author = {Sören Mindermann and Jan Brauner and Muhammed Razzak and Mrinank Sharma and Andreas Kirsch and Winnie Xu and Benedikt Höltgen and Aidan N. Gomez and Adrien Morisot and Sebastian Farquhar and Yarin Gal}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Prioritized Training on Points that are Learnable, Worth Learning, and Not Yet Learnt}, year = {2022}, } @article{kaushal2019learning, author = {Vishal Kaushal and Rishabh Iyer and Suraj Kothawade and Rohan Mahadev and Khoshrav Doctor and Ganesh Ramakrishnan}, journal = {IEEE/CVF Winter Conference on Applicatios of Computer Vision (WACV)}, title = {Learning From Less Data: A Unified Data Subset Selection and Active Learning Framework for Computer Vision}, year = {2019}, } @inproceedings{killamsetty2021retrieve, author = {Krishnateja Killamsetty and Xujiang Zhao and Feng Chen and Rishabh Iyer}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {RETRIEVE: Coreset Selection for Efficient and Robust Semi-Supervised Learning}, year = {2021}, } @inproceedings{killamsetty2021gradmatch, author = {Krishnateja Killamsetty and Durga S and Ganesh Ramakrishnan and Abir De and Rishabh Iyer}, booktitle = {International Conference on Machine Learning (ICML)}, title = {{GRAD-MATCH}: Gradient Matching based Data Subset Selection for Efficient Deep Model Training}, year = {2021}, } @inproceedings{wang2020optimizing, author = {Xinyi Wang and Hieu Pham and Paul Michel and Antonios Anastasopoulos and Jaime Carbonell and Graham Neubig}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Optimizing Data Usage via Differentiable Rewards}, year = {2020}, } @inproceedings{wei2015submodular, author = {Kai Wei and Rishabh Iyer and Jeff Bilmes}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Submodularity in Data Subset Selection and Active Learning}, year = {2015}, } @inproceedings{killamsetty2021glister, author = {Krishnateja Killamsetty and Durga Sivasubramanian and Ganesh Ramakrishnan and Rishabh Iyer}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {GLISTER: Generalization based Data Subset Selection for Efficient and Robust Learning}, year = {2021}, } @inproceedings{paul2021diet, author = {Mansheej Paul and Surya Ganguli and Gintare Karolina Dziugaite}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Deep Learning on a Data Diet: Finding Important Examples Early in Training}, year = {2021}, } @inproceedings{mirzasoleiman2020coresets, author = {Baharan Mirzasoleiman and Jeff Bilmes and Jure Leskovec}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Coresets for Data-efficient Training of Machine Learning Models}, year = {2020}, } @article{musser1999introspective, author = {David R. Musser}, journal = {Software: Practice and Experience}, title = {Introspective Sorting and Selection Algorithms}, volume = {27}, year = {1999}, } @inproceedings{kool2019stochastic, author = {Wouter Kool and Herke van Hoof and Max Welling}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Stochastic Beams and Where to Find Them: The {Gumbel}-Top-{k} Trick for Sampling Sequences Without Replacement}, year = {2019}, } @inproceedings{xie2019subset, author = {Sang Michael Xie and Stefano Ermon}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, title = {Reparameterizable Subset Sampling via Continuous Relaxations}, year = {2019}, } @misc{vieira2014gumbel, author = {Tim Vieira}, title = {{Gumbel}-max trick and weighted reservoir sampling}, year = {2014}, } @inproceedings{kim2016exact, author = {Carolyn Kim and Ashish Sabharwal and Stefano Ermon}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Exact sampling with integer linear programs and random perturbations}, year = {2016}, } @article{kringelum2016chemprot, author = {Jens Kringelum and Sonny Kim Kjærulff and Søren Brunak and Ole Lund and Tudor I. Oprea and Olivier Taboureau}, journal = {Database}, title = {ChemProt-3.0: a global chemical biology diseases mapping}, year = {2016}, } @article{dernoncourt2017rct, author = {Franck Dernoncourt and Ji Young Lee}, journal = {IJCNLP}, title = {Pubmed 200k RCT: a dataset for sequential sentence classification in medical abstracts}, year = {2017}, } @article{jurgens2018citation, author = {David Jurgens and Srijan Kumar and Raine Hoover and Daniel A. McFarland and Dan Jurafsky}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, title = {Measuring the evolution of a scientific field through citation frames}, volume = {6}, year = {2018}, } @inproceedings{luan2018scierc, author = {Yi Luan and Luheng He and Mari Ostendorf and Hannaneh Hajishirzi}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Multi-task identification of entities, relations, and coreference for scientific knowledge graph construction}, year = {2018}, } @article{kiesel2019hyp, author = {Johannes Kiesel and Maria Mestre and Rishabh Shukla and Emmanuel Vincent and Payam Adineh and David Corney and Benno Stein and Martin Potthast}, journal = {SemEval}, title = {SemEval2019 Task 4: Hyperpartisan news detection}, year = {2019}, } @article{mcauley2015amazon, author = {Julian McAuley and Christopher Targett and Qinfeng Shi and Anton van den Hengel}, journal = {SIGIR}, title = {Image-based Recommendations on Styles and Substitutes}, year = {2015}, } @article{razeghi2022impact, author = {Yasaman Razeghi and Robert L. Logan IV and Matt Gardner and Sameer Singh}, journal = {arXiv}, title = {Impact of Pretraining Term Frequencies on Few-Shot Reasoning}, year = {2022}, } @inproceedings{izsak2021how, author = {Peter Izsak and Moshe Berchansky and Omer Levy}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {How to Train {BERT} with an Academic Budget}, year = {2021}, } @inproceedings{katharopoulos2018not, author = {Angelos Katharopoulos and François Fleuret}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Not All Samples Are Created Equal: Deep Learning with Importance Sampling}, year = {2018}, } @inproceedings{alain2016variance, author = {Guillaume Alain and Alex Lamb and Chinnadhurai Sankar and Aaron Courville and Yoshua Bengio}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Variance Reduction in {SGD} by Distributed Importance Sampling}, year = {2016}, } @article{bordes2005fast, author = {Antoine Bordes and Seyda Ertekin and Jason Weston and Leon Bottou}, journal = {Journal of Machine Learning Research (JMLR)}, title = {Fast Kernel Classifiers with Online and Active Learning}, volume = {6}, year = {2005}, } @article{richtarik2013optimal, author = {Peter Richtárik and Martin Takáč}, journal = {arXiv}, title = {On Optimal Probabilities in Stochastic Coordinate Descent Methods}, year = {2013}, } @inproceedings{zhao2015stochastic, author = {Peilin Zhao and Tong Zhang}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Stochastic Optimization with Importance Sampling for Regularized Loss Minimization}, year = {2015}, } @inproceedings{bengio2009curriculum, author = {Yoshua Bengio and Jerome Louradour and Ronan Collobert and Jason Weston}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Curriculum Learning}, year = {2009}, } @inproceedings{serra2015discriminative, author = {Edgar Simo-Serra and Eduard Trulls and Luis Ferraz and Iasonas Kokkinos and Pascal Fua and Francesc Moreno-Noguer}, booktitle = {International Conference on Computer Vision (ICCV)}, title = {Discriminative Learning of Deep Convolutional Feature Point Descriptors}, year = {2015}, } @inproceedings{schroff2015facenet, author = {Florian Schroff and Dmitry Kalenichenko and James Philbin}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, title = {FaceNet: A Unified Embedding for Face Recognition and Clustering}, year = {2015}, } @inproceedings{loshchilov2016online, author = {Ilya Loshchilov and Frank Hutter}, booktitle = {International Conference on Learning Representations Workshop (ICLR)}, title = {Online batch selection for faster training of neural networks}, year = {2016}, } @article{kaplan2020scaling, author = {Jared Kaplan and Sam McCandlish and Tom Henighan and Tom B. Brown and Benjamin Chess and Rewon Child and Scott Gray and Alec Radford and Jeffrey Wu and Dario Amodei}, journal = {arXiv}, title = {Scaling Laws for Neural Language Models}, year = {2020}, } @inproceedings{lo2020s2orc, author = {Kyle Lo and Lucy Lu Wang and Mark Neumann and Rodney Kinney and Daniel S. Weld}, booktitle = {Association for Computational Linguistics (ACL)}, title = {S2ORC: The Semantic Scholar Open Research Corpus}, year = {2020}, } @article{bengtsson2008curse, author = {Thomas Bengtsson and Peter Bickel and Bo Li}, journal = {arXiv}, title = {Curse-of-dimensionality revisited: Collapse of the particle filter in very large scale systems}, year = {2008}, } @article{snyder2008obstacles, author = {Chris Snyder and Thomas Bengtsson and Peter Bickel and Jeff Anderson}, journal = {Mathematical Advances in Data Assimilation (MADA)}, title = {Obstacles to High-Dimensional Particle Filtering}, year = {2008}, } @article{rubin1988sir, author = {Donald B. Rubin}, journal = {Bayesian Statistics}, title = {Using the {SIR} Algorithm to Simulate Posterior Distributions}, year = {1988}, } @article{gelman2004applied, author = {Andrew Gelman and Xiao-Li Meng}, journal = {Wiley Series in Probability and Statistics}, title = {Applied {Bayesian} modeling and causal inference from incomplete-data perspectives}, year = {2004}, } @inproceedings{weinberger2009feature, author = {Kilian Weinberger and Anirban Dasgupta and John Langford and Alex Smola and Josh Attenberg}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Feature Hashing for Large Scale Multitask Learning}, year = {2009}, } @article{tversky1986nearest, author = {Amos Tversky and J. Wesley Hutchinson}, journal = {Psychological review}, pages = {1--3}, title = {Nearest neighbor analysis of psychological spaces}, year = {1986}, } @inproceedings{gershman2015phrase, author = {Samuel J. Gershman and Joshua B. Tenenbaum}, booktitle = {CogSci}, title = {Phrase similarity in humans and machines}, year = {2015}, } @article{wood1994simulation, author = {Andrew T. Wood}, journal = {Communications in statistics-simulation and computation}, pages = {157--164}, title = {Simulation of the von Mises Fisher distribution}, year = {1994}, } @inproceedings{mueller2017sequence, author = {Jonas Mueller and David Gifford and Tommi Jaakkola}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {2536--2544}, title = {Sequence to better sequence: continuous revision of combinatorial structures}, year = {2017}, } @inproceedings{athanasopoulou2014low, author = {Georgia Athanasopoulou and Elias Iosif and Alexandros Potamianos}, booktitle = {International Conference on Computational Linguistics (COLING)}, pages = {731--740}, title = {Low-Dimensional Manifold Distributional Semantic Models}, year = {2014}, } @inproceedings{andrews2012name, author = {Nocholas Andrews and Jason Eisner and Mark Dredze}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {344--355}, title = {Name phylogeny: A generative model of string variation}, year = {2012}, } @inproceedings{alexandrescu2009graph, author = {Andrei Alexandrescu and Katrin Kirchhoff}, booktitle = {North American Association for Computational Linguistics (NAACL)}, pages = {119--127}, title = {Graph-based learning for statistical machine translation}, year = {2009}, } @inproceedings{agirre2014semeval, author = {Eneko Agirre and Carmen Banea and Claire Cardie and Daniel M Cer and Mona T Diab and Aitor Gonzalez-Agirre and Weiwei Guo and Rada Mihalcea and German Rigau and Janyce Wiebe}, booktitle = {International Conference on Computational Linguistics (COLING)}, pages = {81--91}, title = {Sem{E}val-2014 {T}ask 10: Multilingual Semantic Textual Similarity}, year = {2014}, } @article{song2016retrieval, author = {Yiping Song and Rui Yan and Xiang Li and Dongyan Zhao and Ming Zhang}, journal = {arXiv preprint arXiv:1610.07149}, title = {Two are Better than One: An Ensemble of Retrieval- and Generation-Based Dialog Systems}, year = {2016}, } @inproceedings{hu2017toward, author = {Zhiting Hu and Zichao Yang and Xiaodan Liang and Ruslan Salakhutdinov and Eric P Xing}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Toward Controlled Generation of Text}, year = {2017}, } @article{ficler2017controlling, author = {Jessica Ficler and Yoav Goldberg}, journal = {arXiv preprint arXiv:1707.02633}, title = {Controlling Linguistic Style Aspects in Natural Language Generation}, year = {2017}, } @article{tenenbaum2000global, author = {Joshua B Tenenbaum and Vin De Silva and John C Langford}, journal = {Science}, pages = {2319--2323}, title = {A Global Geometric Framework for Nonlinear Dimensionality Reduction}, year = {2000}, } @article{hashimoto2016word, author = {Tatsunori B Hashimoto and David Alvarez-Melis and Tommi S Jaakkola}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, pages = {273--286}, title = {Word Embeddings as Metric Recovery in Semantic Spaces}, volume = {4}, year = {2016}, } @inproceedings{heafield2013scalable, author = {Kenneth Heafield and Ivan Pouzyrevsky and Jonathan H. Clark and Philipp Koehn}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {690--696}, title = { Scalable Modified {K}neser-{N}ey Language Model Estimation}, year = {2013}, } @misc{yelp2017yelp, author = {Yelp}, howpublished = {\url{https://www.yelp.com/dataset_challenge}}, title = {Yelp {D}ataset {C}hallenge, {R}ound 8}, year = {2017}, } @article{chelba2013one, author = {Ciprian Chelba and Tomas Mikolov and Mike Schuster and Qi Ge and Thorsten Brants and Phillipp Koehn and Tony Robinson}, journal = {arXiv preprint arXiv:1312.3005}, title = {One Billion Word Benchmark for Measuring Progress in Statistical Language Modeling}, year = {2013}, } @article{gu2017search, author = {Jiatao Gu and Yong Wang and Kyunghyun Cho and Victor OK Li}, journal = {arXiv preprint arXiv:1705.07267}, title = {Search Engine Guided Non-Parametric Neural Machine Translation}, year = {2017}, } @article{hayes1986writing, author = {John R Hayes and Linda S Flower}, journal = {American psychologist}, number = {10}, pages = {1106--1113}, title = {Writing research and the writer}, volume = {41}, year = {1986}, } @inproceedings{mikolov2013linguistic, author = {Tomas Mikolov and Wen-tau Yih and Geoffrey Zweig}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, pages = {746--751}, title = {Linguistic regularities in continuous space word representations}, volume = {13}, year = {2013}, } @article{bengio2003neural, author = {Yoshua Bengio and Rejean Ducharme and Pascal Vincent and Christian Jauvin}, journal = {Journal of machine learning research}, number = {0}, pages = {1137--1155}, title = {A neural probabilistic language model}, volume = {3}, year = {2003}, } @inproceedings{he2015syntax, author = {He He and Alvin {Grissom II} and Jordan Boyd-Graber and Hal {Daum{\'e} III}}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {55--64}, title = {Syntax-based Rewriting for Simultaneous Machine Translation}, year = {2015}, } @article{parzen1962, author = {Emanuel Parzen}, journal = {Annals of Mathematical Statistics}, pages = {1065--1076}, title = {On Estimation of a Probability Density Function and Mode}, volume = {33}, year = {1962}, } @inproceedings{amodei2016, author = {Dario Amodei and others}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {173--182}, title = {Deep Speech 2 End to End Speech Recognition in {E}nglish and Mandarin}, year = {2016}, } @article{chouldechova2017, author = {Alexandra Chouldechova}, journal = {Big Data}, pages = {153--163}, title = {A study of bias in recidivism prediciton instruments}, year = {2017}, } @inproceedings{joseph2016, author = {Matthew Joseph and Michael Kearns and Jamie Morgenstern and Seth Neel and Aaron Roth}, booktitle = {FATML}, title = {Rawlsian Fairness for Machine Learning}, year = {2016}, } @inproceedings{jabbari2017, author = {Shahin Jabbari and Matthew Joseph and Michael Kearns and Jamie Morgenstern and Aaron Roth}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1617--1626}, title = {Fairness in Reinforcement Learning}, year = {2017}, } @inproceedings{woodworth2017, author = {Blake Woodworth and Suriya Gunasekar and Mesrob I. Ohannessian and Nathan Srebro}, booktitle = {Conference on Learning Theory (COLT)}, pages = {1920--1953}, title = {Learning Non-Discriminatory Predictors}, year = {2017}, } @article{kroll2017, author = {Joshua A. Kroll and Joanna Huey and Solon Baroca and Edward W. Felten and Joel R. Reidenberg and David G Robinson and Harlan Yu}, journal = {University of Pennsylvania Law Review}, pages = {633--706}, title = {Accountable Algorithms}, volume = {3}, year = {2017}, } @book{rawls2009, author = {John Rawls}, publisher = {Harvard University Press}, title = {A theory of justice: Revised edition}, year = {2009}, } @book{rawls2001, author = {John Rawls}, publisher = {Harvard University Press}, title = {Justice as fairness: a restatement}, year = {2001}, } @article{duchi2016, author = {John Duchi and Peter Glynn and Hongseok Namkoong}, journal = {arXiv}, title = {Statistics of Robust Optimization: A Generalized Empirical Likelihood Approach}, year = {2016}, } @inproceedings{kula2015, author = {Maciej Kula}, booktitle = {Proceedings of the 2nd Workshop on New Trends on Content-Based Recommender Systems}, pages = {14--21}, title = {Metadata Embeddings for User and Item Cold-start Recommendations}, year = {2015}, } @techreport{grother2011, author = {Patrick J. Grother and George W. Quinn and P. Jonathon Phillips}, institution = {NIST}, title = {Report on the Evaluation of 2D Still-Image Face Recognition Algorithms}, year = {2011}, } @article{harsanyi1975, author = {John C. Harsanyi}, journal = {The American Political Science Review}, pages = {594--606}, title = { Can the Maximin Principle Serve as a Basis for Morality? A Critique of John Rawls's Theory}, volume = {69}, year = {1975}, } @article{mueller1974, author = {Dennis C. Mueller and Robert D. Tollison and Thomas D. Willet}, journal = {Theory and Decision}, pages = {345--367}, title = {The Utilitarian Contract: A Generalization of Rawls' Theory of Justice}, volume = {4}, year = {1974}, } @article{altham1973, author = {JE J. Altham}, journal = {Philosophy}, pages = {75--78}, title = {Rawls' Difference Principle}, volume = {48}, year = {1973}, } @inproceedings{sapiezynski2017, author = {Piotr Sapiezynski and Valentin Kassarnig and Christo Wilson and Sune Lehmann and Alan Mislove}, booktitle = {FATREC}, pages = {48--51}, title = {Academic performance prediction in a gender-imbalanced environment}, volume = {1}, year = {2017}, } @inproceedings{tatman2017, author = {Rachael Tatman}, booktitle = {Workshop on Ethics in Natural Langauge Processing}, pages = {53--59}, title = {Gender and Dialect Bias in {Y}ou{T}ube's Automatic Captions}, volume = {1}, year = {2017}, } @inproceedings{jurgens2017, author = {David Jurgens and Yulia Tsvetkov and Dan Jurafsky}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {51--57}, title = {Incorporating Dialectal Variability for Socially Equitable Language Identification}, year = {2017}, } @inproceedings{hovy2015, author = {Dirk Hovy and Anders Søgaard}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {483--488}, title = {Tagging Performance Correlates with Age}, year = {2015}, } @inproceedings{jorgensen2015, author = {Anna Katrine Jørgensen and Dirk Hovy and Anders Søgaard}, booktitle = {ACL Workshop on Noisy User-generated Text}, pages = {9--18}, title = {Challenges of studying and processing dialects in social media}, year = {2015}, } @inproceedings{blodgett2016, author = {Su Lin Blodgett and Lisa Green and Brendan O'Connor}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1119--1130}, title = {Demographic Dialectal Variation in Social Media: A Case Study of {A}frican-{A}merican {E}nglish}, year = {2016}, } @article{barocas2016, author = {Solon Barocas and Andrew D. Selbst}, journal = {104 California Law Review}, pages = {671--732}, title = {Big Data's Disparate Impact}, volume = {3}, year = {2016}, } @inproceedings{kusner2017, author = {Matt J Kusner and Joshua R Loftus and Chris Russell and Ricardo Silva}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {4069--4079}, title = {Counterfactual Fairness}, year = {2017}, } @inproceedings{dwork2012, author = {Cynthia Dwork and Moritz Hardt and Toniann Pitassi and Omer Reingold and Rich Zemel}, booktitle = {Innovations in Theoretical Computer Science (ITCS)}, pages = {214--226}, title = {Fairness through awareness}, year = {2012}, } @inproceedings{feldman2015, author = {Michael Feldman and Sorelle Friedler and John Moeller and Carlos Scheidegger and Suresh Venkatasubramanian}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, pages = {259--268}, title = {Certifying and removing disparate impact}, year = {2015}, } @inproceedings{hardt2016, author = {Moritz Hardt and Eric Price and Nathan Srebo}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {3315--3323}, title = {Equality of Opportunity in Supervised Learning}, year = {2016}, } @inproceedings{kleinberg2017, author = {Jon Kleinberg and Sendhil Mullainathan and Manish Raghavan}, booktitle = {Innovations in Theoretical Computer Science (ITCS)}, title = {Inherent Trade-offs in the Fair Determination of Risk Scores}, year = {2017}, } @inproceedings{pleiss2017, author = {Geoff Pleiss and Manish Raghavan and Felix Wu and Jon Kleinberg and Kilian Q. Weinberger}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {5684--5693}, title = {On Fairness and Calibration}, year = {2017}, } @inproceedings{kearns2018preventing, author = {Michael Kearns and Seth Neel and Aaron Roth and Zhiwei Steven Wu}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {2564--2572}, title = {Preventing fairness gerrymandering: Auditing and learning for subgroup fairness}, year = {2018}, } @article{hebertjohnson2017, author = {{\'U}rsula H{\'e}bert-Johnson and Michael P. Kim and Omer Reingold and Guy N. Rothblum}, journal = {arXiv preprint arXiv:1711.08513}, title = {Calibration for the (Computationally-Identifiable) Masses}, year = {2017}, } @inproceedings{zemel2013, author = {Richard Zemel and Yu Wu and Kevin Swersky and Toniann Pitassi and Cynthia Dwork}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {325--333}, title = {Learning Fair Representations}, year = {2013}, } @article{cifka2018, author = {Ondřej Cífka and Aliaksei Severyn and Enrique Alfonseca and Katja Filippova}, journal = {arXiv preprint arXiv:1804.07972}, title = {Eval all, trust a few, do wrong to none: Comparing sentence generation models}, year = {2018}, } @article{davidson2018, author = {Tim R. Davidson and Luca Falorsi and Nicola De Cao and Thomas Kipf and Jakub M. Tomczak}, journal = {arXiv preprint arXiv:1804.00891}, title = {Hyperspherical Variational Auto-Encoders}, year = {2018}, } @article{stone1977, author = {Charles J Stone}, journal = {Annals of Statistics}, title = {Consistent Nonparametric Regression}, volume = {5}, year = {1977}, } @inproceedings{andrew2013deep, author = {Galen Andrew and Raman Arora and Jeff Bilmes and Karen Livescu}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1247--1255}, title = {Deep canonical correlation analysis}, year = {2013}, } @inproceedings{yan2015deep, author = {Fei Yan and Krystian Mikolajczyk}, booktitle = {Computer Vision and Pattern Recognition (CVPR)}, pages = {3441--3450}, title = {Deep correlation for matching images and text}, year = {2015}, } @inproceedings{severyn2015learning, author = {Aliaksei Severyn and Alessandro Moschitti}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, pages = {373--382}, title = {Learning to rank short text pairs with convolutional deep neural networks}, year = {2015}, } @article{tan2015lstm, author = {Ming Tan and Cicero dos Santos and Bing Xiang and Bowen Zhou}, journal = {arXiv preprint arXiv:1511.04108}, title = {{LSTM}-based deep learning models for non-factoid answer selection}, year = {2015}, } @inproceedings{srivastava2012multimodal, author = {Nitish Srivastava and Ruslan R Salakhutdinov}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {2222--2230}, title = {Multimodal Learning with Deep {B}oltzmann Machines}, year = {2012}, } @inproceedings{green2013efficacy, author = {Spence Green and Jeffrey Heer and Christopher D Manning}, booktitle = {Conference on Human Factors in Computing Systems (CHI)}, pages = {439--448}, title = {The efficacy of human post-editing for language translation}, year = {2013}, } @article{kalbfleisch1984least, author = {John David Kalbfleisch and Jerald F Lawless}, journal = {Canadian Journal of Statistics}, number = {3}, pages = {169--182}, title = {Least-squares estimation of transition probabilities from aggregate data}, volume = {12}, year = {1984}, } @inproceedings{bernstein2016consistently, author = {Garrett Bernstein and Daniel Sheldon}, booktitle = {Artificial Intelligence and Statistics (AISTATS)}, pages = {1142--1150}, title = {Consistently Estimating {M}arkov Chains with Noisy Aggregate Data}, year = {2016}, } @article{van1983estimation, author = {Adriaan P Van Der Plas}, journal = {Annals of Statistics}, pages = {78--85}, title = {On the estimation of the parameters of {M}arkov probability models using macro data}, volume = {1}, year = {1983}, } @book{king2013solution, author = {Gary King}, publisher = {Princeton University Press}, title = {A Solution to the Ecological Inference Problem: Reconstructing Individual Behavior from Aggregate Data}, year = {2013}, } @article{moffitt1993identification, author = {Robert Moffitt}, journal = {Journal of Econometrics}, number = {1}, pages = {99--123}, title = {Identification and estimation of dynamic models with a time series of repeated cross-sections}, volume = {59}, year = {1993}, } @article{collado1997estimating, author = {M Dolores Collado}, journal = {Journal of Econometrics}, number = {1}, pages = {37--62}, title = {Estimating dynamic models from time series of independent cross-sections}, volume = {82}, year = {1997}, } @article{hawkins2000estimating, author = {DL Hawkins and Chien-Pai Han}, journal = {Biometrics}, number = {3}, pages = {848--854}, title = {Estimating transition probabilities from aggregate samples plus partial transition data}, volume = {56}, year = {2000}, } @inproceedings{charikar2002similarity, author = {Moses S Charikar}, booktitle = {Proceedings of the thiry-fourth annual ACM symposium on Theory of computing}, pages = {380--388}, title = {Similarity estimation techniques from rounding algorithms}, year = {2002}, } @book{stein2011fourier, author = {Elias M Stein and Rami Shakarchi}, publisher = {Princeton University Press}, title = {Fourier Analysis: an Introduction}, volume = {1}, year = {2011}, } @article{balog2016deepcoder, author = {Matej Balog and Alexander L Gaunt and Marc Brockschmidt and Sebastian Nowozin and Daniel Tarlow}, journal = {arXiv preprint arXiv:1611.01989}, title = {Deepcoder: Learning to write programs}, year = {2016}, } @inproceedings{maddison2014structured, author = {Chris Maddison and Daniel Tarlow}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {649--657}, title = {Structured generative models of natural source code}, year = {2014}, } @inproceedings{allamanis2015bimodal, author = {Miltos Allamanis and Daniel Tarlow and Andrew Gordon and Yi Wei}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {2123--2132}, title = {Bimodal modelling of source code and natural language}, year = {2015}, } @inproceedings{hayati2018retrieval, author = {Shirley Anugrah Hayati and Raphael Olivier and Pravalika Avvaru and Pengcheng Yin and Anthony Tomasic and Graham Neubig}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Retrieval-based neural code generation}, year = {2018}, } @article{sun2018contextual, author = {Wen Sun and Alina Beygelzimer and Hal {Daum{\'e} III} and John Langford and Paul Mineiro}, journal = {arXiv preprint arXiv:1807.06473}, title = {Contextual memory trees}, year = {2018}, } @inproceedings{shen2018nash, author = {Dinghan Shen and Qinliang Su and Paidamoyo Chapfuwa and Wenlin Wang and Guoyin Wang and Ricardo Henao and Lawrence Carin}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {2041--2050}, title = {NASH: Toward End-to-End Neural Architecture for Generative Semantic Hashing}, year = {2018}, } @inproceedings{chaidaroon2017variational, author = {Suthee Chaidaroon and Yi Fang}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, pages = {75--84}, title = {Variational Deep Semantic Hashing for Text Documents}, year = {2017}, } @article{goldenshluger1997spatially, author = {Alexander Goldenshluger and Arkadi Nemirovski}, journal = {Mathematical Methods of Statistics}, pages = {135--170}, title = {On spatially adaptive estimation of nonparametric regression}, volume = {6}, year = {1997}, } @inproceedings{hu2018does, author = {Weihua Hu and Gang Niu and Issei Sato and Masashi Sugiyama}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Does Distributionally Robust Supervised Learning Give Robust Classifiers?}, year = {2018}, } @book{luo2012regularity, author = {Albert CJ Luo}, publisher = {Springer}, title = {Regularity and complexity in dynamical systems}, year = {2012}, } @article{ensign2017runaway, author = {Danielle Ensign and Sorelle A Friedler and Scott Neville and Carlos Scheidegger and Suresh Venkatasubramanian}, journal = {arXiv preprint arXiv:1706.09847}, title = {Runaway feedback loops in predictive policing}, year = {2017}, } @techreport{fuster2017predictably, author = {Andreas Fuster and Paul Goldsmith-Pinkham and Tarun Ramadorai and Ansgar Walther}, institution = {CEPR Discussion Papers}, title = {Predictably Unequal? The Effects of Machine Learning on Credit Markets}, year = {2017}, } @inproceedings{yan2016learning, author = {Rui Yan and Yiping Song and Hua Wu}, booktitle = {ACM Special Interest Group on Information Retreival (SIGIR)}, pages = {55--64}, title = {Learning to respond with deep neural networks for retrieval-based human-computer conversation system}, year = {2016}, } @inproceedings{lei2016semisupervised, author = {Tao Lei and Hrishikesh Joshi and Regina Barzilay and Tommi Jaakkola and Kateryna Tymoshenko and Alessandro Moschitti and Lluis Marquez}, booktitle = {North American Association for Computational Linguistics (NAACL)}, pages = {1279--1289}, title = {Semi-supervised Question Retrieval with Gated Convolutions}, year = {2016}, } @article{wu2018response, author = {Yu Wu and Furu Wei and SHaohan Huang and Zhoujun Li and Ming Zhou}, journal = {arXiv preprint arXiv:1806.07042}, title = {Response Generation by Context-aware Prototype Editing}, year = {2018}, } @inproceedings{xu2018spherical, author = {Jiacheng Xu and Greg Durrett}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Spherical Latent Spaces for Stable Variational Autoencoders}, year = {2018}, } @inproceedings{sumita1991experiments, author = {Eiichiro Sumita and Hitoshi Iida}, booktitle = {Association for Computational Linguistics (ACL)}, title = {Experiments and prospects of Example-Based Machine Translation}, year = {1991}, } @inproceedings{jiao2016minimax, author = {Jiantao Jiao and Yanjun Han and Tsachy Weissman}, booktitle = {IEEE International Symposium on Information Theory}, pages = {750--754}, title = {Minimax estimation of the $L_1$ distance}, year = {2016}, } @article{ali1966general, author = {S M Ali and Samuel David Silvey}, journal = {Journal of the Royal Statistical Society. Series B (Methodological)}, title = {A General Class of Coefficients of Divergence of One Distribution from Another}, volume = {28}, year = {1966}, } @article{balakrishnan2017hypothesis, author = {Sivaraman Balakrishnan and Larry Wasserman}, journal = {arXiv preprint arXiv:1712.06120}, title = {Hypothesis Testing for High-Dimensional Multinomials: A Selective Review}, year = {2017}, } @inproceedings{tolstikhin2016minimax, author = {Ilya Tolstikhin and Bharath K. Sriperumbudur and Bernhard Scholkopf}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1930--1938}, title = {Minimax Estimation of Maximum Mean Discrepancy With Radial Kernels}, year = {2016}, } @inproceedings{singh2018nonparametric, author = {Shashank Singh and Ananya Uppal and Boyue Li and Chun-Liang Li and Manzil Zaheer and Barnabas Poczos}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {246--257}, title = {Nonparametric Density Estimation under Adversarial Losses}, year = {2018}, } @article{bental2013robust, author = {Aharon Ben-Tal and Dick den Hertog and Anja De Waegenaere and Bertrand Melenberg and Gijs Rennen}, journal = {Management Science}, pages = {341--357}, title = {Robust Solutions of Optimization Problems Affected by Uncertain Probabilities}, volume = {59}, year = {2013}, } @article{duchi2021learning, author = {John Duchi and Hongseok Namkoong}, journal = {Annals of Statistics}, title = {Learning Models with Uniform Performance via Distributionally Robust Optimization}, year = {2021}, } @inproceedings{vaswani2013decoding, author = {Ashish Vaswani and Yinggong Zhao and Victoria Fossum and David Chiang}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1387--1392}, title = {Decoding with Large-Scale Neural Language Models Improves Translation}, year = {2013}, } @article{feder1994relations, author = {Meir Feder and Neri Merhav}, journal = {IEEE Transactions on Information Theory}, pages = {259--266}, title = {Relations between entropy and error probability}, volume = {40}, year = {1994}, } @article{sudhakar2015bayesian, author = {Sudhakar Prasad}, journal = {IEEE Transactions on Information Theory}, pages = {5052--5062}, title = {{B}ayesian Error-Based Sequences of Statistical Information Bounds}, volume = {19}, year = {2015}, } @inproceedings{kannan2016smart, author = {Anjuli Kannan and Karol Kurach and Sujith Ravi and Tobias Kaufmann and Andrew Tomkins and Balint Miklos and Greg Corrado and Laszlo Lukacs and Marina Ganea and Peter Young and Vivek Ramavajjala}, booktitle = {International Conference on Knowledge Discovery and Data Mining (KDD)}, pages = {955--964}, title = {Smart Reply: Automated Response Suggestion for Email}, year = {2016}, } @inproceedings{levy2007speakers, author = {Roger Levy and T. Florian Jaeger}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {849--856}, title = {Speakers optimize information density through syntactic reduction}, year = {2007}, } @inproceedings{levy2018communicative, author = {Roger Levy}, booktitle = {Proceedings of the 40th Annual Meeting of the Cognitive Science Society}, pages = {684--689}, title = {Communicative Efficiency, Uniform Information Density, and the Rational Speech Act Theory}, year = {2018}, } @inproceedings{fedus2018maskgan, author = {William Fedus and Ian Goodfellow and Andrew M. Dai}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {MaskGAN: Better Text Generation via Filling in the }, year = {2018}, } @inproceedings{miao2016language, author = {Yishu Miao and Phil Blunsom}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {319--328}, title = {Language as a Latent Variable: Discrete Generative Models for Sentence Compression}, year = {2016}, } @inproceedings{turner2005supervised, author = {Jenine Turner and Eugene Charniak}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {290--297}, title = {Supervised and unsupervised learning for sentence compression}, year = {2005}, } @inproceedings{filippova2013overcoming, author = {Katja Filippova and Yasemin Altun}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, title = {Overcoming the Lack of Parallel Data in Sentence Compression}, year = {2013}, } @article{knight2002summarization, author = {Kevin Knight and Daniel Marcu}, journal = {Artifical Intelligence}, pages = {91--107}, title = {Summarization beyond sentence extraction: A probabilistic approach to sentence compression}, volume = {139}, year = {2002}, } @inproceedings{cohn2008sentence, author = {Trevor Cohn and Mirella Lapata}, booktitle = {International Conference on Computational Linguistics (COLING)}, pages = {137--144}, title = {Sentence Compression Beyond Word Deletion}, year = {2008}, } @inproceedings{fevry2018unsupervised, author = {Thibault Fevry and Jason Phang}, booktitle = {Computational Natural Language Learning (CoNLL)}, pages = {413--422}, title = {Unsupervised Sentence Compression using Denoising Auto-Encoders}, year = {2018}, } @inproceedings{yossef2011context, author = {Ziv Bar-Yossef and Naama Kraus}, booktitle = {World Wide Web (WWW)}, pages = {107--116}, title = {Context-sensitive query auto-completion}, year = {2011}, } @book{hwang1979multiple, author = {Ching-Lai Hwang and Abu Syed Md. Masud}, publisher = {Springer}, title = {Multiple Objective Decision Making Methods and Applications}, year = {1979}, } @article{witten1987arithmetic, author = {Ian H. Witten and Radford M. Neal and John G. Cleary}, journal = {Communications of the ACM}, pages = {520--540}, title = {Arithmetic coding for data compression}, volume = {30}, year = {1987}, } @inproceedings{mccann2017learned, author = {Bryan McCann and James Bradbury and Caiming Xiong and Richard Socher}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {6297--6308}, title = {Learned in translation: Contextualized word vectors}, year = {2017}, } @inproceedings{wen2014robust, author = {Junfeng Wen and Chun-Nam Yu and Russell Greiner}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {631--639}, title = {Robust Learning under Uncertain Test Distributions: Relating Covariate Shift to Model Misspecification}, year = {2014}, } @inproceedings{hu2014polylingual, author = {Yuening Hu and Ke Zhai and Vladimir Eidelman and Jordan Boyd-Graber}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {1166--1176}, title = {Polylingual Tree-Based Topic Models for Translation Domain Adaptation}, year = {2014}, } @inproceedings{eidelman2012topic, author = {Vladimir Eidelman and Jordan Boyd-Graber and Philip Resnik}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {115--119}, title = {Topic Models for Dynamic Translation Model Adaptation}, year = {2012}, } @inproceedings{rakhlin2013optimization, author = {Alexander Rakhlin and Karthik Sridharan}, booktitle = {Conference on Learning Theory (COLT)}, title = {Optimization, Learning, and Games with Predictable Sequences}, year = {2013}, } @inproceedings{namkoong2016stochastic, author = {Hongseok Namkoong and John Duchi}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Stochastic Gradient Methods for Distributionally Robust Optimization with f-Divergences}, year = {2016}, } @article{peters2016causal, author = {Jonas Peters and Peter B\"uhlmann and Nicolai Meinshausen}, journal = {Journal of the Royal Statistical Society. Series B (Methodological)}, title = {Causal inference by using invariant prediction: identification and confidence intervals}, volume = {78}, year = {2016}, } @article{meinshausen2015maximin, author = {Nicolai Meinshausen and Peter B\"uhlmann}, journal = {Annals of Statistics}, title = {Maximin effects in inhomogeneous large-scale data}, volume = {43}, year = {2015}, } @article{rothenhausler2018anchor, author = {Domink Rothenh\"ausler and Peter B\"uhlmann and Nicolai Meinshausen and Jonas Peters}, journal = {arXiv preprint arXiv:1801.06229}, title = {Anchor regression: heterogeneous data meets causality}, year = {2018}, } @inproceedings{buhlmann2016magging, author = {Peter B\"uhlmann and Nicolai Meinshausen}, booktitle = {IEEE}, title = {Magging: maximin aggregation for inhomogeneous large-scale data}, year = {2016}, } @article{bertsimas2018data, author = {Dimitris Bertsimas and Vishal Gupta and Nathan Kallus}, journal = {Mathematical Programming Series A}, title = {Data-driven robust optimization}, volume = {167}, year = {2018}, } @inproceedings{lam2015quantifying, author = {Henry Lam and Enlu Zhou}, booktitle = {2015 Winter Simulation Conference}, title = {Quantifying Input Uncertainty in Stochastic Optimization}, year = {2015}, } @inproceedings{shafieezadeh2015distributionally, author = {Soroosh Shafieezadeh-Abadeh and Peyman Mohajerin Esfahani and Daniel Kuhn}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Distributionally Robust Logistic Regression}, year = {2015}, } @article{lee2017minimax, author = {Jaeho Lee and Maxim Raginsky}, journal = {arXiv preprint arXiv:1705.07815}, title = {Minimax Statistical Learning and Domain Adaptation with Wasserstein Distances}, year = {2017}, } @misc{duchi2019distributionally, author = {John Duchi and Tatsunori Hashimoto and Hongseok Namkoong}, howpublished = {\url{https://cs.stanford.edu/~thashim/assets/publications/condrisk.pdf}}, title = {Distributionally Robust Losses Against Mixture Covariate Shifts}, year = {2019}, } @book{michele2004eliminating, author = {Michele Ver Ploeg and Edward Perrin and Panel on DHHS Collection of Race and Ethnic Data}, publisher = {National Academies Press}, title = {Eliminating Health Disparities: Measurement and Data Needs}, year = {2004}, } @inproceedings{cho2014statmt, author = {Kyunghyun Cho and Bart van Merrienboer and Caglar Gulcehre and Dzmitry Bahdanau and Fethi Bougares and Holger Schwenk and Yoshua Bengio}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1724--1734}, title = { Learning Phrase Representations using {RNN} Encoder-Decoder for Statistical Machine Translation}, year = {2014}, } @inproceedings{ling2016latent, author = {Wang Ling and Edward Grefenstette and Karl Moritz Hermann and Tomáš Kočiský and Andrew Senior and Fumin Wang and Phil Blunsom}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {599--609}, title = {Latent Predictor Networks for Code Generation}, year = {2016}, } @inproceedings{yin2017syntactic, author = {Pengcheng Yin and Graham Neubig}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {440--450}, title = {A Syntactic Neural Model for General-Purpose Code Generation}, year = {2017}, } @inproceedings{dosovitskiy2016generating, author = {Matt J Kusner and Joshua R Loftus and Chris Russell and Ricardo Silva}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {658--666}, title = {Generating Images with Perceptual Similarity Metrics based on Deep Networks}, year = {2016}, } @inproceedings{krizhevsky2011verydeep, author = {Alex Krizhevsky and Geoffrey E. Hinton}, booktitle = {19th European Symposium on Artificial Neural Networks, Computational Intelligence and Machine Learning (ESANN)}, pages = {489--494}, title = {Using Very Deep Autoencoders for Content-Based Image Retrieval}, year = {2011}, } @inproceedings{feng2014cross, author = {Fangxiang Feng and Xiaojie Wang and Ruifan Li}, booktitle = {Proceedings of the 22Nd ACM International Conference on Multimedia}, pages = {7--16}, title = {Cross-modal Retrieval with Correspondence Autoencoder}, year = {2014}, } @article{zhou2016community, author = {Guangyou Zhou and Yin Zhou and Tingting He and Wensheng Wu}, journal = {Knowledge-Based Systems}, pages = {75--83}, title = {Learning semantic representation with neural networks for community question answering retrieval}, year = {2016}, } @inproceedings{grover2017unfolding, author = {Jeenu Grover and Pabitra Mitra}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {16--20}, title = {Sentence Alignment using Unfolding Recursive Autoencoders}, year = {2017}, } @inproceedings{p2017latent, author = {Deepak P and Dinesh Garg and Shirish Shevade}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {855--865}, title = {Latent Space Embedding for Retrieval in Question-Answer Archives}, year = {2017}, } @inproceedings{clinchant2013aggregating, author = {Stéphane Clinchant and Florent Perronnin}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {100--109}, title = {Aggregating Continuous Word Embeddings for Information Retrieval}, year = {2013}, } @inproceedings{ganin2015domain, author = {Yaroslav Ganin and Victor Lempitsky}, booktitle = {International Conference on Machine Learning (ICML)}, pages = {1180--1189}, title = {Unsupervised Domain Adaptation by Backpropagation}, year = {2015}, } @inproceedings{fu2017domain, author = {Lisheng Fu and Thien Huu Nguyen and Bonan Min and Ralph Grishman}, booktitle = {Proceedings of the The 8th International Joint Conference on Natural Language Processing}, pages = {425--429}, title = {Domain Adaptation for Relation Extraction with Domain Adversarial Neural Network}, year = {2017}, } @inproceedings{yang2018nmtadv, author = {Zhen Yang and Wei Chen and Feng Wang and Bo Xu}, booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)}, pages = {1346--1355}, title = {Improving Neural Machine Translation with Conditional Sequence Generative Adversarial Nets}, year = {2018}, } @article{zhang2017aspect, author = {Yuan Zhang and Regina Barzilay and Tommi Jaakkola}, journal = {Transactions of the Association for Computational Linguistics (TACL)}, pages = {515--528}, title = {Aspect-augmented Adversarial Networks for Domain Adaptation}, volume = {5}, year = {2017}, } @inproceedings{pryzant2017domainmix, author = {Reid Pryzant and Denny Britz and Quoc V. Le}, booktitle = {Proceedings of the Second Conference on Machine Translation}, pages = {118--126}, title = {Effective Domain Mixing for Neural Machine Translation}, year = {2017}, } @article{chen2018adversarial, author = {Xilun Chen and Yu Sun and Ben Athiwaratkun and Claire Cardie and Kilian Weinberger}, journal = {arXiv preprint arXiv:arXiv:1606.01614}, title = {Adversarial Deep Averaging Networks for Cross-Lingual Sentiment Classification}, year = {2018}, } @inproceedings{purushotham2017variational, author = {Sanjay Purushotham and Wilka Carvalho and Tanachat Nilanon and Yan Liu}, booktitle = {International Conference on Learning Representations (ICLR)}, title = {Variational Recurrent Adversarial Deep Domain Adaptation}, year = {2017}, } @inproceedings{shen2018WassersteinDG, author = {Jian Shen and Yanru Qu and Weinan Zhang and Yong Yu}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Wasserstein Distance Guided Representation Learning for Domain Adaptation}, year = {2018}, } @inproceedings{sun2016return, author = {Baochen Sun and Jiashi Feng and Kate Saenko}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Return of Frustratingly Easy Domain Adaptation}, year = {2016}, } @inproceedings{liu2015addressing, author = {Anqi Liu and Kaiser Asif}, booktitle = {International Conference on Machine Learning (ICML)}, title = {Addressing Covariate Shift in Active Learning with Adversarial Prediction}, year = {2015}, } @article{zhao2017multiple, author = {Han Zhao and Shanghang Zhang and Guanhang Wu and Jo{\~a}o P. Costeira and Jos{'e} M. F. Moura and Geoffrey J. Gordon}, journal = {CoRR}, title = {Multiple Source Domain Adaptation with Adversarial Training of Neural Networks}, volume = {0}, year = {2017}, } @inproceedings{hoffman2012discovering, author = {Judy Hoffman and Brian Kulis and Trevor Darrell and Kate Saenko}, booktitle = {European Conference on Computer Vision (ECCV)}, pages = {702--715}, title = {Discovering Latent Domains for Multisource Domain Adaptation}, year = {2012}, } @inproceedings{lau2015unsupervised, author = {Jey Han Lau and Alexander Clark and Shalom Lappin}, booktitle = {Association for Computational Linguistics (ACL)}, pages = {1618--1628}, title = {Unsupervised Prediction of Acceptability Judgements}, year = {2015}, } @inproceedings{xiong2014latent, author = {Caiming Xiong and Scott McCloskey and Shao-Hang Hsieh and Jason J. Corso}, booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)}, title = {Latent Domains Modeling for Visual Domain Adaptation}, year = {2014}, } @inproceedings{gong2013reshaping, author = {Boqing Gong and Kristen Grauman and Fei Sha}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, title = {Reshaping Visual Datasets for Domain Adaptation}, year = {2013}, } @inproceedings{marcheggiani2014hierarchical, author = {D Marcheggiani and O T\"ackstr\"om and A Esuli and F Sebastiani}, booktitle = {ECIR}, title = {Hierarchical Multi-Label Conditional Random Fields for Aspect-Oriented Opinion Mining}, year = {2014}, } @inproceedings{yuan2015lightlda, author = {Jinhui Yuan and Fei Gao and Qirong Ho and Wei Dai and Jinliang Wei and Xun Zheng and Eric P. Xing and Tie-Yan Liu and Wei-Ying Ma}, booktitle = {World Wide Web (WWW)}, title = {LightLDA: Big Topic Models on Modest Compute Clusters}, year = {2015}, } @inproceedings{honnibal2015nmdp, author = {Matthew Honnibal and Mark Johnson}, booktitle = {Empirical Methods in Natural Language Processing (EMNLP)}, pages = {1373--1378}, title = {An Improved Non-monotonic Transition System for Dependency Parsing}, year = {2015}, } @inproceedings{mansour2009dams, author = {Yishay Mansour and Mehryar Mohri and Afshin Rostamizadeh}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {1041--1048}, title = {Domain Adaptation with Multiple Sources}, year = {2009}, } @inproceedings{hoffman2018msda, author = {Judy Hoffman and Mehryar Mohri and Ningshan Zhang}, booktitle = {Advances in Neural Information Processing Systems (NeurIPS)}, pages = {8256--8266}, title = {Algorithms and Theory for Multiple-source Adaptation}, year = {2018}, }