CLAW Publications

REM: Evaluating LLM Embodied Spatial Reasoning through Multi-Frame Trajectories

Second Conference on Language Modeling (2025)
Jacob Thompson, Emiliano Garcia-Lopez,

Yonatan Bisk

PDF

@inproceedings{CoLM:Thompson2025,
    author    = {Jacob Thompson and Emiliano Garcia-Lopez and Yonatan Bisk},
    title     = {REM: Evaluating LLM Embodied Spatial Reasoning through Multi-Frame Trajectories},
    booktitle = {Second Conference on Language Modeling},
    year      = {2025},
    url       = {https://openreview.net/forum?id=qbWpEufkqk},
}

Position: You Can't Manufacture a NeRF

Forty-second International Conference on Machine Learning Position Paper Track (2025)
Ani Kimmel, Mueed Ur Rehman,

Yonatan Bisk

, Gary K. Fedder

PDF

@inproceedings{ICML:Kimmel2025,
    author    = {Ani Kimmel and Mueed Ur Rehman and Yonatan Bisk and Gary K. Fedder},
    title     = {Position: You Can't Manufacture a NeRF},
    booktitle = {Forty-second International Conference on Machine Learning Position Paper Track},
    year      = {2025},
    url       = {https://openreview.net/forum?id=kJzB6lQmcb},
}

Looking beyond the next token

ArXiv (2025)

Abitha Thankaraj

, Yiding Jiang, J. Zico Kolter,

Yonatan Bisk

@article{ArXiv:Thankaraj2025,
    author    = {Abitha Thankaraj and Yiding Jiang and J. Zico Kolter and Yonatan Bisk},
    title     = {Looking beyond the next token},
    journal = {ArXiv},
    year      = {2025},
    url       = {https://arxiv.org/abs/2504.11336},
}

Model Successor Functions

ArXiv (2025)

Yingshan Chang

,

Yonatan Bisk

@article{ArXiv:Chang2025,
    author    = {Yingshan Chang and Yonatan Bisk},
    title     = {Model Successor Functions},
    journal = {ArXiv},
    year      = {2025},
    url       = {https://arxiv.org/abs/2502.00197},
}

Casper: Inferring Diverse Intents for Assistive Teleoperation with Vision Language Models

ArXiv (2025)
Huihan Liu, Rutav Shah, Shuijing Liu, Jack Pittenger, Mingyo Seo, Yuchen Cui,

Yonatan Bisk

, Roberto Martín-Martín, Yuke Zhu

@article{ArXiv:Liu2025,
    author    = {Huihan Liu and Rutav Shah and Shuijing Liu and Jack Pittenger and Mingyo Seo and Yuchen Cui and Yonatan Bisk and Roberto Martín-Martín and Yuke Zhu},
    title     = {Casper: Inferring Diverse Intents for Assistive Teleoperation with Vision Language Models},
    journal = {ArXiv},
    year      = {2025},
    url       = {https://arxiv.org/abs/2506.14727},
}

Energy Considerations of Large Language Model Inference and Efficiency Optimizations

The 63rd Annual Meeting of the Association for Computational Linguistics (2025)

Jared Fernandez

, Clara Na, Vashisth Tiwari,

Yonatan Bisk

, Sasha Luccioni, Emma Strubell

@inproceedings{ACL:Fernandez2025,
    author    = {Jared Fernandez and Clara Na and Vashisth Tiwari and Yonatan Bisk and Sasha Luccioni and Emma Strubell},
    title     = {Energy Considerations of Large Language Model Inference and Efficiency Optimizations},
    booktitle = {The 63rd Annual Meeting of the Association for Computational Linguistics},
    year      = {2025},
    url       = {https://arxiv.org/abs/2504.17674},
}

Self-Regulation and Requesting Interventions

ArXiv (2025)
So Yeon Min, Yue Wu, Jimin Sun, Max Kaufmann, Fahim Tajwar,

Yonatan Bisk

, Ruslan Salakhutdinov

@article{ArXiv:Min2025,
    author    = {So Yeon Min and Yue Wu and Jimin Sun and Max Kaufmann and Fahim Tajwar and Yonatan Bisk and Ruslan Salakhutdinov},
    title     = {Self-Regulation and Requesting Interventions},
    journal = {ArXiv},
    year      = {2025},
    url       = {https://arxiv.org/abs/2502.04576},
}

Re-thinking Temporal Search for Long-Form Video Understanding

The IEEE/CVF Conference on Computer Vision and Pattern Recognition (2025)
Jinhui Ye, Zihan Wang, Haosen Sun, Keshigeyan Chandrasegaran, Zane Durante, Cristobal Eyzaguirre,

Yonatan Bisk

, Juan Carlos Niebles, Ehsan Adeli, Li Fei-Fei, Jiajun Wu, Manling Li

@inproceedings{CVPR:Ye2025,
    author    = {Jinhui Ye and Zihan Wang and Haosen Sun and Keshigeyan Chandrasegaran and Zane Durante and Cristobal Eyzaguirre and Yonatan Bisk and Juan Carlos Niebles and Ehsan Adeli and Li Fei-Fei and Jiajun Wu and Manling Li},
    title     = {Re-thinking Temporal Search for Long-Form Video Understanding},
    booktitle = {The IEEE/CVF Conference on Computer Vision and Pattern Recognition},
    year      = {2025},
    url       = {https://arxiv.org/abs/2504.02259},
}

Explore Theory-of-Mind: Program-Guided Adversarial Data Generation for Theory of Mind Reasoning

The Thirteenth International Conference on Learning Representations (2025)
Melanie Sclar, Jane Yu, Maryam Fazel-Zarandi, Yulia Tsvetkov,

Yonatan Bisk

, Yejin Choi, Asli Celikyilmaz

Meta

@inproceedings{ICLR:Sclar2025,
    author    = {Melanie Sclar and Jane Yu and Maryam Fazel-Zarandi and Yulia Tsvetkov and Yonatan Bisk and Yejin Choi and Asli Celikyilmaz},
    title     = {Explore Theory-of-Mind: Program-Guided Adversarial Data Generation for Theory of Mind Reasoning},
    booktitle = {The Thirteenth International Conference on Learning Representations},
    year      = {2025},
    url       = {https://arxiv.org/abs/2412.12175},
}

Efficient Hardware Scaling and Diminishing Returns in Large-Scale Training of Language Models

Transactions on Machine Learning Research (2025)

Jared Fernandez

, Luca Wehrstedt, Leonid Shamis, Mostafa Elhoushi, Kalyan Saladi,

Yonatan Bisk

, Emma Strubell, Jacob Kahn

@article{TMLR:Fernandez2025,
    author    = {Jared Fernandez and Luca Wehrstedt and Leonid Shamis and Mostafa Elhoushi and Kalyan Saladi and Yonatan Bisk and Emma Strubell and Jacob Kahn},
    title     = {Efficient Hardware Scaling and Diminishing Returns in Large-Scale Training of Language Models},
    journal = {Transactions on Machine Learning Research},
    year      = {2025},
    url       = {https://arxiv.org/abs/2411.13055},
}

Embodied-RAG: General non-parametric Embodied Memory for Retrieval and Generation

ArXiv (2024)

Quanting Xie

, So Yeon Min, Tianyi Zhang, Aarav Bajaj, Ruslan Salakhutdinov, Matthew Johnson-Roberson,

Yonatan Bisk

Website

@article{ArXiv:Xie2024,
    author    = {Quanting Xie and So Yeon Min and Tianyi Zhang and Aarav Bajaj and Ruslan Salakhutdinov and Matthew Johnson-Roberson and Yonatan Bisk},
    title     = {Embodied-RAG: General non-parametric Embodied Memory for Retrieval and Generation},
    journal = {ArXiv},
    year      = {2024},
    url       = {https://arxiv.org/abs/2409.18313},
}

MotIF: Motion Instruction Fine-tuning

IEEE Robotics and Automation Letters (2025)
Minyoung Hwang, Joey Hejna, Dorsa Sadigh,

Yonatan Bisk

Website

@article{RA-L:Hwang2025,
    author    = {Minyoung Hwang and Joey Hejna and Dorsa Sadigh and Yonatan Bisk},
    title     = {MotIF: Motion Instruction Fine-tuning},
    journal = {IEEE Robotics and Automation Letters},
    year      = {2025},
    url       = {https://arxiv.org/abs/2409.10683},
}

ANAVI: Audio Noise Awareness using Visuals of Indoor environments for NAVIgation

Conference on Robot Learning (2024)
Vidhi Jain, Rishi Veerapaneni,

Yonatan Bisk

Website

@inproceedings{CoRL:Jain2024,
    author    = {Vidhi Jain and Rishi Veerapaneni and Yonatan Bisk},
    title     = {ANAVI: Audio Noise Awareness using Visuals of Indoor environments for NAVIgation},
    booktitle = {Conference on Robot Learning},
    year      = {2024},
    url       = {https://arxiv.org/abs/2410.18932},
}

Situated Instruction Following

European Conference on Computer Vision (2024)
So Yeon Min, Xavi Puig, Devendra Singh Chaplot, Tsung-Yen Yang, Akshara Rai, Priyam Parashar, Ruslan Salakhutdinov,

Yonatan Bisk

, Roozbeh Mottaghi

Website

@inproceedings{ECCV:Min2024,
    author    = {So Yeon Min and Xavi Puig and Devendra Singh Chaplot and Tsung-Yen Yang and Akshara Rai and Priyam Parashar and Ruslan Salakhutdinov and Yonatan Bisk and Roozbeh Mottaghi},
    title     = {Situated Instruction Following},
    booktitle = {European Conference on Computer Vision},
    year      = {2024},
    url       = {https://arxiv.org/abs/2407.12061},
}

Gradient Localization Improves Lifelong Pretraining of Language Models

Findings of the Conference on Empirical Methods in Natural Language Processing (2024)

Jared Fernandez

,

Yonatan Bisk

, Emma Strubell

@inproceedings{EMNLP-Findings:Fernandez2024,
    author    = {Jared Fernandez and Yonatan Bisk and Emma Strubell},
    title     = {Gradient Localization Improves Lifelong Pretraining of Language Models},
    booktitle = {Findings of the Conference on Empirical Methods in Natural Language Processing},
    year      = {2024},
    url       = {https://arxiv.org/abs/2411.04448},
}

How to Train Your Fact Verifier: Knowledge Transfer with Multimodal Open Models

Findings of the Conference on Empirical Methods in Natural Language Processing (2024)
Jaeyoung Lee, Ximing Lu, Jack Hessel, Faeze Brahman, Youngjae Yu,

Yonatan Bisk

, Yejin Choi, Saadia Gabriel

@inproceedings{EMNLP-Findings:Lee2024,
    author    = {Jaeyoung Lee and Ximing Lu and Jack Hessel and Faeze Brahman and Youngjae Yu and Yonatan Bisk and Yejin Choi and Saadia Gabriel},
    title     = {How to Train Your Fact Verifier: Knowledge Transfer with Multimodal Open Models},
    booktitle = {Findings of the Conference on Empirical Methods in Natural Language Processing },
    year      = {2024},
    url       = {https://arxiv.org/abs/2407.00369},
}

Tools Fail: Detecting Silent Errors in Faulty Tools

Conference on Empirical Methods in Natural Language Processing (2024)
Jimin Sun, So Yeon Min,

Yingshan Chang

,

Yonatan Bisk

@inproceedings{EMNLP:Sun2024,
    author    = {Jimin Sun and So Yeon Min and Yingshan Chang and Yonatan Bisk},
    title     = {Tools Fail: Detecting Silent Errors in Faulty Tools},
    booktitle = {Conference on Empirical Methods in Natural Language Processing },
    year      = {2024},
    url       = {https://arxiv.org/abs/2406.19228},
}

DegustaBot: Zero-Shot Visual Preference Estimation for Personalized Multi-Object Rearrangement

ArXiv (2024)
Benjamin A. Newman, Pranay Gupta, Kris Kitani,

Yonatan Bisk

, Henny Admoni, Chris Paxton

@article{ArXiv:Newman2024,
    author    = {Benjamin A. Newman and Pranay Gupta and Kris Kitani and Yonatan Bisk and Henny Admoni and Chris Paxton},
    title     = {DegustaBot: Zero-Shot Visual Preference Estimation for Personalized Multi-Object Rearrangement},
    journal = {ArXiv},
    year      = {2024},
    url       = {https://arxiv.org/abs/2407.08876},
}

Language Models Need Inductive Biases to Count Inductively

The Thirteenth International Conference on Learning Representations (2025)

Yingshan Chang

,

Yonatan Bisk

@inproceedings{ICLR:Chang2025,
    author    = {Yingshan Chang and Yonatan Bisk},
    title     = {Language Models Need Inductive Biases to Count Inductively},
    booktitle = {The Thirteenth International Conference on Learning Representations},
    year      = {2025},
    url       = {https://arxiv.org/abs/2405.20131},
}

DiffusionPID: Interpreting Diffusion via Partial Information Decomposition

Thirty-Eighth Annual Conference on Neural Information Processing Systems (2024)
Shaurya Dewan, Rushikesh Zawar, Prakanshul Saxena,

Yingshan Chang

, Andrew Luo,

Yonatan Bisk

@inproceedings{NeurIPS:Dewan2024,
    author    = {Shaurya Dewan and Rushikesh Zawar and Prakanshul Saxena and Yingshan Chang and Andrew Luo and Yonatan Bisk},
    title     = {DiffusionPID: Interpreting Diffusion via Partial Information Decomposition},
    booktitle = {Thirty-Eighth Annual Conference on Neural Information Processing Systems},
    year      = {2024},
    url       = {https://arxiv.org/abs/2406.05191},
}

Dialogue with Robots: Proposals for Broadening Participation and Research in the SLIVAR Community

ArXiv (2024)
Casey Kennington, Malihe Alikhani, Heather Pon-Barry, Katherine Atwell,

Yonatan Bisk

, Daniel Fried, Felix Gervits, Zhao Han, Mert Inan, Michael Johnston, Raj Korpan, Diane Litman, Matthew Marge, Cynthia Matuszek, Ross Mead, Shiwali Mohan, Raymond Mooney, Natalie Parde, Jivko Sinapov, Angela Stewart, Matthew Stone, Stefanie Tellex, Tom Williams

@article{ArXiv:Kennington2024,
    author    = {Casey Kennington and Malihe Alikhani and Heather Pon-Barry and Katherine Atwell and Yonatan Bisk and Daniel Fried and Felix Gervits and Zhao Han and Mert Inan and Michael Johnston and Raj Korpan and Diane Litman and Matthew Marge and Cynthia Matuszek and Ross Mead and Shiwali Mohan and Raymond Mooney and Natalie Parde and Jivko Sinapov and Angela Stewart and Matthew Stone and Stefanie Tellex and Tom Williams},
    title     = {Dialogue with Robots: Proposals for Broadening Participation and Research in the SLIVAR Community},
    journal = {ArXiv},
    year      = {2024},
    url       = {https://arxiv.org/abs/2404.01158},
}

VISREAS: Complex Visual Reasoning with Unanswerable Questions

Findings of the 62nd Annual Meeting of the Association for Computational Linguistics (2024)
Syeda Nahida Akter, Sangwu Lee,

Yingshan Chang

,

Yonatan Bisk

, Eric Nyberg

@inproceedings{ACL-Findings:Akter2024,
    author    = {Syeda Nahida Akter and Sangwu Lee and Yingshan Chang and Yonatan Bisk and Eric Nyberg},
    title     = {VISREAS: Complex Visual Reasoning with Unanswerable Questions},
    booktitle = {Findings of the 62nd Annual Meeting of the Association for Computational Linguistics},
    year      = {2024},
    url       = {https://arxiv.org/abs/2403.10534},
}

AgentKit: Flow Engineering with Graphs, not Coding

Conference on Language Modeling (2024)
Yue Wu, Yewen Fan, So Yeon Min, Shrimai Prabhumoye, Stephen McAleer,

Yonatan Bisk

, Ruslan Salakhutdinov, Yuanzhi Li, Tom Mitchell

@inproceedings{COLM:Wu2024,
    author    = {Yue Wu and Yewen Fan and So Yeon Min and Shrimai Prabhumoye and Stephen McAleer and Yonatan Bisk and Ruslan Salakhutdinov and Yuanzhi Li and Tom Mitchell},
    title     = {AgentKit: Flow Engineering with Graphs, not Coding},
    booktitle = {Conference on Language Modeling},
    year      = {2024},
    url       = {https://arxiv.org/abs/2404.11483},
}

Skews in the Phenomenon Space Hinder Generalization in Text-to-Image Generation

European Conference on Computer Vision (2024)

Yingshan Chang

, Yasi Zhang, Zhiyuan Fang, Yingnian Wu,

Yonatan Bisk

, Feng Gao

@inproceedings{ECCV:Chang2024,
    author    = {Yingshan Chang and Yasi Zhang and Zhiyuan Fang and Yingnian Wu and Yonatan Bisk and Feng Gao},
    title     = {Skews in the Phenomenon Space Hinder Generalization in Text-to-Image Generation},
    booktitle = {European Conference on Computer Vision},
    year      = {2024},
    url       = {https://arxiv.org/abs/2403.16394},
}

Direct Preference Optimization of Video Large Multimodal Models from Language Model Reward

Annual Conference of the Nations of the Americas Chapter of the ACL (2025)
Ruohong Zhang, Liangke Gui, Zhiqing Sun, Yihao Feng, Keyang Xu, Yuanhan Zhang, Di Fu, Chunyuan Li, Alexander Hauptmann,

Yonatan Bisk

, Yiming Yang

@inproceedings{NAACL:Zhang2025,
    author    = {Ruohong Zhang and Liangke Gui and Zhiqing Sun and Yihao Feng and Keyang Xu and Yuanhan Zhang and Di Fu and Chunyuan Li and Alexander Hauptmann and Yonatan Bisk and Yiming Yang},
    title     = {Direct Preference Optimization of Video Large Multimodal Models from Language Model Reward},
    booktitle = {Annual Conference of the Nations of the Americas Chapter of the ACL},
    year      = {2025},
    url       = {https://arxiv.org/abs/2404.01258},
}

Vid2Robot: End-to-end Video-conditioned Policy Learning with Cross-Attention Transformers

Robotics: Science and Systems (2024)
Vidhi Jain, Maria Attarian, Nikhil J Joshi, Ayzaan Wahid, Danny Driess, Quan Vuong, Pannag R Sanketi, Pierre Sermanet, Stefan Welker, Christine Chan, Igor Gilitschenski,

Yonatan Bisk

, Debidatta Dwibedi

Website

@inproceedings{RSS:Jain2024,
    author    = {Vidhi Jain and Maria Attarian and Nikhil J Joshi and Ayzaan Wahid and Danny Driess and Quan Vuong and Pannag R Sanketi and Pierre Sermanet and Stefan Welker and Christine Chan and Igor Gilitschenski and Yonatan Bisk and Debidatta Dwibedi},
    title     = {Vid2Robot: End-to-end Video-conditioned Policy Learning with Cross-Attention Transformers},
    booktitle = {Robotics: Science and Systems},
    year      = {2024},
    url       = {https://arxiv.org/abs/2403.12943},
}

SOTOPIA-π: Interactive Learning of Socially Intelligent Language Agents

The 62nd Annual Meeting of the Association for Computational Linguistics (2024)
Ruiyi Wang, Haofei Yu, Wenxin Zhang, Zhengyang Qi, Maarten Sap, Graham Neubig,

Yonatan Bisk

, Hao Zhu

Website

@inproceedings{ACL:Wang2024,
    author    = {Ruiyi Wang and Haofei Yu and Wenxin Zhang and Zhengyang Qi and Maarten Sap and Graham Neubig and Yonatan Bisk and Hao Zhu},
    title     = {SOTOPIA-π: Interactive Learning of Socially Intelligent Language Agents},
    booktitle = {The 62nd Annual Meeting of the Association for Computational Linguistics},
    year      = {2024},
    url       = {https://arxiv.org/abs/2403.08715},
}

OpenEQA: Embodied Question Answering in the Era of Foundation Models

Conference on Computer Vision and Pattern Recognition (2024)
Arjun Majumdar, Anurag Ajay, Xiaohan Zhang, Pranav Putta, Sriram Yenamandra, Mikael Henaff, Sneha Silwal, Paul Mcvay, Oleksandr Maksymets, Sergio Arnaud, Karmesh Yadav, Qiyang Li, Ben Newman, Mohit Sharma, Vincent Berges, Shiqi Zhang, Pulkit Agrawal,

Yonatan Bisk

, Dhruv Batra, Mrinal Kalakrishnan, Franziska Meier, Chris Paxton, Sasha Sax, Aravind Rajeswaran

PDF

Website Blog

@inproceedings{CVPR:Majumdar2024,
    author    = {Arjun Majumdar and Anurag Ajay and Xiaohan Zhang and Pranav Putta and Sriram Yenamandra and Mikael Henaff and Sneha Silwal and Paul Mcvay and Oleksandr Maksymets and Sergio Arnaud and Karmesh Yadav and Qiyang Li and Ben Newman and Mohit Sharma and Vincent Berges and Shiqi Zhang and Pulkit Agrawal and Yonatan Bisk and Dhruv Batra and Mrinal Kalakrishnan and Franziska Meier and Chris Paxton and Sasha Sax and Aravind Rajeswaran},
    title     = {OpenEQA: Embodied Question Answering in the Era of Foundation Models},
    booktitle = {Conference on Computer Vision and Pattern Recognition},
    year      = {2024},
    url       = {https://open-eqa.github.io/assets/pdfs/paper.pdf},
}

Toward General-Purpose Robots via Foundation Models: A Survey and Meta-Analysis

ArXiv (2023)
Yafei Hu,

Quanting Xie

, Vidhi Jain, Jonathan Francis, Jay Patrikar, Nikhil Keetha, Seungchan Kim, Yaqi Xie, Tianyi Zhang, Shibo Zhao, Yu Quan Chong, Chen Wang, Katia Sycara, Matthew Johnson-Roberson, Dhruv Batra, Xiaolong Wang, Sebastian Scherer, Zsolt Kira, Fei Xia,

Yonatan Bisk

Website

@article{ArXiv:Hu2023,
    author    = {Yafei Hu and Quanting Xie and Vidhi Jain and Jonathan Francis and Jay Patrikar and Nikhil Keetha and Seungchan Kim and Yaqi Xie and Tianyi Zhang and Shibo Zhao and Yu Quan Chong and Chen Wang and Katia Sycara and Matthew Johnson-Roberson and Dhruv Batra and Xiaolong Wang and Sebastian Scherer and Zsolt Kira and Fei Xia and Yonatan Bisk},
    title     = {Toward General-Purpose Robots via Foundation Models: A Survey and Meta-Analysis},
    journal = {ArXiv},
    year      = {2023},
    url       = {https://arxiv.org/abs/2312.08782},
}

SOTOPIA: Interactive Evaluation for Social Intelligence in Language Agents

The Twelfth International Conference on Learning Representations (2024)
Xuhui Zhou, Hao Zhu,

Leena Mathur

, Ruohong Zhang, Haofei Yu, Zhengyang Qi, Louis-Philippe Morency,

Yonatan Bisk

, Daniel Fried, Graham Neubig, Maarten Sap

@inproceedings{ICLR:Zhou2024,
    author    = {Xuhui Zhou and Hao Zhu and Leena Mathur and Ruohong Zhang and Haofei Yu and Zhengyang Qi and Louis-Philippe Morency and Yonatan Bisk and Daniel Fried and Graham Neubig and Maarten Sap},
    title     = {SOTOPIA: Interactive Evaluation for Social Intelligence in Language Agents},
    booktitle = {The Twelfth International Conference on Learning Representations},
    year      = {2024},
    url       = {http://arxiv.org/abs/2310.11667},
}

Open X-Embodiment: Robotic Learning Datasets and RT-X Models: Open X-Embodiment Collaboration

IEEE International Conference on Robotics and Automation (ICRA) (2024)
Abby O’Neill, Abdul Rehman, Abhiram Maddukuri, Abhishek Gupta, Abhishek Padalkar, Abraham Lee, Acorn Pooley, Agrim Gupta, Ajay Mandlekar, Ajinkya Jain, Albert Tung, Alex Bewley, Alex Herzog, Alex Irpan, Alexander Khazatsky, Anant Rai, Anchit Gupta, Andrew Wang, Anikait Singh, Animesh Garg, Aniruddha Kembhavi, Annie Xie, Anthony Brohan, Antonin Raffin, Archit Sharma, Arefeh Yavary, Arhan Jain, Ashwin Balakrishna, Ayzaan Wahid, Ben Burgess-Limerick, Beomjoon Kim, Bernhard Schölkopf, Blake Wulfe, Brian Ichter, Cewu Lu, Charles Xu, Charlotte Le, Chelsea Finn, Chen Wang, Chenfeng Xu, Cheng Chi, Chenguang Huang, Christine Chan, Christopher Agia, Chuer Pan, Chuyuan Fu, Coline Devin, Danfei Xu, Daniel Morton, Danny Driess, Daphne Chen, Deepak Pathak, Dhruv Shah, Dieter Büchler, Dinesh Jayaraman, Dmitry Kalashnikov, Dorsa Sadigh, Edward Johns, Ethan Foster, Fangchen Liu, Federico Ceola, Fei Xia, Feiyu Zhao, Freek Stulp, Gaoyue Zhou, Gaurav S. Sukhatme, Gautam Salhotra, Ge Yan, Gilbert Feng, Giulio Schiavi, Glen Berseth, Gregory Kahn, Guanzhi Wang, Hao Su, Hao-Shu Fang, Haochen Shi, Henghui Bao, Heni Ben Amor, Henrik I Christensen, Hiroki Furuta, Homer Walke, Hongjie Fang, Huy Ha, Igor Mordatch, Ilija Radosavovic, Isabel Leal, Jacky Liang, Jad Abou-Chakra, Jaehyung Kim, Jaimyn Drake, Jan Peters, Jan Schneider, Jasmine Hsu, Jeannette Bohg, Jeffrey Bingham, Jeffrey Wu, Jensen Gao, Jiaheng Hu, Jiajun Wu, Jialin Wu, Jiankai Sun, Jianlan Luo, Jiayuan Gu, Jie Tan, Jihoon Oh, Jimmy Wu, Jingpei Lu, Jingyun Yang, Jitendra Malik, João Silvério, Joey Hejna, Jonathan Booher, Jonathan Tompson, Jonathan Yang, Jordi Salvador, Joseph J. Lim, Junhyek Han, Kaiyuan Wang, Kanishka Rao, Karl Pertsch, Karol Hausman, Keegan Go, Keerthana Gopalakrishnan, Ken Goldberg, Kendra Byrne, Kenneth Oslund, Kento Kawaharazuka, Kevin Black, Kevin Lin, Kevin Zhang, Kiana Ehsani, Kiran Lekkala, Kirsty Ellis, Krishan Rana, Krishnan Srinivasan, Kuan Fang, Kunal Pratap Singh, Kuo-Hao Zeng, Kyle Hatch, Kyle Hsu, Laurent Itti, Lawrence Yunliang Chen, Lerrel Pinto, Li Fei-Fei, Liam Tan, Linxi Jim Fan, Lionel Ott, Lisa Lee, Luca Weihs, Magnum Chen, Marion Lepert, Marius Memmel, Masayoshi Tomizuka, Masha Itkina, Mateo Guaman Castro, Max Spero, Maximilian Du, Michael Ahn, Michael C. Yip, Mingtong Zhang, Mingyu Ding, Minho Heo, Mohan Kumar Srirama, Mohit Sharma, Moo Jin Kim, Naoaki Kanazawa, Nicklas Hansen, Nicolas Heess, Nikhil J Joshi, Niko Suenderhauf, Ning Liu, Norman Di Palo, Nur Muhammad MahiShafiullah, Oier Mees, Oliver Kroemer, Osbert Bastani, Pannag R Sanketi, Patrick Tree Miller, Patrick Yin, Paul Wohlhart, Peng Xu, Peter David Fagan, Peter Mitrano, Pierre Sermanet, Pieter Abbeel, Priya Sundaresan, Qiuyu Chen, Quan Vuong, Rafael Rafailov, Ran Tian, Ria Doshi, Roberto Martín-Martín, Rohan Baijal, Rosario Scalise, Rose Hendrix, Roy Lin, Runjia Qian, Ruohan Zhang, Russell Mendonca, Rutav Shah, Ryan Hoque, Ryan Julian, Samuel Bustamante, Sean Kirmani, Sergey Levine, Shan Lin, Sherry Moore, Shikhar Bahl, Shivin Dass, Shubham Sonawani, Shuran Song, Sichun Xu, Siddhant Haldar, Siddharth Karamcheti, Simeon Adebola, Simon Guist, Soroush Nasiriany, Stefan Schaal, Stefan Welker, Stephen Tian, Subramanian Ramamoorthy, Sudeep Dasari, Suneel Belkhale, Sungjae Park, Suraj Nair, Suvir Mirchandani, Takayuki Osa, Tanmay Gupta, Tatsuya Harada, Tatsuya Matsushima, Ted Xiao, Thomas Kollar, Tianhe Yu, Tianli Ding, Todor Davchev, Tony Z. Zhao, Travis Armstrong, Trevor Darrell, Trinity Chung, Vidhi Jain, Vincent Vanhoucke, Wei Zhan, Wenxuan Zhou, Wolfram Burgard, Xi Chen, Xiaolong Wang, Xinghao Zhu, Xinyang Geng, Xiyuan Liu, Xu Liangwei, Xuanlin Li, Yao Lu, Yecheng Jason Ma, Yejin Kim, Yevgen Chebotar, Yifan Zhou, Yifeng Zhu, Yilin Wu, Ying Xu, Yixuan Wang, Yonatan Bisk, Yoonyoung Cho, Youngwoon Lee, Yuchen Cui, Yue Cao, Yueh-Hua Wu, Yujin Tang, Yuke Zhu, Yunchu Zhang, Yunfan Jiang, Yunshuang Li, Yunzhu Li, Yusuke Iwasawa, Yutaka Matsuo, Zehan Ma, Zhuo Xu, Zichen Jeff Cui, Zichen Zhang, Zipeng Lin

Website

@inproceedings{ICRA:O’Neill2024,
    author    = {Abby O’Neill and Abdul Rehman and Abhiram Maddukuri and Abhishek Gupta and Abhishek Padalkar and Abraham Lee and Acorn Pooley and Agrim Gupta and Ajay Mandlekar and Ajinkya Jain and Albert Tung and Alex Bewley and Alex Herzog and Alex Irpan and Alexander Khazatsky and Anant Rai and Anchit Gupta and Andrew Wang and Anikait Singh and Animesh Garg and Aniruddha Kembhavi and Annie Xie and Anthony Brohan and Antonin Raffin and Archit Sharma and Arefeh Yavary and Arhan Jain and Ashwin Balakrishna and Ayzaan Wahid and Ben Burgess-Limerick and Beomjoon Kim and Bernhard Schölkopf and Blake Wulfe and Brian Ichter and Cewu Lu and Charles Xu and Charlotte Le and Chelsea Finn and Chen Wang and Chenfeng Xu and Cheng Chi and Chenguang Huang and Christine Chan and Christopher Agia and Chuer Pan and Chuyuan Fu and Coline Devin and Danfei Xu and Daniel Morton and Danny  Driess and Daphne Chen and Deepak Pathak and Dhruv Shah and Dieter Büchler and Dinesh Jayaraman and Dmitry Kalashnikov and Dorsa Sadigh and Edward Johns and Ethan Foster and Fangchen Liu and Federico   Ceola and Fei  Xia and Feiyu  Zhao and Freek  Stulp and Gaoyue Zhou and Gaurav S.  Sukhatme and Gautam Salhotra and Ge   Yan and Gilbert    Feng and Giulio   Schiavi and Glen Berseth and Gregory    Kahn and Guanzhi    Wang and Hao  Su and Hao-Shu    Fang and Haochen  Shi and Henghui  Bao and Heni   Ben Amor and Henrik I Christensen and Hiroki   Furuta and Homer  Walke and Hongjie    Fang and Huy  Ha and Igor   Mordatch and Ilija    Radosavovic and Isabel Leal and Jacky  Liang and Jad  Abou-Chakra and Jaehyung Kim and Jaimyn Drake and Jan  Peters and Jan    Schneider and Jasmine  Hsu and Jeannette  Bohg and Jeffrey  Bingham and Jeffrey  Wu and Jensen   Gao and Jiaheng  Hu and Jiajun   Wu and Jialin   Wu and Jiankai  Sun and Jianlan  Luo and Jiayuan  Gu and Jie  Tan and Jihoon   Oh and Jimmy    Wu and Jingpei  Lu and Jingyun    Yang and Jitendra   Malik and João   Silvério and Joey   Hejna and Jonathan Booher and Jonathan Tompson and Jonathan   Yang and Jordi  Salvador and Joseph J.    Lim and Junhyek  Han and Kaiyuan    Wang and Kanishka Rao and Karl Pertsch and Karol    Hausman and Keegan   Go and Keerthana    Gopalakrishnan and Ken    Goldberg and Kendra Byrne and Kenneth  Oslund and Kento  Kawaharazuka and Kevin  Black and Kevin    Lin and Kevin  Zhang and Kiana    Ehsani and Kiran    Lekkala and Kirsty Ellis and Krishan    Rana and Krishnan Srinivasan and Kuan   Fang and Kunal Pratap   Singh and Kuo-Hao    Zeng and Kyle   Hatch and Kyle Hsu and Laurent    Itti and Lawrence Yunliang  Chen and Lerrel Pinto and Li   Fei-Fei and Liam Tan and Linxi Jim    Fan and Lionel   Ott and Lisa Lee and Luca   Weihs and Magnum Chen and Marion   Lepert and Marius   Memmel and Masayoshi  Tomizuka and Masha    Itkina and Mateo Guaman Castro and Max    Spero and Maximilian   Du and Michael  Ahn and Michael C.   Yip and Mingtong   Zhang and Mingyu Ding and Minho    Heo and Mohan Kumar  Srirama and Mohit    Sharma and Moo Jin  Kim and Naoaki Kanazawa and Nicklas  Hansen and Nicolas    Heess and Nikhil J   Joshi and Niko Suenderhauf and Ning Liu and Norman   Di Palo and Nur Muhammad MahiShafiullah and Oier   Mees and Oliver   Kroemer and Osbert   Bastani and Pannag R Sanketi and Patrick Tree Miller and Patrick  Yin and Paul   Wohlhart and Peng Xu and Peter David    Fagan and Peter    Mitrano and Pierre Sermanet and Pieter   Abbeel and Priya    Sundaresan and Qiuyu  Chen and Quan   Vuong and Rafael Rafailov and Ran    Tian and Ria    Doshi and Roberto    Martín-Martín and Rohan    Baijal and Rosario  Scalise and Rose Hendrix and Roy  Lin and Runjia Qian and Ruohan Zhang and Russell    Mendonca and Rutav  Shah and Ryan   Hoque and Ryan Julian and Samuel   Bustamante and Sean Kirmani and Sergey   Levine and Shan Lin and Sherry Moore and Shikhar    Bahl and Shivin Dass and Shubham    Sonawani and Shuran Song and Sichun   Xu and Siddhant Haldar and Siddharth    Karamcheti and Simeon   Adebola and Simon  Guist and Soroush    Nasiriany and Stefan   Schaal and Stefan   Welker and Stephen    Tian and Subramanian  Ramamoorthy and Sudeep   Dasari and Suneel Belkhale and Sungjae    Park and Suraj  Nair and Suvir    Mirchandani and Takayuki Osa and Tanmay Gupta and Tatsuya  Harada and Tatsuya  Matsushima and Ted    Xiao and Thomas   Kollar and Tianhe   Yu and Tianli Ding and Todor    Davchev and Tony Z.    Zhao and Travis Armstrong and Trevor   Darrell and Trinity    Chung and Vidhi  Jain and Vincent    Vanhoucke and Wei    Zhan and Wenxuan    Zhou and Wolfram  Burgard and Xi Chen and Xiaolong   Wang and Xinghao  Zhu and Xinyang    Geng and Xiyuan   Liu and Xu Liangwei and Xuanlin  Li and Yao  Lu and Yecheng Jason    Ma and Yejin    Kim and Yevgen Chebotar and Yifan  Zhou and Yifeng   Zhu and Yilin    Wu and Ying Xu and Yixuan Wang and Yonatan    Bisk and Yoonyoung    Cho and Youngwoon    Lee and Yuchen   Cui and Yue  Cao and Yueh-Hua Wu and Yujin  Tang and Yuke Zhu and Yunchu Zhang and Yunfan Jiang and Yunshuang    Li and Yunzhu   Li and Yusuke   Iwasawa and Yutaka   Matsuo and Zehan    Ma and Zhuo Xu and Zichen Jeff  Cui and Zichen Zhang and Zipeng   Lin},
    title     = {Open X-Embodiment: Robotic Learning Datasets and RT-X Models: Open X-Embodiment Collaboration},
    booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
    year      = {2024},
    url       = {https://arxiv.org/abs/2310.08864},
}

Reasoning about the Unseen for Efficient Outdoor Object Navigation

ArXiv (2023)

Quanting Xie

, Tianyi Zhang, Kedi Xu, Matthew Johnson-Roberson,

Yonatan Bisk

@article{ArXiv:Xie2023,
    author    = {Quanting Xie and Tianyi Zhang and Kedi Xu and Matthew Johnson-Roberson and Yonatan Bisk},
    title     = {Reasoning about the Unseen for Efficient Outdoor Object Navigation},
    journal = {ArXiv},
    year      = {2023},
    url       = {https://arxiv.org/abs/2309.10103},
}

MOSAIC: Learning Unified Multi-Sensory Object Property Representations for Robot Perception

IEEE International Conference on Robotics and Automation (2024)
Gyan Tatiya, Jonathan Francis, Ho-Hsiang Wu,

Yonatan Bisk

, Jivko Sinapov

@inproceedings{ICRA:Tatiya2024,
    author    = {Gyan Tatiya and Jonathan Francis and Ho-Hsiang Wu and Yonatan Bisk and Jivko Sinapov},
    title     = {MOSAIC: Learning Unified Multi-Sensory Object Property Representations for Robot Perception},
    booktitle = {IEEE International Conference on Robotics and Automation},
    year      = {2024},
    url       = {https://arxiv.org/abs/2309.08508},
}

WebArena: A Realistic Web Environment for Building Autonomous Agents

The Twelfth International Conference on Learning Representations (2024)
Shuyan Zhou, Frank F. Xu, Hao Zhu, Xuhui Zhou, Robert Lo, Abishek Sridhar, Xianyi Cheng, Tianyue Ou,

Yonatan Bisk

, Daniel Fried, Uri Alon, Graham Neubig

Website

@inproceedings{ICLR:Zhou2024,
    author    = {Shuyan Zhou and Frank F. Xu and Hao Zhu and Xuhui Zhou and Robert Lo and Abishek Sridhar and Xianyi Cheng and Tianyue Ou and Yonatan Bisk and Daniel Fried and Uri Alon and Graham Neubig},
    title     = {WebArena: A Realistic Web Environment for Building Autonomous Agents},
    booktitle = {The Twelfth International Conference on Learning Representations},
    year      = {2024},
    url       = {https://arxiv.org/abs/2307.13854},
}

Spatial-Language Attention Policies for Efficient Robot Learning

Conference on Robot Learning (2023)
Priyam Parashar, Vidhi Jain, Xiaohan Zhang, Jay Vakil, Sam Powers,

Yonatan Bisk

, Chris Paxton

Website

@inproceedings{CoRL:Parashar2023,
    author    = {Priyam Parashar and Vidhi Jain and Xiaohan Zhang and Jay Vakil and Sam Powers and Yonatan Bisk and Chris Paxton},
    title     = {Spatial-Language Attention Policies for Efficient Robot Learning},
    booktitle = {Conference on Robot Learning},
    year      = {2023},
    url       = {https://arxiv.org/abs/2304.11235},
}

SPAE: Semantic Pyramid AutoEncoder for Multimodal Generation with Frozen LLMs

Thirty-seventh Conference on Neural Information Processing Systems (2023)
Lijun Yu, Yong Cheng, Zhiruo Wang, Vivek Kumar, Wolfgang Macherey, Yanping Huang, David A. Ross, Irfan Essa,

Yonatan Bisk

, Ming-Hsuan Yang, Kevin Murphy, Alexander Hauptmann, Lu Jiang

@inproceedings{NeurIPS:Yu2023,
    author    = {Lijun Yu and Yong Cheng and Zhiruo Wang and Vivek Kumar and Wolfgang Macherey and Yanping Huang and David A. Ross and Irfan Essa and Yonatan Bisk and Ming-Hsuan Yang and Kevin Murphy and Alexander Hauptmann and Lu Jiang},
    title     = {SPAE: Semantic Pyramid AutoEncoder for Multimodal Generation with Frozen LLMs},
    booktitle = {Thirty-seventh Conference on Neural Information Processing Systems },
    year      = {2023},
    url       = {https://arxiv.org/abs/2306.17842},
}

HomeRobot: Open-Vocabulary Mobile Manipulation

Conference on Robot Learning (2023)
Sriram Yenamandra, Arun Ramachandran, Karmesh Yadav, Austin Wang, Mukul Khanna, Theophile Gervet, Tsung-Yen Yang, Vidhi Jain, Alexander William Clegg, John Turner, Zsolt Kira, Manolis Savva, Angel Chang, Devendra Singh Chaplot, Dhruv Batra, Roozbeh Mottaghi,

Yonatan Bisk

, Chris Paxton

Website Video

@inproceedings{CoRL:Yenamandra2023,
    author    = {Sriram Yenamandra and Arun Ramachandran and Karmesh Yadav and Austin Wang and Mukul Khanna and Theophile Gervet and Tsung-Yen Yang and Vidhi Jain and Alexander William Clegg and John Turner and Zsolt Kira and Manolis Savva and Angel Chang and Devendra Singh Chaplot and Dhruv Batra and Roozbeh Mottaghi and Yonatan Bisk and Chris Paxton},
    title     = {HomeRobot: Open-Vocabulary Mobile Manipulation},
    booktitle = {Conference on Robot Learning},
    year      = {2023},
    url       = {https://arxiv.org/abs/2306.11565},
}

SPRING: GPT-4 Out-performs RL Algorithms by Studying Papers and Reasoning

Thirty-seventh Conference on Neural Information Processing Systems (2023)
Yue Wu, Shrimai Prabhumoye, So Yeon Min,

Yonatan Bisk

, Ruslan Salakhutdinov, Amos Azaria, Tom Mitchell, Yuanzhi Li

@inproceedings{NeurIPS:Wu2023,
    author    = {Yue Wu and Shrimai Prabhumoye and So Yeon Min and Yonatan Bisk and Ruslan Salakhutdinov and Amos Azaria and Tom Mitchell and Yuanzhi Li},
    title     = {SPRING: GPT-4 Out-performs RL Algorithms by Studying Papers and Reasoning},
    booktitle = {Thirty-seventh Conference on Neural Information Processing Systems },
    year      = {2023},
    url       = {https://arxiv.org/abs/2305.15486},
}

Plan, Eliminate, and Track -- Language Models are Good Teachers for Embodied Agents

ArXiv (2023)
Yue Wu, So Yeon Min,

Yonatan Bisk

, Ruslan Salakhutdinov, Amos Azaria, Yuanzhi Li, Tom Mitchell, Shrimai Prabhumoye

@article{ArXiv:Wu2023,
    author    = {Yue Wu and So Yeon Min and Yonatan Bisk and Ruslan Salakhutdinov and Amos Azaria and Yuanzhi Li and Tom Mitchell and Shrimai Prabhumoye},
    title     = {Plan, Eliminate, and Track -- Language Models are Good Teachers for Embodied Agents},
    journal = {ArXiv},
    year      = {2023},
    url       = {https://arxiv.org/abs/2305.02412},
}

Towards Open-World Mobile Manipulation in Homes: Lessons from the Neurips 2023 HomeRobot Open Vocabulary Mobile Manipulation Challenge

Thirty-seventh Conference on Neural Information Processing Systems: Competition Track (2023)
Sriram Yenamandra, Arun Ramachandran, Mukul Khanna, Karmesh Yadav, Jay Vakil, Andrew Melnik, Michael Büttner, Leon Harz, Lyon Brown, Gora Chand Nandi, Arjun PS, Gaurav Kumar Yadav, Rahul Kala, Robert Haschke, Yang Luo, Jinxin Zhu, Yansen Han, Bingyi Lu, Xuan Gu, Qinyuan Liu, Yaping Zhao, Qiting Ye, Chenxiao Dou, Yansong Chua, Volodymyr Kuzma, Vladyslav Humennyy, Ruslan Partsey, Jonathan Francis, Devendra Singh Chaplot, Gunjan Chhablani, Alexander Clegg, Theophile Gervet, Vidhi Jain, Ram Ramrakhya, Andrew Szot, Austin Wang, Tsung-Yen Yang, Aaron Edsinger, Charlie Kemp, Binit Shah, Zsolt Kira, Dhruv Batra, Roozbeh Mottaghi,

Yonatan Bisk

, Chris Paxton

Website

@inproceedings{NeurIPS-Challenge:Yenamandra2023,
    author    = {Sriram Yenamandra and Arun Ramachandran and Mukul Khanna and Karmesh Yadav and Jay Vakil and Andrew Melnik and Michael Büttner and Leon Harz and Lyon Brown and Gora Chand Nandi and Arjun PS and Gaurav Kumar Yadav and Rahul Kala and Robert Haschke and Yang Luo and Jinxin Zhu and Yansen Han and Bingyi Lu and Xuan Gu and Qinyuan Liu and Yaping Zhao and Qiting Ye and Chenxiao Dou and Yansong Chua and Volodymyr Kuzma and Vladyslav Humennyy and Ruslan Partsey and Jonathan Francis and Devendra Singh Chaplot and Gunjan Chhablani and Alexander Clegg and Theophile Gervet and Vidhi Jain and Ram Ramrakhya and Andrew Szot and Austin Wang and Tsung-Yen Yang and Aaron Edsinger and Charlie Kemp and Binit Shah and Zsolt Kira and Dhruv Batra and Roozbeh Mottaghi and Yonatan Bisk and Chris Paxton},
    title     = {Towards Open-World Mobile Manipulation in Homes: Lessons from the Neurips 2023 HomeRobot Open Vocabulary Mobile Manipulation Challenge},
    booktitle = {Thirty-seventh Conference on Neural Information Processing Systems: Competition Track},
    year      = {2023},
    url       = {https://arxiv.org/abs/2407.06939},
}

EXCALIBUR: Encouraging and Evaluating Embodied Exploration

Conference on Computer Vision and Pattern Recognition (2023)
Hao Zhu, Raghav Kapoor, So Yeon Min, Winson Han, Jiatai Li, Kaiwen Geng, Graham Neubig,

Yonatan Bisk

, Aniruddha Kembhavi, Luca Weihs

PDF

Video Tasks

@inproceedings{CVPR:Zhu2023,
    author    = {Hao Zhu and Raghav Kapoor and So Yeon Min and Winson Han and Jiatai Li and Kaiwen Geng and Graham Neubig and Yonatan Bisk and Aniruddha Kembhavi and Luca Weihs},
    title     = {EXCALIBUR: Encouraging and Evaluating Embodied Exploration},
    booktitle = {Conference on Computer Vision and Pattern Recognition},
    year      = {2023},
    url       = {https://openaccess.thecvf.com/content/CVPR2023/html/Zhu_EXCALIBUR_Encouraging_and_Evaluating_Embodied_Exploration_CVPR_2023_paper.html},
}

The Framework Tax: Disparities Between Inference Efficiency in Research and Deployment

The 2023 Conference on Empirical Methods in Natural Language Processing (2023)

Jared Fernandez

, Jacob Kahn, Clara Na,

Yonatan Bisk

, Emma Strubell

@inproceedings{EMNLP:Fernandez2023,
    author    = {Jared Fernandez and Jacob Kahn and Clara Na and Yonatan Bisk and Emma Strubell},
    title     = {The Framework Tax: Disparities Between Inference Efficiency in Research and Deployment},
    booktitle = {The 2023 Conference on Empirical Methods in Natural Language Processing },
    year      = {2023},
    url       = {https://arxiv.org/abs/2302.06117},
}

Computational Language Acquisition with Theory of Mind

The Eleventh International Conference on Learning Representations (2023)
Andy Liu, Hao Zhu, Emmy Liu,

Yonatan Bisk

, Graham Neubig

PDF

@inproceedings{ICLR:Liu2023,
    author    = {Andy Liu and Hao Zhu and Emmy Liu and Yonatan Bisk and Graham Neubig},
    title     = {Computational Language Acquisition with Theory of Mind},
    booktitle = {The Eleventh International Conference on Learning Representations},
    year      = {2023},
    url       = {https://openreview.net/forum?id=C2ulri4duIs},
}

Self-Supervised Object Goal Navigation with In-Situ Finetuning

IEEE/RSJ International Conference on Intelligent Robots and Systems (2023)
So Yeon Min, Yao-Hung Hubert Tsai, Wei Ding, Ali Farhadi, Ruslan Salakhutdinov,

Yonatan Bisk

, Jian Zhang

Video

@inproceedings{IROS:Min2023,
    author    = {So Yeon Min and Yao-Hung Hubert Tsai and Wei Ding and Ali Farhadi and Ruslan Salakhutdinov and Yonatan Bisk and Jian Zhang},
    title     = {Self-Supervised Object Goal Navigation with In-Situ Finetuning},
    booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems},
    year      = {2023},
    url       = {https://arxiv.org/abs/2212.05923},
}

MAEA: Multimodal Attribution for Embodied AI

Progress and Challenges in Building Trustworthy Embodied AI at NeurIPS 2022 (2022)
Vidhi Jain, Jayant Sravan Tamarapalli, Sahiti Yerramilli,

Yonatan Bisk

PDF

@inproceedings{TEA-Wksp:Jain2022,
    author    = {Vidhi Jain and Jayant Sravan Tamarapalli and Sahiti Yerramilli and Yonatan Bisk},
    title     = {MAEA: Multimodal Attribution for Embodied AI},
    booktitle = {Progress and Challenges in Building Trustworthy Embodied AI at NeurIPS 2022},
    year      = {2022},
    url       = {https://openreview.net/pdf?id=OUs2us5Xhx},
}

Tackling AlfWorld with Action Attention and Common Sense from Language Models

Language and Reinforcement Learning Workshop at NeurIPS 2022 (2022)
Yue Wu, So Yeon Min,

Yonatan Bisk

, Ruslan Salakhutdinov, Shrimai Prabhumoye

PDF

@inproceedings{LaReL-Wksp:Wu2022,
    author    = {Yue Wu and So Yeon Min and Yonatan Bisk and Ruslan Salakhutdinov and Shrimai Prabhumoye},
    title     = {Tackling AlfWorld with Action Attention and Common Sense from Language Models},
    booktitle = {Language and Reinforcement Learning Workshop at NeurIPS 2022},
    year      = {2022},
    url       = {https://openreview.net/forum?id=AqkPRUZ-YkO},
}

Retrospectives on the Embodied AI Workshop

ArXiv (2022)
Matt Deitke, Dhruv Batra,

Yonatan Bisk

, Tommaso Campari, Angel X. Chang, Devendra Singh Chaplot, Changan Chen, Claudia Pérez D'Arpino, Kiana Ehsani, Ali Farhadi, Li Fei-Fei, Anthony Francis, Chuang Gan, Kristen Grauman, David Hall, Winson Han, Unnat Jain, Aniruddha Kembhavi, Jacob Krantz, Stefan Lee, Chengshu Li, Sagnik Majumder, Oleksandr Maksymets, Roberto Martín-Martín, Roozbeh Mottaghi, Sonia Raychaudhuri, Mike Roberts, Silvio Savarese, Manolis Savva, Mohit Shridhar, Niko Sünderhauf, Andrew Szot, Ben Talbot, Joshua B. Tenenbaum, Jesse Thomason, Alexander Toshev, Joanne Truong, Luca Weihs, Jiajun Wu

@article{ArXiv:Deitke2022,
    author    = {Matt Deitke and Dhruv Batra and Yonatan Bisk and Tommaso Campari and Angel X. Chang and Devendra Singh Chaplot and Changan Chen and Claudia Pérez D'Arpino and Kiana Ehsani and Ali Farhadi and Li Fei-Fei and Anthony Francis and Chuang Gan and Kristen Grauman and David Hall and Winson Han and Unnat Jain and Aniruddha Kembhavi and Jacob Krantz and Stefan Lee and Chengshu Li and Sagnik Majumder and Oleksandr Maksymets and Roberto Martín-Martín and Roozbeh Mottaghi and Sonia Raychaudhuri and Mike Roberts and Silvio Savarese and Manolis Savva and Mohit Shridhar and Niko Sünderhauf and Andrew Szot and Ben Talbot and Joshua B. Tenenbaum and Jesse Thomason and Alexander Toshev and Joanne Truong and Luca Weihs and Jiajun Wu},
    title     = {Retrospectives on the Embodied AI Workshop},
    journal = {ArXiv},
    year      = {2022},
    url       = {https://arxiv.org/abs/2210.06849},
}

Don't Copy the Teacher: Data and Model Challenges in Embodied Dialogue

Conference on Empirical Methods in Natural Language Processing (2022)
So Yeon Min, Hao Zhu, Ruslan Salakhutdinov,

Yonatan Bisk

Video

@inproceedings{EMNLP:Min2022,
    author    = {So Yeon Min and Hao Zhu and Ruslan Salakhutdinov and Yonatan Bisk},
    title     = {Don't Copy the Teacher: Data and Model Challenges in Embodied Dialogue},
    booktitle = {Conference on Empirical Methods in Natural Language Processing},
    year      = {2022},
    url       = {https://arxiv.org/abs/2210.04443},
}

EvEntS ReaLM: Event Reasoning of Entity States via Language Models

Conference on Empirical Methods in Natural Language Processing (2022)
Evangelia Spiliopoulou, Artidoro Pagnoni,

Yonatan Bisk

, Eduard Hovy

@inproceedings{EMNLP:Spiliopoulou2022,
    author    = {Evangelia Spiliopoulou and Artidoro Pagnoni and Yonatan Bisk and Eduard Hovy},
    title     = {EvEntS ReaLM: Event Reasoning of Entity States via Language Models},
    booktitle = {Conference on Empirical Methods in Natural Language Processing},
    year      = {2022},
    url       = {https://arxiv.org/abs/2211.05392},
}

On Advances in Text Generation from Images Beyond Captioning: A Case Study in Self-Rationalization

Findings of the Conference on Empirical Methods in Natural Language Processing (2022)
Shruti Palaskar, Akshita Bhagia,

Yonatan Bisk

, Florian Metze, Alan W Black, Ana Marasovic

@inproceedings{EMNLP-Findings:Palaskar2022,
    author    = {Shruti Palaskar and Akshita Bhagia and Yonatan Bisk and Florian Metze and Alan W Black and Ana Marasovic},
    title     = {On Advances in Text Generation from Images Beyond Captioning: A Case Study in Self-Rationalization},
    booktitle = {Findings of the Conference on Empirical Methods in Natural Language Processing},
    year      = {2022},
    url       = {https://arxiv.org/abs/2205.11686},
}

Transformers are Adaptable Task Planners

Conference on Robot Learning (2022)
Vidhi Jain, Yixin Lin, Eric Undersander,

Yonatan Bisk

, Akshara Rai

Video

@inproceedings{CoRL:Jain2022,
    author    = {Vidhi Jain and Yixin Lin and Eric Undersander and Yonatan Bisk and Akshara Rai},
    title     = {Transformers are Adaptable Task Planners},
    booktitle = {Conference on Robot Learning},
    year      = {2022},
    url       = {https://arxiv.org/abs/2207.02442},
}

Training Vision-Language Transformers from Captions

Transactions on Machine Learning Research (2023)
Liangke Gui,

Yingshan Chang

, Qiuyuan Huang, Subhojit Som, Alexander Hauptmann, Jianfeng Gao,

Yonatan Bisk

@article{TMLR:Gui2023,
    author    = {Liangke Gui and Yingshan Chang and Qiuyuan Huang and Subhojit Som and Alexander Hauptmann and Jianfeng Gao and Yonatan Bisk},
    title     = {Training Vision-Language Transformers from Captions},
    journal = {Transactions on Machine Learning Research},
    year      = {2023},
    url       = {https://arxiv.org/abs/2205.09256},
}

Symmetric Machine Theory of Mind

39th International Conference on Machine Learning (2022)
Melanie Sclar, Graham Neubig,

Yonatan Bisk

PDF

Video

@inproceedings{ICML:Sclar2022,
    author    = {Melanie Sclar and Graham Neubig and Yonatan Bisk},
    title     = {Symmetric Machine Theory of Mind},
    booktitle = {39th International Conference on Machine Learning},
    year      = {2022},
    url       = {https://proceedings.mlr.press/v162/sclar22a.html},
}

A Framework for Learning to Request Rich and Contextually Useful Information from Humans

39th International Conference on Machine Learning, (2022)
Khanh Nguyen,

Yonatan Bisk

, Hal Daume III

Video

@inproceedings{ICML:Nguyen2022,
    author    = {Khanh Nguyen and Yonatan Bisk and Hal Daume III},
    title     = {A Framework for Learning to Request Rich and Contextually Useful Information from Humans},
    booktitle = {39th International Conference on Machine Learning,},
    year      = {2022},
    url       = {http://arxiv.org/abs/2110.08258},
}

Simulated Language Learning from Communicative Goals and Linguistic Input

Annual Meeting of the Cognitive Science Society (2022)
Hao Zhu,

Yonatan Bisk

, Graham Neubig

PDF

@inproceedings{CogSci:Zhu2022,
    author    = {Hao Zhu and Yonatan Bisk and Graham Neubig},
    title     = {Simulated Language Learning from Communicative Goals and Linguistic Input},
    booktitle = {Annual Meeting of the Cognitive Science Society},
    year      = {2022},
    url       = {https://escholarship.org/uc/item/7p65n371},
}

HEAR 2021: Holistic Evaluation of Audio Representations

Proceedings of Machine Learning Research (PMLR): NeurIPS 2021 Competition Track (2022)
Joseph Turian, Jordie Shier, Humair Raj Khan, Bhiksha Raj, Björn W. Schuller, Christian J. Steinmetz, Colin Malloy, George Tzanetakis, Gissel Velarde, Kirk McNally, Max Henry, Nicolas Pinto, Camille Noufi, Christian Clough, Dorien Herremans, Eduardo Fonseca, Jesse Engel, Justin Salamon, Philippe Esling, Pranay Manocha, Shinji Watanabe, Zeyu Jin,

Yonatan Bisk

Website

@inproceedings{PMLR:Turian2022,
    author    = {Joseph Turian and Jordie Shier and Humair Raj Khan and Bhiksha Raj and Björn W. Schuller and Christian J. Steinmetz and Colin Malloy and George Tzanetakis and Gissel Velarde and Kirk McNally and Max Henry and Nicolas Pinto and Camille Noufi and Christian Clough and Dorien Herremans and Eduardo Fonseca and Jesse Engel and Justin Salamon and Philippe Esling and Pranay Manocha and Shinji Watanabe and Zeyu Jin and Yonatan Bisk},
    title     = {HEAR 2021: Holistic Evaluation of Audio Representations},
    booktitle = {Proceedings of Machine Learning Research (PMLR): NeurIPS 2021 Competition Track},
    year      = {2022},
    url       = {http://arxiv.org/abs/2203.03022},
}

KAT: A Knowledge Augmented Transformer for Vision-and-Language

Annual Conference of the North American Chapter of the Association for Computational Linguistics (2022)
Liangke Gui, Borui Wang, Qiuyuan Huang, Alexander Hauptmann,

Yonatan Bisk

, Jianfeng Gao

@inproceedings{NAACL:Gui2022,
    author    = {Liangke Gui and Borui Wang and Qiuyuan Huang and Alexander Hauptmann and Yonatan Bisk and Jianfeng Gao},
    title     = {KAT: A Knowledge Augmented Transformer for Vision-and-Language},
    booktitle = {Annual Conference of the North American Chapter of the Association for Computational Linguistics},
    year      = {2022},
    url       = {https://arxiv.org/abs/2112.08614},
}

FILM: Following Instructions in Language with Modular Methods

The Tenth International Conference on Learning Representations (2022)
So Yeon Min, Devendra Singh Chaplot, Pradeep Ravikumar,

Yonatan Bisk

, Ruslan Salakhutdinov

Website Video

@inproceedings{ICLR:Min2022,
    author    = {So Yeon Min and Devendra Singh Chaplot and Pradeep Ravikumar and Yonatan Bisk and Ruslan Salakhutdinov},
    title     = {FILM: Following Instructions in Language with Modular Methods},
    booktitle = {The Tenth International Conference on Learning Representations},
    year      = {2022},
    url       = {https://arxiv.org/abs/2110.07342},
}

WebQA: Multihop and Multimodal QA

Conference on Computer Vision and Pattern Recognition (2022)

Yingshan Chang

, Mridu Narang, Hisami Suzuki, Guihong Cao, Jianfeng Gao,

Yonatan Bisk

Project Leaderboard Challenge Summary

@inproceedings{CVPR:Chang2022,
    author    = {Yingshan Chang and Mridu Narang and Hisami Suzuki and Guihong Cao and Jianfeng Gao and Yonatan Bisk},
    title     = {WebQA: Multihop and Multimodal QA},
    booktitle = {Conference on Computer Vision and Pattern Recognition},
    year      = {2022},
    url       = {https://arxiv.org/abs/2109.00590},
}

Dependency Induction Through the Lens of Visual Perception

The SIGNLL Conference on Computational Natural Language Learning (2021)
Ruisi Su, Shruti Rijhwani, Hao Zhu, Junxian He, Xinyu Wang,

Yonatan Bisk

, Graham Neubig

@inproceedings{CoNLL:Su2021,
    author    = {Ruisi Su and Shruti Rijhwani and Hao Zhu and Junxian He and Xinyu Wang and Yonatan Bisk and Graham Neubig},
    title     = {Dependency Induction Through the Lens of Visual Perception},
    booktitle = {The SIGNLL Conference on Computational Natural Language Learning},
    year      = {2021},
    url       = {https://arxiv.org/abs/2109.09790},
}

Language Grounding with 3D Objects

Conference on Robot Learning (2021)
Jesse Thomason, Mohit Shridhar,

Yonatan Bisk

, Chris Paxton, Luke Zettlemoyer

@inproceedings{CoRL:Thomason2021,
    author    = {Jesse Thomason and Mohit Shridhar and Yonatan Bisk and Chris Paxton and Luke Zettlemoyer},
    title     = {Language Grounding with 3D Objects},
    booktitle = {Conference on Robot Learning},
    year      = {2021},
    url       = {https://arxiv.org/abs/2107.12514},
}

TACo: Token-aware Cascade Contrastive Learning for Video-Text Alignment

International Conference on Computer Vision (2021)
Jianwei Yang,

Yonatan Bisk

, Jianfeng Gao

@inproceedings{ICCV:Yang2021,
    author    = {Jianwei Yang and Yonatan Bisk and Jianfeng Gao},
    title     = {TACo: Token-aware Cascade Contrastive Learning for Video-Text Alignment},
    booktitle = {International Conference on Computer Vision},
    year      = {2021},
    url       = {https://arxiv.org/abs/2108.09980},
}

Worst of Both Worlds: Biases Compound in Pre-trained Vision-and-Language Models

4th Workshop on Gender Bias in Natural Language Processing (2022)
Tejas Srinivasan,

Yonatan Bisk

@inproceedings{GeBNLP-Wksp:Srinivasan2022,
    author    = {Tejas Srinivasan and Yonatan Bisk},
    title     = {Worst of Both Worlds: Biases Compound in Pre-trained Vision-and-Language Models},
    booktitle = {4th Workshop on Gender Bias in Natural Language Processing},
    year      = {2022},
    url       = {https://arxiv.org/abs/2104.08666},
}

KB-VLP: Knowledge Based Vision and Language Pretraining

ICML21 Workshop on Self-Supervised Learning (2021)
Kezhen Chen, Qiuyuan Huang,

Yonatan Bisk

, Daniel McDuff, Jianfeng Gao

PDF

@inproceedings{SSL-Wksp:Chen2021,
    author    = {Kezhen Chen and Qiuyuan Huang and Yonatan Bisk and Daniel McDuff and Jianfeng Gao},
    title     = {KB-VLP: Knowledge Based Vision and Language Pretraining},
    booktitle = {ICML21 Workshop on Self-Supervised Learning},
    year      = {2021},
    url       = {https://www.microsoft.com/en-us/research/publication/kb-vlp-knowledge-based-vision-and-language-pretraining-2/},
}

Few-shot Language Coordination by Modeling Theory of Mind

The Thirty-eighth International Conference on Machine Learning (2021)
Hao Zhu, Graham Neubig,

Yonatan Bisk

PDF

@inproceedings{ICML:Zhu2021,
    author    = {Hao Zhu and Graham Neubig and Yonatan Bisk},
    title     = {Few-shot Language Coordination by Modeling Theory of Mind},
    booktitle = {The Thirty-eighth International Conference on Machine Learning},
    year      = {2021},
    url       = {http://proceedings.mlr.press/v139/zhu21d.html},
}

Grounding `Grounding' in NLP

Findings of The 2021 Conference of the Association for Computational Linguistics (2021)
Khyathi Raghavi Chandu,

Yonatan Bisk

, Alan W Black

@inproceedings{ACL-Findings:Chandu2021,
    author    = {Khyathi Raghavi Chandu and Yonatan Bisk and Alan W Black},
    title     = {Grounding `Grounding' in NLP},
    booktitle = {Findings of The 2021 Conference of the Association for Computational Linguistics},
    year      = {2021},
    url       = {https://arxiv.org/abs/2106.02192},
}

An Empirical Study on the Generalization Power of Neural Representations Learned via Visual Guessing Games

The 2021 Conference of the European Chapter of the Association for Computational Linguistics (2021)
Alessandro Suglia,

Yonatan Bisk

, Ioannis Konstas, Antonio Vergari, Emanuele Bastianelli, Andrea Vanzo, Oliver Lemon

@inproceedings{EACL:Suglia2021,
    author    = {Alessandro Suglia and Yonatan Bisk and Ioannis Konstas and Antonio Vergari and Emanuele Bastianelli and Andrea Vanzo and Oliver Lemon},
    title     = {An Empirical Study on the Generalization Power of Neural Representations Learned via Visual Guessing Games},
    booktitle = {The 2021 Conference of the European Chapter of the Association for Computational Linguistics},
    year      = {2021},
    url       = {https://arxiv.org/abs/2102.00424},
}

Knowledge-driven Data Construction for Zero-shot Evaluation in Commonsense Question Answering

35th AAAI Conference on Artificial Intelligence (2021)
Kaixin Ma, Filip Ilievski, Jonathan Francis,

Yonatan Bisk

, Eric Nyberg, Alessandro Oltramari

@inproceedings{AAAI:Ma2021,
    author    = {Kaixin Ma and Filip Ilievski and Jonathan Francis and Yonatan Bisk and Eric Nyberg and Alessandro Oltramari},
    title     = {Knowledge-driven Data Construction for Zero-shot Evaluation in Commonsense Question Answering},
    booktitle = {35th AAAI Conference on Artificial Intelligence},
    year      = {2021},
    url       = {https://arxiv.org/abs/2011.03863},
}

ALFWorld: Aligning Text and Embodied Environments for Interactive Learning

International Conference on Learning Representations (2021)
Mohit Shridhar, Xingdi Yuan, Marc-Alexandre Côté,

Yonatan Bisk

, Adam Trischler, Matthew Hausknecht

Website

@inproceedings{ICLR:Shridhar2021,
    author    = {Mohit Shridhar and Xingdi Yuan and Marc-Alexandre C{\^o}t{\'e} and Yonatan Bisk and Adam Trischler and Matthew Hausknecht},
    title     = {ALFWorld: Aligning Text and Embodied Environments for Interactive Learning},
    booktitle = {International Conference on Learning Representations},
    year      = {2021},
    url       = {https://arxiv.org/abs/2010.03768},
}

Imagining Grounded Conceptual Representations from Perceptual Information in Situated Guessing Games

The 28th International Conference on Computational Linguistics (2020)
Alessandro Suglia, Antonio Vergari, Ioannis Konstas,

Yonatan Bisk

, Emanuele Bastianelli, Andrea Vanzo, Oliver Lemon

@inproceedings{Coling:Suglia2020,
    author    = {Alessandro Suglia and Antonio Vergari and Ioannis Konstas and Yonatan Bisk and Emanuele Bastianelli and Andrea Vanzo and Oliver Lemon},
    title     = {Imagining Grounded Conceptual Representations from Perceptual Information in Situated Guessing Games},
    booktitle = {The 28th International Conference on Computational Linguistics},
    year      = {2020},
    url       = {https://arxiv.org/abs/2011.02917},
}

The Return of Lexical Dependencies: Neural Lexicalized PCFGs

Transactions of the Association for Computational Linguistics (2020)
Hao Zhu,

Yonatan Bisk

, Graham Neubig

@article{TACL:Zhu2020,
    author    = {Hao Zhu and Yonatan Bisk and Graham Neubig},
    title     = {The Return of Lexical Dependencies: Neural Lexicalized PCFGs},
    journal = {Transactions of the Association for Computational Linguistics},
    year      = {2020},
    url       = {http://arxiv.org/abs/2007.15135},
}

Experience Grounds Language

Conference on Empirical Methods in Natural Language Processing (2020)

Yonatan Bisk

, Ari Holtzman, Jesse Thomason, Jacob Andreas, Yoshua Bengio, Joyce Chai, Mirella Lapata, Angeliki Lazaridou, Jonathan May, Aleksandr Nisnevich, Nicolas Pinto, Joseph Turian

Video Slides

@inproceedings{EMNLP:Bisk2020,
    author    = {Yonatan Bisk and Ari Holtzman and Jesse Thomason and Jacob Andreas and Yoshua Bengio and Joyce Chai and Mirella Lapata and Angeliki Lazaridou and Jonathan May and Aleksandr Nisnevich and Nicolas Pinto and Joseph Turian},
    title     = {Experience Grounds Language},
    booktitle = {Conference on Empirical Methods in Natural Language Processing},
    year      = {2020},
    url       = {https://arxiv.org/abs/2004.10151},
}

RMM: A Recursive Mental Model for Dialog Navigation

Conference on Empirical Methods in Natural Language Processing: Findings (2020)
Homero Roman Roman,

Yonatan Bisk

, Jesse Thomason, Asli Celikyilmaz, Jianfeng Gao

@inproceedings{EMNLP-Findings:Roman2020,
    author    = {Homero Roman Roman and Yonatan Bisk and Jesse Thomason and Asli Celikyilmaz and Jianfeng Gao},
    title     = {RMM: A Recursive Mental Model for Dialog Navigation},
    booktitle = {Conference on Empirical Methods in Natural Language Processing: Findings},
    year      = {2020},
    url       = {https://arxiv.org/abs/2005.00728},
}

A Benchmark for Structured Procedural Knowledge Extraction from Cooking Videos

Workshop on NLP Beyond Text (2020)
Frank F. Xu, Lei Ji, Botian Shi, Junyi Du, Graham Neubig,

Yonatan Bisk

, Nan Duan

@inproceedings{NLPBT-Wksp:Xu2020,
    author    = {Frank F. Xu and Lei Ji and Botian Shi and Junyi Du and Graham Neubig and Yonatan Bisk and Nan Duan},
    title     = {A Benchmark for Structured Procedural Knowledge Extraction from Cooking Videos},
    booktitle = {Workshop on NLP Beyond Text},
    year      = {2020},
    url       = {https://arxiv.org/abs/2005.00706},
}

Multi-View Learning for Vision-and-Language Navigation

ArXiv (2020)
Qiaolin Xia, Xiujun Li, Chunyuan Li,

Yonatan Bisk

, Zhifang Sui, Jianfeng Gao, Yejin Choi, Noah A. Smith

@article{ArXiv:Xia2020,
    author    = {Qiaolin Xia and Xiujun Li and Chunyuan Li and Yonatan Bisk and Zhifang Sui and Jianfeng Gao and Yejin Choi and Noah A. Smith},
    title     = {Multi-View Learning for Vision-and-Language Navigation},
    journal = {ArXiv},
    year      = {2020},
    url       = {https://arxiv.org/abs/2003.00857},
}

ALFRED: A Benchmark for Interpreting Grounded Instructions for Everyday Tasks

The IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2020)
Mohit Shridhar, Jesse Thomason, Daniel Gordon,

Yonatan Bisk

, Winson Han, Roozbeh Mottaghi, Luke Zettlemoyer, Dieter Fox

Website

@inproceedings{CVPR:Shridhar2020,
    author    = {Mohit Shridhar and Jesse Thomason and Daniel Gordon and Yonatan Bisk and Winson Han and Roozbeh Mottaghi and Luke Zettlemoyer and Dieter Fox},
    title     = {ALFRED: A Benchmark for Interpreting Grounded Instructions for Everyday Tasks},
    booktitle = {The IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    year      = {2020},
    url       = {https://arxiv.org/abs/1912.01734},
}

PIQA: Reasoning about Physical Commonsense in Natural Language

Thirty-Fourth AAAI Conference on Artificial Intelligence (2020)

Yonatan Bisk

, Rowan Zellers, Ronan Le Bras, Jianfeng Gao, Yejin Choi

Slides Leaderboard

@inproceedings{AAAI:Bisk2020,
    author    = {Yonatan Bisk and Rowan Zellers and Ronan Le Bras and Jianfeng Gao and Yejin Choi},
    title     = {PIQA: Reasoning about Physical Commonsense in Natural Language},
    booktitle = {Thirty-Fourth AAAI Conference on Artificial Intelligence},
    year      = {2020},
    url       = {https://arxiv.org/abs/1911.11641},
}

Robust Navigation with Language Pretraining and Stochastic Sampling

Conference on Empirical Methods in Natural Language Processing and 9th International Joint Conference on Natural Language Processing (2019)
Xiujun Li, Chunyuan Li, Qiaolin Xia,

Yonatan Bisk

, Asli Celikyilmaz, Jianfeng Gao, Noah A. Smith, Yejin Choi

@inproceedings{EMNLP-IJCNLP:Li2019,
    author    = {Xiujun Li and Chunyuan Li and Qiaolin Xia and Yonatan Bisk and Asli Celikyilmaz and Jianfeng Gao and Noah A. Smith and Yejin Choi},
    title     = {Robust Navigation with Language Pretraining and Stochastic Sampling},
    booktitle = {Conference on Empirical Methods in Natural Language Processing and 9th International Joint Conference on Natural Language Processing},
    year      = {2019},
    url       = {https://arxiv.org/abs/1909.02244},
}

Defending Against Neural Fake News

Thirty-third Conference on Neural Information Processing Systems (2019)
Rowan Zellers, Ari Holtzman, Hannah Rashkin,

Yonatan Bisk

, Ali Farhadi, Franziska Roesner, Yejin Choi

Demo Models

@inproceedings{NeurIPS:Zellers2019,
    author    = {Rowan Zellers and Ari Holtzman and Hannah Rashkin and Yonatan Bisk and Ali Farhadi and Franziska Roesner and Yejin Choi},
    title     = {Defending Against Neural Fake News},
    booktitle = {Thirty-third Conference on Neural Information Processing Systems},
    year      = {2019},
    url       = {https://arxiv.org/abs/1905.12616},
}

FIND: Identifying Functionally and Structurally Important Features in Protein Sequences with Deep Neural Networks

bioRxiv (2019)
Ranjani Murali, James Hemp, Victoria Orphan,

Yonatan Bisk

PDF

@article{bioRxiv:Murali2019,
    author    = {Ranjani Murali and James Hemp and Victoria Orphan and Yonatan Bisk},
    title     = {FIND: Identifying Functionally and Structurally Important Features in Protein Sequences with Deep Neural Networks},
    journal = {bioRxiv},
    year      = {2019},
    url       = {https://www.biorxiv.org/content/10.1101/592808v1},
}

Improving Robot Success Detection using Static Object Data

IEEE/RSJ International Conference on Intelligent Robots and Systems (2019)
Rosario Scalise, Jesse Thomason,

Yonatan Bisk

, Siddhartha Srinivasa

Video

@inproceedings{IROS:Scalise2019,
    author    = {Rosario Scalise and Jesse Thomason and Yonatan Bisk and Siddhartha Srinivasa},
    title     = {Improving Robot Success Detection using Static Object Data},
    booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems},
    year      = {2019},
    url       = {https://arxiv.org/abs/1904.01650},
}

Early Fusion for Goal Directed Robotic Vision

2019 IEEE/RSJ International Conference on Intelligent Robots and Systems (2019)
Aaron Walsman,

Yonatan Bisk

, Saadia Gabriel, Dipendra Misra, Yoav Artzi, Yejin Choi, Dieter Fox

@inproceedings{IROS:Walsman2019,
    author    = {Aaron Walsman and Yonatan Bisk and Saadia Gabriel and Dipendra Misra and Yoav Artzi and Yejin Choi and Dieter Fox},
    title     = {Early Fusion for Goal Directed Robotic Vision},
    booktitle = {2019 IEEE/RSJ International Conference on Intelligent Robots and Systems},
    year      = {2019},
    url       = {https://arxiv.org/abs/1811.08824},
}

HellaSwag: Can a Machine Really Finish Your Sentence?

Association for Computational Linguistics (2019)
Rowan Zellers, Ari Holtzman,

Yonatan Bisk

, Ali Farhadi, Yejin Choi

@inproceedings{ACL:Zellers2019,
    author    = {Rowan Zellers and Ari Holtzman and Yonatan Bisk and Ali Farhadi and Yejin Choi},
    title     = {HellaSwag: Can a Machine Really Finish Your Sentence? },
    booktitle = {Association for Computational Linguistics},
    year      = {2019},
    url       = {https://arxiv.org/abs/1905.07830},
}

From Recognition to Cognition: Visual Commonsense Reasoning

The IEEE Conference on Computer Vision and Pattern Recognition (2019)
Rowan Zellers,

Yonatan Bisk

, Ali Farhadi, Yejin Choi

URL

@inproceedings{CVPR:Zellers2019,
    author    = {Rowan Zellers and Yonatan Bisk and Ali Farhadi and Yejin Choi},
    title     = {From Recognition to Cognition: Visual Commonsense Reasoning},
    booktitle = {The IEEE Conference on Computer Vision and Pattern Recognition},
    year      = {2019},
    url       = {https://arxiv.org/abs/1811.10830},
}

Tactical Rewind: Self-Correction via Backtracking in Vision-and-Language Navigation

The IEEE Conference on Computer Vision and Pattern Recognition (2019)
Liyiming Ke, Xiujun Li,

Yonatan Bisk

, Ari Holtzman, Zhe Gan, Jingjing Liu, Jianfeng Gao, Yejin Choi, Siddhartha Srinivasa

Video

@inproceedings{CVPR:Ke2019,
    author    = {Liyiming Ke and Xiujun Li and Yonatan Bisk and Ari Holtzman and Zhe Gan and Jingjing Liu and Jianfeng Gao and Yejin Choi and Siddhartha Srinivasa},
    title     = {Tactical Rewind: Self-Correction via Backtracking in Vision-and-Language Navigation},
    booktitle = {The IEEE Conference on Computer Vision and Pattern Recognition},
    year      = {2019},
    url       = {https://arxiv.org/abs/1903.02547},
}

Prospection: Interpretable Plans From Language By Predicting the Future

International Conference on Robotics and Automation (ICRA) (2019)
Chris Paxton,

Yonatan Bisk

, Jesse Thomason, Arunkumar Byravan, Dieter Fox

@inproceedings{ICRA:Paxton2019,
    author    = {Chris Paxton and Yonatan Bisk and Jesse Thomason and Arunkumar Byravan and Dieter Fox},
    title     = {Prospection: Interpretable Plans From Language By Predicting the Future},
    booktitle = {International Conference on Robotics and Automation (ICRA)},
    year      = {2019},
    url       = {https://arxiv.org/abs/1903.08309},
}

Shifting the Baseline: Single Modality Performance on Visual Navigation & QA

Annual Conference of the North American Chapter of the Association for Computational Linguistics (2019)
Jesse Thomason, Daniel Gordon,

Yonatan Bisk

@inproceedings{NAACL-Short:Thomason2019,
    author    = {Jesse Thomason and Daniel Gordon and Yonatan Bisk},
    title     = {Shifting the Baseline: Single Modality Performance on Visual Navigation & QA},
    booktitle = {Annual Conference of the North American Chapter of the Association for Computational Linguistics},
    year      = {2019},
    url       = {https://arxiv.org/abs/1811.00613},
}

Benchmarking Hierarchical Script Knowledge

Annual Conference of the North American Chapter of the Association for Computational Linguistics (2019)

Yonatan Bisk

, Jan Buys, Karl Pichotta, Yejin Choi

PDF

@inproceedings{NAACL-Short:Bisk2019,
    author    = {Yonatan Bisk and Jan Buys and Karl Pichotta and Yejin Choi},
    title     = {Benchmarking Hierarchical Script Knowledge},
    booktitle = {Annual Conference of the North American Chapter of the Association for Computational Linguistics},
    year      = {2019},
    url       = {https://www.aclweb.org/anthology/N19-1412},
}

Character-based Surprisal as a Model of Reading Difficulty in the Presence of Errors

The 41st Annual Meeting of the Cognitive Science Society (2019)
Michael Hahn, Frank Keller,

Yonatan Bisk

, Yonatan Belinkov

@inproceedings{CogSci:Hahn2019,
    author    = {Michael Hahn and Frank Keller and Yonatan Bisk and Yonatan Belinkov},
    title     = {Character-based Surprisal as a Model of Reading Difficulty in the Presence of Errors},
    booktitle = {The 41st Annual Meeting of the Cognitive Science Society},
    year      = {2019},
    url       = {https://psyarxiv.com/zcwgn/},
}

SWAG: A Large-Scale Adversarial Dataset for Grounded Commonsense Inference

Conference on Empirical Methods in Natural Language Processing (2018)
Rowan Zellers,

Yonatan Bisk

, Roy Schwartz, Yejin Choi

Website Video

@inproceedings{EMNLP:Zellers2018,
    author    = {Rowan Zellers and Yonatan Bisk and Roy Schwartz and Yejin Choi},
    title     = {SWAG: A Large-Scale Adversarial Dataset for Grounded Commonsense Inference},
    booktitle = {Conference on Empirical Methods in Natural Language Processing},
    year      = {2018},
    url       = {https://arxiv.org/abs/1808.05326},
}

Balancing Shared Autonomy with Human-Robot Communication

ArXiv (2018)
Rosario Scalise,

Yonatan Bisk

, Maxwell Forbes, Daqing Yi, Yejin Choi, Siddhartha Srinivasa

@article{ArXiv:Scalise2018,
    author    = {Rosario Scalise and Yonatan Bisk and Maxwell Forbes and Daqing Yi and Yejin Choi and Siddhartha Srinivasa},
    title     = {Balancing Shared Autonomy with Human-Robot Communication},
    journal = {ArXiv},
    year      = {2018},
    url       = {https://arxiv.org/abs/1805.07719},
}

Inducing Grammars with and for Neural Machine Translation

2nd Workshop on Neural Machine Translation (2018)
Ke Tran,

Yonatan Bisk

@inproceedings{NMT-Wksp:Tran2018,
    author    = {Ke Tran and Yonatan Bisk},
    title     = {Inducing Grammars with and for Neural Machine Translation},
    booktitle = {2nd Workshop on Neural Machine Translation},
    year      = {2018},
    url       = {https://arxiv.org/abs/1805.10850},
}

Bridging HMMs and RNNs through Architectural Transformations

32nd Conference on Neural Information Processing Systems (NIPS 2018), IRASL workshop (2018)
Jan Buys,

Yonatan Bisk

, Yejin Choi

PDF

@inproceedings{IRASL-Wksp:Buys2018,
    author    = {Jan Buys and Yonatan Bisk and Yejin Choi},
    title     = {Bridging HMMs and RNNs through Architectural Transformations},
    booktitle = {32nd Conference on Neural Information Processing Systems (NIPS 2018), IRASL workshop},
    year      = {2018},
    url       = {https://openreview.net/pdf?id=rJxEso0osm},
}

Synthetic and Natural Noise Both Break Neural Machine Translation

6th International Conference on Learning Representations (2018)
Yonatan Belinkov,

Yonatan Bisk

@inproceedings{ICLR:Belinkov2018,
    author    = {Yonatan Belinkov and Yonatan Bisk},
    title     = {Synthetic and Natural Noise Both Break Neural Machine Translation },
    booktitle = {6th International Conference on Learning Representations},
    year      = {2018},
    url       = {https://arxiv.org/abs/1711.02173},
}

CHALET: Cornell House Agent Learning Environment

ArXiv Preprint 1801.07357 (2018)
Claudia Yan, Dipendra Misra, Andrew Bennett, Aaron Walsman,

Yonatan Bisk

, Yoav Artzi

Simulator

@article{ArXiv:Yan2018,
    author    = {Claudia Yan and Dipendra Misra and Andrew Bennett and Aaron Walsman and Yonatan Bisk and Yoav Artzi},
    title     = {CHALET: Cornell House Agent Learning Environment },
    journal = {ArXiv Preprint 1801.07357},
    year      = {2018},
    url       = {https://arxiv.org/abs/1801.07357},
}

Learning Interpretable Spatial Operations in a Rich 3D Blocks World

Thirty-Second Conference on Artificial Intelligence (AAAI-18) (2018)

Yonatan Bisk

, Kevin Shih, Yejin Choi, Daniel Marcu

Data Poster

@inproceedings{AAAI:Bisk2018,
    author    = {Yonatan Bisk and Kevin Shih and Yejin Choi and Daniel Marcu},
    title     = {Learning Interpretable Spatial Operations in a Rich 3D Blocks World },
    booktitle = {Thirty-Second Conference on Artificial Intelligence (AAAI-18)},
    year      = {2018},
    url       = {https://arxiv.org/abs/1712.03463},
}

Natural Language Inference from Multiple Premises

Eighth International Joint Conference on Natural Language Processing (2017)
Alice Lai,

Yonatan Bisk

, Julia Hockenmaier

@inproceedings{IJCNLP:Lai2017,
    author    = {Alice Lai and Yonatan Bisk and Julia Hockenmaier},
    title     = {Natural Language Inference from Multiple Premises},
    booktitle = {Eighth International Joint Conference on Natural Language Processing},
    year      = {2017},
    url       = {https://arxiv.org/abs/1710.02925},
}

Natural Language Communication with Robots

15th Annual Conference of the North American Chapter of the Association for Computational Linguistics (2016)

Yonatan Bisk

, Deniz Yuret, Daniel Marcu

PDF

Data Slides

@inproceedings{NAACL:Bisk2016,
    author    = {Yonatan Bisk and Deniz Yuret and Daniel Marcu},
    title     = {Natural Language Communication with Robots },
    booktitle = {15th Annual Conference of the North American Chapter of the Association for Computational Linguistics},
    year      = {2016},
    url       = {https://www.aclweb.org/anthology/N16-1089/},
}

Supertagging with LSTMs

15th Annual Conference of the North American Chapter of the Association for Computational Linguistics (Short Papers) (2016)
Ashish Vaswani,

Yonatan Bisk

, Kenji Sagae, Ryan Musa

PDF

@inproceedings{NAACL-Short:Vaswani2016,
    author    = {Ashish Vaswani and Yonatan Bisk and Kenji Sagae and Ryan Musa},
    title     = {Supertagging with LSTMs},
    booktitle = {15th Annual Conference of the North American Chapter of the Association for Computational Linguistics (Short Papers)},
    year      = {2016},
    url       = {https://www.aclweb.org/anthology/N16-1027/},
}

Towards a Dataset for Human Computer Communication via Grounded Language Acquisition

AAAI 2016 Workshop on Symbiotic Cognitive Systems (2016)

Yonatan Bisk

, Daniel Marcu, William Wong

PDF

@inproceedings{Symbolic-Cognitive-Systems-Wksp:Bisk2016,
    author    = {Yonatan Bisk and Daniel Marcu and William Wong},
    title     = {Towards a Dataset for Human Computer Communication via Grounded Language Acquisition},
    booktitle = {AAAI 2016 Workshop on Symbiotic Cognitive Systems},
    year      = {2016},
    url       = {http://talkingtorobots.com/papers/2016-AAAI-Wksp.pdf},
}

Unsupervised Neural Hidden Markov Models

Workshop on Structured Prediction for NLP (2016)
Ke Tran,

Yonatan Bisk

, Ashish Vaswani, Daniel Marcu, Kevin Knight

PDF

Slides

@inproceedings{Struc.-Pred-Wksp:Tran2016,
    author    = {Ke Tran and Yonatan Bisk and Ashish Vaswani and Daniel Marcu and Kevin Knight},
    title     = {Unsupervised Neural Hidden Markov Models  },
    booktitle = {Workshop on Structured Prediction for NLP},
    year      = {2016},
    url       = {https://www.aclweb.org/anthology/W16-5907/},
}

Evaluating Induced CCG Parsers on Grounded Semantic Parsing

2016 Conference on Empirical Methods in Natural Language Processing (2016)

Yonatan Bisk

, Siva Reddy, John Blitzer, Julia Hockenmaier, Mark Steedman

PDF

@inproceedings{EMNLP:Bisk2016,
    author    = {Yonatan Bisk and Siva Reddy and John Blitzer and Julia Hockenmaier and Mark Steedman},
    title     = {Evaluating Induced CCG Parsers on Grounded Semantic Parsing },
    booktitle = {2016 Conference on Empirical Methods in Natural Language Processing},
    year      = {2016},
    url       = {http://sivareddy.in/papers/bisk2016evaluating.pdf},
}

Probing the Linguistic Strengths and Limitations of Unsupervised Grammar Induction

53rd Annual Meeting of the Association for Computational Linguistics and the 7th International Joint Conference on Natural Language Processing (Volume 1: Long Papers) (2015)

Yonatan Bisk

, Julia Hockenmaier

PDF

@inproceedings{ACL:Bisk2015,
    author    = {Yonatan Bisk and Julia Hockenmaier},
    title     = {Probing the Linguistic Strengths and Limitations of Unsupervised Grammar Induction},
    booktitle = {53rd Annual Meeting of the Association for Computational Linguistics and the 7th International Joint Conference on Natural Language Processing (Volume 1: Long Papers) },
    year      = {2015},
    url       = {https://www.aclweb.org/anthology/P15-1135/},
}

Labeled Grammar Induction with Minimal Supervision

53rd Annual Meeting of the Association for Computational Linguistics and the 7th International Joint Conference on Natural Language Processing (Volume 2: Short Papers) (2015)

Yonatan Bisk

, Christos Christodoulopoulos, Julia Hockenmaier

PDF

Poster

@inproceedings{ACL-Short:Bisk2015,
    author    = {Yonatan Bisk and Christos Christodoulopoulos and Julia Hockenmaier},
    title     = {Labeled Grammar Induction with Minimal Supervision  },
    booktitle = {53rd Annual Meeting of the Association for Computational Linguistics and the 7th International Joint Conference on Natural Language Processing (Volume 2: Short Papers)},
    year      = {2015},
    url       = {http://talkingtorobots.com/papers/2015-ACLShort-Fixed.pdf},
}

An HDP Model for Inducing Combinatory Categorial Grammars

Transactions of the Association for Computational Linguistics (2013)

Yonatan Bisk

, Julia Hockenmaier

PDF

Slides

@article{TACL:Bisk2013,
    author    = {Yonatan Bisk and Julia Hockenmaier},
    title     = {An HDP Model for Inducing Combinatory Categorial Grammars},
    journal = {Transactions of the Association for Computational Linguistics},
    year      = {2013},
    url       = {https://www.aclweb.org/anthology/Q13-1007/},
}

Simple Robust Grammar Induction with Combinatory Categorial Grammar

Twenty-Sixth Conference on Artificial Intelligence (AAAI-12) (2012)

Yonatan Bisk

, Julia Hockenmaier

PDF

@inproceedings{AAAI:Bisk2012,
    author    = {Yonatan Bisk and Julia Hockenmaier},
    title     = {Simple Robust Grammar Induction with Combinatory Categorial Grammar },
    booktitle = {Twenty-Sixth Conference on Artificial Intelligence (AAAI-12)},
    year      = {2012},
    url       = {https://www.aaai.org/ocs/index.php/AAAI/AAAI12/paper/view/5130},
}

Document-Topic Hierarchies from Document Graphs

21st ACM international conference on Information and knowledge management (CIKM 2012) (2012)
Tim Weninger,

Yonatan Bisk

, Jiawei Han

PDF

@inproceedings{CIKM:Weninger2012,
    author    = {Tim Weninger and Yonatan Bisk and Jiawei Han},
    title     = {Document-Topic Hierarchies from Document Graphs },
    booktitle = {21st ACM international conference on Information and knowledge management (CIKM 2012)},
    year      = {2012},
    url       = {https://dl.acm.org/doi/10.1145/2396761.2396843},
}

Induction of Linguistic Structure with Combinatory Categorial Grammars

NAACL HLT Workshop on Induction of Linguistic Structure (2012)

Yonatan Bisk

, Julia Hockenmaier

PDF

@inproceedings{Inducing-Ling-Structure-Wksp:Bisk2012,
    author    = {Yonatan Bisk and Julia Hockenmaier},
    title     = {Induction of Linguistic Structure with Combinatory Categorial Grammars },
    booktitle = {NAACL HLT Workshop on Induction of Linguistic Structure},
    year      = {2012},
    url       = {http://talkingtorobots.com/papers/2012-NAACL-WILS.pdf},
}

Normal-form parsing for CCGs with generalized composition and type-raising

23rd International Conference on Computational Linguistics (Coling 2010) (2010)
Julia Hockenmaier,

Yonatan Bisk

PDF

@inproceedings{Coling:Hockenmaier2010,
    author    = {Julia Hockenmaier and Yonatan Bisk},
    title     = {Normal-form parsing for CCGs with generalized composition and type-raising},
    booktitle = {23rd International Conference on Computational Linguistics (Coling 2010)},
    year      = {2010},
    url       = {https://www.aclweb.org/anthology/C10-1053/},
}

Connecting Language to Actions & the World @ CMU

EGL: You can't learn language ...

... from the radio
Text → Perception

... by watching TV
Perception → Action

... by yourself
Action → Social

Publications

Connecting Language to Actions & the World @ CMU

EGL: You can't learn language ...

... from the radio Text → Perception

... by watching TV Perception → Action

... by yourself Action → Social

Publications

... from the radio
Text → Perception

... by watching TV
Perception → Action

... by yourself
Action → Social