这是indexloc提供的服务,不要输入任何密码

BibTeX records: Anikait Singh

download as .bib file

@inproceedings{DBLP:conf/cvpr/DangSZES25,
  author       = {Meihua Dang and
                  Anikait Singh and
                  Linqi Zhou and
                  Stefano Ermon and
                  Jiaming Song},
  title        = {Personalized Preference Fine-tuning of Diffusion Models},
  booktitle    = {{IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2025, Nashville, TN, USA, June 11-15, 2025},
  pages        = {8020--8030},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2025},
  url          = {https://openaccess.thecvf.com/content/CVPR2025/html/Dang\_Personalized\_Preference\_Fine-tuning\_of\_Diffusion\_Models\_CVPR\_2025\_paper.html},
  doi          = {10.1109/CVPR52734.2025.00751},
  timestamp    = {Wed, 20 Aug 2025 10:18:56 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/DangSZES25.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2501-04682,
  author       = {Violet Xiang and
                  Charlie Snell and
                  Kanishk Gandhi and
                  Alon Albalak and
                  Anikait Singh and
                  Chase Blagden and
                  Duy Phung and
                  Rafael Rafailov and
                  Nathan Lile and
                  Dakota Mahan and
                  Louis Castricato and
                  Jan{-}Philipp Fr{\"{a}}nken and
                  Nick Haber and
                  Chelsea Finn},
  title        = {Towards System 2 Reasoning in LLMs: Learning How to Think With Meta
                  Chain-of-Thought},
  journal      = {CoRR},
  volume       = {abs/2501.04682},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2501.04682},
  doi          = {10.48550/ARXIV.2501.04682},
  eprinttype    = {arXiv},
  eprint       = {2501.04682},
  timestamp    = {Tue, 18 Feb 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2501-04682.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2501-06655,
  author       = {Meihua Dang and
                  Anikait Singh and
                  Linqi Zhou and
                  Stefano Ermon and
                  Jiaming Song},
  title        = {Personalized Preference Fine-tuning of Diffusion Models},
  journal      = {CoRR},
  volume       = {abs/2501.06655},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2501.06655},
  doi          = {10.48550/ARXIV.2501.06655},
  eprinttype    = {arXiv},
  eprint       = {2501.06655},
  timestamp    = {Sat, 06 Sep 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2501-06655.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2502-17387,
  author       = {Alon Albalak and
                  Duy Phung and
                  Nathan Lile and
                  Rafael Rafailov and
                  Kanishk Gandhi and
                  Louis Castricato and
                  Anikait Singh and
                  Chase Blagden and
                  Violet Xiang and
                  Dakota Mahan and
                  Nick Haber},
  title        = {Big-Math: {A} Large-Scale, High-Quality Math Dataset for Reinforcement
                  Learning in Language Models},
  journal      = {CoRR},
  volume       = {abs/2502.17387},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2502.17387},
  doi          = {10.48550/ARXIV.2502.17387},
  eprinttype    = {arXiv},
  eprint       = {2502.17387},
  timestamp    = {Fri, 21 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2502-17387.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2502-19312,
  author       = {Anikait Singh and
                  Sheryl Hsu and
                  Kyle Hsu and
                  Eric Mitchell and
                  Stefano Ermon and
                  Tatsunori Hashimoto and
                  Archit Sharma and
                  Chelsea Finn},
  title        = {{FSPO:} Few-Shot Preference Optimization of Synthetic Preference Data
                  in LLMs Elicits Effective Personalization to Real Users},
  journal      = {CoRR},
  volume       = {abs/2502.19312},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2502.19312},
  doi          = {10.48550/ARXIV.2502.19312},
  eprinttype    = {arXiv},
  eprint       = {2502.19312},
  timestamp    = {Sat, 06 Sep 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2502-19312.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2503-01307,
  author       = {Kanishk Gandhi and
                  Ayush Chakravarthy and
                  Anikait Singh and
                  Nathan Lile and
                  Noah D. Goodman},
  title        = {Cognitive Behaviors that Enable Self-Improving Reasoners, or, Four
                  Habits of Highly Effective STaRs},
  journal      = {CoRR},
  volume       = {abs/2503.01307},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2503.01307},
  doi          = {10.48550/ARXIV.2503.01307},
  eprinttype    = {arXiv},
  eprint       = {2503.01307},
  timestamp    = {Tue, 08 Apr 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2503-01307.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2510-02263,
  author       = {Yuxiao Qu and
                  Anikait Singh and
                  Yoonho Lee and
                  Amrith Setlur and
                  Ruslan Salakhutdinov and
                  Chelsea Finn and
                  Aviral Kumar},
  title        = {{RLAD:} Training LLMs to Discover Abstractions for Solving Reasoning
                  Problems},
  journal      = {CoRR},
  volume       = {abs/2510.02263},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2510.02263},
  doi          = {10.48550/ARXIV.2510.02263},
  eprinttype    = {arXiv},
  eprint       = {2510.02263},
  timestamp    = {Sun, 09 Nov 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2510-02263.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2510-07307,
  author       = {Rushi Qiang and
                  Yuchen Zhuang and
                  Anikait Singh and
                  Percy Liang and
                  Chao Zhang and
                  Sherry Yang and
                  Bo Dai},
  title        = {MLE-Smith: Scaling {MLE} Tasks with Automated Multi-Agent Pipeline},
  journal      = {CoRR},
  volume       = {abs/2510.07307},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2510.07307},
  doi          = {10.48550/ARXIV.2510.07307},
  eprinttype    = {arXiv},
  eprint       = {2510.07307},
  timestamp    = {Tue, 11 Nov 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2510-07307.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:conf/rlc/RafailovHSKSKHK24,
  author       = {Rafael Rafailov and
                  Kyle Beltran Hatch and
                  Anikait Singh and
                  Aviral Kumar and
                  Laura Smith and
                  Ilya Kostrikov and
                  Philippe Hansen{-}Estruch and
                  Victor Kolev and
                  Philip J. Ball and
                  Jiajun Wu and
                  Sergey Levine and
                  Chelsea Finn},
  title        = {{D5RL:} Diverse Datasets for Data-Driven Deep Reinforcement Learning},
  journal      = {{RLJ}},
  volume       = {5},
  pages        = {2178--2197},
  year         = {2024},
  url          = {https://rlj.cs.umass.edu/2024/papers/Paper305.html},
  timestamp    = {Fri, 10 Oct 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/rlc/RafailovHSKSKHK24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/TajwarSSR0XEFK24,
  author       = {Fahim Tajwar and
                  Anikait Singh and
                  Archit Sharma and
                  Rafael Rafailov and
                  Jeff Schneider and
                  Tengyang Xie and
                  Stefano Ermon and
                  Chelsea Finn and
                  Aviral Kumar},
  title        = {Preference Fine-Tuning of LLMs Should Leverage Suboptimal, On-Policy
                  Data},
  booktitle    = {Forty-first International Conference on Machine Learning, {ICML} 2024,
                  Vienna, Austria, July 21-27, 2024},
  publisher    = {OpenReview.net},
  year         = {2024},
  url          = {https://openreview.net/forum?id=bWNPx6t0sF},
  timestamp    = {Mon, 02 Sep 2024 16:45:29 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/TajwarSSR0XEFK24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/ONeillRMGPLPGMJ24,
  author       = {Abby O'Neill and
                  Abdul Rehman and
                  Abhiram Maddukuri and
                  Abhishek Gupta and
                  Abhishek Padalkar and
                  Abraham Lee and
                  Acorn Pooley and
                  Agrim Gupta and
                  Ajay Mandlekar and
                  Ajinkya Jain and
                  Albert Tung and
                  Alex Bewley and
                  Alexander Herzog and
                  Alex Irpan and
                  Alexander Khazatsky and
                  Anant Rai and
                  Anchit Gupta and
                  Andrew E. Wang and
                  Anikait Singh and
                  Animesh Garg and
                  Aniruddha Kembhavi and
                  Annie Xie and
                  Anthony Brohan and
                  Antonin Raffin and
                  Archit Sharma and
                  Arefeh Yavary and
                  Arhan Jain and
                  Ashwin Balakrishna and
                  Ayzaan Wahid and
                  Ben Burgess{-}Limerick and
                  Beomjoon Kim and
                  Bernhard Sch{\"{o}}lkopf and
                  Blake Wulfe and
                  Brian Ichter and
                  Cewu Lu and
                  Charles Xu and
                  Charlotte Le and
                  Chelsea Finn and
                  Chen Wang and
                  Chenfeng Xu and
                  Cheng Chi and
                  Chenguang Huang and
                  Christine Chan and
                  Christopher Agia and
                  Chuer Pan and
                  Chuyuan Fu and
                  Coline Devin and
                  Danfei Xu and
                  Daniel Morton and
                  Danny Driess and
                  Daphne Chen and
                  Deepak Pathak and
                  Dhruv Shah and
                  Dieter B{\"{u}}chler and
                  Dinesh Jayaraman and
                  Dmitry Kalashnikov and
                  Dorsa Sadigh and
                  Edward Johns and
                  Ethan Paul Foster and
                  Fangchen Liu and
                  Federico Ceola and
                  Fei Xia and
                  Feiyu Zhao and
                  Freek Stulp and
                  Gaoyue Zhou and
                  Gaurav S. Sukhatme and
                  Gautam Salhotra and
                  Ge Yan and
                  Gilbert Feng and
                  Giulio Schiavi and
                  Glen Berseth and
                  Gregory Kahn and
                  Guanzhi Wang and
                  Hao Su and
                  Haoshu Fang and
                  Haochen Shi and
                  Henghui Bao and
                  Heni Ben Amor and
                  Henrik I. Christensen and
                  Hiroki Furuta and
                  Homer Walke and
                  Hongjie Fang and
                  Huy Ha and
                  Igor Mordatch and
                  Ilija Radosavovic and
                  Isabel Leal and
                  Jacky Liang and
                  Jad Abou{-}Chakra and
                  Jaehyung Kim and
                  Jaimyn Drake and
                  Jan Peters and
                  Jan Schneider and
                  Jasmine Hsu and
                  Jeannette Bohg and
                  Jeffrey T. Bingham and
                  Jeffrey Wu and
                  Jensen Gao and
                  Jiaheng Hu and
                  Jiajun Wu and
                  Jialin Wu and
                  Jiankai Sun and
                  Jianlan Luo and
                  Jiayuan Gu and
                  Jie Tan and
                  Jihoon Oh and
                  Jimmy Wu and
                  Jingpei Lu and
                  Jingyun Yang and
                  Jitendra Malik and
                  Jo{\~{a}}o Silv{\'{e}}rio and
                  Joey Hejna and
                  Jonathan Booher and
                  Jonathan Tompson and
                  Jonathan Yang and
                  Jordi Salvador and
                  Joseph J. Lim and
                  Junhyek Han and
                  Kaiyuan Wang and
                  Kanishka Rao and
                  Karl Pertsch and
                  Karol Hausman and
                  Keegan Go and
                  Keerthana Gopalakrishnan and
                  Ken Goldberg and
                  Kendra Byrne and
                  Kenneth Oslund and
                  Kento Kawaharazuka and
                  Kevin Black and
                  Kevin Lin and
                  Kevin Zhang and
                  Kiana Ehsani and
                  Kiran Lekkala and
                  Kirsty Ellis and
                  Krishan Rana and
                  Krishnan Srinivasan and
                  Kuan Fang and
                  Kunal Pratap Singh and
                  Kuo{-}Hao Zeng and
                  Kyle Hatch and
                  Kyle Hsu and
                  Laurent Itti and
                  Lawrence Yunliang Chen and
                  Lerrel Pinto and
                  Li Fei{-}Fei and
                  Liam Tan and
                  Linxi Jim Fan and
                  Lionel Ott and
                  Lisa Lee and
                  Luca Weihs and
                  Magnum Chen and
                  Marion Lepert and
                  Marius Memmel and
                  Masayoshi Tomizuka and
                  Masha Itkina and
                  Mateo Guaman Castro and
                  Max Spero and
                  Maximilian Du and
                  Michael Ahn and
                  Michael C. Yip and
                  Mingtong Zhang and
                  Mingyu Ding and
                  Minho Heo and
                  Mohan Kumar Srirama and
                  Mohit Sharma and
                  Moo Jin Kim and
                  Naoaki Kanazawa and
                  Nicklas Hansen and
                  Nicolas Heess and
                  Nikhil J. Joshi and
                  Niko S{\"{u}}nderhauf and
                  Ning Liu and
                  Norman Di Palo and
                  Nur Muhammad (Mahi) Shafiullah and
                  Oier Mees and
                  Oliver Kroemer and
                  Osbert Bastani and
                  Pannag R. Sanketi and
                  Patrick Tree Miller and
                  Patrick Yin and
                  Paul Wohlhart and
                  Peng Xu and
                  Peter David Fagan and
                  Peter Mitrano and
                  Pierre Sermanet and
                  Pieter Abbeel and
                  Priya Sundaresan and
                  Qiuyu Chen and
                  Quan Vuong and
                  Rafael Rafailov and
                  Ran Tian and
                  Ria Doshi and
                  Roberto Mart{\'{\i}}n{-}Mart{\'{\i}}n and
                  Rohan Baijal and
                  Rosario Scalise and
                  Rose Hendrix and
                  Roy Lin and
                  Runjia Qian and
                  Ruohan Zhang and
                  Russell Mendonca and
                  Rutav Shah and
                  Ryan Hoque and
                  Ryan Julian and
                  Samuel Bustamante{-}Gomez and
                  Sean Kirmani and
                  Sergey Levine and
                  Shan Lin and
                  Sherry Moore and
                  Shikhar Bahl and
                  Shivin Dass and
                  Shubham D. Sonawani and
                  Shuran Song and
                  Sichun Xu and
                  Siddhant Haldar and
                  Siddharth Karamcheti and
                  Simeon Adebola and
                  Simon Guist and
                  Soroush Nasiriany and
                  Stefan Schaal and
                  Stefan Welker and
                  Stephen Tian and
                  Subramanian Ramamoorthy and
                  Sudeep Dasari and
                  Suneel Belkhale and
                  Sungjae Park and
                  Suraj Nair and
                  Suvir Mirchandani and
                  Takayuki Osa and
                  Tanmay Gupta and
                  Tatsuya Harada and
                  Tatsuya Matsushima and
                  Ted Xiao and
                  Thomas Kollar and
                  Tianhe Yu and
                  Tianli Ding and
                  Todor Davchev and
                  Tony Z. Zhao and
                  Travis Armstrong and
                  Trevor Darrell and
                  Trinity Chung and
                  Vidhi Jain and
                  Vincent Vanhoucke and
                  Wei Zhan and
                  Wenxuan Zhou and
                  Wolfram Burgard and
                  Xi Chen and
                  Xiaolong Wang and
                  Xinghao Zhu and
                  Xinyang Geng and
                  Xiyuan Liu and
                  Liangwei Xu and
                  Xuanlin Li and
                  Yao Lu and
                  Yecheng Jason Ma and
                  Yejin Kim and
                  Yevgen Chebotar and
                  Yifan Zhou and
                  Yifeng Zhu and
                  Yilin Wu and
                  Ying Xu and
                  Yixuan Wang and
                  Yonatan Bisk and
                  Yoonyoung Cho and
                  Youngwoon Lee and
                  Yuchen Cui and
                  Yue Cao and
                  Yueh{-}Hua Wu and
                  Yujin Tang and
                  Yuke Zhu and
                  Yunchu Zhang and
                  Yunfan Jiang and
                  Yunshuang Li and
                  Yunzhu Li and
                  Yusuke Iwasawa and
                  Yutaka Matsuo and
                  Zehan Ma and
                  Zhuo Xu and
                  Zichen Jeff Cui and
                  Zichen Zhang and
                  Zipeng Lin},
  title        = {Open X-Embodiment: Robotic Learning Datasets and {RT-X} Models : Open
                  X-Embodiment Collaboration},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2024, Yokohama, Japan, May 13-17, 2024},
  pages        = {6892--6903},
  publisher    = {{IEEE}},
  year         = {2024},
  url          = {https://doi.org/10.1109/ICRA57147.2024.10611477},
  doi          = {10.1109/ICRA57147.2024.10611477},
  timestamp    = {Wed, 05 Nov 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icra/ONeillRMGPLPGMJ24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/BhatejaGGSTVCLK24,
  author       = {Chethan Bhateja and
                  Derek Guo and
                  Dibya Ghosh and
                  Anikait Singh and
                  Manan Tomar and
                  Quan Vuong and
                  Yevgen Chebotar and
                  Sergey Levine and
                  Aviral Kumar},
  title        = {Robotic Offline {RL} from Internet Videos via Value-Function Learning},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2024, Yokohama, Japan, May 13-17, 2024},
  pages        = {16977--16984},
  publisher    = {{IEEE}},
  year         = {2024},
  url          = {https://doi.org/10.1109/ICRA57147.2024.10611575},
  doi          = {10.1109/ICRA57147.2024.10611575},
  timestamp    = {Mon, 19 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/BhatejaGGSTVCLK24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2404-14367,
  author       = {Fahim Tajwar and
                  Anikait Singh and
                  Archit Sharma and
                  Rafael Rafailov and
                  Jeff Schneider and
                  Tengyang Xie and
                  Stefano Ermon and
                  Chelsea Finn and
                  Aviral Kumar},
  title        = {Preference Fine-Tuning of LLMs Should Leverage Suboptimal, On-Policy
                  Data},
  journal      = {CoRR},
  volume       = {abs/2404.14367},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2404.14367},
  doi          = {10.48550/ARXIV.2404.14367},
  eprinttype    = {arXiv},
  eprint       = {2404.14367},
  timestamp    = {Sat, 25 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2404-14367.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2408-08441,
  author       = {Rafael Rafailov and
                  Kyle Hatch and
                  Anikait Singh and
                  Laura Smith and
                  Aviral Kumar and
                  Ilya Kostrikov and
                  Philippe Hansen{-}Estruch and
                  Victor Kolev and
                  Philip J. Ball and
                  Jiajun Wu and
                  Chelsea Finn and
                  Sergey Levine},
  title        = {{D5RL:} Diverse Datasets for Data-Driven Deep Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2408.08441},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2408.08441},
  doi          = {10.48550/ARXIV.2408.08441},
  eprinttype    = {arXiv},
  eprint       = {2408.08441},
  timestamp    = {Fri, 10 Oct 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2408-08441.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2410-02725,
  author       = {Rohin Manvi and
                  Anikait Singh and
                  Stefano Ermon},
  title        = {Adaptive Inference-Time Compute: LLMs Can Predict if They Can Do Better,
                  Even Mid-Generation},
  journal      = {CoRR},
  volume       = {abs/2410.02725},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2410.02725},
  doi          = {10.48550/ARXIV.2410.02725},
  eprinttype    = {arXiv},
  eprint       = {2410.02725},
  timestamp    = {Sat, 06 Sep 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2410-02725.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2412-08812,
  author       = {Yoonho Lee and
                  Jonathan Williams and
                  Henrik Marklund and
                  Archit Sharma and
                  Eric Mitchell and
                  Anikait Singh and
                  Chelsea Finn},
  title        = {Test-Time Alignment via Hypothesis Reweighting},
  journal      = {CoRR},
  volume       = {abs/2412.08812},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2412.08812},
  doi          = {10.48550/ARXIV.2412.08812},
  eprinttype    = {arXiv},
  eprint       = {2412.08812},
  timestamp    = {Sat, 06 Sep 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2412-08812.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/corl/ZitkovichYXXXXW23,
  author       = {Brianna Zitkovich and
                  Tianhe Yu and
                  Sichun Xu and
                  Peng Xu and
                  Ted Xiao and
                  Fei Xia and
                  Jialin Wu and
                  Paul Wohlhart and
                  Stefan Welker and
                  Ayzaan Wahid and
                  Quan Vuong and
                  Vincent Vanhoucke and
                  Huong T. Tran and
                  Radu Soricut and
                  Anikait Singh and
                  Jaspiar Singh and
                  Pierre Sermanet and
                  Pannag R. Sanketi and
                  Grecia Salazar and
                  Michael S. Ryoo and
                  Krista Reymann and
                  Kanishka Rao and
                  Karl Pertsch and
                  Igor Mordatch and
                  Henryk Michalewski and
                  Yao Lu and
                  Sergey Levine and
                  Lisa Lee and
                  Tsang{-}Wei Edward Lee and
                  Isabel Leal and
                  Yuheng Kuang and
                  Dmitry Kalashnikov and
                  Ryan Julian and
                  Nikhil J. Joshi and
                  Alex Irpan and
                  Brian Ichter and
                  Jasmine Hsu and
                  Alexander Herzog and
                  Karol Hausman and
                  Keerthana Gopalakrishnan and
                  Chuyuan Fu and
                  Pete Florence and
                  Chelsea Finn and
                  Kumar Avinava Dubey and
                  Danny Driess and
                  Tianli Ding and
                  Krzysztof Marcin Choromanski and
                  Xi Chen and
                  Yevgen Chebotar and
                  Justice Carbajal and
                  Noah Brown and
                  Anthony Brohan and
                  Montserrat Gonzalez Arenas and
                  Kehang Han},
  editor       = {Jie Tan and
                  Marc Toussaint and
                  Kourosh Darvish},
  title        = {{RT-2:} Vision-Language-Action Models Transfer Web Knowledge to Robotic
                  Control},
  booktitle    = {Conference on Robot Learning, CoRL 2023, 6-9 November 2023, Atlanta,
                  GA, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {229},
  pages        = {2165--2183},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v229/zitkovich23a.html},
  timestamp    = {Mon, 20 Jan 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/corl/ZitkovichYXXXXW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/NakamotoZSM0FKL23,
  author       = {Mitsuhiko Nakamoto and
                  Simon Zhai and
                  Anikait Singh and
                  Max Sobol Mark and
                  Yi Ma and
                  Chelsea Finn and
                  Aviral Kumar and
                  Sergey Levine},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Cal-QL: Calibrated Offline {RL} Pre-Training for Efficient Online
                  Fine-Tuning},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/c44a04289beaf0a7d968a94066a1d696-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/NakamotoZSM0FKL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/SinghKVCL23,
  author       = {Anikait Singh and
                  Aviral Kumar and
                  Quan Vuong and
                  Yevgen Chebotar and
                  Sergey Levine},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {ReDS: Offline {RL} With Heteroskedastic Datasets via Support Constraints},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/4b5d47949866d06ab5c03022b4a5a551-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/SinghKVCL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/rss/KumarSENYFL23,
  author       = {Aviral Kumar and
                  Anikait Singh and
                  Frederik D. Ebert and
                  Mitsuhiko Nakamoto and
                  Yanlai Yang and
                  Chelsea Finn and
                  Sergey Levine},
  editor       = {Kostas E. Bekris and
                  Kris Hauser and
                  Sylvia L. Herbert and
                  Jingjin Yu},
  title        = {Pre-Training for Robots: Offline {RL} Enables Learning New Tasks in
                  a Handful of Trials},
  booktitle    = {Robotics: Science and Systems XIX, Daegu, Republic of Korea, July
                  10-14, 2023},
  year         = {2023},
  url          = {https://doi.org/10.15607/RSS.2023.XIX.019},
  doi          = {10.15607/RSS.2023.XIX.019},
  timestamp    = {Thu, 20 Jul 2023 14:53:22 +0200},
  biburl       = {https://dblp.org/rec/conf/rss/KumarSENYFL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2303-05479,
  author       = {Mitsuhiko Nakamoto and
                  Yuexiang Zhai and
                  Anikait Singh and
                  Max Sobol Mark and
                  Yi Ma and
                  Chelsea Finn and
                  Aviral Kumar and
                  Sergey Levine},
  title        = {Cal-QL: Calibrated Offline {RL} Pre-Training for Efficient Online
                  Fine-Tuning},
  journal      = {CoRR},
  volume       = {abs/2303.05479},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2303.05479},
  doi          = {10.48550/ARXIV.2303.05479},
  eprinttype    = {arXiv},
  eprint       = {2303.05479},
  timestamp    = {Sat, 06 Sep 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2303-05479.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2307-15818,
  author       = {Anthony Brohan and
                  Noah Brown and
                  Justice Carbajal and
                  Yevgen Chebotar and
                  Xi Chen and
                  Krzysztof Choromanski and
                  Tianli Ding and
                  Danny Driess and
                  Avinava Dubey and
                  Chelsea Finn and
                  Pete Florence and
                  Chuyuan Fu and
                  Montse Gonzalez Arenas and
                  Keerthana Gopalakrishnan and
                  Kehang Han and
                  Karol Hausman and
                  Alexander Herzog and
                  Jasmine Hsu and
                  Brian Ichter and
                  Alex Irpan and
                  Nikhil J. Joshi and
                  Ryan Julian and
                  Dmitry Kalashnikov and
                  Yuheng Kuang and
                  Isabel Leal and
                  Lisa Lee and
                  Tsang{-}Wei Edward Lee and
                  Sergey Levine and
                  Yao Lu and
                  Henryk Michalewski and
                  Igor Mordatch and
                  Karl Pertsch and
                  Kanishka Rao and
                  Krista Reymann and
                  Michael S. Ryoo and
                  Grecia Salazar and
                  Pannag Sanketi and
                  Pierre Sermanet and
                  Jaspiar Singh and
                  Anikait Singh and
                  Radu Soricut and
                  Huong T. Tran and
                  Vincent Vanhoucke and
                  Quan Vuong and
                  Ayzaan Wahid and
                  Stefan Welker and
                  Paul Wohlhart and
                  Jialin Wu and
                  Fei Xia and
                  Ted Xiao and
                  Peng Xu and
                  Sichun Xu and
                  Tianhe Yu and
                  Brianna Zitkovich},
  title        = {{RT-2:} Vision-Language-Action Models Transfer Web Knowledge to Robotic
                  Control},
  journal      = {CoRR},
  volume       = {abs/2307.15818},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.15818},
  doi          = {10.48550/ARXIV.2307.15818},
  eprinttype    = {arXiv},
  eprint       = {2307.15818},
  timestamp    = {Mon, 20 Jan 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-15818.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-13041,
  author       = {Chethan Bhateja and
                  Derek Guo and
                  Dibya Ghosh and
                  Anikait Singh and
                  Manan Tomar and
                  Quan Vuong and
                  Yevgen Chebotar and
                  Sergey Levine and
                  Aviral Kumar},
  title        = {Robotic Offline {RL} from Internet Videos via Value-Function Pre-Training},
  journal      = {CoRR},
  volume       = {abs/2309.13041},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.13041},
  doi          = {10.48550/ARXIV.2309.13041},
  eprinttype    = {arXiv},
  eprint       = {2309.13041},
  timestamp    = {Sun, 06 Oct 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-13041.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-08864,
  author       = {Open X.{-}Embodiment Collaboration and
                  Abhishek Padalkar and
                  Acorn Pooley and
                  Ajinkya Jain and
                  Alex Bewley and
                  Alexander Herzog and
                  Alex Irpan and
                  Alexander Khazatsky and
                  Anant Raj and
                  Anikait Singh and
                  Anthony Brohan and
                  Antonin Raffin and
                  Ayzaan Wahid and
                  Ben Burgess{-}Limerick and
                  Beomjoon Kim and
                  Bernhard Sch{\"{o}}lkopf and
                  Brian Ichter and
                  Cewu Lu and
                  Charles Xu and
                  Chelsea Finn and
                  Chenfeng Xu and
                  Cheng Chi and
                  Chenguang Huang and
                  Christine Chan and
                  Chuer Pan and
                  Chuyuan Fu and
                  Coline Devin and
                  Danny Driess and
                  Deepak Pathak and
                  Dhruv Shah and
                  Dieter B{\"{u}}chler and
                  Dmitry Kalashnikov and
                  Dorsa Sadigh and
                  Edward Johns and
                  Federico Ceola and
                  Fei Xia and
                  Freek Stulp and
                  Gaoyue Zhou and
                  Gaurav S. Sukhatme and
                  Gautam Salhotra and
                  Ge Yan and
                  Giulio Schiavi and
                  Gregory Kahn and
                  Hao Su and
                  Haoshu Fang and
                  Haochen Shi and
                  Heni Ben Amor and
                  Henrik I. Christensen and
                  Hiroki Furuta and
                  Homer Walke and
                  Hongjie Fang and
                  Igor Mordatch and
                  Ilija Radosavovic and
                  et al.},
  title        = {Open X-Embodiment: Robotic Learning Datasets and {RT-X} Models},
  journal      = {CoRR},
  volume       = {abs/2310.08864},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.08864},
  doi          = {10.48550/ARXIV.2310.08864},
  eprinttype    = {arXiv},
  eprint       = {2310.08864},
  timestamp    = {Thu, 15 May 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-08864.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/KumarHSL22,
  author       = {Aviral Kumar and
                  Joey Hong and
                  Anikait Singh and
                  Sergey Levine},
  title        = {Should {I} Run Offline Reinforcement Learning or Behavioral Cloning?},
  booktitle    = {The Tenth International Conference on Learning Representations, {ICLR}
                  2022, Virtual Event, April 25-29, 2022},
  publisher    = {OpenReview.net},
  year         = {2022},
  url          = {https://openreview.net/forum?id=AP1MKT37rJ},
  timestamp    = {Sat, 20 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/KumarHSL22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2204-05618,
  author       = {Aviral Kumar and
                  Joey Hong and
                  Anikait Singh and
                  Sergey Levine},
  title        = {When Should We Prefer Offline Reinforcement Learning Over Behavioral
                  Cloning?},
  journal      = {CoRR},
  volume       = {abs/2204.05618},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2204.05618},
  doi          = {10.48550/ARXIV.2204.05618},
  eprinttype    = {arXiv},
  eprint       = {2204.05618},
  timestamp    = {Sat, 06 Sep 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2204-05618.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-05178,
  author       = {Aviral Kumar and
                  Anikait Singh and
                  Frederik Ebert and
                  Yanlai Yang and
                  Chelsea Finn and
                  Sergey Levine},
  title        = {Pre-Training for Robots: Offline {RL} Enables Learning New Tasks from
                  a Handful of Trials},
  journal      = {CoRR},
  volume       = {abs/2210.05178},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.05178},
  doi          = {10.48550/ARXIV.2210.05178},
  eprinttype    = {arXiv},
  eprint       = {2210.05178},
  timestamp    = {Sat, 06 Sep 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-05178.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-01052,
  author       = {Anikait Singh and
                  Aviral Kumar and
                  Quan Vuong and
                  Yevgen Chebotar and
                  Sergey Levine},
  title        = {Offline {RL} With Realistic Datasets: Heteroskedasticity and Support
                  Constraints},
  journal      = {CoRR},
  volume       = {abs/2211.01052},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.01052},
  doi          = {10.48550/ARXIV.2211.01052},
  eprinttype    = {arXiv},
  eprint       = {2211.01052},
  timestamp    = {Sat, 06 Sep 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-01052.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/corl/KumarSTFL21,
  author       = {Aviral Kumar and
                  Anikait Singh and
                  Stephen Tian and
                  Chelsea Finn and
                  Sergey Levine},
  editor       = {Aleksandra Faust and
                  David Hsu and
                  Gerhard Neumann},
  title        = {A Workflow for Offline Model-Free Robotic Reinforcement Learning},
  booktitle    = {Conference on Robot Learning, 8-11 November 2021, London, {UK}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {164},
  pages        = {417--428},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {https://proceedings.mlr.press/v164/kumar22a.html},
  timestamp    = {Wed, 19 Jan 2022 17:10:33 +0100},
  biburl       = {https://dblp.org/rec/conf/corl/KumarSTFL21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-10813,
  author       = {Aviral Kumar and
                  Anikait Singh and
                  Stephen Tian and
                  Chelsea Finn and
                  Sergey Levine},
  title        = {A Workflow for Offline Model-Free Robotic Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2109.10813},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.10813},
  eprinttype    = {arXiv},
  eprint       = {2109.10813},
  timestamp    = {Mon, 27 Sep 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-10813.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}