Gorilla: Large Language Model Connected with Massive APIs
Shishir G. Patil, Tianjun Zhang, Xin Wang, Joseph E. Gonzalez
Neural Information Processing Systems (NeurIPS) 2024
[Paper]
[Code]
[Slides]
[Short Video]
[Long Video]
[bibtex]
@inproceedings{patil2023gorilla,
title={Gorilla: Large Language Model Connected with Massive APIs},
author={Shishir G. Patil and Tianjun Zhang and Xin Wang and Joseph E. Gonzalez},
booktitle = {Advances in Neural Information Processing Systems},
volume = {37},
year = {2024},
url = {https://proceedings.neurips.cc/paper_files/paper/2024/file/e4c61f578ff07830f5c37378dd3ecb0d-Paper-Conference.pdf}
}
The Berkeley Function Calling Leaderboard (BFCL): From Tool Use to Agentic Evaluation of Large Language Models
Shishir G. Patil, Huanzhi Mao, Fanjia Yan, Charlie Ji, Vishnu Suresh, Ion Stoica, Joseph E Gonzalez
International Conference of Machine Learning (ICML) 2025
[Paper]
[Leaderboard]
[Code]
[bibtex]
@inproceedings{patil2025bfcl,
title={The Berkeley Function Calling Leaderboard (BFCL): From Tool Use to Agentic Evaluation of Large Language Models},
author={Patil, Shishir G. and Mao, Huanzhi and Yan, Fanjia and Ji, Charlie and Suresh, Vishnu and Stoica, Ion and Gonzalez, Joseph E}
year={2025},
booktitle={International Conference on Machine Learning}
}
GoEX: Perspectives and Designs Towards a Runtime for Autonomous LLM Applications
Shishir G. Patil, Tianjun Zhang, Vivian Fang, Noppapon C., Roy Huang, Aaron Hao, Martin Casado, Joseph E. Gonzalez, Raluca Ada Popa, Ion Stoica
arXiv preprint arXiv:2404.06921
[Paper]
[Code]
[bibtex]
@inproceedings{patil2024goex,
title={GoEX: Perspectives and Designs Towards a Runtime for Autonomous LLM Applications},
author={Shishir G. Patil and Tianjun Zhang and Vivian Fang and Noppapon C. and Roy Huang and Aaron Hao and Martin Casado and Joseph E. Gonzalez and Raluca Ada Popa and Ion Stoica},
year={2024},
journal={arXiv preprint arXiv:2404.06921}
}
The Llama 3 Herd of Models
Llama Team
[Paper]
[Model Weights]
[bibtex]
@article{llama3,
title={The Llama 3 Herd of Models},
author={Dubey, Abhimanyu and Jauhri, Abhinav and Pandey, Abhinav and Kadian, Abhishek and Al-Dahle, Ahmad and Letman, Aiesha and Mathur, Akhil and Schelten, Alan and Yang, Amy and Fan, Angela and others},
year={2024},
journal={arXiv preprint arXiv:2407.21783}
}
Efficient ML Model Updates for Deeply Embedded Microcontrollers
Shishir G. Patil, Sam Kumar, Prabal Dutta, Joseph E. Gonzalez
EuroSys 2026
[Paper]
[Code]
[bibtex]
@inproceedings{patil2026efficient,
title={Efficient ML Model Updates for Deeply Embedded Microcontrollers},
author={Shishir G. Patil and Sam Kumar and Prabal Dutta and Joseph E. Gonzalez},
year={2026},
journal={Proceedings of the 2026 EuroSys Conference},
url = "https://2026.eurosys.org/papers.html",
}
LLMs Can Easily Learn to Reason from Demonstrations Structure, not content, is what matters!
Dacheng Li, Shiyi Cao, Tyler Griggs, Shu Liu, Xiangxi Mo, Eric Tang, Sumanth Hegde, Kourosh Hakhamaneshi, Shishir G. Patil, Matei Zaharia, Joseph E. Gonzalez, Ion Stoica
Empirical Methods in Natural Language Processing (EMNLP) 2025
[Paper]
[Code]
[bibtex]
@article{skythought,
title={LLMs Can Easily Learn to Reason from Demonstrations Structure, not content, is what matters!},
author={Li, Dacheng and Cao, Shiyi and Griggs, Tyler and Liu, Shu and Mo, Xiangxi and Tang, Eric and Hegde, Sumanth and Hakhamaneshi, Kourosh and Patil, Shishir G. and Zaharia, Matei and Gonzalez, Joseph E. and Stoica, Ion},
year={2025},
journal={Empirical Methods in Natural Language Processing (EMNLP) 2025}
}
AdvancedIF: Rubric-Based Benchmarking and Reinforcement Learning for Advancing LLM Instruction Following
Llama Team
Association for Computational Linguistics (ACL 2026)
[Paper]
[Model Weights]
[bibtex]
@article{llama3,
title={AdvancedIF: Rubric-Based Benchmarking and Reinforcement Learning for Advancing LLM Instruction Following},
author={Dubey, Abhimanyu and Jauhri, Abhinav and Pandey, Abhinav and Kadian, Abhishek and Al-Dahle, Ahmad and Letman, Aiesha and Mathur, Akhil and Schelten, Alan and Yang, Amy and Fan, Angela and others},
year={2024},
journal={arXiv preprint arXiv:2407.21783}
}
LLoCO: Learning Long Contexts Offline
Sijun Tan, Xiuyu Li, Shishir G. Patil, Ziyang Wu, Tianjun Zhang, Kurt Keutzer, Joseph E. Gonzalez, Raluca Ada Popa
Empirical Methods in Natural Language Processing (EMNLP) 2024
[Paper]
[Code]
[bibtex]
@inproceedings{tan2024lloco,
title={LLoCO: Learning Long Contexts Offline},
author={Tan, Sijun and Li, Xiuyu and Patil, Shishir G and Wu, Ziyang and Zhang, Tianjun and Keutzer, Kurt and Gonzalez, Joseph E. and Popa, Raluca Ada},
year={2024},
journal={Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing},
url = "https://aclanthology.org/2024.emnlp-main.975/",
doi = "10.18653/v1/2024.emnlp-main.975",
}
RAFT: Adapting Language Model to Domain Specific RAG
Tianjun Zhang, Shishir G. Patil, Naman Jain, Sheng Shen, Matei Zaharia, Ion Stoica, Joseph E. Gonzalez
Conference on Language Modeling (COLM) 2024
[Paper]
[Code]
[bibtex]
@inproceedings{zhang2024raft,
title={RAFT: Adapting Language Model to Domain Specific RAG},
author={Tianjun Zhang and Shishir G. Patil and Naman Jain and Sheng Shen and Matei
Zaharia and Ion Stoica and Joseph E. Gonzalez},
year={2024},
journal={arXiv preprint arXiv:2403.10131}
}
Nebula: A Privacy-First Platform for Data Backhaul
Jean-Luc Watson, Tess Despres, Alvin Tan, Shishir G. Patil, Prabal Dutta, Raluca Ada Popa
IEEE Symposium of Security and Privacy - IEEE S&P (Oakland) 2024.
[Paper]
[bibtex]
@inproceedings{watson2024nebula,
title={Nebula: A Privacy-First Platform for Data Backhaul},
author={Jean-Luc Watson and Tess Despres and Alvin Tan and Shishir G. Patil and Prabal Dutta and Raluca Ada Popa},
year={2024},
booktitle={2024 IEEE Symposium on Security and Privacy (SP)}
}
Revisiting Edge AI: Opportunities and Challenges
Tobias Meuser, Lauri Lovén, Monowar Bhuyan, Shishir G. Patil, Schahram Dustdar, Atakan Aral, Suzan Bayhan, Christian Becker, Eyal de Lara, Aaron Yi Ding, Janick Edinger, James Gross, Nitinder Mohan, Andy D. Pimentel, Etienne Rivière, Henning Schulzrinne, Pieter Simoens, Gürkan Solmaz
IEEE Internet Computing 2024
[Paper]
[bibtex]
@article{revisitingedgeai,
title={Revisiting Edge AI: Opportunities and Challenges},
author={Meuser, Tobias and Lovén, Lauri and Bhuyan, Monowar and Patil, Shishir G. and Dustdar, Schahram and Aral, Atakan and Bayhan, Suzan and Becker, Christian and de Lara, Eyal and Ding, Aaron Yi and Edinger, Janick and Gross, James and Mohan, Nitinder and Pimentel, Andy D. and Rivière, Etienne and Schulzrinne, Henning and Simoens, Pieter and Solmaz, Gürkan},
journal={IEEE Internet Computing},
volume={28},
number={4},
pages={49--59},
year={2024},
doi={10.1109/MIC.2024.3383758}
}
MemGPT: Towards LLMs as operating systems
Charles Packer, Vivian Fang, Shishir G. Patil, Kevin Lin, Sarah Wooders, Joseph E. Gonzalez
arXiv preprint arXiv:2310.08560
[Paper]
[Code]
[bibtex]
@inproceedings{packer2023memgpt,
title={MemGPT: Towards LLMs as operating systems},
author={Packer, Charles and Fang, Vivian and Patil, Shishir G and Lin, Kevin and Wooders, Sarah and Gonzalez, Joseph E},
year={2023},
journal={arXiv preprint arXiv:2310.08560}
}
Skyplane: Optimizing Transfer Cost and Throughput Using Cloud-Aware Overlays
Paras Jain, Sam Kumar, Sarah Wooders, Shishir G. Patil, Joseph E. Gonzalez, Ion Stoica
USENIX Symposium on Networked Systems Design and Implementation (NSDI) 2023
[Paper]
[Code]
[bibtex]
@inproceedings{jain2022skyplane,
title={Skyplane: Optimizing Transfer Cost and Throughput Using Cloud-Aware Overlays},
author={Jain, Paras and Kumar, Sam and Wooders, Sarah and Patil, Shishir G and Gonzalez, Joseph E and Stoica, Ion},
booktitle = {20th USENIX Symposium on Networked Systems Design and Implementation (NSDI 23)},
year={2023},
url = {https://www.usenix.org/conference/nsdi23/presentation/jain},
}
POET: Training Neural Networks on Tiny Devices with Integrated Rematerialization and Paging
Shishir G. Patil, Paras Jain, Prabal Dutta, Ion Stoica, Joseph E. Gonzalez
[Spotlight] International Conference of Machine Learning (ICML) 2022
[Paper]
[Code]
[Poster]
[Slides]
[Video]
[bibtex]
@inproceedings{patil2022poet,
title={POET: Training Neural Networks on Tiny Devices with Integrated Rematerialization and Paging},
author={Patil, Shishir G and Jain, Paras and Dutta, Prabal and Stoica, Ion and Gonzalez, Joseph},
booktitle={International Conference on Machine Learning},
pages={17573--17583},
year={2022},
organization={PMLR}
}
Where the Sidewalk Ends: Privacy of Opportunistic Backhaul
Tess Despres, Shishir Patil, Alvin Tan, Jean-Luc Watson, Prabal Dutta
Proceedings of the 15th European Workshop on Systems Security (EuroSec) 2022.
[Paper]
[bibtex]
@inproceedings{sidewalk,
title={Where the sidewalk ends: privacy of opportunistic backhaul},
author={Despres, Tess and Patil, Shishir and Tan, Alvin and Watson, Jean-Luc and Dutta, Prabal},
booktitle={Proceedings of the 15th European Workshop on Systems Security},
pages={1--7},
year={2022}
}
Learning Embeddings that Capture Spatial Semantics for Indoor Navigation
Vidhi Jain, Shishir G. Patil, Prakhar Agarwal, Katia Sycara
Neural Information Processing Systems (NeurIPS) 2020 (ORLR Workshop).
[Paper]
[Code]
[Poster]
[bibtex]
@inproceedings{jain2020,
title={Learning Embeddings that Capture Spatial Semantics for Indoor Navigation},
author={Jain, Vidhi and Patil, Shishir and Agarwal, Prakhar and Sycara, Katia},
booktitle={NeurIPS 2020, Workshop on Object Representations for Learning and Reasoning},
year={2020}
}
GesturePod: Enabling On-device Gesture-based Interaction for White Cane Users
Shishir G. Patil, Don Dennis, Chirag Pabbaraju, Nadeem Shaheer, Harsha Vardhan Simhadri, Vivek Seshadri, Manik Varma, Prateek Jain
ACM User Interface Software and Technology Symposium (UIST) 2019.
Also available as Microsoft Research Technical Report, MSR-TR-2018-14, May 2018
[Video Preview]
[Poster]
[Paper]
[Gesture Recognition Data set]
[Simulation and Code]
[bibtex]
@inproceedings{patil2019gesturepod,
title={Gesturepod: Enabling on-device gesture-based interaction for white cane users},
author={Patil, Shishir G and Dennis, Don Kurian and Pabbaraju, Chirag and Shaheer, Nadeem and
Simhadri, Harsha Vardhan and Seshadri, Vivek and Varma, Manik and Jain, Prateek},
booktitle={Proceedings of the 32nd Annual ACM Symposium on User Interface Software and Technology},
pages={403--415},
year={2019}
}
Real-world Demonstration of ML-based Gesture Recognition
Shishir G. Patil, Don Dennis, Harsha Vardhan Simhadri, Prateek Jain
2nd Workshop on Machine Learning on the Phone and
other Consumer Devices (MLPCD), NeurIPS 2018
[Poster]
[bibtex]
@inproceedings{patil2018,
title={Real-world Demonstration of ML-based Gesture Recognition},
author={Patil, Shishir G and Dennis, Don Kurian and Simhadri, Harsha Vardhan and Jain, Prateek},
booktitle={Proceedings of the 2nd Workshop on Machine Learning on the Phone and
other Consumer Devices (MLPCD) NeurIPS 2018},
year={2018}
}
Characterization and analysis of Transistor Outline TO-254 package for power device applications
Shishir G. Patil, B. Pavithra and M. M. Nayak
IEEE Electron Devices Society, 3rd International Conference on Emerging Electronics (ICEE) 2017
[Paper]
[bibtex]
@inproceedings{8074632,
author={S. G. {Patil} and B. {Pavithra} and M. M. {Nayak}},
booktitle={2016 3rd International Conference on Emerging Electronics (ICEE)},
title={Characterization and analysis of Transistor Outline TO-254 package for power device applications},
year={2016},
pages={1-5},
}