@misc{khandelwal2024:100k,title={{$100K or 100 Days: Trade-offs when Pre-Training with Academic Resources}},author={Khandelwal, Apoorv and Yun, Tian and Nayak, Nihal V. and Merullo, Jack and Bach, Stephen H. and Sun, Chen and Pavlick, Ellie},year={2024},pdf={https://arxiv.org/pdf/2410.23261},code={https://github.com/apoorvkh/academic-pretraining},eprint={2410.23261},archiveprefix={arXiv},primaryclass={cs.CL},abbr={ArXiv},preprint={true},bibtex_show={true},journal={ArXiv}}
Findings
Learning to Generate Instruction Tuning Datasets for Zero-Shot Task Adaptation
@inproceedings{bonito:aclfindings24,title={Learning to Generate Instruction Tuning Datasets for Zero-Shot Task Adaptation},author={Nayak, Nihal V. and Nan, Yiyang and Trost, Avi and Bach, Stephen H.},booktitle={Findings of the Association for Computational Linguistics: ACL 2024},year={2024},selected={true},preprint={false},bibtex_show={true},abbr={Findings},pdf={https://arxiv.org/abs/2402.18334},blog={https://snorkel.ai/how-bonito-helps-fine-tune-specialized-llms-faster-than-ever/},code={https://github.com/BatsResearch/nayak-arxiv24-code},project={https://github.com/BatsResearch/bonito}}
Findings
Does CLIP Bind Concepts? Probing Compositionality in Large Image Models
@inproceedings{lewis:eacl24,title={Does CLIP Bind Concepts? Probing Compositionality in Large Image Models},author={Lewis, Martha and Nayak, Nihal V. and Yu, Peilin and Yu, Qinan and Merullo, Jack and Bach, Stephen H. and Pavlick, Ellie},year={2024},selected={true},preprint={false},bibtex_show={true},booktitle={Findings of the Association for Computational Linguistics: EACL 2024},abbr={Findings},pdf={https://arxiv.org/abs/2212.10537},code={https://github.com/marthaflinderslewis/clip-binding}}
2023
NeurIPS-W
Learning to Generate Instructions to Adapt Language Models to New Tasks
Nihal V. Nayak, Yiyang Nan, Avi Trost, and Stephen Bach
In Findings of the Association for Computational Linguistics: EACL 2024 2023
@misc{nayak:neurips23,title={Learning to Generate Instructions to Adapt Language Models to New Tasks},author={Nayak, Nihal V. and Nan, Yiyang and Trost, Avi and Bach, Stephen},year={2023},selected={false},preprint={false},journal={Workshop on Instruction Tuning and Instruction Following @ NeurIPS 2023},abbr={NeurIPS-W},bibtex_show={true},pdf={https://openreview.net/forum?id=tw2w8rgWMV}}
ICLR
Learning to Compose Soft Prompts for Compositional Zero-Shot Learning
@inproceedings{csp:iclr23,author={Nayak, Nihal V. and Yu, Peilin and Bach, Stephen H.},title={Learning to Compose Soft Prompts for Compositional Zero-Shot Learning},booktitle={International Conference on Learning Representations (ICLR)},year={2023},abbr={ICLR},bibtex_show={true},selected={true},pdf={https://arxiv.org/abs/2204.03574},code={https://github.com/BatsResearch/csp}}
2022
ArXiv
BLOOM: A 176B-Parameter Open-Access Multilingual Language Model
Teven Le Scao, Angela Fan, Christopher Akiki, Ellie Pavlick, Suzana Ilić, Daniel Hesslow, Roman Castagné, Alexandra Sasha Luccioni, François Yvon, Matthias Gallé, and others
@article{bloom:arxiv22,title={BLOOM: A 176B-Parameter Open-Access Multilingual Language Model},author={Scao, Teven Le and Fan, Angela and Akiki, Christopher and Pavlick, Ellie and Ili{\'c}, Suzana and Hesslow, Daniel and Castagn{\'e}, Roman and Luccioni, Alexandra Sasha and Yvon, Fran{\c{c}}ois and Gall{\'e}, Matthias and others},year={2022},abbr={ArXiv},preprint={true},bibtex_show={true},journal={ArXiv},pdf={https://arxiv.org/abs/2211.05100},project={https://huggingface.co/bigscience/bloom}}
ArXiv
CEREAL: Few-Sample Clustering Evaluation
Nihal V. Nayak, Ethan R. Elenberg, and Clemens Rosenbaum
@article{cereal:arxiv22,title={CEREAL: Few-Sample Clustering Evaluation},author={Nayak, Nihal V. and Elenberg, Ethan R. and Rosenbaum, Clemens},year={2022},selected={false},preprint={true},journal={ArXiv},bibtex_show={true},abbr={ArXiv},pdf={https://arxiv.org/abs/2210.00064}}
TMLR
Zero-Shot Learning with Common Sense Knowledge Graphs
@article{nayak:tmlr22,author={Nayak, Nihal V. and Bach, Stephen H.},title={Zero-Shot Learning with Common Sense Knowledge Graphs},year={2022},pdf={https://arxiv.org/abs/2006.10713},project={https://github.com/BatsResearch/zsl-kg},code={https://github.com/BatsResearch/nayak-arxiv20-code},journal={Transactions on Machine Learning Research},abbr={TMLR},bibtex_show={true},selected={true}}
ACL
PromptSource: An Integrated Development Environment and Repository for Natural Language Prompts
Stephen H. Bach, Victor Sanh, Zheng-Xin Yong, Albert Webson, Colin Raffel,
Nihal V. Nayak, Abheesht Sharma, Taewoon Kim, M Saiful Bari, Thibault Fevry, Zaid Alyafeai, Manan Dey, Andrea Santilli, Zhiqing Sun, Srulik Ben-David, Canwen Xu, Gunjan Chhablani, Han Wang, Jason Alan Fries, Maged S. Al-shaibani, Shanya Sharma, Urmish Thakker, Khalid Almubarak, Xiangru Tang, Dragomir Radev, Mike Tian-Jian Jiang, and Alexander M. Rush
In Meeting of the Association for Computational Linguistics (ACL) Demonstration 2022
@inproceedings{bach:acldemo22,author={Bach, Stephen H. and Sanh, Victor and Yong, Zheng-Xin and Webson, Albert and Raffel, Colin and Nayak, Nihal V. and Sharma, Abheesht and Kim, Taewoon and Bari, M Saiful and Fevry, Thibault and Alyafeai, Zaid and Dey, Manan and Santilli, Andrea and Sun, Zhiqing and Ben-David, Srulik and Xu, Canwen and Chhablani, Gunjan and Wang, Han and Fries, Jason Alan and Al-shaibani, Maged S. and Sharma, Shanya and Thakker, Urmish and Almubarak, Khalid and Tang, Xiangru and Radev, Dragomir and Jiang, Mike Tian-Jian and Rush, Alexander M.},title={{P}rompt{S}ource: {A}n Integrated Development Environment and Repository for Natural Language Prompts},booktitle={Meeting of the Association for Computational Linguistics (ACL) Demonstration},pdf={https://arxiv.org/abs/2202.01279},project={https://github.com/bigscience-workshop/promptsource},year={2022},abbr={ACL},bibtex_show={true}}
ICLR
Multitask Prompted Training Enables Zero-Shot Task Generalization
Victor Sanh, Albert Webson, Colin Raffel, Stephen H. Bach, Lintang Sutawika, Zaid Alyafeai, Antoine Chaffin, Arnaud Stiegler, Teven Le Scao, Arun Raja, Manan Dey, M Saiful Bari, Canwen Xu, Urmish Thakker, Shanya Sharma Sharma, Eliza Szczechla, Taewoon Kim, Gunjan Chhablani,
Nihal V. Nayak, Debajyoti Datta, Jonathan Chang, Mike Tian-Jian Jiang, Han Wang, Matteo Manica, Sheng Shen, Zheng Xin Yong, Harshit Pandey, Rachel Bawden, Thomas Wang, Trishala Neeraj, Jos Rozen, Abheesht Sharma, Andrea Santilli, Thibault Fevry, Jason Alan Fries, Ryan Teehan, Stella Biderman, Leo Gao, Tali Bers, Thomas Wolf, and Alexander M. Rush
In International Conference on Learning Representations (ICLR) 2022
@inproceedings{sanh:iclr22,author={Sanh, Victor and Webson, Albert and Raffel, Colin and Bach, Stephen H. and Sutawika, Lintang and Alyafeai, Zaid and Chaffin, Antoine and Stiegler, Arnaud and Scao, Teven Le and Raja, Arun and Dey, Manan and Bari, M Saiful and Xu, Canwen and Thakker, Urmish and Sharma, Shanya Sharma and Szczechla, Eliza and Kim, Taewoon and Chhablani, Gunjan and Nayak, Nihal V. and Datta, Debajyoti and Chang, Jonathan and Jiang, Mike Tian-Jian and Wang, Han and Manica, Matteo and Shen, Sheng and Yong, Zheng Xin and Pandey, Harshit and Bawden, Rachel and Wang, Thomas and Neeraj, Trishala and Rozen, Jos and Sharma, Abheesht and Santilli, Andrea and Fevry, Thibault and Fries, Jason Alan and Teehan, Ryan and Biderman, Stella and Gao, Leo and Bers, Tali and Wolf, Thomas and Rush, Alexander M.},title={Multitask Prompted Training Enables Zero-Shot Task Generalization},booktitle={International Conference on Learning Representations (ICLR)},year={2022},pdf={https://arxiv.org/abs/2110.08207},project={https://github.com/bigscience-workshop/promptsource},code={https://github.com/bigscience-workshop/t-zero},abbr={ICLR},bibtex_show={true},selected={true}}
MLSys
TAGLETS: A System for Automatic Semi-Supervised Learning with Auxiliary Data
Wasu Piriyakulkij, Cristina Menghini, Ross Briden,
Nihal V. Nayak, Jeffrey Zhu, Elaheh Raisi, and Stephen H. Bach
In Conference on Machine Learning and Systems (MLSys) 2022
@inproceedings{piriyakulkij:mlsys22,author={Piriyakulkij, Wasu and Menghini, Cristina and Briden, Ross and Nayak, Nihal V. and Zhu, Jeffrey and Raisi, Elaheh and Bach, Stephen H.},title={{TAGLETS}: {A} System for Automatic Semi-Supervised Learning with Auxiliary Data},booktitle={Conference on Machine Learning and Systems (MLSys)},year={2022},pdf={https://arxiv.org/abs/2111.04798},project={https://github.com/BatsResearch/taglets},bibtex_show={true},abbr={MLSys}}
2019
RANLP
Study on Unsupervised Statistical Machine Translation for Backtranslation
Anush Kumar,
Nihal V. Nayak, Aditya Chandra, and Mydhili K. Nair
In Proceedings of the International Conference on Recent Advances in Natural Language Processing (RANLP) 2019
@inproceedings{kumar:ranlp19,title={Study on Unsupervised Statistical Machine Translation for Backtranslation},author={Kumar, Anush and Nayak, Nihal V. and Chandra, Aditya and Nair, Mydhili K.},booktitle={Proceedings of the International Conference on Recent Advances in Natural Language Processing (RANLP)},address={Varna, Bulgaria},publisher={INCOMA Ltd.},pdf={https://aclanthology.org/R19-1068},abbr={RANLP},year={2019},bibtex_show={true},doi={10.26615/978-954-452-056-4_068},pages={578--582}}
AAAI
DEXTER - Data EXTraction & Entity Recognition for Low Resource Datasets
Nihal V. Nayak, Pratheek Mahishi, and Sagar Rao
In AAAI Spring Symposium: Combining Machine Learning with Knowledge Engineering (AAAI-MAKE) 2019
@inproceedings{nayak:aaai19,title={DEXTER - Data EXTraction \& Entity Recognition for Low Resource Datasets},author={Nayak, Nihal V. and Mahishi, Pratheek and Rao, Sagar},booktitle={AAAI Spring Symposium: Combining Machine Learning with Knowledge Engineering (AAAI-MAKE)},year={2019},pdf={http://ceur-ws.org/Vol-2350/paper13.pdf},bibtex_show={true},abbr={AAAI}}
2018
BEA
Context Based Approach for Second Language Acquisition
Nihal V. Nayak, and Arjun R. Rao
In Proceedings of the Thirteenth Workshop on Innovative Use of NLP for Building Educational Applications (BEA) 2018
@inproceedings{nayak:acl2017,title={{V} for Vocab: An Intelligent {F}lashcard Application},author={Nayak, Nihal V. and Chinchore, Tanmay and Hanumanth Rao, Aishwarya and Martin, Shane Michael and Simha, Sagar Nagaraj and Lingaraju, G. M. and Jamadagni, H. S.},booktitle={Proceedings of {ACL} 2017, Student Research Workshop (ACL-SRW)},year={2017},publisher={Association for Computational Linguistics},pdf={https://aclanthology.org/P17-3005},pages={24--29},abbr={ACL-SRW},bibtex_show={true}}