@inproceedings{groundcua,title={Grounding Computer Use Agents on Human Demonstrations},author={Nayak, Shravan and Feizi, Aarash and Jian, Xiangru and Lin, Kevin Qinghong and Li, Kaixin and Awal, Rabiul and Lù, Xing Han and Obando-Ceron, Johan and Rodriguez, Juan A and Chapados, Nicolas and Vazquez, David and Romero-Soriano, Adriana and Rabbany, Reihaneh and Taslakian, Perouz and Pal, Christopher and Gella, Spandana and Rajeswar, Sai},year={2025},}
Pre-print
Value Drifts: Tracing Value Alignment During LLM Post-Training
Mehar Bhatia, Shravan Nayak, Gaurav Kamath, and
3 more authors
@inproceedings{valuedrifts,title={Value Drifts: Tracing Value Alignment During LLM Post-Training},author={Bhatia, Mehar and Nayak, Shravan and Kamath, Gaurav and Mosbach, Marius and Shwartz, Vered and Reddy, Siva},year={2025},}
EMNLP Findings
CulturalFrames: Assessing Cultural Expectation Alignment in Text-to-Image Models and Evaluation Metrics
Shravan Nayak, Mehar Bhatia, Xiaofeng Zhang, and
6 more authors
@inproceedings{nayak2025culturalframesassessingculturalexpectation,title={CulturalFrames: Assessing Cultural Expectation Alignment in Text-to-Image Models and Evaluation Metrics},author={Nayak, Shravan and Bhatia, Mehar and Zhang, Xiaofeng and Rieser, Verena and Hendricks, Lisa Anne and van Steenkiste, Sjoerd and Goyal, Yash and Stańczak, Karolina and Agrawal, Aishwarya},year={2025},booktitle={EMNLP Findings}}
ICML
UI-Vision: A Desktop-centric GUI Benchmark for Visual Perception and Interaction
Shravan Nayak, Xiangru Jian, Kevin Qinghong Lin, and
11 more authors
@inproceedings{nayak2025uivisiondesktopcentricguibenchmark,title={UI-Vision: A Desktop-centric GUI Benchmark for Visual Perception and Interaction},author={Nayak, Shravan and Jian, Xiangru and Lin, Kevin Qinghong and Rodriguez, Juan A. and Kalsi, Montek and Awal, Rabiul and Chapados, Nicolas and Özsu, M. Tamer and Agrawal, Aishwarya and Vazquez, David and Pal, Christopher and Taslakian, Perouz and Gella, Spandana and Rajeswar, Sai},year={2025},booktitle={ICML}}
ICML
LIVS: A Pluralistic Alignment Dataset for Inclusive Public Spaces
Rashid Mushkani, Shravan Nayak, Hugo Berard, and
3 more authors
@inproceedings{mushkani2025livspluralisticalignmentdataset,title={LIVS: A Pluralistic Alignment Dataset for Inclusive Public Spaces},author={Mushkani, Rashid and Nayak, Shravan and Berard, Hugo and Cohen, Allison and Koseki, Shin and Bertrand, Hadrien},year={2025},booktitle={ICML},}
2024
ICLR
BigDocs: An Open and Permissively-Licensed Dataset for Training Multimodal Models on Document and Code Tasks
Juan Rodriguez, Xiangru Jian, Siba Smarak Panigrahi, and
40 more authors
@inproceedings{rodriguez2024bigdocsopenpermissivelylicenseddataset,title={BigDocs: An Open and Permissively-Licensed Dataset for Training Multimodal Models on Document and Code Tasks},author={Rodriguez, Juan and Jian, Xiangru and Panigrahi, Siba Smarak and Zhang, Tianyu and Feizi, Aarash and Puri, Abhay and Kalkunte, Akshay and Savard, François and Masry, Ahmed and Nayak, Shravan and Awal, Rabiul and Massoud, Mahsa and Abaskohi, Amirhossein and Li, Zichao and Wang, Suyuchen and Noël, Pierre-André and Richter, Mats Leon and Vadacchino, Saverio and Agarwal, Shubbam and Biswas, Sanket and Shanian, Sara and Zhang, Ying and Bolger, Noah and MacDonald, Kurt and Fauvel, Simon and Tejaswi, Sathwik and Sunkara, Srinivas and Monteiro, Joao and Dvijotham, Krishnamurthy DJ and Scholak, Torsten and Chapados, Nicolas and Kharagani, Sepideh and Hughes, Sean and Özsu, M. and Reddy, Siva and Pedersoli, Marco and Bengio, Yoshua and Pal, Christopher and Laradji, Issam and Gella, Spandanna and Taslakian, Perouz and Vazquez, David and Rajeswar, Sai},year={2024},eprint={2412.04626},archiveprefix={arXiv},primaryclass={cs.LG},}
EMNLP
Benchmarking Vision Language Models for Cultural Understanding
Shravan Nayak, Kanishk Jain, Rabiul Awal, and
5 more authors
@inproceedings{nayak2024benchmarkingvisionlanguagemodels,title={Benchmarking Vision Language Models for Cultural Understanding},author={Nayak, Shravan and Jain, Kanishk and Awal, Rabiul and Reddy, Siva and van Steenkiste, Sjoerd and Hendricks, Lisa Anne and Stańczak, Karolina and Agrawal, Aishwarya},booktitle={EMNLP},year={2024}}
EMNLP Findings
Towards Adversarially Robust Vision-Language Models: Insights from Design Choices and Prompt Formatting Techniques
Rishika Bhagwatkar, Shravan Nayak, Reza Bayat, and
4 more authors
In EMNLP Findings, TiFA Workshop (Outstanding paper), NextGenAISafety Workshop at ICML, 2024
@inproceedings{bhagwatkar2024adversariallyrobustvisionlanguagemodels,title={Towards Adversarially Robust Vision-Language Models: Insights from Design Choices and Prompt Formatting Techniques},author={Bhagwatkar, Rishika and Nayak, Shravan and Bayat, Reza and Roger, Alexis and Kaplan, Daniel Z and Bashivan, Pouya and Rish, Irina},booktitle={EMNLP Findings, TiFA Workshop (Outstanding paper), NextGenAISafety Workshop at ICML},year={2024}}
ESSV
Can We See Your Response Before You Speak? Exploring Linguistic Information Found in Inter-Utterance Pauses
Christian Schuler, Shravan Nayak, Debjoy Saha, and
1 more author
@inproceedings{SchulerNayakSahaetal.2024,author={Schuler, Christian and Nayak, Shravan and Saha, Debjoy and Baumann, Timo},title={Can We See Your Response Before You Speak? Exploring Linguistic Information Found in Inter-Utterance Pauses},booktitle={Elektronische Sprachsignalverarbeitung},year={2024}}
@inproceedings{nayak2024midspace,title={{MID}-Space: Aligning Diverse Communities' Needs to Inclusive Public Spaces},author={Nayak, Shravan and Mushkani, Rashid and Berard, Hugo and Cohen, Allison and Koseki, Shin and Bertrand, Hadrien},booktitle={Pluralistic Alignment Workshop at NeurIPS 2024},year={2024},url={https://openreview.net/forum?id=kyfkMRT4Ao}}
@inproceedings{nayak2023,author={Nayak, Shravan and Ranathunga, Surangika and Thillainathan, Sarubi and Hung, Rikki and Rinaldi, Anthony and Wang, Yining and Mackey, Jonah and Ho, Andrew and Lee, En-Shiun Annie},title={Leveraging Auxiliary Domain Parallel Data in Intermediate Task Fine-tuning for Low-resource Translation},booktitle={ICLR 2021 Workshop on Practical ML for Developing Countries},year={2023}}
2022
LREC
Merkel Podcast Corpus: A Multimodal Dataset Compiled from 16 Years of Angela Merkel’s Weekly Video Podcasts
Debjoy Saha, Shravan Nayak, and Timo Baumann
In International Conference on Language Resources and Evaluation, 2022
@inproceedings{Saha2022MerkelPC,title={Merkel Podcast Corpus: A Multimodal Dataset Compiled from 16 Years of Angela Merkel’s Weekly Video Podcasts},author={Saha, Debjoy and Nayak, Shravan and Baumann, Timo},booktitle={International Conference on Language Resources and Evaluation},year={2022}}
ACL Findings
Pre-Trained Multilingual Sequence-to-Sequence Models: A Hope for Low-Resource Language Translation?
En-Shiun Lee, Sarubi Thillainathan, Shravan Nayak, and
4 more authors
In Findings of the Association for Computational Linguistics: ACL 2022, May 2022
@inproceedings{lee-etal-2022-pre,title={Pre-Trained Multilingual Sequence-to-Sequence Models: A Hope for Low-Resource Language Translation?},author={Lee, En-Shiun and Thillainathan, Sarubi and Nayak, Shravan and Ranathunga, Surangika and Adelani, David and Su, Ruisi and McCarthy, Arya},booktitle={Findings of the Association for Computational Linguistics: ACL 2022},month=may,year={2022},address={Dublin, Ireland},publisher={Association for Computational Linguistics},pages={58--67}}
ICMI
A Deep Dive Into Neural Synchrony Evaluation for Audio-visual Translation
Shravan Nayak, Christian Schuler, Debjoy Saha, and
1 more author
International Conference on Multimodal Interaction, May 2022
@article{Nayak2022ADD,title={A Deep Dive Into Neural Synchrony Evaluation for Audio-visual Translation},author={Nayak, Shravan and Schuler, Christian and Saha, Debjoy and Baumann, Timo},journal={International Conference on Multimodal Interaction},year={2022}}
2020
COLING
The Two Shades of Dubbing in Neural Machine Translation
Alina Karakanta, Supratik Bhattacharya, Shravan Nayak, and
3 more authors
In International Conference on Computational Linguistics, May 2020
@inproceedings{Karakanta2020TheTS,title={The Two Shades of Dubbing in Neural Machine Translation},author={Karakanta, Alina and Bhattacharya, Supratik and Nayak, Shravan and Baumann, Timo and Negri, Matteo and Turchi, Marco},booktitle={International Conference on Computational Linguistics},year={2020}}
@article{Nayak2020SeeMS,title={See me Speaking? Differentiating on Whether Words are Spoken On Screen or Off to Optimize Machine Dubbing},author={Nayak, Shravan and Baumann, Timo and Bhattacharya, Supratik and Karakanta, Alina and Negri, Matteo and Turchi, Marco},journal={Deep Video Understanding Workshop, ICMI},year={2020}}
IEEE ISGT
Stochastic Game Frameworks for Efficient Energy Management in Microgrid Networks
Shravan Nayak, Chanakya Ajit Ekbote, Annanya Pratap Singh Chauhan, and
5 more authors
IEEE PES Innovative Smart Grid Technologies Europe (ISGT-Europe), May 2020
@article{Nayak2020StochasticGF,title={Stochastic Game Frameworks for Efficient Energy Management in Microgrid Networks},author={Nayak, Shravan and Ekbote, Chanakya Ajit and Chauhan, Annanya Pratap Singh and Diddigi, Raghuram Bharadwaj and Ray, Prishita and Sikdar, Abhinava and Danda, Sai Koti Reddy and Bhatnagar, Shalabh},journal={IEEE PES Innovative Smart Grid Technologies Europe (ISGT-Europe)},year={2020},pages={116-120}}