@article{arnaout2026responsible,title={Responsible Evaluation of AI for Mental Health},author={Arnaout, Hiba and Goel, Anmol and Schwartz, H Andrew and Eberhardt, Steffen T and Atzil-Slonim, Dana and Doherty, Gavin and Schwartz, Brian and Lutz, Wolfgang and Althoff, Tim and De Choudhury, Munmun and others},journal={arXiv preprint arXiv:2602.00065},year={2026},}
2025
2025
Do LLMs Suppress Naïve Theories? Investigating Scientific Reasoning and Development in GPT-4o
@article{shah2024naivetheories,title={Do LLMs Suppress Naïve Theories? Investigating Scientific Reasoning and Development in GPT-4o},author={Gupta, Sneh and Shah, Raj Sanjay and Varma, Sashank},journal={Advances in Cognitive Systems},year={2025},url={https://openreview.net/pdf?id=mMSxCWDkzP},}
The World According to LLMs: How Geographic Origin Influences LLMs’ Entity Deduction Capabilities
Harsh Nishant Lalai, Raj Sanjay Shah, Jiaxin Pei, and 3 more authors
@inproceedings{lalaiworld,title={The World According to LLMs: How Geographic Origin Influences LLMs' Entity Deduction Capabilities},author={Lalai, Harsh Nishant and Shah, Raj Sanjay and Pei, Jiaxin and Varma, Sashank and Wang, Yi-Chia and Emami, Ali},url={https://openreview.net/pdf?id=hJtvCfDfs1},booktitle={Second Conference on Language Modeling},year={2025},}
Guiding a user to interact with an intelligent computing system using best practices
Michelle Brachman, Zahra Ashktorab, Michael Desmond, and 5 more authors
@misc{brachman2025guiding,title={Guiding a user to interact with an intelligent computing system using best practices},author={Brachman, Michelle and Ashktorab, Zahra and Desmond, Michael and Do, Hyo Jin and Dugan, Casey and Johnson, James and Pan, Qian and Shah, Raj Sanjay},year={2025},month=jun,publisher={Google Patents},note={US Patent App. 18/542,554}}
Can llm-simulated practice and feedback upskill human counselors? a randomized study with 90+ novice counselors
Ryan Louie, Raj Sanjay Shah, Ifdita Hasan Orney, and 3 more authors
@article{louie2025can,title={Can llm-simulated practice and feedback upskill human counselors? a randomized study with 90+ novice counselors},author={Louie, Ryan and Shah, Raj Sanjay and Orney, Ifdita Hasan and Pacheco, Juan Pablo and Brunskill, Emma and Yang, Diyi},url={https://arxiv.org/abs/2505.02428},year={2025},}
Helping the helper: Supporting peer counselors via ai-empowered practice and feedback
Shang-Ling Hsu, Raj Sanjay Shah, Prathik Senthil, and 4 more authors
Proceedings of the ACM on Human-Computer Interaction, 2025
@article{hsu2025helping,title={Helping the helper: Supporting peer counselors via ai-empowered practice and feedback},author={Hsu, Shang-Ling and Shah, Raj Sanjay and Senthil, Prathik and Ashktorab, Zahra and Dugan, Casey and Geyer, Werner and Yang, Diyi},journal={Proceedings of the ACM on Human-Computer Interaction},volume={9},number={2},pages={1--45},year={2025},url={https://doi.org/10.1145/3710993},doi={10.1145/3710993},publisher={ACM New York, NY, USA},}
From Intentions to Techniques: A Comprehensive Taxonomy and Challenges in Text Watermarking for Large Language Models
Harsh Nishant Lalai, Aashish Anantha Ramakrishnan, Raj Sanjay Shah, and 1 more author
In Findings of the Association for Computational Linguistics: NAACL 2025, Apr 2025
@inproceedings{lalai-etal-2025-intentions,title={From Intentions to Techniques: A Comprehensive Taxonomy and Challenges in Text Watermarking for Large Language Models},author={Lalai, Harsh Nishant and Anantha Ramakrishnan, Aashish and Shah, Raj Sanjay and Lee, Dongwon},editor={Chiruzzo, Luis and Ritter, Alan and Wang, Lu},booktitle={Findings of the Association for Computational Linguistics: NAACL 2025},month=apr,year={2025},address={Albuquerque, New Mexico},publisher={Association for Computational Linguistics},url={https://aclanthology.org/2025.findings-naacl.343/},doi={10.18653/v1/2025.findings-naacl.343},pages={6162--6175},isbn={979-8-89176-195-7},}
TN-Eval: Rubric and Evaluation Protocols for Measuring the Quality of Behavioral Therapy Notes
Raj Sanjay Shah, Lei Xu, Qianchu Liu, and 3 more authors
In Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 6: Industry Track), Jul 2025
@inproceedings{shah-etal-2025-tn,title={{TN}-Eval: Rubric and Evaluation Protocols for Measuring the Quality of Behavioral Therapy Notes},author={Shah, Raj Sanjay and Xu, Lei and Liu, Qianchu and Burnsky, Jon and Bertagnolli, Andrew and Shivade, Chaitanya},editor={Rehm, Georg and Li, Yunyao},booktitle={Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 6: Industry Track)},month=jul,year={2025},address={Vienna, Austria},publisher={Association for Computational Linguistics},url={https://aclanthology.org/2025.acl-industry.14/},doi={10.18653/v1/2025.acl-industry.14},pages={179--199},isbn={979-8-89176-288-6},}
Findings of the Third BabyLM Challenge: Accelerating Language Modeling Research with Cognitively Plausible Data
Lucas Charpentier, Leshem Choshen, Ryan Cotterell, and 8 more authors
@article{charpentier2025babylm,title={Findings of the Third BabyLM Challenge: Accelerating Language Modeling Research with Cognitively Plausible Data},author={Charpentier, Lucas and Choshen, Leshem and Cotterell, Ryan and Gul, Mustafa Omer and Hu, Michael and Jumelet, Jaap and Linzen, Tal and Liu, Jing and Mueller, Aaron and Ross, Candace and others},url={https://arxiv.org/abs/2502.10645},year={2025},}
The potential–and the pitfalls–of using pre-trained language models as cognitive science theories
@article{shah2025potential,title={The potential--and the pitfalls--of using pre-trained language models as cognitive science theories},author={Shah, Raj Sanjay and Varma, Sashank},url={https://arxiv.org/abs/2501.12651},year={2025},}
The unlearning mirage: A dynamic framework for evaluating LLM unlearning
Raj Sanjay Shah, Jing Huang, Keerthiram Murugesan, and 2 more authors
@inproceedings{shah2025unlearning,title={The unlearning mirage: A dynamic framework for evaluating LLM unlearning},author={Shah, Raj Sanjay and Huang, Jing and Murugesan, Keerthiram and Baracaldo, Nathalie and Yang, Diyi},booktitle={Second Conference on Language Modeling},url={https://openreview.net/pdf?id=exW2SFJK4H},year={2025},}
2024
2024
Multi-Level Feedback Generation with Large Language Models for Empowering Novice Peer Counselors
Alicja Chaszczewicz, Raj Sanjay Shah, Ryan Louie, and 3 more authors
In Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics, 2024
@inproceedings{chaszczewicz2024multi,title={Multi-Level Feedback Generation with Large Language Models for Empowering Novice Peer Counselors},author={Chaszczewicz, Alicja and Shah, Raj Sanjay and Louie, Ryan and Arnow, Bruce A. and Kraut, Robert and Yang, Diyi},booktitle={Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics},year={2024},publisher={Association for Computational Linguistics},}
Natural Mitigation of Catastrophic Interference: Continual Learning in Power-Law Learning Environments
Raj Sanjay Shah, Atith Gandhi, Vijay Marupudi, and 1 more author
@article{gandhi2024catastrophic,title={Natural Mitigation of Catastrophic Interference: Continual Learning in Power-Law Learning Environments},author={Shah, Raj Sanjay and Gandhi, Atith and Marupudi, Vijay and Varma, Sashank},booktitle={ECAI 2024},year={2024},}
What Makes Digital Support Effective? How Therapeutic Skills Affect Clinical Well-Being
Wenjie Yang, Anna Fang, Raj Sanjay Shah, and 4 more authors
Proceedings of the ACM on Human-Computer Interaction, 2024
@article{yang2024makes,title={What Makes Digital Support Effective? How Therapeutic Skills Affect Clinical Well-Being},author={Yang, Wenjie and Fang, Anna and Shah, Raj Sanjay and Mathur, Yash and Yang, Diyi and Zhu, Haiyi and Kraut, Robert E.},journal={Proceedings of the ACM on Human-Computer Interaction},volume={8},number={CSCW1},pages={1--29},year={2024},publisher={ACM New York, NY, USA},}
LLMs Assist NLP Researchers: Critique Paper (Meta-)Reviewing
Jiangshu Du, Yibo Wang, Wenting Zhao, and 8 more authors
In Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing, 2024
@inproceedings{du2024llms,title={LLMs Assist NLP Researchers: Critique Paper (Meta-)Reviewing},author={Du, Jiangshu and Wang, Yibo and Zhao, Wenting and Deng, Zhongfen and Liu, Shuaiqi and Lou, Renze and Zou, Henry Peng and Venkit, Pranav Narayanan and Zhang, Nan and Srinath, Mukund and others},booktitle={Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing},year={2024},publisher={Association for Computational Linguistics},}
How Well Do Deep Learning Models Capture Human Concepts? The Case of the Typicality Effect
Siddhartha K. Vemuri, Raj Sanjay Shah, and Sashank Varma
Proceedings of the 46th Annual Meeting of the Cognitive Science Society, 2024
@article{vemuri2024well,title={How Well Do Deep Learning Models Capture Human Concepts? The Case of the Typicality Effect},author={Vemuri, Siddhartha K. and Shah, Raj Sanjay and Varma, Sashank},journal={Proceedings of the 46th Annual Meeting of the Cognitive Science Society},year={2024},}
Incremental Comprehension of Garden-Path Sentences by Large Language Models: Semantic Interpretation, Syntactic Re-Analysis, and Attention
Andrew Li, Xianle Feng, Siddhant Narang, and 4 more authors
Proceedings of the Annual Meeting of the Cognitive Science Society, 2024
@article{li2024incremental,title={Incremental Comprehension of Garden-Path Sentences by Large Language Models: Semantic Interpretation, Syntactic Re-Analysis, and Attention},author={Li, Andrew and Feng, Xianle and Narang, Siddhant and Peng, Austin and Cai, Tianle and Shah, Raj Sanjay and Varma, Sashank},journal={Proceedings of the Annual Meeting of the Cognitive Science Society},volume={46},year={2024},}
Development of Cognitive Intelligence in Pre-trained Language Models
Raj Sanjay Shah, Khushi Bhardwaj, and Sashank Varma
Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing, 2024
@article{shah2024cognitive,title={Development of Cognitive Intelligence in Pre-trained Language Models},author={Shah, Raj Sanjay and Bhardwaj, Khushi and Varma, Sashank},journal={Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing},year={2024},}
Understanding Graphical Perception in Data Visualization through Zero-Shot Prompting of Vision-Language Models
Grace Guo*, Jenna Jiayi Kang*, Raj Sanjay Shah*, and 2 more authors
NeurIPS 2024 Workshop on Behavioral Machine Learning, 2024
@article{shah2024graphperception,title={Understanding Graphical Perception in Data Visualization through Zero-Shot Prompting of Vision-Language Models},author={Guo, Grace and Kang, Jenna Jiayi and Shah, Raj Sanjay and Pfister, Hanspeter and Varma, Sashank},journal={NeurIPS 2024 Workshop on Behavioral Machine Learning},year={2024},}
2023
2023
Pre-training LLMs Using a Human-Like Development Data Corpus
Khushi Bhardwaj, Raj Sanjay Shah, and Sashank Varma
Proceedings of the BabyLM Challenge at the 27th Conference on Computational Linguistics, 2023
@article{bhardwaj2023pre,title={Pre-training LLMs Using a Human-Like Development Data Corpus},author={Bhardwaj, Khushi and Shah, Raj Sanjay and Varma, Sashank},journal={Proceedings of the BabyLM Challenge at the 27th Conference on Computational Linguistics},year={2023},}
Numeric Magnitude Comparison Effects in Large Language Models
Raj Sanjay Shah, Vijay Marupudi, Reba Koenen, and 2 more authors
In Findings of the Association for Computational Linguistics: ACL 2023, 2023
@inproceedings{shah2023numeric,title={Numeric Magnitude Comparison Effects in Large Language Models},author={Shah, Raj Sanjay and Marupudi, Vijay and Koenen, Reba and Bhardwaj, Khushi and Varma, Sashank},booktitle={Findings of the Association for Computational Linguistics: ACL 2023},year={2023},publisher={Association for Computational Linguistics},}
2022
2022
Modeling Motivational Interviewing Strategies on an Online Peer-to-Peer Counseling Platform
Raj Sanjay Shah, Faye Holt, Shirley Anugrah Hayati, and 4 more authors
Proceedings of the ACM on Human-Computer Interaction, 2022
@article{shah2022miti,title={Modeling Motivational Interviewing Strategies on an Online Peer-to-Peer Counseling Platform},author={Shah, Raj Sanjay and Holt, Faye and Hayati, Shirley Anugrah and Agarwal, Aastha and Wang, Yi-Chia and Kraut, Robert and Yang, Diyi},journal={Proceedings of the ACM on Human-Computer Interaction},volume={6},number={CSCW2},pages={1--24},year={2022},publisher={ACM New York, NY, USA},doi={10.1145/3555640},}
When FLUE Meets FLANG: Benchmarks and Large Pretrained Language Models for the Financial Domain
Raj Sanjay Shah, Kunal Chawla, Dheeraj Eidnani, and 7 more authors
In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, 2022
@inproceedings{shah2022flang,title={When FLUE Meets FLANG: Benchmarks and Large Pretrained Language Models for the Financial Domain},author={Shah, Raj Sanjay and Chawla, Kunal and Eidnani, Dheeraj and Shah, Agam and Du, Wendi and Chava, Sudheer and Raman, Natraj and Smiley, Charese and Chen, Jiaao and Yang, Diyi},booktitle={Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing},year={2022},publisher={Association for Computational Linguistics},}
JARVix at SemEval-2022 Task 2: It Takes One to Know One? Idiomaticity Detection Using Zero and One-Shot Learning
Ashwin Pathak, Raj Sanjay Shah, Vaibhav Kumar, and 1 more author
Proceedings of the 16th International Workshop on Semantic Evaluation (SemEval), 2022
@article{jarvix2022,title={JARVix at SemEval-2022 Task 2: It Takes One to Know One? Idiomaticity Detection Using Zero and One-Shot Learning},author={Pathak, Ashwin and Shah, Raj Sanjay and Kumar, Vaibhav and Jakhotiya, Yash},journal={Proceedings of the 16th International Workshop on Semantic Evaluation (SemEval)},year={2022},publisher={Association for Computational Linguistics},url={https://aclanthology.org/2022.semeval-1.19/},}
2021
2021
Bitcoin Data Analytics: Scalable Techniques for Transaction Clustering and Embedding Generation
Raj Sanjay Shah, Ashutosh Bhatia, Atith Gandhi, and 1 more author
In 2021 International Conference on Communication Systems & Networks (COMSNETS), 2021
@inproceedings{bitcoin2021,title={Bitcoin Data Analytics: Scalable Techniques for Transaction Clustering and Embedding Generation},author={Shah, Raj Sanjay and Bhatia, Ashutosh and Gandhi, Atith and Mathur, Shray},booktitle={2021 International Conference on Communication Systems & Networks (COMSNETS)},year={2021},publisher={IEEE},doi={10.1109/COMSNETS51098.2021.9352922},}
2020
2020
CTI-Twitter: Gathering Cyber Threat Intelligence from Twitter Using Integrated Supervised and Unsupervised Learning
Linn-Mari Kristiansen, Vinti Agarwal, Katrin Franke, and 1 more author
In 2020 IEEE International Conference on Big Data (BigData), 2020
@inproceedings{cti2020,title={CTI-Twitter: Gathering Cyber Threat Intelligence from Twitter Using Integrated Supervised and Unsupervised Learning},author={Kristiansen, Linn-Mari and Agarwal, Vinti and Franke, Katrin and Shah, Raj Sanjay},booktitle={2020 IEEE International Conference on Big Data (BigData)},year={2020},publisher={IEEE},doi={10.1109/BigData50022.2020.9378393},}