Publications | Raj S. Shah

2026

Responsible Evaluation of AI for Mental Health

Hiba Arnaout, Anmol Goel, H Andrew Schwartz, and 8 more authors

arXiv preprint arXiv:2602.00065, 2026

@article{arnaout2026responsible,
  title = {Responsible Evaluation of AI for Mental Health},
  author = {Arnaout, Hiba and Goel, Anmol and Schwartz, H Andrew and Eberhardt, Steffen T and Atzil-Slonim, Dana and Doherty, Gavin and Schwartz, Brian and Lutz, Wolfgang and Althoff, Tim and De Choudhury, Munmun and others},
  journal = {arXiv preprint arXiv:2602.00065},
  year = {2026},
}

2025

Do LLMs Suppress Naïve Theories? Investigating Scientific Reasoning and Development in GPT-4o

Sneh Gupta, Raj Sanjay Shah, and Sashank Varma

Advances in Cognitive Systems, 2025

Bib PDF

@article{shah2024naivetheories,
  title = {Do LLMs Suppress Naïve Theories? Investigating Scientific Reasoning and Development in GPT-4o},
  author = {Gupta, Sneh and Shah, Raj Sanjay and Varma, Sashank},
  journal = {Advances in Cognitive Systems},
  year = {2025},
  url = {https://openreview.net/pdf?id=mMSxCWDkzP},
}

The World According to LLMs: How Geographic Origin Influences LLMs’ Entity Deduction Capabilities

Harsh Nishant Lalai, Raj Sanjay Shah, Jiaxin Pei, and 3 more authors

In Second Conference on Language Modeling, 2025

Bib PDF

@inproceedings{lalaiworld,
  title = {The World According to LLMs: How Geographic Origin Influences LLMs' Entity Deduction Capabilities},
  author = {Lalai, Harsh Nishant and Shah, Raj Sanjay and Pei, Jiaxin and Varma, Sashank and Wang, Yi-Chia and Emami, Ali},
  url = {https://openreview.net/pdf?id=hJtvCfDfs1},
  booktitle = {Second Conference on Language Modeling},
  year = {2025},
}

Guiding a user to interact with an intelligent computing system using best practices

Michelle Brachman, Zahra Ashktorab, Michael Desmond, and 5 more authors

Jun 2025

US Patent App. 18/542,554

Bib

@misc{brachman2025guiding,
  title = {Guiding a user to interact with an intelligent computing system using best practices},
  author = {Brachman, Michelle and Ashktorab, Zahra and Desmond, Michael and Do, Hyo Jin and Dugan, Casey and Johnson, James and Pan, Qian and Shah, Raj Sanjay},
  year = {2025},
  month = jun,
  publisher = {Google Patents},
  note = {US Patent App. 18/542,554}
}

Can llm-simulated practice and feedback upskill human counselors? a randomized study with 90+ novice counselors

Ryan Louie, Raj Sanjay Shah, Ifdita Hasan Orney, and 3 more authors

2025

arXiv Bib PDF

@article{louie2025can,
  title = {Can llm-simulated practice and feedback upskill human counselors? a randomized study with 90+ novice counselors},
  author = {Louie, Ryan and Shah, Raj Sanjay and Orney, Ifdita Hasan and Pacheco, Juan Pablo and Brunskill, Emma and Yang, Diyi},
  url = {https://arxiv.org/abs/2505.02428},
  year = {2025},
}

Helping the helper: Supporting peer counselors via ai-empowered practice and feedback

Shang-Ling Hsu, Raj Sanjay Shah, Prathik Senthil, and 4 more authors

Proceedings of the ACM on Human-Computer Interaction, 2025

DOI Bib PDF

@article{hsu2025helping,
  title = {Helping the helper: Supporting peer counselors via ai-empowered practice and feedback},
  author = {Hsu, Shang-Ling and Shah, Raj Sanjay and Senthil, Prathik and Ashktorab, Zahra and Dugan, Casey and Geyer, Werner and Yang, Diyi},
  journal = {Proceedings of the ACM on Human-Computer Interaction},
  volume = {9},
  number = {2},
  pages = {1--45},
  year = {2025},
  url = {https://doi.org/10.1145/3710993},
  doi = {10.1145/3710993},
  publisher = {ACM New York, NY, USA},
}

From Intentions to Techniques: A Comprehensive Taxonomy and Challenges in Text Watermarking for Large Language Models

Harsh Nishant Lalai, Aashish Anantha Ramakrishnan, Raj Sanjay Shah, and 1 more author

In Findings of the Association for Computational Linguistics: NAACL 2025, Apr 2025

DOI Bib PDF

@inproceedings{lalai-etal-2025-intentions,
  title = {From Intentions to Techniques: A Comprehensive Taxonomy and Challenges in Text Watermarking for Large Language Models},
  author = {Lalai, Harsh Nishant and Anantha Ramakrishnan, Aashish and Shah, Raj Sanjay and Lee, Dongwon},
  editor = {Chiruzzo, Luis and Ritter, Alan and Wang, Lu},
  booktitle = {Findings of the Association for Computational Linguistics: NAACL 2025},
  month = apr,
  year = {2025},
  address = {Albuquerque, New Mexico},
  publisher = {Association for Computational Linguistics},
  url = {https://aclanthology.org/2025.findings-naacl.343/},
  doi = {10.18653/v1/2025.findings-naacl.343},
  pages = {6162--6175},
  isbn = {979-8-89176-195-7},
}

TN-Eval: Rubric and Evaluation Protocols for Measuring the Quality of Behavioral Therapy Notes

Raj Sanjay Shah, Lei Xu, Qianchu Liu, and 3 more authors

In Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 6: Industry Track), Jul 2025

DOI Bib PDF

@inproceedings{shah-etal-2025-tn,
  title = {{TN}-Eval: Rubric and Evaluation Protocols for Measuring the Quality of Behavioral Therapy Notes},
  author = {Shah, Raj Sanjay and Xu, Lei and Liu, Qianchu and Burnsky, Jon and Bertagnolli, Andrew and Shivade, Chaitanya},
  editor = {Rehm, Georg and Li, Yunyao},
  booktitle = {Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 6: Industry Track)},
  month = jul,
  year = {2025},
  address = {Vienna, Austria},
  publisher = {Association for Computational Linguistics},
  url = {https://aclanthology.org/2025.acl-industry.14/},
  doi = {10.18653/v1/2025.acl-industry.14},
  pages = {179--199},
  isbn = {979-8-89176-288-6},
}

Findings of the Third BabyLM Challenge: Accelerating Language Modeling Research with Cognitively Plausible Data

Lucas Charpentier, Leshem Choshen, Ryan Cotterell, and 8 more authors

2025

arXiv Bib PDF

@article{charpentier2025babylm,
  title = {Findings of the Third BabyLM Challenge: Accelerating Language Modeling Research with Cognitively Plausible Data},
  author = {Charpentier, Lucas and Choshen, Leshem and Cotterell, Ryan and Gul, Mustafa Omer and Hu, Michael and Jumelet, Jaap and Linzen, Tal and Liu, Jing and Mueller, Aaron and Ross, Candace and others},
  url = {https://arxiv.org/abs/2502.10645},
  year = {2025},
}

The potential–and the pitfalls–of using pre-trained language models as cognitive science theories

Raj Sanjay Shah and Sashank Varma

2025

arXiv Bib PDF

@article{shah2025potential,
  title = {The potential--and the pitfalls--of using pre-trained language models as cognitive science theories},
  author = {Shah, Raj Sanjay and Varma, Sashank},
  url = {https://arxiv.org/abs/2501.12651},
  year = {2025},
}

The unlearning mirage: A dynamic framework for evaluating LLM unlearning

Raj Sanjay Shah, Jing Huang, Keerthiram Murugesan, and 2 more authors

In Second Conference on Language Modeling, 2025

Bib PDF

@inproceedings{shah2025unlearning,
  title = {The unlearning mirage: A dynamic framework for evaluating LLM unlearning},
  author = {Shah, Raj Sanjay and Huang, Jing and Murugesan, Keerthiram and Baracaldo, Nathalie and Yang, Diyi},
  booktitle = {Second Conference on Language Modeling},
  url = {https://openreview.net/pdf?id=exW2SFJK4H},
  year = {2025},
}

2024

Multi-Level Feedback Generation with Large Language Models for Empowering Novice Peer Counselors

Alicja Chaszczewicz, Raj Sanjay Shah, Ryan Louie, and 3 more authors

In Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics, 2024

arXiv Bib PDF

@inproceedings{chaszczewicz2024multi,
  title = {Multi-Level Feedback Generation with Large Language Models for Empowering Novice Peer Counselors},
  author = {Chaszczewicz, Alicja and Shah, Raj Sanjay and Louie, Ryan and Arnow, Bruce A. and Kraut, Robert and Yang, Diyi},
  booktitle = {Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics},
  year = {2024},
  publisher = {Association for Computational Linguistics},
}

Natural Mitigation of Catastrophic Interference: Continual Learning in Power-Law Learning Environments

Raj Sanjay Shah, Atith Gandhi, Vijay Marupudi, and 1 more author

2024

arXiv Bib PDF

@article{gandhi2024catastrophic,
  title = {Natural Mitigation of Catastrophic Interference: Continual Learning in Power-Law Learning Environments},
  author = {Shah, Raj Sanjay and Gandhi, Atith and Marupudi, Vijay and Varma, Sashank},
  booktitle = {ECAI 2024},
  year = {2024},
}

What Makes Digital Support Effective? How Therapeutic Skills Affect Clinical Well-Being

Wenjie Yang, Anna Fang, Raj Sanjay Shah, and 4 more authors

Proceedings of the ACM on Human-Computer Interaction, 2024

Bib PDF

@article{yang2024makes,
  title = {What Makes Digital Support Effective? How Therapeutic Skills Affect Clinical Well-Being},
  author = {Yang, Wenjie and Fang, Anna and Shah, Raj Sanjay and Mathur, Yash and Yang, Diyi and Zhu, Haiyi and Kraut, Robert E.},
  journal = {Proceedings of the ACM on Human-Computer Interaction},
  volume = {8},
  number = {CSCW1},
  pages = {1--29},
  year = {2024},
  publisher = {ACM New York, NY, USA},
}

LLMs Assist NLP Researchers: Critique Paper (Meta-)Reviewing

Jiangshu Du, Yibo Wang, Wenting Zhao, and 8 more authors

In Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing, 2024

arXiv Bib PDF

@inproceedings{du2024llms,
  title = {LLMs Assist NLP Researchers: Critique Paper (Meta-)Reviewing},
  author = {Du, Jiangshu and Wang, Yibo and Zhao, Wenting and Deng, Zhongfen and Liu, Shuaiqi and Lou, Renze and Zou, Henry Peng and Venkit, Pranav Narayanan and Zhang, Nan and Srinath, Mukund and others},
  booktitle = {Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing},
  year = {2024},
  publisher = {Association for Computational Linguistics},
}

How Well Do Deep Learning Models Capture Human Concepts? The Case of the Typicality Effect

Siddhartha K. Vemuri, Raj Sanjay Shah, and Sashank Varma

Proceedings of the 46th Annual Meeting of the Cognitive Science Society, 2024

Bib PDF

@article{vemuri2024well,
  title = {How Well Do Deep Learning Models Capture Human Concepts? The Case of the Typicality Effect},
  author = {Vemuri, Siddhartha K. and Shah, Raj Sanjay and Varma, Sashank},
  journal = {Proceedings of the 46th Annual Meeting of the Cognitive Science Society},
  year = {2024},
}

Incremental Comprehension of Garden-Path Sentences by Large Language Models: Semantic Interpretation, Syntactic Re-Analysis, and Attention

Andrew Li, Xianle Feng, Siddhant Narang, and 4 more authors

Proceedings of the Annual Meeting of the Cognitive Science Society, 2024

arXiv Bib PDF

@article{li2024incremental,
  title = {Incremental Comprehension of Garden-Path Sentences by Large Language Models: Semantic Interpretation, Syntactic Re-Analysis, and Attention},
  author = {Li, Andrew and Feng, Xianle and Narang, Siddhant and Peng, Austin and Cai, Tianle and Shah, Raj Sanjay and Varma, Sashank},
  journal = {Proceedings of the Annual Meeting of the Cognitive Science Society},
  volume = {46},
  year = {2024},
}

Development of Cognitive Intelligence in Pre-trained Language Models

Raj Sanjay Shah, Khushi Bhardwaj, and Sashank Varma

Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing, 2024

arXiv Bib PDF

@article{shah2024cognitive,
  title = {Development of Cognitive Intelligence in Pre-trained Language Models},
  author = {Shah, Raj Sanjay and Bhardwaj, Khushi and Varma, Sashank},
  journal = {Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing},
  year = {2024},
}

Understanding Graphical Perception in Data Visualization through Zero-Shot Prompting of Vision-Language Models

Grace Guo^*, Jenna Jiayi Kang^*, Raj Sanjay Shah^*, and 2 more authors

NeurIPS 2024 Workshop on Behavioral Machine Learning, 2024

arXiv Bib PDF

@article{shah2024graphperception,
  title = {Understanding Graphical Perception in Data Visualization through Zero-Shot Prompting of Vision-Language Models},
  author = {Guo, Grace and Kang, Jenna Jiayi and Shah, Raj Sanjay and Pfister, Hanspeter and Varma, Sashank},
  journal = {NeurIPS 2024 Workshop on Behavioral Machine Learning},
  year = {2024},
}

2023

Pre-training LLMs Using a Human-Like Development Data Corpus

Khushi Bhardwaj, Raj Sanjay Shah, and Sashank Varma

Proceedings of the BabyLM Challenge at the 27th Conference on Computational Linguistics, 2023

arXiv Bib PDF

@article{bhardwaj2023pre,
  title = {Pre-training LLMs Using a Human-Like Development Data Corpus},
  author = {Bhardwaj, Khushi and Shah, Raj Sanjay and Varma, Sashank},
  journal = {Proceedings of the BabyLM Challenge at the 27th Conference on Computational Linguistics},
  year = {2023},
}

Numeric Magnitude Comparison Effects in Large Language Models

Raj Sanjay Shah, Vijay Marupudi, Reba Koenen, and 2 more authors

In Findings of the Association for Computational Linguistics: ACL 2023, 2023

arXiv Bib PDF

@inproceedings{shah2023numeric,
  title = {Numeric Magnitude Comparison Effects in Large Language Models},
  author = {Shah, Raj Sanjay and Marupudi, Vijay and Koenen, Reba and Bhardwaj, Khushi and Varma, Sashank},
  booktitle = {Findings of the Association for Computational Linguistics: ACL 2023},
  year = {2023},
  publisher = {Association for Computational Linguistics},
}

2022

Modeling Motivational Interviewing Strategies on an Online Peer-to-Peer Counseling Platform

Raj Sanjay Shah, Faye Holt, Shirley Anugrah Hayati, and 4 more authors

Proceedings of the ACM on Human-Computer Interaction, 2022

DOI arXiv Bib PDF

@article{shah2022miti,
  title = {Modeling Motivational Interviewing Strategies on an Online Peer-to-Peer Counseling Platform},
  author = {Shah, Raj Sanjay and Holt, Faye and Hayati, Shirley Anugrah and Agarwal, Aastha and Wang, Yi-Chia and Kraut, Robert and Yang, Diyi},
  journal = {Proceedings of the ACM on Human-Computer Interaction},
  volume = {6},
  number = {CSCW2},
  pages = {1--24},
  year = {2022},
  publisher = {ACM New York, NY, USA},
  doi = {10.1145/3555640},
}

When FLUE Meets FLANG: Benchmarks and Large Pretrained Language Models for the Financial Domain

Raj Sanjay Shah, Kunal Chawla, Dheeraj Eidnani, and 7 more authors

In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, 2022

arXiv Bib PDF

@inproceedings{shah2022flang,
  title = {When FLUE Meets FLANG: Benchmarks and Large Pretrained Language Models for the Financial Domain},
  author = {Shah, Raj Sanjay and Chawla, Kunal and Eidnani, Dheeraj and Shah, Agam and Du, Wendi and Chava, Sudheer and Raman, Natraj and Smiley, Charese and Chen, Jiaao and Yang, Diyi},
  booktitle = {Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing},
  year = {2022},
  publisher = {Association for Computational Linguistics},
}

JARVix at SemEval-2022 Task 2: It Takes One to Know One? Idiomaticity Detection Using Zero and One-Shot Learning

Ashwin Pathak, Raj Sanjay Shah, Vaibhav Kumar, and 1 more author

Proceedings of the 16th International Workshop on Semantic Evaluation (SemEval), 2022

Bib PDF

@article{jarvix2022,
  title = {JARVix at SemEval-2022 Task 2: It Takes One to Know One? Idiomaticity Detection Using Zero and One-Shot Learning},
  author = {Pathak, Ashwin and Shah, Raj Sanjay and Kumar, Vaibhav and Jakhotiya, Yash},
  journal = {Proceedings of the 16th International Workshop on Semantic Evaluation (SemEval)},
  year = {2022},
  publisher = {Association for Computational Linguistics},
  url = {https://aclanthology.org/2022.semeval-1.19/},
}

2021

Bitcoin Data Analytics: Scalable Techniques for Transaction Clustering and Embedding Generation

Raj Sanjay Shah, Ashutosh Bhatia, Atith Gandhi, and 1 more author

In 2021 International Conference on Communication Systems & Networks (COMSNETS), 2021

DOI Bib PDF

@inproceedings{bitcoin2021,
  title = {Bitcoin Data Analytics: Scalable Techniques for Transaction Clustering and Embedding Generation},
  author = {Shah, Raj Sanjay and Bhatia, Ashutosh and Gandhi, Atith and Mathur, Shray},
  booktitle = {2021 International Conference on Communication Systems & Networks (COMSNETS)},
  year = {2021},
  publisher = {IEEE},
  doi = {10.1109/COMSNETS51098.2021.9352922},
}

2020

CTI-Twitter: Gathering Cyber Threat Intelligence from Twitter Using Integrated Supervised and Unsupervised Learning

Linn-Mari Kristiansen, Vinti Agarwal, Katrin Franke, and 1 more author

In 2020 IEEE International Conference on Big Data (BigData), 2020

DOI Bib PDF

@inproceedings{cti2020,
  title = {CTI-Twitter: Gathering Cyber Threat Intelligence from Twitter Using Integrated Supervised and Unsupervised Learning},
  author = {Kristiansen, Linn-Mari and Agarwal, Vinti and Franke, Katrin and Shah, Raj Sanjay},
  booktitle = {2020 IEEE International Conference on Big Data (BigData)},
  year = {2020},
  publisher = {IEEE},
  doi = {10.1109/BigData50022.2020.9378393},
}