@article{rai2024practical,
title={A practical review of mechanistic interpretability for transformer-based language models},
author={Rai, Daking and Zhou, Yilun and Feng, Shi and Saparov, Abulhair and Yao, Ziyu},
journal={arXiv preprint arXiv:2407.02646},
year={2024}
}
Assistant Professor, GMU CS
PhD Student, GMU CS