@article{makelov2024towards,
  title={Towards principled evaluations of sparse autoencoders for interpretability and control},
  author={Makelov, Aleksandar and Lange, George and Nanda, Neel},
  journal={arXiv preprint arXiv:2405.08366},
  year={2024}
}