@inproceedings{inproceedings, title = {{Confidence regulation neurons in language models}}, publisher = {{NeurIPS}}, url = {{https://eprints.whiterose.ac.uk/id/eprint/222011 https://neurips.cc/virtual/2024/poster/96903 }}, year = {{2024}}, month = {{12}}, author = {{Stolfo A and Wu B and Gurnee W and Belinkov Y and Song X and Sachan M and Nanda N}}, journal = {{Advances in Neural Information Processing Systems}}, note = {{Accessed on 2025/11/23}}}