@misc{cundy2025preferencelearningliedetectors, title={Preference Learning with Lie Detectors can Induce Honesty or Evasion}, author={Chris Cundy and Adam Gleave}, year={2025}, eprint={2505.13787}, archivePrefix={arXiv}, primaryClass={cs.LG}, url={https://arxiv.org/abs/2505.13787}, }