@article{aremu2026robust,
  title={Robust Safety Monitoring of Language Models via Activation Watermarking},
  author={Aremu, Toluwani and Ognev, Daniil and Poppi, Samuele and Lukas, Nils},
  journal={arXiv preprint arXiv:2603.23171},
  year={2026}
}
