@inproceedings{ijcai2025p56, title = {Feint and Attack: Jailbreaking and Protecting LLMs via Attention Distribution Modeling}, author = {Pu, Rui and Li, Chaozhuo and Ha, Rui and Chen, Zejian and Zhang, Litian and Liu, Zheng and Qiu, Lirong and Ye, Zaisheng}, booktitle = {Proceedings of the Thirty-Fourth International Joint Conference on Artificial Intelligence, {IJCAI-25}}, publisher = {International Joint Conferences on Artificial Intelligence Organization}, editor = {James Kwok}, pages = {493--501}, year = {2025}, month = {8}, note = {Main Track}, doi = {10.24963/ijcai.2025/56}, url = {https://doi.org/10.24963/ijcai.2025/56}, }