@inproceedings{ijcai2024p0443, title = {Exterior Penalty Policy Optimization with Penalty Metric Network under Constraints}, author = {Gao, Shiqing and Ding, Jiaxin and Fu, Luoyi and Wang, Xinbing and Zhou, Chenghu}, booktitle = {Proceedings of the Thirty-Third International Joint Conference on Artificial Intelligence, {IJCAI-24}}, publisher = {International Joint Conferences on Artificial Intelligence Organization}, editor = {Kate Larson}, pages = {4007--4015}, year = {2024}, month = {8}, note = {Main Track}, doi = {10.24963/ijcai.2024/443}, url = {https://doi.org/10.24963/ijcai.2024/443}, }