@inproceedings{chen2024accelerated,title={Accelerated Policy Gradient: On the Convergence Rates of the Nesterov Momentum for Reinforcement Learning},author={Chen, Yen-Ju and Huang, Nai-Chieh and Lee, Ching-pei and Hsieh, Ping-Chun},booktitle={International Conference on Machine Learning (ICML)},year={2024},}
PPO-Clip Attains Global Optimality: Towards Deeper Understandings of Clipping
Nai-Chieh Huang, Ping-Chun Hsieh, Kuo-Hao Ho, and I-Chen Wu
In Proceedings of the AAAI Conference on Artificial Intelligence, 2024
@inproceedings{huang2024ppo,title={PPO-Clip Attains Global Optimality: Towards Deeper Understandings of Clipping},author={Huang, Nai-Chieh and Hsieh, Ping-Chun and Ho, Kuo-Hao and Wu, I-Chen},booktitle={Proceedings of the AAAI Conference on Artificial Intelligence},volume={38},number={11},pages={12600--12607},year={2024},}