@conference{ma_balancing_2026, author = {Changlian Ma and Zizheng Huang and Xiangyu Zeng and Yi Wang and Cheng Liang and Kun Tian and Xinhai Zhao and Limin Wang}, booktitle = {The Fourteenth International Conference on Learning Representations}, date = {2026-04-24}, title = {Balancing the Experts: Unlocking LoRA-MoE for GRPO via Mechanism-Aware Rewards}, url = {https://iclr.cc/virtual/2026/poster/10007126}, year = {2026} }