@inproceedings{ijcai2024p705, title = {LocMoE: A Low-overhead MoE for Large Language Model Training}, author = {Li, Jing and Sun, Zhijie and He, Xuan and Zeng, Li and Lin, Yi and Li, Entong and Zheng, Binfan and Zhao, Rongqian and Chen, Xin}, booktitle = {Proceedings of the Thirty-Third International Joint Conference on Artificial Intelligence, {IJCAI-24}}, publisher = {International Joint Conferences on Artificial Intelligence Organization}, editor = {Kate Larson}, pages = {6377--6387}, year = {2024}, month = {8}, note = {Main Track}, doi = {10.24963/ijcai.2024/705}, url = {https://doi.org/10.24963/ijcai.2024/705}, }