@inproceedings{singh:ics2023, author = {Singh, Siddharth and Bhatele, Abhinav}, title = {A Novel Tensor-Expert Hybrid Parallelism Approach to Scale Mixture-of-Experts Training}, booktitle = {Proceedings of the International Conference on Supercomputing}, series = {ICS '23}, year = {2023 (to appear)}, month = jun, }