@inproceedings{f4b37b4e44fa450a98d2f4084e9a2c0c,
title = "Quartet: A Holistic Hybrid Parallel Framework for Training Large Language Models",
abstract = "Hybrid parallelism is popular in training large language models (LLMs). However, existing efforts have focused on optimizing individual strategies in hybrid parallelism, such as pipeline scheduling, device assignment, etc., which limits the overall training efficiency. This paper explores the intricate dependencies among four pivotal strategies-model scaling, model splitting, pipeline scheduling, and device assignment-and proposes Quartet, a holistic hybrid parallel framework for joint optimization. The novelty lies upon the formulation of parameterized pipeline scheduling and device assignment, alongside a pioneering analysis of model scaling{\textquoteright}s impact on the throughput. These provide the basis for orchestrating four strategies within a unified framework to maximize the overall training throughput efficiently. Evaluation results show that: for representative LLMs , Quartet improves the training throughput by up to 2.16× over the state-of-the-art synchronous hybrid parallel approaches.",
keywords = "Distributed Training, Hybrid Parallelism, Large Language Models",
author = "Weigang Zhang and Biyu Zhou and Xing Wu and Chaochen Gao and Zhibing Liu and Xuehai Tang and Ruixuan Li and Jizhong Han and Songlin Hu",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Switzerland AG 2024.; 30th International Conference on Parallel and Distributed Computing, Euro-Par 2024 ; Conference date: 26-08-2024 Through 30-08-2024",
year = "2024",
doi = "10.1007/978-3-031-69766-1\_29",
language = "英语",
isbn = "9783031697654",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "424--438",
editor = "Jesus Carretero and Javier Garcia-Blas and Sameer Shende and Ivona Brandic and Katzalin Olcoz and Martin Schreiber",
booktitle = "Euro-Par 2024",
address = "德国",
}