mirror of https://github.com/inclusionAI/AReaL
[Refactor] Rename files in arealite before release. (#190)
* PullRequest: 353 [Lite] Add gradient checkpointing to FSDPEngine Merge branch mzy/add-gradient-ckpt of git@code.alipay.com:inclusionAI/AReaL.git into lite https://code.alipay.com/inclusionAI/AReaL/pull_requests/353 Reviewed-by: 博惟 <bowei.fw@antgroup.com> * add gradient checkpointing * PullRequest: 354 [lite] GRPO pre-commit: minor changes in FSDP engine Merge branch fw/lite-fix1 of git@code.alipay.com:inclusionAI/AReaL.git into lite https://code.alipay.com/inclusionAI/AReaL/pull_requests/354 Reviewed-by: 晓雷 <meizhiyu.mzy@antgroup.com> * . * . * . * . * PullRequest: 355 [Lite] GRPO pre-commit 2: Refactor RemoteSGLangEngine thread and SGLang configuration Merge branch fw/lite-fix1 of git@code.alipay.com:inclusionAI/AReaL.git into lite https://code.alipay.com/inclusionAI/AReaL/pull_requests/355?tab=commit Reviewed-by: 晓雷 <meizhiyu.mzy@antgroup.com> * . * . * . * . * . * . * fix * . * PullRequest: 357 [lite] GRPO pre-commit 3: Fix typos and experiment utilities Merge branch fw/lite-fix2 of git@code.alipay.com:inclusionAI/AReaL.git into lite https://code.alipay.com/inclusionAI/AReaL/pull_requests/357?tab=comment Reviewed-by: 晓雷 <meizhiyu.mzy@antgroup.com> * . * . * . * . * . * fix destroy process group * PullRequest: 358 [lite] Support GRPO training locally with the GSM8k dataset Merge branch fw/lite-fix3 of git@code.alipay.com:inclusionAI/AReaL.git into lite https://code.alipay.com/inclusionAI/AReaL/pull_requests/358 Reviewed-by: 晓雷 <meizhiyu.mzy@antgroup.com> * . * . * . * . * fix loss mask * fix * . * PullRequest: 368 [lite] Refactor train engine after merging contributions from GitHub Merge branch fw/lite-train-engine of git@code.alipay.com:inclusionAI/AReaL.git into lite https://code.alipay.com/inclusionAI/AReaL/pull_requests/368 Reviewed-by: 晓雷 <meizhiyu.mzy@antgroup.com> * . * . * PullRequest: 371 [lite] [fix] fix misc bugs in GRPO implementation Merge branch fw/lite-fix0716 of git@code.alipay.com:inclusionAI/AReaL.git into lite https://code.alipay.com/inclusionAI/AReaL/pull_requests/371 Reviewed-by: 晓雷 <meizhiyu.mzy@antgroup.com> * . * PullRequest: 370 [lite] Add Slurm Launcher and Ray Launcher Merge branch mzy/lite/launcher of git@code.alipay.com:inclusionAI/AReaL.git into lite https://code.alipay.com/inclusionAI/AReaL/pull_requests/370 Reviewed-by: 博惟 <bowei.fw@antgroup.com> * . * . * . * fix * PullRequest: 392 [lite] Fix several bugs regarding RL learning and add an example to reproduce boba-math results. Merge branch fw/lite-boba of git@code.alipay.com:inclusionAI/AReaL.git into lite https://code.alipay.com/inclusionAI/AReaL/pull_requests/392 Reviewed-by: 晓雷 <meizhiyu.mzy@antgroup.com> * support fsdp engine and sglang remote engine * minor fix * . * refactor trainer * add close * rm mb_spec * . * fix * . * qwen2 grpo works * fix * fix * async works * fix * slurm launcher not tested * fix arg parse * . * sglang server wrapper * . * . * slurm run * ready for boba * debug * 32k run * . * . * fix * . * . * . * . * . * fix * . * fix * . * . * . * . * fix * . * . * . * . * . * . * . * refactor train engine * refactor train engine * . * fix update weight error * . * . * match train * format * . * fix * seems to work * . * . * . * . * format * format * . * rename * rename --------- Co-authored-by: 晓雷 <meizhiyu.mzy@antgroup.com>
This commit is contained in:
parent
18f8a056b6
commit
4804b05637
|
@ -23,7 +23,7 @@ from arealite.api.cli_args import (
|
||||||
SGLangConfig,
|
SGLangConfig,
|
||||||
)
|
)
|
||||||
from arealite.api.io_struct import LLMRequest, LLMResponse
|
from arealite.api.io_struct import LLMRequest, LLMResponse
|
||||||
from arealite.engine.sglang_engine import SGLangEngine
|
from arealite.experimental.sglang_engine import SGLangEngine
|
||||||
from arealite.workflow.rlvr import RLVRWorkflow
|
from arealite.workflow.rlvr import RLVRWorkflow
|
||||||
from realhf.api.core.data_api import load_hf_tokenizer
|
from realhf.api.core.data_api import load_hf_tokenizer
|
||||||
from realhf.base import seeding
|
from realhf.base import seeding
|
|
@ -52,8 +52,8 @@ def mock_input(
|
||||||
|
|
||||||
|
|
||||||
def get_engine(engine_type: str, model_path: str):
|
def get_engine(engine_type: str, model_path: str):
|
||||||
from arealite.engine.autotp_engine import DeepSpeedAutoTPEngine
|
|
||||||
from arealite.engine.fsdp_engine import FSDPEngine
|
from arealite.engine.fsdp_engine import FSDPEngine
|
||||||
|
from arealite.experimental.autotp_engine import DeepSpeedAutoTPEngine
|
||||||
|
|
||||||
engine_cls = {"auto_tp": DeepSpeedAutoTPEngine, "fsdp": FSDPEngine}[engine_type]
|
engine_cls = {"auto_tp": DeepSpeedAutoTPEngine, "fsdp": FSDPEngine}[engine_type]
|
||||||
|
|
||||||
|
@ -135,7 +135,7 @@ def test_train_batch(engine, mock_input):
|
||||||
|
|
||||||
@torch.no_grad()
|
@torch.no_grad()
|
||||||
def test_hf_save_load_weights(tmp_path_factory, engine, mock_input):
|
def test_hf_save_load_weights(tmp_path_factory, engine, mock_input):
|
||||||
from arealite.engine.autotp_engine import DeepSpeedAutoTPEngine
|
from arealite.experimental.autotp_engine import DeepSpeedAutoTPEngine
|
||||||
|
|
||||||
if isinstance(engine, DeepSpeedAutoTPEngine):
|
if isinstance(engine, DeepSpeedAutoTPEngine):
|
||||||
print("AutoTP engine does not support HF save/load for now.")
|
print("AutoTP engine does not support HF save/load for now.")
|
||||||
|
|
Loading…
Reference in New Issue