From 6ccc34c33e856321d5d6fa185808d917d8c68050 Mon Sep 17 00:00:00 2001 From: robo-cmh Date: Fri, 12 Sep 2025 16:04:16 +0800 Subject: [PATCH] =?UTF-8?q?=E4=BF=AE=E6=94=B9=E6=96=87=E4=BB=B6=E6=8B=BC?= =?UTF-8?q?=E5=86=99=E9=94=99=E8=AF=AF?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- cli/train_dapo.py | 2 +- cli/train_grpo.py | 4 ++-- cli/train_ppo.py | 4 ++-- mindspeed_rl/workers/__init__.py | 4 ++-- mindspeed_rl/workers/integrated_worker.py | 4 ++-- .../workers/{reference_woker.py => reference_worker.py} | 0 mindspeed_rl/workers/{reward_woker.py => reward_worker.py} | 0 mindspeed_rl/workers/scheduler/launcher.py | 4 ++-- tests/ut/workers/scheduler/test_launcher.py | 4 ++-- 9 files changed, 13 insertions(+), 13 deletions(-) rename mindspeed_rl/workers/{reference_woker.py => reference_worker.py} (100%) rename mindspeed_rl/workers/{reward_woker.py => reward_worker.py} (100%) diff --git a/cli/train_dapo.py b/cli/train_dapo.py index 2b48bc2f..f6ffc2ee 100644 --- a/cli/train_dapo.py +++ b/cli/train_dapo.py @@ -31,7 +31,7 @@ from mindspeed_rl.datasets.build_dataset import build_train_valid_test_datasets from mindspeed_rl.workers.dynamic_sampling import DynamicSampling from mindspeed_rl.workers.rule_reward import RuleReward from mindspeed_rl.workers.actor_hybrid_worker import ActorHybridWorker -from mindspeed_rl.workers.reward_woker import RewardWorker +from mindspeed_rl.workers.reward_worker import RewardWorker from mindspeed_rl.workers.integrated_worker import IntegratedWorker from mindspeed_rl.trainer.dapo_trainer_hybrid import RayDAPOTrainer diff --git a/cli/train_grpo.py b/cli/train_grpo.py index e2de0e8a..00166cb9 100644 --- a/cli/train_grpo.py +++ b/cli/train_grpo.py @@ -31,8 +31,8 @@ from mindspeed_rl.datasets.dataloader import PromptDataLoader from mindspeed_rl.workers.rule_reward import RuleReward from mindspeed_rl.trainer.grpo_trainer_hybrid import RayGRPOTrainer from mindspeed_rl.workers.actor_hybrid_worker import ActorHybridWorker -from mindspeed_rl.workers.reference_woker import ReferenceWorker -from mindspeed_rl.workers.reward_woker import RewardWorker +from mindspeed_rl.workers.reference_worker import ReferenceWorker +from mindspeed_rl.workers.reward_worker import RewardWorker from mindspeed_rl.workers.integrated_worker import IntegratedWorker cur_file_dir = Path(__file__).absolute().parent.parent diff --git a/cli/train_ppo.py b/cli/train_ppo.py index 162389cb..d28098df 100644 --- a/cli/train_ppo.py +++ b/cli/train_ppo.py @@ -32,8 +32,8 @@ from mindspeed_rl.workers.rule_reward import RuleReward from mindspeed_rl.trainer.ppo_trainer_hybrid import RayPPOTrainer from mindspeed_rl.workers.scheduler.launcher import RayActorGroup from mindspeed_rl.workers.actor_hybrid_worker import ActorHybridWorker -from mindspeed_rl.workers.reference_woker import ReferenceWorker -from mindspeed_rl.workers.reward_woker import RewardWorker +from mindspeed_rl.workers.reference_worker import ReferenceWorker +from mindspeed_rl.workers.reward_worker import RewardWorker from mindspeed_rl.workers.integrated_worker import IntegratedWorker from mindspeed_rl.workers.critic_worker import CriticWorker from mindspeed_rl.workers.scheduler.launcher import construct_colocate_placement_groups diff --git a/mindspeed_rl/workers/__init__.py b/mindspeed_rl/workers/__init__.py index d0f3d57c..8fc052fa 100644 --- a/mindspeed_rl/workers/__init__.py +++ b/mindspeed_rl/workers/__init__.py @@ -1,8 +1,8 @@ # coding=utf-8 # Copyright (c) 2025, HUAWEI CORPORATION. All rights reserved. -from .reference_woker import ReferenceWorker -from .reward_woker import RewardWorker +from .reference_worker import ReferenceWorker +from .reward_worker import RewardWorker from .actor_hybrid_worker import ActorHybridWorker from .scheduler import RayActorGroup from .resharding.megatron_sharding_manager import MegatronShardingManager diff --git a/mindspeed_rl/workers/integrated_worker.py b/mindspeed_rl/workers/integrated_worker.py index 0c3a231a..9d24ce7f 100644 --- a/mindspeed_rl/workers/integrated_worker.py +++ b/mindspeed_rl/workers/integrated_worker.py @@ -18,8 +18,8 @@ from mindspeed_rl.utils.utils import mstx_timer_decorator, profiler_start, profi from mindspeed_rl.utils.utils import MsProbe from mindspeed_rl.workers.actor_hybrid_worker import ActorHybridWorkerBase -from mindspeed_rl.workers.reference_woker import ReferenceWorkerBase -from mindspeed_rl.workers.reward_woker import RewardWorkerBase +from mindspeed_rl.workers.reference_worker import ReferenceWorkerBase +from mindspeed_rl.workers.reward_worker import RewardWorkerBase from mindspeed_rl.models.reference import Reference from mindspeed_rl.models.reward import Reward diff --git a/mindspeed_rl/workers/reference_woker.py b/mindspeed_rl/workers/reference_worker.py similarity index 100% rename from mindspeed_rl/workers/reference_woker.py rename to mindspeed_rl/workers/reference_worker.py diff --git a/mindspeed_rl/workers/reward_woker.py b/mindspeed_rl/workers/reward_worker.py similarity index 100% rename from mindspeed_rl/workers/reward_woker.py rename to mindspeed_rl/workers/reward_worker.py diff --git a/mindspeed_rl/workers/scheduler/launcher.py b/mindspeed_rl/workers/scheduler/launcher.py index f9fb57fe..74b6153a 100644 --- a/mindspeed_rl/workers/scheduler/launcher.py +++ b/mindspeed_rl/workers/scheduler/launcher.py @@ -34,8 +34,8 @@ from mindspeed_rl.config_cls.mindstudio_config import ProfilerConfig, MsprobeCon from mindspeed_rl.utils.tokenizer import BaseTokenizer from mindspeed_rl.workers.base_worker import BaseWorker from mindspeed_rl.workers.actor_hybrid_worker import ActorHybridWorker -from mindspeed_rl.workers.reference_woker import ReferenceWorker -from mindspeed_rl.workers.reward_woker import RewardWorker +from mindspeed_rl.workers.reference_worker import ReferenceWorker +from mindspeed_rl.workers.reward_worker import RewardWorker from mindspeed_rl.workers.integrated_worker import IntegratedWorker from mindspeed_rl.workers.critic_worker import CriticWorker from mindspeed_rl.workers.vit_worker import VitWorker diff --git a/tests/ut/workers/scheduler/test_launcher.py b/tests/ut/workers/scheduler/test_launcher.py index 3e0b6663..d38c5a24 100644 --- a/tests/ut/workers/scheduler/test_launcher.py +++ b/tests/ut/workers/scheduler/test_launcher.py @@ -6,8 +6,8 @@ import pytest import mindspeed_rl from mindspeed_rl.workers.scheduler.launcher import RayActorGroup from mindspeed_rl.workers.actor_hybrid_worker import ActorHybridWorker -from mindspeed_rl.workers.reference_woker import ReferenceWorker -from mindspeed_rl.workers.reward_woker import RewardWorker +from mindspeed_rl.workers.reference_worker import ReferenceWorker +from mindspeed_rl.workers.reward_worker import RewardWorker from mindspeed_rl.config_cls.megatron_config import MegatronConfig from mindspeed_rl.config_cls.rl_config import RLConfig from mindspeed_rl.config_cls.generate_config import GenerateConfig -- Gitee