diff --git a/applications/ColossalChat/coati/trainer/__init__.py b/applications/ColossalChat/coati/trainer/__init__.py index 6d0900153..0c85f7d3d 100755 --- a/applications/ColossalChat/coati/trainer/__init__.py +++ b/applications/ColossalChat/coati/trainer/__init__.py @@ -5,6 +5,7 @@ from .orpo import ORPOTrainer from .ppo import PPOTrainer from .rm import RewardModelTrainer from .sft import SFTTrainer +from .prm import ProcessRewardModelTrainer __all__ = [ "SLTrainer", @@ -15,4 +16,5 @@ __all__ = [ "DPOTrainer", "ORPOTrainer", "KTOTrainer", + "ProcessRewardModelTrainer" ]