diff --git a/tuning/config/acceleration_configs/acceleration_framework_config.py b/tuning/config/acceleration_configs/acceleration_framework_config.py index 7da11a5de..a5a685897 100644 --- a/tuning/config/acceleration_configs/acceleration_framework_config.py +++ b/tuning/config/acceleration_configs/acceleration_framework_config.py @@ -97,7 +97,7 @@ class AccelerationFrameworkConfig: path="training.moe", key="scattermoe", standalone=True, - experimental=False, + experimental=True, required_packages=["moe"], ), ] = None diff --git a/tuning/config/acceleration_configs/fast_moe.py b/tuning/config/acceleration_configs/fast_moe.py index 2da74f158..14a44f929 100644 --- a/tuning/config/acceleration_configs/fast_moe.py +++ b/tuning/config/acceleration_configs/fast_moe.py @@ -25,12 +25,6 @@ class FastMoe: ep_degree: int = 1 - def post_init(self): - assert self.world_size % self.ep_degree == 0, ( - f"world size ({self.world_size}) " - f"not divisible by ep_size ({self.ep_degree})." - ) - @dataclass class FastMoeConfig: