From 5f810d9c9ce0f826d31c5ff4bed177a2c77ae545 Mon Sep 17 00:00:00 2001 From: Eric Tang Date: Fri, 29 May 2026 20:42:22 +0000 Subject: [PATCH] make empty cuda cache default true for megatron --- skyrl/train/config/config.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/skyrl/train/config/config.py b/skyrl/train/config/config.py index e4ac7bb655..45604f641e 100644 --- a/skyrl/train/config/config.py +++ b/skyrl/train/config/config.py @@ -188,7 +188,7 @@ class MegatronConfig(BaseConfig): transformer_config_kwargs: Dict[str, Any] = field( default_factory=lambda: copy.deepcopy(DEFAULT_TRANSFORMER_CONFIG_KWARGS) ) - empty_cuda_cache: Optional[bool] = None + empty_cuda_cache: Optional[bool] = True model_config_kwargs: dict = field(default_factory=dict) dist_ckpt_optim_fully_reshardable: bool = False freeze_moe_router: bool = False