NovaSky-AI · erictang000 · May 29, 2026 · May 29, 2026 · gemini-code-assist · May 29, 2026
diff --git a/skyrl/train/config/config.py b/skyrl/train/config/config.py
@@ -188,7 +188,7 @@ class MegatronConfig(BaseConfig):
     transformer_config_kwargs: Dict[str, Any] = field(
         default_factory=lambda: copy.deepcopy(DEFAULT_TRANSFORMER_CONFIG_KWARGS)
     )
-    empty_cuda_cache: Optional[bool] = None
+    empty_cuda_cache: Optional[bool] = True
-    empty_cuda_cache: Optional[bool] = True
+    empty_cuda_cache: bool = True
-    empty_cuda_cache: Optional[bool] = True
+    empty_cuda_cache: bool = True
     model_config_kwargs: dict = field(default_factory=dict)
     dist_ckpt_optim_fully_reshardable: bool = False
     freeze_moe_router: bool = False