@@ -197,6 +197,7 @@ def get_ft_env(
197197 # Select timeout based on operation type
198198 timeout_map = {
199199 "data_processing" : FT_RD_SETTING .data_processing_timeout ,
200+ "debug_data_processing" : FT_RD_SETTING .debug_data_processing_timeout ,
200201 "micro_batch" : FT_RD_SETTING .micro_batch_timeout ,
201202 "full_training" : FT_RD_SETTING .full_timeout ,
202203 }
@@ -229,6 +230,7 @@ def get_ft_env(
229230
230231def get_data_processing_env (
231232 enable_cache : bool | None = None ,
233+ is_debug : bool = False ,
232234) -> tuple [Env , dict ]:
233235 """Get environment for data processing scripts with LLM API access.
234236
@@ -239,13 +241,14 @@ def get_data_processing_env(
239241
240242 Args:
241243 enable_cache: Whether to enable Docker caching
244+ is_debug: Whether running in debug mode (shorter timeout, default 20 min vs 1 hour)
242245
243246 Returns:
244247 Tuple of (env, env_vars) where env_vars contains LLM API keys
245248 to be passed to env.run() as the env parameter
246249 """
247250 env = get_ft_env (
248- operation = "data_processing" ,
251+ operation = "debug_data_processing" if is_debug else " data_processing" ,
249252 enable_cache = enable_cache ,
250253 )
251254
0 commit comments