File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -142,29 +142,6 @@ def destroy_parallel_state():
142142 except ImportError :
143143 pass
144144
145- # Reset the third global async_calls instance in base strategy module
146- try :
147- import megatron .core .dist_checkpointing .strategies .base as base_strategy
148- from megatron .core .dist_checkpointing .strategies .async_utils import (
149- AsyncCallsQueue ,
150- )
151-
152- # Clean up and reset the global async_calls in base strategy
153- old_call_idx = getattr (base_strategy .async_calls , "call_idx" , None )
154- num_unfinalized = base_strategy .async_calls .get_num_unfinalized_calls ()
155- if num_unfinalized > 0 :
156- print (
157- f"[WARNING] Resetting base strategy async_calls with { num_unfinalized } unfinalized calls"
158- )
159- try :
160- base_strategy .async_calls .close ()
161- except :
162- pass
163- base_strategy .async_calls = AsyncCallsQueue ()
164- print (f"[DEBUG] Reset base strategy async_calls (old call_idx: { old_call_idx } )" )
165- except ImportError :
166- pass
167-
168145
169146def setup_distributed () -> None :
170147 """Handle NCCL settings, dtype mapping, and basic config setup."""
You can’t perform that action at this time.
0 commit comments