File tree Expand file tree Collapse file tree 2 files changed +10
-4
lines changed Expand file tree Collapse file tree 2 files changed +10
-4
lines changed Original file line number Diff line number Diff line change @@ -34,6 +34,12 @@ class Profiling:
3434    profile_freq : int  =  10 
3535    """How often to collect profile traces, in iterations""" 
3636
37+     profiler_active : int  =  1 
38+     """The steps profiler is active for""" 
39+ 
40+     profiler_warmup : int  =  3 
41+     """The number of warmup steps before the active step in each profiling cycle""" 
42+ 
3743    enable_memory_snapshot : bool  =  False 
3844    """Whether to dump memory snapshot""" 
3945
Original file line number Diff line number Diff line change 1414from  torchtitan .config  import  Profiling  as  ProfilingConfig 
1515from  torchtitan .tools .logging  import  logger 
1616
17- # the number of warmup steps before the active step in each profiling cycle 
18- WARMUP  =  3 
19- 
2017# how much memory allocation/free ops to record in memory snapshots 
2118MEMORY_SNAPSHOT_MAX_ENTRIES  =  100000 
2219
@@ -58,7 +55,10 @@ def trace_handler(prof):
5855        if  not  os .path .exists (trace_dir ):
5956            os .makedirs (trace_dir , exist_ok = True )
6057
61-         warmup , active  =  WARMUP , 1 
58+         warmup , active  =  (
59+             profiling_config .profiler_warmup ,
60+             profiling_config .profiler_active ,
61+         )
6262        wait  =  profile_freq  -  (active  +  warmup )
6363        assert  (
6464            wait  >=  0 
    
 
   
 
     
   
   
          
     
  
    
     
 
    
      
     
 
     
    You can’t perform that action at this time.
  
 
    
  
     
    
      
        
     
 
       
      
     
   
 
    
    
  
 
  
 
     
    
0 commit comments