File tree Expand file tree Collapse file tree 1 file changed +3
-3
lines changed Expand file tree Collapse file tree 1 file changed +3
-3
lines changed Original file line number Diff line number Diff line change @@ -131,7 +131,7 @@ def __init__(self, job_config: JobConfig):
131
131
print ("Must use pytorch from unlanded https://github.com/pytorch/pytorch/pull/160282, e.g. torchtitan_conda_prod:5e4101faa448c2ee6b62ddd76ee08e8c" )
132
132
raise
133
133
134
- # Configs from Ruisi
134
+ # Configs from Ruisi
135
135
136
136
# set to 0.1 if you want to make bucketing more efficient with mixed dtype collectives
137
137
torch ._inductor .config .simplefsdp .relax_ratio = 0
@@ -140,10 +140,10 @@ def __init__(self, job_config: JobConfig):
140
140
torch ._inductor .config .simplefsdp .estimate_verbose = False
141
141
torch ._inductor .config .simplefsdp .save_estimation_path = "/mnt/mffuse/cache_ruisi/estimation_mast_" + job_config .model .flavor + ".pkl"
142
142
# set to True after the first communication estimation results are saved. This would reduce decision making time.
143
- torch ._inductor .config .simplefsdp .load_cache = False
143
+ torch ._inductor .config .simplefsdp .load_cache = False
144
144
torch ._inductor .config .simplefsdp .enable_bucket_ir = True
145
145
torch ._inductor .config .simplefsdp .enable_reorder_ir = True
146
- torch ._inductor .config .simplefsdp .simplefsdp_only = True # False for 2d True for 1d
146
+ torch ._inductor .config .simplefsdp .simplefsdp_only = False # False for 2d True for 1d
147
147
torch ._inductor .config .simplefsdp .peak_memory_offset = 0
148
148
torch ._inductor .config .simplefsdp .bucketing_type = "auto"
149
149
You can’t perform that action at this time.
0 commit comments