[hotfix] fix auto policy of test_sharded_optim_v2 (#2157)

feifeibear · web-flow · commit b87496a66b0f · 2022-12-20T23:03:18.000+08:00
diff --git a/colossalai/gemini/memory_tracer/chunk_memstats_collector.py b/colossalai/gemini/memory_tracer/chunk_memstats_collector.py
@@ -33,4 +33,4 @@ def record_model_data_volume(self) -> None:
 
     @property
     def cuda_margin_mem(self) -> float:
-        return colo_device_memory_capacity(get_current_device()) - self._memstats.max_overall_cuda('cuda')
+        return colo_device_memory_capacity(get_current_device()) - self._memstats.max_overall_cuda
diff --git a/colossalai/gemini/memory_tracer/memory_stats.py b/colossalai/gemini/memory_tracer/memory_stats.py
@@ -107,14 +107,6 @@ def max_non_model_data(self, device_type: str) -> float:
         else:
             raise TypeError
 
-    def max_overall_cuda(self, device_type: str) -> float:
-        if device_type == 'cuda':
-            return max(self._overall_cuda_list)
-        elif device_type == 'cpu':
-            return max(self._overall_cpu_list)
-        else:
-            raise TypeError
-
     def clear(self):
         self._model_data_cuda_list = []
         self._overall_cuda_list = []
diff --git a/colossalai/gemini/memory_tracer/memstats_collector.py b/colossalai/gemini/memory_tracer/memstats_collector.py
@@ -79,9 +79,7 @@ def record_model_data_volume(self) -> None:
         if self._start_flag and not self.use_outside_memstats:
             # The following code work for ZeroInitContext, which is deprecated in v0.1.12
             cuda_mem = StatefulTensor.GST_MGR.total_mem['cuda']
-            cpu_mem = StatefulTensor.GST_MGR.total_mem['cpu']
-            self._memstats.append_model_data('cuda', cuda_mem)
-            self._memstats.append_model_data('cpu', cpu_mem)
+            self._memstats.record_max_cuda_model_data(cuda_mem)
 
     def sample_overall_data(self) -> None:
         """
diff --git a/tests/test_zero/test_sharded_optim_v2.py b/tests/test_zero/test_sharded_optim_v2.py
@@ -64,7 +64,7 @@ def _run_test_sharded_optim_v2(cpu_offload, shard_strategy_class, use_cpuadam, g
         zero_model = ShardedModelV2(
             zero_model,
             shard_strategy,
-            tensor_placement_policy='cpu' if cpu_offload else 'cuda',
+            tensor_placement_policy='cpu' if cpu_offload else 'auto',
             reuse_fp16_shard=use_cpuadam,
         )
 

Original file line number	Diff line number	Diff line change
`@@ -64,7 +64,7 @@ def _run_test_sharded_optim_v2(cpu_offload, shard_strategy_class, use_cpuadam, g`
`64`	`64`	`zero_model = ShardedModelV2(`
`65`	`65`	`zero_model,`
`66`	`66`	`shard_strategy,`
`67`		`- tensor_placement_policy='cpu' if cpu_offload else 'cuda',`
	`67`	`+ tensor_placement_policy='cpu' if cpu_offload else 'auto',`
`68`	`68`	`reuse_fp16_shard=use_cpuadam,`
`69`	`69`	`)`
`70`	`70`