@@ -120,7 +120,8 @@ def load_gen(
120120 callback : Callable [[int , int ], None ] | None = None ,
121121 generator : bool = True ,
122122 tp_dev_limits : dict | None = None ,
123- tp_backend : str = "native"
123+ tp_backend : str = "native" ,
124+ verbose : bool = False
124125 ):
125126 """
126127 Load model, generator function. For regular function, call load() with the same arguments
@@ -197,6 +198,9 @@ def load_gen(
197198
198199 :param tp_backend:
199200 str, either "nccl" (default) or "native"
201+
202+ :param verbose:
203+ bool, more info while loading including full TP split
200204 """
201205
202206 free_mem ()
@@ -214,7 +218,7 @@ def load_gen(
214218 "Cannot specify reserve_per_device or use_per_device when loading to single device."
215219 assert not tensor_p , \
216220 "Cannot use tensor_p when loading to single device."
217- self ._load_single (progressbar , device , self .config , self .modules )
221+ self ._load_single (progressbar , device , self .config , self .modules , verbose )
218222
219223 # Use/reserve
220224 else :
@@ -264,6 +268,7 @@ def load_gen(
264268 generator ,
265269 self .config ,
266270 self .modules ,
271+ verbose ,
267272 )
268273 self .output_device = self .modules [- 1 ].device
269274
@@ -290,6 +295,7 @@ def load_gen(
290295 self .modules ,
291296 tp_dev_limits ,
292297 tp_backend ,
298+ verbose ,
293299 )
294300 self .output_device = tp_output_device
295301
0 commit comments