@@ -7,7 +7,7 @@ use operators::{
77 nvidia_gpu:: Gpu ,
88 random_sample:: nvidia_gpu:: Operator as RandomSampleGpu ,
99 rearrange:: nvidia_gpu:: Operator as Rearrange ,
10- ByteOf , QueueOf , TopoNode ,
10+ Blob , ByteOf , QueueOf , TopoNode ,
1111} ;
1212use std:: {
1313 cell:: { RefCell , RefMut } ,
@@ -207,9 +207,7 @@ impl<'blk> Weights<'blk> {
207207 . as_ref ( )
208208 . map ( |_| Vec :: with_capacity ( model. meta . nblk ) ) ;
209209 for blk in & model. blocks {
210- let blk = blk. distribute ( & model. meta , range. clone ( ) , count, |len| {
211- ctx. malloc_host :: < u8 > ( len)
212- } ) ;
210+ let blk = blk. distribute ( & model. meta , range. clone ( ) , count, Blob :: new) ;
213211 let loader = loader
214212 . get_or_insert_with ( || blk. as_ref ( ) . map ( |s| H2DLoader :: new ( s. len ( ) , & stream) ) ) ;
215213
@@ -240,20 +238,20 @@ impl<'blk> Weights<'blk> {
240238
241239struct H2DLoader < ' ctx > {
242240 event : Event < ' ctx > ,
243- host : HostMem < ' ctx > ,
241+ host : Blob ,
244242 dev : DevMem < ' ctx > ,
245243}
246244
247245impl < ' ctx > H2DLoader < ' ctx > {
248246 fn new ( size : usize , stream : & Stream < ' ctx > ) -> Self {
249247 Self {
250248 event : stream. record ( ) ,
251- host : stream . ctx ( ) . malloc_host :: < u8 > ( size) ,
249+ host : Blob :: new ( size) ,
252250 dev : stream. malloc :: < u8 > ( size) ,
253251 }
254252 }
255253
256- fn load ( & mut self , host : Contiguous < HostMem < ' ctx > > , stream : & Stream < ' ctx > ) -> DevMem < ' ctx > {
254+ fn load ( & mut self , host : Contiguous < Blob > , stream : & Stream < ' ctx > ) -> DevMem < ' ctx > {
257255 self . event . synchronize ( ) ;
258256 match host {
259257 Contiguous :: Borrowed ( host) => self . host . copy_from_slice ( host) ,
0 commit comments