@@ -294,25 +294,23 @@ __mlu_func__ void genIndiceOutLast(int32_t *nram_output, int32_t *nram_input,
294294 o_w = output_space .o_w ;
295295 int32_t o_hw = o_h * o_w , o_dhw = o_d * o_h * o_w ;
296296 __bang_write_value ((int32_t * )nram_aux + 4 * deal_num , deal_num , int (o_dhw ));
297- __cn_vector_div_s32 ( deal_num , (int32_t * )nram_aux , (int32_t * )nram_input ,
298- (int32_t * )nram_aux + 4 * deal_num );
297+ __bang_div ( (int32_t * )nram_aux , (int32_t * )nram_input ,
298+ (int32_t * )nram_aux + 4 * deal_num , deal_num );
299299 __bang_mul_scalar ((int32_t * )nram_output , (int32_t * )nram_aux , (int )o_dhw ,
300300 deal_num );
301301 __bang_sub ((int32_t * )nram_input , (int32_t * )nram_input , (int * )nram_output ,
302302 deal_num );
303303 __bang_write_value ((int32_t * )nram_aux + 4 * deal_num , deal_num , int (o_hw ));
304- __cn_vector_div_s32 (deal_num , (int32_t * )nram_aux + deal_num ,
305- (int32_t * )nram_input ,
306- (int32_t * )nram_aux + 4 * deal_num );
304+ __bang_div ((int32_t * )nram_aux + deal_num , (int32_t * )nram_input ,
305+ (int32_t * )nram_aux + 4 * deal_num , deal_num );
307306 __bang_mul_scalar ((int32_t * )nram_output , (int32_t * )nram_aux + deal_num ,
308307 (int )o_hw , deal_num );
309308 __bang_sub ((int32_t * )nram_input , (int32_t * )nram_input ,
310309 (int32_t * )nram_output , deal_num );
311310
312311 __bang_write_value ((int32_t * )nram_aux + 4 * deal_num , deal_num , int (o_w ));
313- __cn_vector_div_s32 (deal_num , (int32_t * )nram_aux + 2 * deal_num ,
314- (int32_t * )nram_input ,
315- (int32_t * )nram_aux + 4 * deal_num );
312+ __bang_div ((int32_t * )nram_aux + 2 * deal_num , (int32_t * )nram_input ,
313+ (int32_t * )nram_aux + 4 * deal_num , deal_num );
316314 __bang_mul_scalar ((int32_t * )nram_output , (int32_t * )nram_aux + 2 * deal_num ,
317315 (int )o_w , deal_num );
318316 __bang_sub ((int32_t * )nram_aux + 3 * deal_num , (int32_t * )nram_input ,
0 commit comments