@@ -276,12 +276,15 @@ bool test_printf_multistream(uint32_t num_blocks,
276276 hipLaunchKernelGGL (kernel_complex_opX, dim3 (num_blocks, 1 , 1 ),
277277 dim3 (threads_per_block, 1 , 1 ),
278278 0 , stream[i], Ad, Bd, iterCount);
279+ HIP_CHECK (hipGetLastError ());
279280 hipLaunchKernelGGL (kernel_complex_opY, dim3 (1 , num_blocks, 1 ),
280281 dim3 (1 , threads_per_block, 1 ),
281282 0 , stream[i], Ad, Bd, iterCount);
283+ HIP_CHECK (hipGetLastError ());
282284 hipLaunchKernelGGL (kernel_complex_opZ, dim3 (1 , 1 , num_blocks),
283285 dim3 (1 , 1 , threads_per_block),
284286 0 , stream[i], Ad, Bd, iterCount);
287+ HIP_CHECK (hipGetLastError ());
285288 }
286289 HIP_CHECK (hipDeviceSynchronize ());
287290 for (int i = 0 ; i < NUM_STREAM; i++) {
@@ -368,12 +371,15 @@ bool test_printf_multigpu(int gpu,
368371 hipLaunchKernelGGL (kernel_complex_opX, dim3 (num_blocks, 1 , 1 ),
369372 dim3 (threads_per_block, 1 , 1 ),
370373 0 , 0 , Ad, Bd, iterCount);
374+ HIP_CHECK (hipGetLastError ());
371375 hipLaunchKernelGGL (kernel_complex_opY, dim3 (1 , num_blocks, 1 ),
372376 dim3 (1 , threads_per_block, 1 ),
373377 0 , 0 , Ad, Bd, iterCount);
378+ HIP_CHECK (hipGetLastError ());
374379 hipLaunchKernelGGL (kernel_complex_opZ, dim3 (1 , 1 , num_blocks),
375380 dim3 (1 , 1 , threads_per_block),
376381 0 , 0 , Ad, Bd, iterCount);
382+ HIP_CHECK (hipGetLastError ());
377383 HIP_CHECK (hipDeviceSynchronize ());
378384 std::ifstream CapturedData = captured.getCapturedData ();
379385 char *buffer = new char [CHUNK_SIZE];
0 commit comments