@@ -666,7 +666,10 @@ int mca_pml_bfo_ft_event( int state )
666666 if (OPAL_CRS_CHECKPOINT == state ) {
667667 if ( opal_cr_timing_barrier_enabled ) {
668668 OPAL_CR_SET_TIMER (OPAL_CR_TIMER_CRCPBR1 );
669- opal_pmix .fence (NULL , 0 );
669+ if (OMPI_SUCCESS != (ret = opal_pmix .fence (NULL , 0 ))) {
670+ opal_output (0 , "pml:bfo: ft_event(Restart): Failed to fence complete" );
671+ return ret ;
672+ }
670673 }
671674
672675 OPAL_CR_SET_TIMER (OPAL_CR_TIMER_P2P0 );
@@ -677,7 +680,10 @@ int mca_pml_bfo_ft_event( int state )
677680 if ( !first_continue_pass ) {
678681 if ( opal_cr_timing_barrier_enabled ) {
679682 OPAL_CR_SET_TIMER (OPAL_CR_TIMER_COREBR0 );
680- opal_pmix .fence (NULL , 0 );
683+ if (OMPI_SUCCESS != (ret = opal_pmix .fence (NULL , 0 ))) {
684+ opal_output (0 , "pml:bfo: ft_event(Restart): Failed to fence complete" );
685+ return ret ;
686+ }
681687 }
682688 OPAL_CR_SET_TIMER (OPAL_CR_TIMER_P2P2 );
683689 }
@@ -777,7 +783,10 @@ int mca_pml_bfo_ft_event( int state )
777783 if ( !first_continue_pass ) {
778784 if ( opal_cr_timing_barrier_enabled ) {
779785 OPAL_CR_SET_TIMER (OPAL_CR_TIMER_P2PBR1 );
780- opal_pmix .fence (NULL , 0 );
786+ if (OMPI_SUCCESS != (ret = opal_pmix .fence (NULL , 0 ))) {
787+ opal_output (0 , "pml:bfo: ft_event(Restart): Failed to fence complete" );
788+ return ret ;
789+ }
781790 }
782791 OPAL_CR_SET_TIMER (OPAL_CR_TIMER_P2P3 );
783792 }
@@ -787,7 +796,10 @@ int mca_pml_bfo_ft_event( int state )
787796 * Exchange the modex information once again.
788797 * BTLs will have republished their modex information.
789798 */
790- opal_pmix .fence (NULL , 0 );
799+ if (OMPI_SUCCESS != (ret = opal_pmix .fence (NULL , 0 ))) {
800+ opal_output (0 , "pml:bfo: ft_event(Restart): Failed to fence complete" );
801+ return ret ;
802+ }
791803
792804 /*
793805 * Startup the PML stack now that the modex is running again
@@ -799,7 +811,10 @@ int mca_pml_bfo_ft_event( int state )
799811 }
800812
801813 /* Is this barrier necessary ? JJH */
802- opal_pmix .fence (NULL , 0 );
814+ if (OMPI_SUCCESS != (ret = opal_pmix .fence (NULL , 0 ))) {
815+ opal_output (0 , "pml:bfo: ft_event(Restart): Failed to fence complete" );
816+ return ret ;
817+ }
803818
804819 if ( NULL != procs ) {
805820 for (p = 0 ; p < (int )num_procs ; ++ p ) {
@@ -812,7 +827,10 @@ int mca_pml_bfo_ft_event( int state )
812827 if ( !first_continue_pass ) {
813828 if ( opal_cr_timing_barrier_enabled ) {
814829 OPAL_CR_SET_TIMER (OPAL_CR_TIMER_P2PBR2 );
815- opal_pmix .fence (NULL , 0 );
830+ if (OMPI_SUCCESS != (ret = opal_pmix .fence (NULL , 0 ))) {
831+ opal_output (0 , "pml:bfo: ft_event(Restart): Failed to fence complete" );
832+ return ret ;
833+ }
816834 }
817835 OPAL_CR_SET_TIMER (OPAL_CR_TIMER_CRCP1 );
818836 }
@@ -825,7 +843,10 @@ int mca_pml_bfo_ft_event( int state )
825843 * Exchange the modex information once again.
826844 * BTLs will have republished their modex information.
827845 */
828- opal_pmix .fence (NULL , 0 );
846+ if (OMPI_SUCCESS != (ret = opal_pmix .fence (NULL , 0 ))) {
847+ opal_output (0 , "pml:bfo: ft_event(Restart): Failed to fence complete" );
848+ return ret ;
849+ }
829850
830851 /*
831852 * Startup the PML stack now that the modex is running again
@@ -837,7 +858,10 @@ int mca_pml_bfo_ft_event( int state )
837858 }
838859
839860 /* Is this barrier necessary ? JJH */
840- opal_pmix .fence (NULL , 0 );
861+ if (OMPI_SUCCESS != (ret = opal_pmix .fence (NULL , 0 ))) {
862+ opal_output (0 , "pml:bfo: ft_event(Restart): Failed to fence complete" );
863+ return ret ;
864+ }
841865
842866 if ( NULL != procs ) {
843867 for (p = 0 ; p < (int )num_procs ; ++ p ) {
0 commit comments