diff --git a/PW/src/print_clock_pw.f90 b/PW/src/print_clock_pw.f90 index ef9f02101..25e857e86 100644 --- a/PW/src/print_clock_pw.f90 +++ b/PW/src/print_clock_pw.f90 @@ -92,7 +92,8 @@ SUBROUTINE print_clock_pw() ! WRITE( stdout, '(/5x,"Called by c_bands:")' ) CALL print_clock( 'init_us_2' ) - CALL print_clock( 'init_us_2_gpu' ) + CALL print_clock( 'init_us_2:cpu' ) + CALL print_clock( 'init_us_2:gpu' ) IF ( isolve == 0 ) THEN CALL print_clock( 'regterg' ) ; CALL print_clock( 'cegterg' ) ELSE IF (isolve == 1) THEN diff --git a/upflib/init_us_2_base.f90 b/upflib/init_us_2_base.f90 index a8b121daa..f35c40c2e 100644 --- a/upflib/init_us_2_base.f90 +++ b/upflib/init_us_2_base.f90 @@ -67,6 +67,8 @@ SUBROUTINE init_us_2_base( npw_, npwx, igk_, q_, nat, tau, ityp, & INTEGER, PARAMETER :: blocksize = 256 INTEGER :: iblock, numblock, realblocksize ! + CALL start_clock( 'init_us_2:cpu' ) + ! IF (lmaxkb < 0) RETURN ! ! setting cache blocking size @@ -205,6 +207,8 @@ SUBROUTINE init_us_2_base( npw_, npwx, igk_, q_, nat, tau, ityp, & ! IF (spline_ps) DEALLOCATE( xdata ) ! + CALL stop_clock( 'init_us_2:cpu' ) + ! RETURN ! END SUBROUTINE init_us_2_base diff --git a/upflib/init_us_2_base_gpu.f90 b/upflib/init_us_2_base_gpu.f90 index 09b24ee17..cc6ab519d 100644 --- a/upflib/init_us_2_base_gpu.f90 +++ b/upflib/init_us_2_base_gpu.f90 @@ -81,6 +81,7 @@ SUBROUTINE init_us_2_base_gpu( npw_, npwx, igk__d, q_, nat, tau, ityp, & attributes(PINNED) :: qg_h, vq_h #endif ! + CALL start_clock( 'init_us_2:gpu' ) ! if (lmaxkb<0) return @@ -242,5 +243,7 @@ SUBROUTINE init_us_2_base_gpu( npw_, npwx, igk__d, q_, nat, tau, ityp, & deallocate ( qg_h, vq_h ) END IF ! + CALL stop_clock( 'init_us_2:gpu' ) + ! return end subroutine init_us_2_base_gpu