263 lines
		
	
	
		
			7.2 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
		
		
			
		
	
	
			263 lines
		
	
	
		
			7.2 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
|   | module timer_impl | ||
|  |   !$ use omp_lib | ||
|  |   use :: iso_c_binding, only: c_ptr | ||
|  |   use timer_module, only: timer_callback | ||
|  |   implicit none | ||
|  | 
 | ||
|  |   public :: init_timer, fini_timer | ||
|  |   integer, public :: limtrace=0 | ||
|  | 
 | ||
|  |   private | ||
|  | 
 | ||
|  |   integer, parameter :: MAXCALL=100 | ||
|  |   integer :: lu=6 | ||
|  |   real :: dut | ||
|  |   integer :: i,nmax=0,ncall(MAXCALL),nlevel(MAXCALL),nparent(MAXCALL) | ||
|  |   character(len=8) :: name(MAXCALL),space='        ' | ||
|  |   logical :: on(MAXCALL) | ||
|  |   real :: total,sum,sumf,ut(MAXCALL),ut0(MAXCALL) | ||
|  |   !$ integer :: j,l,m,ntid(MAXCALL) | ||
|  | 
 | ||
|  |   ! | ||
|  |   ! C interoperable callback setup | ||
|  |   ! | ||
|  |   public :: C_init_timer | ||
|  |   abstract interface | ||
|  |      subroutine C_timer_callback (context, dname, k) | ||
|  |        use, intrinsic :: iso_c_binding, only: c_ptr | ||
|  |        implicit none | ||
|  |        type(c_ptr), intent(in) :: context | ||
|  |        character(len=8), intent(in) :: dname | ||
|  |        integer, intent(in) :: k | ||
|  |      end subroutine C_timer_callback | ||
|  |   end interface | ||
|  |   type(c_ptr), private :: the_context | ||
|  |   procedure(C_timer_callback), pointer, private :: the_C_callback | ||
|  | 
 | ||
|  | contains | ||
|  |   subroutine timer_callback_wrapper (dname, k) | ||
|  |     implicit none | ||
|  |     character(len=8), intent(in) :: dname | ||
|  |     integer, intent(in) :: k | ||
|  |     call the_C_callback (the_context, dname, k) | ||
|  |   end subroutine timer_callback_wrapper | ||
|  | 
 | ||
|  |   subroutine C_init_timer (context, callback) bind(C) | ||
|  |     use, intrinsic :: iso_c_binding, only: c_ptr, c_funptr, c_f_procpointer | ||
|  |     use iso_c_utilities, only: c_to_f_string | ||
|  |     use timer_module, only: timer | ||
|  |     implicit none | ||
|  |     type(c_ptr), intent(in) :: context | ||
|  |     type(c_funptr), intent(in) :: callback | ||
|  |     the_context=context | ||
|  |     call c_f_procpointer (callback, the_C_callback) | ||
|  |     timer => timer_callback_wrapper | ||
|  |   end subroutine C_init_timer | ||
|  | 
 | ||
|  |   ! | ||
|  |   ! default Fortran implementation which is thread safe using OpenMP | ||
|  |   ! | ||
|  |   subroutine default_timer (dname, k) | ||
|  | 
 | ||
|  |     ! Times procedure number n between a call with k=0 (tstart) and with | ||
|  |     ! k=1 (tstop). Accumulates sums of these times in array ut (user time). | ||
|  |     ! Also traces all calls (for debugging purposes) if limtrace.gt.0 | ||
|  |     ! | ||
|  |     ! If this is used with OpenMP than the /timer_private/ common | ||
|  |     ! block must be copyed into each thread of a thread team by using | ||
|  |     ! the copyin() clause on the !$omp parallel directive that creates | ||
|  |     ! the team. | ||
|  | 
 | ||
|  |     implicit none | ||
|  | 
 | ||
|  |     character(len=8), intent(in) :: dname | ||
|  |     integer, intent(in) :: k | ||
|  | 
 | ||
|  |     real :: ut1,eps=0.000001 | ||
|  |     integer :: n,ndiv,ntrace=0 | ||
|  |     !$ integer :: tid | ||
|  |     character(len=8) :: tname | ||
|  |     include 'timer_common.inc' | ||
|  | 
 | ||
|  |     !$omp critical(timer) | ||
|  |     if(limtrace.lt.0) go to 999 | ||
|  |     if(k.gt.1) go to 40                        !Check for "all done" (k>1) | ||
|  |     onlevel(0)=0 | ||
|  | 
 | ||
|  |     !$ tid=omp_get_thread_num() | ||
|  |     do n=1,nmax                                !Check for existing name/parent[/thread] | ||
|  |        if(name(n).eq.dname & | ||
|  |                                 !$ .and.ntid(n).eq.tid & | ||
|  |             ) then | ||
|  |           if (on(n)) then | ||
|  |              if (nparent(n).eq.onlevel(level-1)) goto 20 | ||
|  |           else | ||
|  |              if (nparent(n).eq.onlevel(level)) goto 20 | ||
|  |           end if | ||
|  |        end if | ||
|  |     enddo | ||
|  | 
 | ||
|  |     nmax=nmax+1                                !This is a new one | ||
|  |     n=nmax | ||
|  |     !$ ntid(n)=tid | ||
|  |     ncall(n)=0 | ||
|  |     on(n)=.false. | ||
|  |     ut(n)=eps | ||
|  |     name(n)=dname | ||
|  | 
 | ||
|  | 20  if(k.eq.0) then                                !Get start times (k=0) | ||
|  |        if(on(n)) then | ||
|  |           print*,'Error in timer: ',dname,' already on.' | ||
|  |        end if | ||
|  |        level=level+1 !Increment the level | ||
|  |        on(n)=.true. | ||
|  |        !     call system_clock(icount,irate) | ||
|  |        !     ut0(n)=float(icount)/irate | ||
|  |        !     call cpu_time(ut0(n)) | ||
|  |        ut0(n)=secnds(0.0) | ||
|  | 
 | ||
|  |        ncall(n)=ncall(n)+1 | ||
|  |        if(ncall(n).gt.1.and.nlevel(n).ne.level) then | ||
|  |           !recursion is happening | ||
|  |           ! | ||
|  |           !TODO: somehow need to account for this deeper call at the | ||
|  |           !shallowest instance in the call chain and this needs to be | ||
|  |           !done without incrementing anything here other than counters | ||
|  |           !and timers | ||
|  |           ! | ||
|  |           nlevel(n)=-1 | ||
|  |        else | ||
|  |           nlevel(n)=level | ||
|  |        endif | ||
|  |        nparent(n)=onlevel(level-1) | ||
|  |        onlevel(level)=n | ||
|  | 
 | ||
|  |     else if(k.eq.1) then        !Get stop times and accumulate sums. (k=1) | ||
|  |        if(on(n)) then | ||
|  |           on(n)=.false. | ||
|  |           !        call system_clock(icount,irate) | ||
|  |           !        ut1=float(icount)/irate | ||
|  |           !        call cpu_time(ut1) | ||
|  |           ut1=secnds(0.0) | ||
|  | 
 | ||
|  |           ut(n)=ut(n)+ut1-ut0(n) | ||
|  |        endif | ||
|  |        level=level-1 | ||
|  |     endif | ||
|  | 
 | ||
|  |     ntrace=ntrace+1 | ||
|  |     if(ntrace.lt.limtrace) write(lu,1020) ntrace,tname,k,level,nparent(n) | ||
|  | 1020 format(i8,': ',a8,3i5) | ||
|  |     go to 998 | ||
|  | 
 | ||
|  |     ! Write out the timer statistics | ||
|  | 
 | ||
|  | 40  write(lu,1040) | ||
|  | 1040 format(/' Name                 Time  Frac     dTime',       & | ||
|  |          ' dFrac    Calls'/58('-')) | ||
|  | 
 | ||
|  |     !$ !walk backwards through the database rolling up thread data by call chain | ||
|  |     !$ do i=nmax,1,-1 | ||
|  |     !$    do j=1,i-1 | ||
|  |     !$       l=j | ||
|  |     !$       m=i | ||
|  |     !$       do while (name(l).eq.name(m)) | ||
|  |     !$          l=nparent(l) | ||
|  |     !$          m=nparent(m) | ||
|  |     !$          if (l.eq.0.or.m.eq.0) exit | ||
|  |     !$       end do | ||
|  |     !$       if (l.eq.0.and.m.eq.0) then | ||
|  |     !$          !same call chain so roll up data | ||
|  |     !$          ncall(j)=ncall(j)+ncall(i) | ||
|  |     !$          ut(j)=ut(j)+ut(i) | ||
|  |     !$          do n=1,nmax | ||
|  |     !$            if (nparent(n).eq.i) nparent(n)=j | ||
|  |     !$          end do | ||
|  |     !$          name(i)=space | ||
|  |     !$          exit | ||
|  |     !$       end if | ||
|  |     !$    end do | ||
|  |     !$ end do | ||
|  | 
 | ||
|  |     if(k.gt.100) then | ||
|  |        ndiv=k-100 | ||
|  |        do i=1,nmax | ||
|  |           ncall(i)=ncall(i)/ndiv | ||
|  |           ut(i)=ut(i)/ndiv | ||
|  |        enddo | ||
|  |     endif | ||
|  | 
 | ||
|  |     total=ut(1) | ||
|  |     sum=0. | ||
|  |     sumf=0. | ||
|  |     call print_root(1) | ||
|  |     write(lu,1070) sum,sumf | ||
|  | 1070 format(58('-')/32x,f10.3,f6.2) | ||
|  |     nmax=0 | ||
|  |     eps=0.000001 | ||
|  |     ntrace=0 | ||
|  |     level=0 | ||
|  |     onlevel(0)=0 | ||
|  | 
 | ||
|  | 998 flush(lu) | ||
|  | 
 | ||
|  | 999 continue | ||
|  | 
 | ||
|  |     !$omp end critical(timer) | ||
|  |     return | ||
|  |   end subroutine default_timer | ||
|  | 
 | ||
|  |   recursive subroutine print_root(i) | ||
|  |     implicit none | ||
|  |     integer, intent(in) :: i | ||
|  |     character(len=16) :: sname | ||
|  |     real :: dutf, utf | ||
|  |     integer :: j, kk | ||
|  | 
 | ||
|  |     if (i.le.nmax) then | ||
|  |        if (name(i).ne.space) then | ||
|  |           dut=ut(i) | ||
|  |           do j=i,nmax | ||
|  |              if (name(j).ne.space.and.nparent(j).eq.i) dut=dut-ut(j) | ||
|  |           enddo | ||
|  |           if(dut.lt.0.0) dut=0.0 | ||
|  |           utf=ut(i)/total | ||
|  |           dutf=dut/total | ||
|  |           sum=sum+dut | ||
|  |           sumf=sumf+dutf | ||
|  |           kk=nlevel(i) | ||
|  |           sname=space(1:kk)//name(i)//space(1:8-kk) | ||
|  |           write(lu,2000) sname,ut(i),utf,dut,dutf,ncall(i) | ||
|  | 2000      format(a16,2(f10.3,f6.2),i9) | ||
|  |           do j=i,nmax | ||
|  |              if(nparent(j).eq.i) call print_root(j) | ||
|  |           enddo | ||
|  |        end if | ||
|  |     end if | ||
|  |     return | ||
|  |   end subroutine print_root | ||
|  | 
 | ||
|  |   subroutine init_timer (filename) | ||
|  |     use, intrinsic :: iso_c_binding, only: c_char | ||
|  |     use timer_module, only: timer | ||
|  |     implicit none | ||
|  |     character(len=*), optional, intent(in) :: filename | ||
|  |     include 'timer_common.inc' | ||
|  |     data level/0/, onlevel/11 * 0/ | ||
|  |     if (present (filename)) then | ||
|  |        open (newunit=lu, file=filename, status='unknown') | ||
|  |     else | ||
|  |        open (newunit=lu, file='timer.out', status='unknown') | ||
|  |     end if | ||
|  |     timer => default_timer | ||
|  |   end subroutine init_timer | ||
|  | 
 | ||
|  |   subroutine fini_timer () | ||
|  |     use timer_module, only: timer, null_timer | ||
|  |     implicit none | ||
|  |     timer => null_timer | ||
|  |     close (lu) | ||
|  |   end subroutine fini_timer | ||
|  | 
 | ||
|  | end module timer_impl |