[3331] | 1 | SUBROUTINE GSTATS(KNUM,KSWITCH) |
---|
| 2 | |
---|
| 3 | !**** *GSTATS* - Gather timing statistics |
---|
| 4 | |
---|
| 5 | ! PURPOSE. |
---|
| 6 | ! -------- |
---|
| 7 | ! To gather timings for subsequent output by routine STATS_OUTPUT |
---|
| 8 | |
---|
| 9 | |
---|
| 10 | !** INTERFACE. |
---|
| 11 | ! ---------- |
---|
| 12 | ! *CALL* *GSTATS(KNUM,KSWITCH) |
---|
| 13 | |
---|
| 14 | ! EXPLICIT ARGUMENTS |
---|
| 15 | ! -------------------- |
---|
| 16 | ! KNUM - timing event number (for list of already defined events |
---|
| 17 | ! see routine STATS_OUTPUT) |
---|
| 18 | ! KSWITCH - KSWITCH=0 - switch on timer |
---|
| 19 | ! KSWITCH=1 - switch off timer |
---|
| 20 | ! KSWITCH=2 - suspend timer |
---|
| 21 | ! KSWITCH=3 - resume timer |
---|
| 22 | |
---|
| 23 | ! IMPLICIT ARGUMENTS |
---|
| 24 | ! -------------------- |
---|
| 25 | ! Module YOMSTATS |
---|
| 26 | |
---|
| 27 | ! METHOD. |
---|
| 28 | ! ------- |
---|
| 29 | |
---|
| 30 | |
---|
| 31 | ! EXTERNALS. USER_CLOCK - timing routine |
---|
| 32 | ! ---------- MPL_BARRIER - syncronization of processors |
---|
| 33 | |
---|
| 34 | ! REFERENCE. |
---|
| 35 | ! ---------- |
---|
| 36 | ! ECMWF Research Department documentation of the IFS |
---|
| 37 | |
---|
| 38 | ! AUTHOR. |
---|
| 39 | ! ------- |
---|
| 40 | ! Mats Hamrud ECMWF |
---|
| 41 | |
---|
| 42 | ! MODIFICATIONS. |
---|
| 43 | ! -------------- |
---|
| 44 | ! ORIGINAL : 98-11-15 |
---|
| 45 | ! D.Salmond: 02-02-25 Return if not master thread when called from a |
---|
| 46 | ! parallel region. |
---|
| 47 | ! J.Hague: 03-06-11 Memory tracing (for NSTATS_MEM MPI tasks) |
---|
| 48 | ! ------------------------------------------------------------------ |
---|
| 49 | |
---|
| 50 | USE PARKIND1 ,ONLY : JPIM ,JPRB ,JPIB |
---|
| 51 | USE YOMHOOK ,ONLY : LHOOK, DR_HOOK |
---|
| 52 | |
---|
| 53 | USE YOMGSTATS |
---|
| 54 | !USE MPL_MODULE ! MPL 28.11.08 |
---|
| 55 | USE YOMOML |
---|
| 56 | |
---|
| 57 | IMPLICIT NONE |
---|
| 58 | |
---|
| 59 | INTEGER(KIND=JPIM),INTENT(IN) :: KNUM |
---|
| 60 | INTEGER(KIND=JPIM),INTENT(IN) :: KSWITCH |
---|
| 61 | |
---|
| 62 | INTEGER(KIND=JPIM) :: IMOD,ICALL |
---|
| 63 | INTEGER(KIND=JPIM) :: IIMEM, IIPAG, IIMEMC |
---|
| 64 | INTEGER(KIND=JPIB) :: IMEM, IMEMH, IMEMS, IMEMC, IPAG, INUM |
---|
| 65 | INTEGER(KIND=JPIB) :: GETRSS, GETHWM, GETSTK, GETCURHEAP, GETPAG |
---|
| 66 | EXTERNAL GETRSS, GETHWM, GETSTK, GETCURHEAP, GETPAG |
---|
| 67 | REAL(KIND=JPRB) :: ZTIMED,ZCLOCK,ZTIME,ZTCPU,ZVCPU |
---|
| 68 | REAL(KIND=JPRB) :: ZLAST_PAR_TIME |
---|
| 69 | LOGICAL :: LLFIRST=.TRUE. |
---|
| 70 | LOGICAL :: LLMFIRST=.TRUE. |
---|
| 71 | CHARACTER(LEN=32), SAVE :: CCDESC_DRHOOK(JPMAXSTAT) |
---|
| 72 | CHARACTER(LEN=32), SAVE :: CCDESC_BARR(JPMAXSTAT) |
---|
| 73 | SAVE ZLAST_PAR_TIME |
---|
| 74 | SAVE IIMEM, IIPAG, IIMEMC |
---|
| 75 | |
---|
| 76 | INTEGER(KIND=JPIM),SAVE :: NUM_THREADS |
---|
| 77 | REAL(KIND=JPRB),ALLOCATABLE,SAVE :: ZHOOK_HANDLE(:) |
---|
| 78 | REAL(KIND=JPRB),SAVE :: ZHOOK_HANDLE_COMMS, ZHOOK_HANDLE_COMMS1 |
---|
| 79 | REAL(KIND=JPRB),SAVE :: ZHOOK_HANDLE_TRANS |
---|
| 80 | REAL(KIND=JPRB),SAVE :: ZHOOK_HANDLE_BARR |
---|
| 81 | CHARACTER*4 CC |
---|
| 82 | |
---|
| 83 | INTEGER(KIND=JPIM) :: NMAX_STATS, KULNAM |
---|
| 84 | |
---|
| 85 | INTERFACE |
---|
| 86 | #include "user_clock.h" |
---|
| 87 | END INTERFACE |
---|
| 88 | |
---|
| 89 | ! write(0,*) "GSTATS:LSTATS,JPMAXSTAT,LGSTATS_LABEL,KNUM=",LSTATS,JPMAXSTAT,LGSTATS_LABEL,KNUM |
---|
| 90 | |
---|
| 91 | IF(LSTATS) THEN |
---|
| 92 | |
---|
| 93 | IF(.NOT.ALLOCATED(ZHOOK_HANDLE))THEN |
---|
| 94 | NUM_THREADS=OML_MAX_THREADS() |
---|
| 95 | ALLOCATE(ZHOOK_HANDLE(NUM_THREADS)) |
---|
| 96 | ENDIF |
---|
| 97 | |
---|
| 98 | IF(LGSTATS_LABEL)THEN |
---|
| 99 | DO INUM=1,JPMAXSTAT |
---|
| 100 | WRITE(CC,'(I4)')INUM |
---|
| 101 | CCDESC_BARR(INUM)='>BAR-'//CCDESC(INUM)(1:21)//'('//CC//')' |
---|
| 102 | ENDDO |
---|
| 103 | DO INUM=1,JPMAXSTAT |
---|
| 104 | WRITE(CC,'(I4)')INUM |
---|
| 105 | ! write(6,*) inum,cctype(inum) |
---|
| 106 | IF(CCTYPE(INUM).EQ."TRS".OR.CCTYPE(INUM).EQ.'MP-'.OR.CCTYPE(INUM).EQ.'MPL'& |
---|
| 107 | & .OR.CCTYPE(INUM).EQ.'BAR'.OR.CCTYPE(INUM).EQ.'OMP') THEN |
---|
| 108 | CCDESC_DRHOOK(INUM)='>'//CCTYPE(INUM)//'-'//CCDESC(INUM)(1:21)//'('//CC//')' |
---|
| 109 | ENDIF |
---|
| 110 | ENDDO |
---|
| 111 | LGSTATS_LABEL=.FALSE. |
---|
| 112 | ENDIF |
---|
| 113 | ! ------------------------------------------------------------------ |
---|
| 114 | |
---|
| 115 | !J IF((KNUM > 1000 .AND.KNUM < 2001).AND.(.NOT.LSTATS_OMP))GOTO 99999 |
---|
| 116 | !J IF((KNUM > 500 .AND.KNUM < 1001).AND.(.NOT.LSTATS_COMMS))GOTO 99999 |
---|
| 117 | IF(OML_MY_THREAD() > 1)GOTO 99999 |
---|
| 118 | |
---|
| 119 | !J IF(KNUM/=0) THEN |
---|
| 120 | !J IF(LSYNCSTATS .AND.(KSWITCH==0.OR. KSWITCH==2)) THEN |
---|
| 121 | !J IF(.NOT.OML_IN_PARALLEL().AND. KNUM < 500 )THEN |
---|
| 122 | !J IF(LHOOK)CALL DR_HOOK(CCDESC_BARR(KNUM),0,ZHOOK_HANDLE_BARR) |
---|
| 123 | !J CALL MPL_BARRIER(CDSTRING='GSTATS:') |
---|
| 124 | !J IF(LHOOK)CALL DR_HOOK(CCDESC_BARR(KNUM),1,ZHOOK_HANDLE_BARR) |
---|
| 125 | !J ENDIF |
---|
| 126 | !J ENDIF |
---|
| 127 | !J ENDIF |
---|
| 128 | |
---|
| 129 | IF (LHOOK .AND. (KSWITCH == 0 .OR. KSWITCH == 1)) THEN |
---|
| 130 | ! write(0,*) "KNUM,SWITCH=",KNUM,KSWITCH |
---|
| 131 | ! write(0,*) "CCTYPE=",CCTYPE(KNUM) |
---|
| 132 | ! write(0,*) "CCDESC_DRHOOK=",CCDESC_DRHOOK(KNUM) |
---|
| 133 | IF(CCTYPE(KNUM).EQ."TRS")THEN |
---|
| 134 | CALL DR_HOOK(CCDESC_DRHOOK(KNUM),KSWITCH,ZHOOK_HANDLE_TRANS) |
---|
| 135 | ELSEIF(CCTYPE(KNUM).EQ.'MP-')THEN |
---|
| 136 | CALL DR_HOOK(CCDESC_DRHOOK(KNUM),KSWITCH,ZHOOK_HANDLE_COMMS) |
---|
| 137 | ELSEIF(CCTYPE(KNUM).EQ.'MPL'.AND.KNUM.NE.682)THEN |
---|
| 138 | CALL DR_HOOK(CCDESC_DRHOOK(KNUM),KSWITCH,ZHOOK_HANDLE_COMMS1) |
---|
| 139 | ELSEIF(CCTYPE(KNUM).EQ.'OMP')THEN |
---|
| 140 | ! CALL DR_HOOK(CCDESC_DRHOOK(KNUM),KSWITCH,ZHOOK_HANDLE) |
---|
| 141 | ! MPL 1.12.08 : erreur a la compilation car zhook_handle est un tableau et non un |
---|
| 142 | ! scalaire (PKEY) |
---|
| 143 | CALL DR_HOOK(CCDESC_DRHOOK(KNUM),KSWITCH,ZTIME) |
---|
| 144 | ELSEIF(CCTYPE(KNUM).EQ.'BAR')THEN |
---|
| 145 | CALL DR_HOOK(CCDESC_DRHOOK(KNUM),KSWITCH,ZHOOK_HANDLE_BARR) |
---|
| 146 | ENDIF |
---|
| 147 | ENDIF |
---|
| 148 | |
---|
| 149 | CALL USER_CLOCK(PELAPSED_TIME=ZCLOCK) |
---|
| 150 | IF (LSTATSCPU.OR.KNUM==0) THEN |
---|
| 151 | CALL USER_CLOCK(PTOTAL_CP=ZTCPU,PVECTOR_CP=ZVCPU) |
---|
| 152 | ELSE |
---|
| 153 | ZTCPU = 0.0_JPRB |
---|
| 154 | ZVCPU = 0.0_JPRB |
---|
| 155 | ENDIF |
---|
| 156 | |
---|
| 157 | IF (LLFIRST) THEN |
---|
| 158 | |
---|
| 159 | ! write(0,*) "JPMAXSTAT:2=",JPMAXSTAT |
---|
| 160 | |
---|
| 161 | NCALLS(:) = 0 |
---|
| 162 | TIMESUM(:) = 0.0_JPRB |
---|
| 163 | TIMESQSUM(:) = 0.0_JPRB |
---|
| 164 | TIMEMAX(:) = 0.0_JPRB |
---|
| 165 | TIMESUMB(:) = 0.0_JPRB |
---|
| 166 | TTCPUSUM(:) = 0.0_JPRB |
---|
| 167 | TVCPUSUM(:) = 0.0_JPRB |
---|
| 168 | TIMELCALL(:) = ZCLOCK |
---|
| 169 | CCDESC="" |
---|
| 170 | CCTYPE="" |
---|
| 171 | NTMEM = 0 |
---|
| 172 | NTMEM(:,5) = 99999999 |
---|
| 173 | IIMEM=0 |
---|
| 174 | IIPAG=0 |
---|
| 175 | IIMEMC=0 |
---|
| 176 | TIME_LAST_CALL = ZCLOCK |
---|
| 177 | ZLAST_PAR_TIME=ZCLOCK |
---|
| 178 | LLFIRST = .FALSE. |
---|
| 179 | ENDIF |
---|
| 180 | |
---|
| 181 | IF(KNUM < 0.OR. KNUM > JPMAXSTAT) CALL ABOR1('GSTATS') |
---|
| 182 | IF(KSWITCH == 0.OR. KSWITCH == 1) THEN |
---|
| 183 | NCALLS(KNUM) = NCALLS(KNUM)+1 |
---|
| 184 | ENDIF |
---|
| 185 | IMOD = MOD(NCALLS(KNUM),2) |
---|
| 186 | IF(.NOT.((KSWITCH == 0.AND. IMOD == 1) .OR.& |
---|
| 187 | &(KSWITCH == 2.AND. IMOD == 1) .OR.& |
---|
| 188 | &(KSWITCH == 3.AND. IMOD == 1) .OR.& |
---|
| 189 | &(KSWITCH == 1.AND. IMOD == 0))) THEN |
---|
| 190 | WRITE(JPERR,*) 'KNUM,KSWITCH,IMOD,NCALLS(KNUM)',& |
---|
| 191 | &KNUM,KSWITCH,IMOD,NCALLS(KNUM) |
---|
| 192 | CALL ABOR1('GSTATS') |
---|
| 193 | ENDIF |
---|
| 194 | |
---|
| 195 | IF( KSWITCH == 0 ) THEN |
---|
| 196 | ! Start timing event |
---|
| 197 | IF(KNUM < 500) THEN |
---|
| 198 | ZTIMED = ZCLOCK-TIME_LAST_CALL |
---|
| 199 | ELSE |
---|
| 200 | ZTIMED = ZCLOCK - ZLAST_PAR_TIME |
---|
| 201 | ENDIF |
---|
| 202 | TIMESUMB(KNUM) = TIMESUMB(KNUM)+ZTIMED |
---|
| 203 | THISTIME(KNUM) = 0.0_JPRB |
---|
| 204 | TIMELCALL(KNUM) = ZCLOCK |
---|
| 205 | TTCPULCALL(KNUM) = ZTCPU |
---|
| 206 | TVCPULCALL(KNUM) = ZVCPU |
---|
| 207 | THISTCPU(KNUM) = 0.0_JPRB |
---|
| 208 | THISVCPU(KNUM) = 0.0_JPRB |
---|
| 209 | IF(MYPROC_STATS.LE.NSTATS_MEM.AND.MYPROC_STATS.NE.0) THEN |
---|
| 210 | ! CALL getrss(IMEM) |
---|
| 211 | ! IMEM = getrss()/1024 |
---|
| 212 | IPAG = getpag() |
---|
| 213 | IMEMH = gethwm()/1024 |
---|
| 214 | IMEMS = getstk()/1024 |
---|
| 215 | IMEMC = 0 |
---|
| 216 | IF(LSTATS_ALLOC) IMEMC = GETCURHEAP()/1024 |
---|
| 217 | IF(IMEM > IIMEM.OR.IPAG > IIPAG.OR.(LSTATS_ALLOC.AND.(IMEMC.NE.IIMEMC))) THEN |
---|
| 218 | IF(LLMFIRST) THEN |
---|
| 219 | WRITE(0,*) ".---------------------------------------------------------" |
---|
| 220 | WRITE(0,*) "| Memory trace details" |
---|
| 221 | WRITE(0,*) "| --------------------" |
---|
| 222 | WRITE(0,*) "| Memory examined at each GSTATS call if NSTATS_MEM>0." |
---|
| 223 | WRITE(0,*) "| Header for each trace line is:" |
---|
| 224 | WRITE(0,*) "|" |
---|
| 225 | WRITE(0,*) "| RSS_INC: Increase in RSS_MAX (KB)" |
---|
| 226 | WRITE(0,*) "| RSS_MAX: Maximum real working set so far (KB)" |
---|
| 227 | WRITE(0,*) "| HEAP_MX: High Water Mark for heap so far (KB)" |
---|
| 228 | WRITE(0,*) "| STK: Current Stack usage (KB)" |
---|
| 229 | WRITE(0,*) "| PGS: Page faults w I/O since last trace line" |
---|
| 230 | WRITE(0,*) "| CALL: Number of gstats call" |
---|
| 231 | WRITE(0,*) "| HEAP: Current malloc'd total (KB)" |
---|
| 232 | WRITE(0,*) "|" |
---|
| 233 | WRITE(0,*) "| Trace line written for NSTATS_MEM MPI tasks if RSS_MAX" |
---|
| 234 | WRITE(0,*) "| RSS_MAX increases, PGS>0, or HEAP changed" |
---|
| 235 | WRITE(0,*) "| (if LTATS_ALLOC=.TRUE.)" |
---|
| 236 | WRITE(0,*) "`---------------------------------------------------------" |
---|
| 237 | WRITE(0,*) "" |
---|
| 238 | WRITE(0,'(A10,A5,21X,A7,2A8,A7,A5,A5,A8)') & |
---|
| 239 | & "MEMORY "," KNUM","RSS_INC"," RSS_MAX"," HEAP_MX"," STK", & |
---|
| 240 | & " PGS"," CALL"," HEAP" |
---|
| 241 | LLMFIRST=.FALSE. |
---|
| 242 | ENDIF |
---|
| 243 | WRITE(0,'(A10,I5,1X,A20,1X,I6,2(1X,I7),1X,I6,1X,I4,1X,I4,1X,I7)') & |
---|
| 244 | & "MEMORY bfr",KNUM,CCDESC(KNUM),IMEM-IIMEM,IMEM,IMEMH,IMEMS, & |
---|
| 245 | & IPAG-IIPAG,(NCALLS(KNUM)+1)/2,IMEMC |
---|
| 246 | ENDIF |
---|
| 247 | NTMEM(KNUM,2)=IMEM |
---|
| 248 | IIMEM=IMEM |
---|
| 249 | IIPAG=IPAG |
---|
| 250 | IIMEMC=IMEMC |
---|
| 251 | ENDIF |
---|
| 252 | ELSEIF( KSWITCH == 1 ) THEN |
---|
| 253 | ! Finish timing event |
---|
| 254 | ZTIME = THISTIME(KNUM)+(ZCLOCK-TIMELCALL(KNUM)) |
---|
| 255 | TIMESUM(KNUM) = TIMESUM(KNUM)+ZTIME |
---|
| 256 | TIMESQSUM(KNUM) = TIMESQSUM(KNUM)+ZTIME**2 |
---|
| 257 | TIMEMAX(KNUM) = MAX(TIMEMAX(KNUM),ZTIME) |
---|
| 258 | TTCPUSUM(KNUM) = TTCPUSUM(KNUM)+THISTCPU(KNUM)+ZTCPU-TTCPULCALL(KNUM) |
---|
| 259 | TVCPUSUM(KNUM) = TVCPUSUM(KNUM)+THISVCPU(KNUM)+ZVCPU-TVCPULCALL(KNUM) |
---|
| 260 | IF(MYPROC_STATS.LE.NSTATS_MEM.AND.MYPROC_STATS.NE.0) THEN |
---|
| 261 | ! CALL getrss(IMEM) |
---|
| 262 | IMEM = GETRSS()/1024 |
---|
| 263 | IPAG = GETPAG() |
---|
| 264 | IMEMH = GETHWM()/1024 |
---|
| 265 | IMEMS = GETSTK()/1024 |
---|
| 266 | IMEMC = 0 |
---|
| 267 | IF(LSTATS_ALLOC) IMEMC = GETCURHEAP()/1024 |
---|
| 268 | IF(IMEM > IIMEM.OR.IPAG > IIPAG.OR.(LSTATS_ALLOC.AND.(IMEMC.NE.IIMEMC))) THEN |
---|
| 269 | WRITE(0,'(A10,I5,1X,A20,1X,I6,2(1X,I7),1X,I6,1X,I4,1X,I4,1X,I7)') & |
---|
| 270 | & "MEMORY aft ",KNUM,CCDESC(KNUM),IMEM-IIMEM,IMEM,IMEMH,IMEMS, & |
---|
| 271 | & IPAG-IIPAG,NCALLS(KNUM)/2,IMEMC |
---|
| 272 | ENDIF |
---|
| 273 | IIMEM=IMEM |
---|
| 274 | IIPAG=IPAG |
---|
| 275 | IIMEMC=IMEMC |
---|
| 276 | IMEM=IMEM-NTMEM(KNUM,2) |
---|
| 277 | NTMEM(KNUM,4)=NTMEM(KNUM,4)+IMEM |
---|
| 278 | IF(IMEM > NTMEM(KNUM,1)) THEN |
---|
| 279 | NTMEM(KNUM,1)=IMEM |
---|
| 280 | NTMEM(KNUM,3)=NCALLS(KNUM) |
---|
| 281 | ENDIF |
---|
| 282 | IF(IMEM < NTMEM(KNUM,5)) NTMEM(KNUM,5)=IMEM |
---|
| 283 | ENDIF |
---|
| 284 | ELSEIF( KSWITCH == 2 ) THEN |
---|
| 285 | ! Suspend timing event |
---|
| 286 | ZTIMED = ZCLOCK-TIMELCALL(KNUM) |
---|
| 287 | THISTIME(KNUM) = THISTIME(KNUM)+ZTIMED |
---|
| 288 | THISTCPU(KNUM) = THISTCPU(KNUM)+ZTCPU-TTCPULCALL(KNUM) |
---|
| 289 | THISVCPU(KNUM) = THISVCPU(KNUM)+ZVCPU-TVCPULCALL(KNUM) |
---|
| 290 | ELSEIF( KSWITCH == 3 ) THEN |
---|
| 291 | ! Resume timing event |
---|
| 292 | TIMELCALL(KNUM) = ZCLOCK |
---|
| 293 | TTCPULCALL(KNUM) = ZTCPU |
---|
| 294 | TVCPULCALL(KNUM) = ZVCPU |
---|
| 295 | ENDIF |
---|
| 296 | TIME_LAST_CALL = ZCLOCK |
---|
| 297 | IF(KNUM > 500.OR.KNUM == 102.OR.KNUM == 103) ZLAST_PAR_TIME = ZCLOCK |
---|
| 298 | ! Trace stats |
---|
| 299 | NCALLS_TOTAL = NCALLS_TOTAL+1 |
---|
| 300 | IF (LTRACE_STATS .AND. NCALLS_TOTAL <= NTRACE_STATS) THEN |
---|
| 301 | ICALL = NCALLS_TOTAL |
---|
| 302 | TIME_TRACE(ICALL) = ZCLOCK |
---|
| 303 | NCALL_TRACE(ICALL) = (JPMAXSTAT+1)*KSWITCH+KNUM |
---|
| 304 | ENDIF |
---|
| 305 | |
---|
| 306 | ENDIF |
---|
| 307 | |
---|
| 308 | 99999 CONTINUE |
---|
| 309 | END SUBROUTINE GSTATS |
---|