-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathcp_external_control.F
229 lines (199 loc) · 10.6 KB
/
cp_external_control.F
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
!--------------------------------------------------------------------------------------------------!
! CP2K: A general program to perform molecular dynamics simulations !
! Copyright (C) 2000 - 2020 CP2K developers group !
!--------------------------------------------------------------------------------------------------!
! **************************************************************************************************
!> \brief Routines to handle the external control of CP2K
!> \par History
!> - Moved from MODULE termination to here (18.02.2011,MK)
!> - add communication control (20.02.2013 Mandes)
!> \author Marcella Iannuzzi (10.03.2005,MI)
! **************************************************************************************************
MODULE cp_external_control
USE cp_files, ONLY: close_file,&
open_file
USE cp_log_handling, ONLY: cp_get_default_logger,&
cp_logger_get_default_unit_nr,&
cp_logger_type
USE global_types, ONLY: global_environment_type
USE kinds, ONLY: default_string_length,&
dp
USE machine, ONLY: m_walltime
USE message_passing, ONLY: mp_bcast,&
mp_probe
#include "./base/base_uses.f90"
IMPLICIT NONE
PRIVATE
CHARACTER(len=*), PARAMETER, PRIVATE :: moduleN = 'cp_external_control'
PUBLIC :: external_control
PUBLIC :: set_external_comm
INTEGER, SAVE :: external_comm = -1
INTEGER, SAVE :: external_master_id = -1
INTEGER, SAVE :: scf_energy_message_tag = -1
INTEGER, SAVE :: exit_tag = -1
CONTAINS
! **************************************************************************************************
!> \brief set the communicator to an external source or destination,
!> to send messages (e.g. intermediate energies during scf) or
!> reveive commands (e.g. aborting the calculation)
!> \param comm ...
!> \param in_external_master_id ...
!> \param in_scf_energy_message_tag ...
!> \param in_exit_tag ...
!> \author Mandes 02.2013
! **************************************************************************************************
SUBROUTINE set_external_comm(comm, in_external_master_id, &
in_scf_energy_message_tag, in_exit_tag)
INTEGER, INTENT(IN) :: comm, in_external_master_id
INTEGER, INTENT(IN), OPTIONAL :: in_scf_energy_message_tag, in_exit_tag
CHARACTER(LEN=*), PARAMETER :: routineN = 'set_external_comm', &
routineP = moduleN//':'//routineN
CPASSERT(in_external_master_id .GE. 0)
external_comm = comm
external_master_id = in_external_master_id
IF (PRESENT(in_scf_energy_message_tag)) &
scf_energy_message_tag = in_scf_energy_message_tag
IF (PRESENT(in_exit_tag)) THEN
! the exit tag should be different from the mp_probe tag default
CPASSERT(in_exit_tag .NE. -1)
exit_tag = in_exit_tag
END IF
END SUBROUTINE set_external_comm
! **************************************************************************************************
!> \brief External manipulations during a run : when the <PROJECT_NAME>.EXIT_$runtype
!> command is sent the program stops at the level of $runtype
!> when a general <PROJECT_NAME>.EXIT command is sent the program is stopped
!> at all levels (at least those that call this function)
!> if the file WAIT exists, the program waits here till it disappears
!> \param should_stop ...
!> \param flag ...
!> \param globenv ...
!> \param target_time ...
!> \param start_time ...
!> \author MI (10.03.2005)
! **************************************************************************************************
SUBROUTINE external_control(should_stop, flag, globenv, target_time, start_time)
LOGICAL, INTENT(OUT) :: should_stop
CHARACTER(LEN=*), INTENT(IN) :: flag
TYPE(global_environment_type), OPTIONAL, POINTER :: globenv
REAL(dp), OPTIONAL :: target_time, start_time
CHARACTER(LEN=*), PARAMETER :: routineN = 'external_control', &
routineP = moduleN//':'//routineN
CHARACTER(LEN=default_string_length) :: exit_fname, exit_fname_level, &
exit_gname, exit_gname_level
INTEGER :: handle, i, tag, unit_number
LOGICAL :: should_wait
LOGICAL, SAVE :: check_always = .FALSE.
REAL(KIND=dp) :: my_start_time, my_target_time, t1, t2, &
time_check
REAL(KIND=dp), SAVE :: t_last_file_check = 0.0_dp
TYPE(cp_logger_type), POINTER :: logger
CALL timeset(routineN, handle)
logger => cp_get_default_logger()
should_stop = .FALSE.
exit_gname = "EXIT"
exit_gname_level = TRIM(exit_gname)//"_"//TRIM(flag)
exit_fname = TRIM(logger%iter_info%project_name)//"."//TRIM(exit_gname)
exit_fname_level = TRIM(logger%iter_info%project_name)//"."//TRIM(exit_gname_level)
! check for incomming messages and if it is tagged with the exit tag
IF (exit_tag .NE. -1) THEN
i = external_master_id
CALL mp_probe(source=i, comm=external_comm, tag=tag)
IF (tag .EQ. exit_tag) should_stop = .TRUE.
END IF
IF (logger%para_env%ionode) THEN
! files will only be checked every 20 seconds, or if the clock wraps/does not exist,
! otherwise 64 waters on 64 cores can spend up to 10% of time here, on lustre
! however, if should_stop has been true, we should always check
! (at each level scf, md, ... the file must be there to guarantee termination)
t1 = m_walltime()
IF (t1 > t_last_file_check + 20.0_dp .OR. t1 <= t_last_file_check .OR. check_always) THEN
t_last_file_check = t1
! allows for halting execution for a while
! this is useful to copy a consistent snapshot of the output
! while a simulation is running
INQUIRE (FILE="WAIT", EXIST=should_wait)
IF (should_wait) THEN
CALL open_file(file_name="WAITING", file_status="UNKNOWN", &
file_form="FORMATTED", file_action="WRITE", &
unit_number=unit_number)
WRITE (UNIT=cp_logger_get_default_unit_nr(logger), FMT="(/,T2,A,/)") &
"*** waiting till the file WAIT has been removed ***"
DO
! sleep a bit (to save the file system)
t1 = m_walltime()
DO I = 1, 100000000
t2 = m_walltime()
IF (t2 - t1 > 1.0_dp) EXIT
ENDDO
! and ask again
INQUIRE (FILE="WAIT", EXIST=should_wait)
IF (.NOT. should_wait) EXIT
ENDDO
CALL close_file(unit_number=unit_number, file_status="DELETE")
ENDIF
! EXIT control sequence
! Check for <PROJECT_NAME>.EXIT_<FLAG>
IF (.NOT. should_stop) THEN
INQUIRE (FILE=exit_fname_level, EXIST=should_stop)
IF (should_stop) THEN
CALL open_file(file_name=exit_fname_level, unit_number=unit_number)
CALL close_file(unit_number=unit_number, file_status="DELETE")
WRITE (UNIT=cp_logger_get_default_unit_nr(logger), FMT="(/,T2,A,/)") &
"*** "//flag//" run terminated by external request ***"
END IF
END IF
! Check for <PROJECT_NAME>.EXIT
IF (.NOT. should_stop) THEN
INQUIRE (FILE=exit_fname, EXIST=should_stop)
IF (should_stop) THEN
WRITE (UNIT=cp_logger_get_default_unit_nr(logger), FMT="(/,T2,A,/)") &
"*** "//TRIM(flag)//" run terminated by external request ***"
ENDIF
END IF
! Check for EXIT_<FLAG>
IF (.NOT. should_stop) THEN
INQUIRE (FILE=exit_gname_level, EXIST=should_stop)
IF (should_stop) THEN
CALL open_file(file_name=exit_gname_level, unit_number=unit_number)
CALL close_file(unit_number=unit_number, file_status="DELETE")
WRITE (UNIT=cp_logger_get_default_unit_nr(logger), FMT="(/,T2,A,/)") &
"*** "//flag//" run terminated by external request ***"
END IF
END IF
! Check for EXIT
IF (.NOT. should_stop) THEN
INQUIRE (FILE=exit_gname, EXIST=should_stop)
IF (should_stop) THEN
WRITE (UNIT=cp_logger_get_default_unit_nr(logger), FMT="(/,T2,A,/)") &
"*** "//TRIM(flag)//" run terminated by external request ***"
ENDIF
END IF
ENDIF
IF (PRESENT(target_time)) THEN
my_target_time = target_time
my_start_time = start_time
ELSEIF (PRESENT(globenv)) THEN
my_target_time = globenv%cp2k_target_time
my_start_time = globenv%cp2k_start_time
ELSE
! If none of the two arguments is present abort.. This routine should always check about time.
CPABORT("")
END IF
IF ((.NOT. should_stop) .AND. (my_target_time > 0.0_dp)) THEN
! Check for execution time
time_check = m_walltime() - my_start_time
IF (time_check .GT. my_target_time) THEN
should_stop = .TRUE.
WRITE (UNIT=cp_logger_get_default_unit_nr(logger), FMT="(/,T2,A,f12.3,A)") &
"*** "//TRIM(flag)//" run terminated - exceeded requested execution time:", &
my_target_time, " seconds.", &
"*** Execution time now: ", time_check, " seconds."
END IF
END IF
END IF
CALL mp_bcast(should_stop, logger%para_env%source, logger%para_env%group)
check_always = should_stop
CALL timestop(handle)
END SUBROUTINE external_control
END MODULE cp_external_control