New URL for NEMO forge!   http://forge.nemo-ocean.eu

Since March 2022 along with NEMO 4.2 release, the code development moved to a self-hosted GitLab.
This present forge is now archived and remained online for history.
trusting_func.sh in branches/2015/dev_r5092_CNRS_SETTE/NEMOGCM/TRUST – NEMO

source: branches/2015/dev_r5092_CNRS_SETTE/NEMOGCM/TRUST/trusting_func.sh @ 5669

Last change on this file since 5669 was 5669, checked in by nicolasmartin, 9 years ago

dev_r5092_CNRS_SETTE Corrections in trusting.sh to recompile NEMO from scratch & find all gz archives

  • Property eol-style set to native
  • Property svn:executable set to *
  • Property svn:keywords set to Author Date Id Rev URL
File size: 9.7 KB
Line 
1#!/bin/bash
2
3
4## Messenger filenames
5FILE_DATE=mesg_01_date_$PATTERNAME.txt    ; FILE_STAT=mesg_02_status_$PATTERNAME.txt
6FILE_RESU=mesg_03_result_$PATTERNAME.txt  ; FILE_NEMO=mesg_04_nemogcm_$PATTERNAME.txt
7FILE_XIOS=mesg_05_xios_$PATTERNAME.txt    ; FILE_COMP=mesg_06_compiler_$PATTERNAME.txt
8FILE_MPIN=mesg_07_mpi_$PATTERNAME.txt     ; FILE_NCDF=mesg_08_netcdf_$PATTERNAME.txt
9FILE_INPT=mesg_09_inputs_$PATTERNAME.txt  ; FILE_CPUT=mesg_10_cputime_$PATTERNAME.txt
10FILE_COMM=mesg_11_comments_$PATTERNAME.txt;
11
12## Trusting summary & archive timestamped filenames
13FILE_TRUS=trusting_${DATE}_$PATTERNAME.txt; FILE_ARCH=trusting_${DATE}_$PATTERNAME.tar.gz
14
15print_step() { printf "\nStep.....\n$1\n"; }
16
17init_files() {
18    echo 'Date'          >  ${FILE_DATE}; echo 'Status'           >  ${FILE_STAT}
19    echo 'Result'        >  ${FILE_RESU}; echo 'NEMOGCM rev.'     >  ${FILE_NEMO}
20    echo 'XIOS rev.'     >  ${FILE_XIOS}; echo 'Fortran compiler' >  ${FILE_COMP}
21    echo 'MPI libs'      >  ${FILE_MPIN}; echo 'NetCDF libs'      >  ${FILE_NCDF}
22    echo 'Input files'   >  ${FILE_INPT}; echo 'Real CPU time'    >  ${FILE_CPUT}
23    echo 'Comments'      >  ${FILE_COMM}
24
25    # 'Failed' status with 'Unknown error' by default
26    echo $ST             >> ${FILE_STAT}; echo 'Unknown error'    >> ${FILE_RESU}
27}
28
29get_date() {
30    local dat=$( date -ud ${DATE} +"%F %R %Z" )
31
32    echo $dat >> ${FILE_DATE}
33}
34
35get_nemo_rev() {
36    local rev_loc svn_cmd
37    local rev=0 svn_opt='status'
38
39    ## If -v|--version option has been set, modify svn command
40    if   [ $( echo ${NEMO_VERS} | grep  "HEAD\|up\|update"                     ) ]; then
41   svn_cmd='svn update -r HEAD'
42    elif [ $( echo ${NEMO_VERS} | grep -o '{[0-9]\{4\}-[0-9]\{2\}-[0-9]\{2\}}' ) ]; then
43   svn_cmd='svn update -r '$( echo ${NEMO_VERS} | grep -o '{[0-9]\{4\}-[0-9]\{2\}-[0-9]\{2\}}' )
44    elif [ $( echo ${NEMO_VERS} | grep -o '[0-9]*'                             ) ]; then
45   svn_cmd='svn update -r '$( echo ${NEMO_VERS} | grep -o '[0-9]*'                             )
46    else
47   svn_cmd='svn '${svn_opt}
48    fi
49
50    for dir in ${NEMO_ARCH} ${NEMO_CONF} ${NEMO_ENGI} \
51               ${NEMO_EIOI} ${NEMO_EFCM}              \
52          ${NEMO_TCMP} ${NEMO_TRBD}              \
53          ${DIR_XIOS}                             ; do
54
55   ## For time being, just get revision number from XIOS
56   if [ "$dir" == "${DIR_XIOS}" ]; then
57       rev_loc=$( svn info $dir | awk '(NR == 9) {print $NF}' )
58       echo 'XIOS '${rev_loc} >> model.log
59       echo "<a href=\"https://forge.ipsl.jussieu.fr/ioserver/changeset/${rev_loc}\" target=\"_blank\">${rev_loc}</a>" \
60      >> ${FILE_XIOS}
61       continue
62   fi
63
64   echo $dir
65   ${svn_cmd} $dir
66   rev_loc=$( svn info $dir | awk '(NR == 9) {print $NF}' )
67   (( ${rev_loc} >= $rev )) && rev=${rev_loc}
68    done
69
70    echo 'NEMOGCM '$rev   >> model.log
71    echo "<a href=\"https://forge.ipsl.jussieu.fr/nemo/changeset/$rev\" target=\"_blank\">$rev</a>" \
72   >> ${FILE_NEMO}
73}
74
75get_soft_rel() {
76    local soft_rel
77
78    for soft in $CDO $COMPILER $MPI $NETCDF; do
79   soft_rel=''
80
81        if (( ${I_MODULE} == 1 )); then
82       soft_rel=$( echo $LOADEDMODULES | sed "s/.*$soft\/\([0-9.a-z_]*\).*/\1/i" )
83   else
84       soft_rel=$( echo $PATH          | sed "s/.*$soft\([0-9.a-z_]*\).*/\1/i"   )
85   fi
86
87   [ "$soft" == "$COMPILER" ] && soft_rel=$( $soft --version | grep -m1 -oe '\<[0-9. ]*\>' )
88   soft=$( echo $soft | sed 's#\\##g; s#[/-]$##' ) ## Cleaning characters string to display proper soft name
89   echo $soft ${soft_rel} >> model.log
90    done
91
92    sed -n 4p model.log >> ${FILE_COMP}; sed -n 5p model.log >> ${FILE_MPIN}; sed -n 6p model.log >> ${FILE_NCDF}
93}
94
95get_inputs() {
96    local cmd_iol="tar -tvf ${NEMO_FORC}/${NEMO_TARF}" cmd_iof="tar -vxf ${NEMO_FORC}/${NEMO_TARF}"
97
98    [ -z "${NEMO_TARF}" ] && cmd_iol="ls ${NEMO_FORC}/*" && cmd_iof="\cp ${NEMO_FORC}/* ."
99    ${cmd_iol} > inputs_list.txt && ${cmd_iof} > /dev/null
100}
101
102diff_inputs() {
103    local dif
104    local files_list='' mesg='Same' 
105
106    for file in inputs_list.txt namelist_* *.xml; do
107   dif=''
108   if [ -e ${REFE_DIR}/$file ]; then dif=$( diff -q $file ${REFE_DIR}/$file ); else dif=0; fi
109
110   if [ -n "$dif" ]; then
111       mesg='Different'
112       [ "$dif" != '0' ] && echo $dif && files_list+=$file' '
113   fi
114
115    done
116
117    [ "$mesg" == 'Same' ] && echo $mesg
118    echo $mesg >> ${FILE_INPT}
119
120    [ -n "${files_list}" ] && echo 'Inputs  : '${files_list}'differ<br>' >> temp_${FILE_COMM}
121}
122
123job_pending() {
124    local time_elapsed=0 time_increment=30
125
126    sleep ${time_increment}
127
128    while [[ $( ${JOB_LIST} | grep ${JOB_ID} ) && ${time_elapsed} -lt ${TIME_LIMI} ]]; do
129   printf "\n####################################################\n" >> computation.log
130   ${JOB_INFO} ${JOB_ID}                                             >> computation.log
131   sleep ${time_increment}
132   time_elapsed=$(( ${time_elapsed} + ${time_increment} ))
133    done
134
135    sleep ${time_increment}
136
137    if [ ${time_elapsed} -eq ${TIME_LIMI} ]; then
138   ${JOB_DELE} ${JOB_ID} &> /dev/null
139   let TIME_LIMIT/=3600
140   get_out 6
141    fi
142}
143
144diff_results() {
145    local files_list=''
146
147    for file in ocean.output *.stat; do
148   [ ! -e ${REFE_DIR}/$file ] && export ST='FAILED' && get_out 7
149   diff -q $file ${REFE_DIR}/$file
150   (( $? != 0 )) && export ST='FAILED' && files_list+=$file' '
151    done
152
153    [ -n "${files_list}" ] && echo 'Results : '${files_list}'differ<br>' >> temp_${FILE_COMM}
154}
155
156diff_restart() {
157    local base_name diff_rcd file nb_dom
158    local dif=0 files_list=''
159
160    [ ! -e  ${REFE_DIR}/time.step ] && export ST='FAILED' && get_out 7
161
162    TIME_STEP=$( cat ${REFE_DIR}/time.step | tr -d [:space:] )
163    echo 'Last time step of standard run: '${TIME_STEP}
164
165    if [ $( find -regex ".*_0+${TIME_STEP}_restart.*\.nc" -print -quit ) ]; then
166   base_name=$( find -regex ".*_0+${TIME_STEP}_restart.*\.nc" -print -quit | awk -F/ '{print $NF}' \
167                | sed "s/^\(.*\)$TIME_STEP\_restart.*/\1$TIME_STEP\_/"                              )
168
169   for comp in restart restart_ice restart_trc; do
170       file=${base_name}${comp}
171
172       nb_dom=$( find -name "${file}_[0-9]*.nc" | wc -l | awk '{print $1}' )
173       if   [ ${nb_dom} -gt 1 ]; then
174      ${NEMO_TRBD}/rebuild_nemo -t $NPROC $file ${nb_dom} > /dev/null
175      [ $? -eq 0 ] && rm -f ${base_name}${comp}_[0-9]*.nc > /dev/null
176       elif [ ${nb_dom} -eq 0 ]; then
177      export ST='FAILED' && get_out 8
178       fi
179
180       if [ -e ${REFE_DIR}/$file.nc ]; then
181       ## UNIX `cmp` not suitable (filename & timestamp in .nc file)
182      diff_rcd=$( $CDO diffn $file.nc ${REFE_DIR}/$file.nc 2> /dev/null               \
183                  | awk '/records/ {print $0}' | sed 's/differ$/differ,/' | tr -d '\n'  )
184
185      if [[ ! -z ${diff_rcd} && $( echo ${diff_rcd} | awk '{print $1}') -ne 0 ]]; then
186          export ST='FAILED'
187          files_list+=$file' '
188          let dif+=$( echo ${diff_rcd} | awk '{print $1}' )
189          echo $file.nc': '${diff_rcd}
190      else
191          echo 'identical'
192      fi
193
194       else
195      export ST='FAILED' && get_out 7
196       fi
197
198   done
199
200   [ -n "${files_list}" ] && echo 'Restarts: '${files_list}$dif' record(s) differ<br>' >> temp_${FILE_COMM}
201    else
202   export ST='FAILED'
203    fi
204
205}
206
207get_cpu_time() {
208    local real_cpu_time=$( eval ${JOB_TIME} )
209
210    echo ${real_cpu_time} | tee -a ${FILE_CPUT}
211}
212
213comments() {
214    local state=$1
215    export TIME_STEP=0
216
217    if [ "$state" == 'E R R O R' ]; then
218   [ -e time.step ] && export TIME_STEP=$( cat time.step | tr -d ' ' )
219   [ -e ocean.output ] && line=$( grep -m1 -A4 "$state"   ocean.output | tr -d '\n' )
220    else
221   [ -e ocean.output ] && line=$( grep -m1 -A2 "^ $state" ocean.output | tr -d '\n' )
222    fi
223
224    echo   $line
225    printf "$line<br>" >> temp_${FILE_COMM}
226}
227
228mesg_make() {
229    ## Format comments for web
230    [ -e temp_${FILE_COMM} ] && cat temp_${FILE_COMM} | tr -d '\n' | sed 's/<br>$//' >> ${FILE_COMM}
231
232    paste -d ';' mesg_*.txt | tee ${FILE_TRUS}
233}
234
235mesg_publish() {
236    local cmd
237
238    if [ $PUBLISH -eq 1 ]; then
239
240   if [ -f ${REFE_DIR}/trusting_$PATTERNAME.txt ]; then cmd='tail -1'; else cmd='cat'; fi
241
242   $cmd ${FILE_TRUS} >> ${REFE_DIR}/trusting_$PATTERNAME.txt
243
244  ## Send mail only when FAILED
245   if [[ ! -z $EMAIL && "$ST" == 'FAILED' ]]; then
246       cat << END_MAIL > trusting.mail
247XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX
248
249Dear $USER,
250
251The trusting sequence for ${REFE_CONF} has failed.
252Directory: ${TEST_DIR}
253Archive created: ${FILE_ARCH} in ${REFE_DIR}
254
255XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX
256
257END_MAIL
258       [ -e ${TEST_DIR}/${FILE_TRUS} ] && cat ${TEST_DIR}/${FILE_TRUS}                  >> trusting.mail
259       mail -s "[NEMO Trusting ${NEMO_HPCC} ${REFE_CONF} ${NEMO_BRAN}] $ST $ERR" $EMAIL <  trusting.mail
260   fi
261
262    fi
263}
264
265get_out() {
266    ERR=$1
267
268    cd ${TEST_DIR}
269
270    if [ "$ST" == 'FAILED' ]; then
271
272        ## Error identification
273   case $ERR in
274       ## Compilation
275       1) ERR='XIOS compilation failed'          ;; 2) ERR='NEMO compilation failed'            ;;
276       ## Submission
277       3) ERR='Missing input files'              ;; 4) ERR='Job submission error'               ;;
278       ## Running
279       5) ERR='Crashed at time step '${TIME_STEP};; 6) ERR='Exceeded time limit '${TIME_LIMI}'h';;
280       ## Results
281       7) ERR='Missing previous outputs'         ;; 8) ERR='New outputs differ'                 ;;
282       ## Undefined
283       *) ERR='Unknown error'                    ;;
284   esac
285
286   export ERR
287    fi
288
289    sed -i "2 s/.*/$ST/"  ${FILE_STAT} && sed -i "2 s/.*/$ERR/" ${FILE_RESU}
290
291    ## Save tested configuration if trusting failed
292    if [[ "$ST" == 'FAILED' && $PUBLISH -eq 1 && $DEBUG -eq 0 ]]; then
293   echo 'Creating archive '${FILE_ARCH}' under '${REFE_DIR}
294   tar -czf ${REFE_DIR}/${FILE_ARCH} * ${TEST_DIR}/${NEMO_CONF}/${TEST_CONF}/cpp_*  \
295                                        ${TEST_DIR}/${NEMO_CONF}/${TEST_CONF}/MY_SRC \
296                                       ${TEST_DIR}/${NEMO_CONF}/${TEST_CONF}/WORK
297    fi
298
299    mesg_make
300    mesg_publish
301
302    exit 0
303}
Note: See TracBrowser for help on using the repository browser.