New URL for NEMO forge!   http://forge.nemo-ocean.eu

Since March 2022 along with NEMO 4.2 release, the code development moved to a self-hosted GitLab.
This present forge is now archived and remained online for history.
trusting_func.sh in branches/2015/dev_r5092_CNRS_SETTE/NEMOGCM/TRUST – NEMO

source: branches/2015/dev_r5092_CNRS_SETTE/NEMOGCM/TRUST/trusting_func.sh @ 5644

Last change on this file since 5644 was 5644, checked in by nicolasmartin, 9 years ago

dev_r5092_CNRS_SETTE Wide modifications on trusting_func.sh for clearness & other significant changes on different names

  • Property eol-style set to native
  • Property svn:executable set to *
  • Property svn:keywords set to Author Date Id Rev URL
File size: 9.2 KB
Line 
1#!/bin/bash
2
3
4## Messenger filenames
5FILE_DATE=mesg_01_date_$PATTERNAME.txt    ; FILE_STAT=mesg_02_status_$PATTERNAME.txt
6FILE_RESU=mesg_03_result_$PATTERNAME.txt  ; FILE_NEMO=mesg_04_nemogcm_$PATTERNAME.txt
7FILE_XIOS=mesg_05_xios_$PATTERNAME.txt    ; FILE_COMP=mesg_06_compiler_$PATTERNAME.txt
8FILE_MPIN=mesg_07_mpi_$PATTERNAME.txt     ; FILE_NCDF=mesg_08_netcdf_$PATTERNAME.txt
9FILE_INPT=mesg_09_inputs_$PATTERNAME.txt  ; FILE_CPUT=mesg_10_cputime_$PATTERNAME.txt
10FILE_COMM=mesg_11_comments_$PATTERNAME.txt;
11
12##
13FILE_TRUS=trusting_${DATE}_$PATTERNAME.txt; FILE_ARCH=trusting_${DATE}_$PATTERNAME.tar.gz
14
15print_step() { printf "\nStep.....\n$1\n"; }
16
17init_files() {
18    echo 'Date'        > ${FILE_DATE}; echo 'Status'           > ${FILE_STAT}
19    echo 'Result'      > ${FILE_RESU}; echo 'NEMOGCM rev.'     > ${FILE_NEMO}
20    echo 'XIOS rev.'   > ${FILE_XIOS}; echo 'Fortran compiler' > ${FILE_COMP}
21    echo 'MPI libs'    > ${FILE_MPIN}; echo 'NetCDF libs'      > ${FILE_NCDF}
22    echo 'Input files' > ${FILE_INPT}; echo 'Real CPU time'    > ${FILE_CPUT}
23    echo 'Comments'    > ${FILE_COMM}
24}
25
26get_date() {
27    local dat=$( date -ud ${DATE} +"%F %R %Z" )
28
29    echo $dat >> ${FILE_DATE}
30}
31
32get_nemo_rev() {
33    local rev_loc svn_cmd
34    local rev=0 svn_opt='status'
35
36    ## If -v|--version option has been set, modify svn command
37    if   [ $( echo ${NEMO_VERS} | grep  "HEAD\|up\|update"                     ) ]; then
38   svn_cmd='svn update -r HEAD'
39    elif [ $( echo ${NEMO_VERS} | grep -o '{[0-9]\{4\}-[0-9]\{2\}-[0-9]\{2\}}' ) ]; then
40   svn_cmd='svn update -r '$( echo ${NEMO_VERS} | grep -o '{[0-9]\{4\}-[0-9]\{2\}-[0-9]\{2\}}' )
41    elif [ $( echo ${NEMO_VERS} | grep -o '[0-9]*'                             ) ]; then
42   svn_cmd='svn update -r '$( echo ${NEMO_VERS} | grep -o '[0-9]*' )
43    else
44   svn_cmd='svn '${svn_opt}
45    fi
46
47    for dir in ${NEMO_ARCH} ${NEMO_CONF} ${NEMO_ENGI} \
48               ${NEMO_EIOI} ${NEMO_EFCM}              \
49          ${NEMO_TCMP} ${NEMO_TRBD}              \
50          ${DIR_XIOS}                             ; do
51
52   ## For time being, just get revision number from XIOS
53   if [ "$dir" == "${DIR_XIOS}" ]; then
54       rev_loc=$( svn info $dir | awk '(NR == 9) {print $NF}' )
55       echo 'XIOS '${rev_loc} >> model.log
56       echo "<a href=\"https://forge.ipsl.jussieu.fr/ioserver/changeset/${rev_loc}\" target=\"_blank\">${rev_loc}</a>" \
57      >> ${FILE_XIOS}
58       continue
59   fi
60
61   echo $dir
62   ${svn_cmd} $dir
63   rev_loc=$( svn info $dir | awk '(NR == 9) {print $NF}' )
64   (( ${rev_loc} >= $rev )) && rev=${rev_loc}
65    done
66
67    echo 'NEMOGCM '$rev   >> model.log
68    echo "<a href=\"https://forge.ipsl.jussieu.fr/nemo/changeset/$rev\" target=\"_blank\">$rev</a>" \
69   >> ${FILE_NEMO}
70}
71
72get_soft_rel() {
73    local soft_rel
74
75    for soft in $CDO $COMPILER $MPI $NETCDF; do
76   soft_rel=''
77        ((   ${I_MODULE} == 1   )) && soft_rel=$( echo $LOADEDMODULES | sed "s/.*$soft\/\([0-9.a-z_]*\).*/\1/i" )
78   [    -z "${soft_rel}"    ] && soft_rel=$( echo $PATH          | sed "s/.*$soft\([0-9.a-z_]*\).*/\1/i"   )
79   [ "$soft" == "$COMPILER" ] && soft_rel=$( $soft --version     | grep -m1 -oe '\<[0-9. ]*\>'             )
80   ## Cleaning characters string to display proper soft name
81   soft=$( echo $soft | sed 's#\\##g; s#[/-]$##' )
82   echo $soft ${soft_rel} >> model.log
83    done
84
85    sed -n 4p model.log > ${FILE_COMP}; sed -n 5p model.log > ${FILE_MPIN}; sed -n 6p model.log > ${FILE_NCDF}
86}
87
88get_inputs() {
89    local cmd_iol="tar -tvf ${NEMO_FORC}/${NEMO_TARF}"; cmd_iof="tar -vxf ${NEMO_FORC}/${NEMO_TARF}"
90
91    [ -z "${NEMO_TARF}" ] && cmd_iol="ls ${NEMO_FORC}/*" && cmd_iof="\cp ${NEMO_FORC}/* ."
92    ${cmd_iol} > inputs_list.txt && ${cmd_iof} > /dev/null
93}
94
95diff_inputs() {
96    local dif
97    local mesg='Same'
98
99    for file in inputs_list.txt $( ls namelist_* ) $( ls *.xml ); do
100   dif=''
101   if [ -e ${REFE_DIR}/$file ]; then dif=$( diff -q $file ${REFE_DIR}/$file ); else dif=0; fi
102   if [ -n "$dif" ]; then mesg='Different'; [ "$dif" != '0' ] && echo $dif | tee -a ${FILE_COMM}; fi
103    done
104
105    echo $mesg | tee -a ${FILE_INPT}
106}
107
108job_pending() {
109    local time_elapsed=0; time_increment=30
110
111    sleep ${time_increment}
112
113    while [[ $( ${JOB_LIST} | grep ${JOB_ID} ) && ${time_elapsed} -lt ${TIME_LIMI} ]]; do
114   printf "\n####################################################\n" >> computation.log
115   ${JOB_INFO} ${JOB_ID}                                             >> computation.log
116   sleep ${time_increment}
117   time_elapsed=$(( ${time_elapsed} + ${time_increment} ))
118    done
119
120    sleep ${time_increment}
121
122    if [ ${time_elapsed} -eq ${TIME_LIMI} ]; then
123   ${JOB_DELE} ${JOB_ID} &> /dev/null
124   TIME_LIMIT=$(( ${TIME_LIMI} / 3600 ))
125#  export TIME_LIMIT
126   get_out 6
127    fi
128}
129
130diff_results() {
131    for file in ocean.output $( ls *.stat ); do
132   [ ! -e ${REFE_DIR}/$file ] && export ST='FAILED' && get_out 7
133   diff -q $file ${REFE_DIR}/$file | tee -a ${FILE_COMM}
134   (( $? != 0 )) && export ST='FAILED'
135    done
136}
137
138diff_restart() {
139    local base_name file nb_dom diff_rcd
140
141    [ ! -e  ${REFE_DIR}/time.step ] && export ST='FAILED' && get_out 9
142
143#    export LAST_TIME_STEP=$( cat ${REFE_DIR}/time.step | tr -d [:space:] )
144    LAST_TIME_STEP=$( cat ${REFE_DIR}/time.step | tr -d [:space:] )
145    echo 'Last time step of standard run: '${LAST_TIME_STEP}
146
147    if [ $( find -regex ".*_0+${LAST_TIME_STEP}_restart.*\.nc" -print -quit ) ]; then
148   base_name=$( find -regex ".*_0+${LAST_TIME_STEP}_restart.*\.nc" -print -quit | awk -F/ '{print $NF}' \
149                | sed "s/^\(.*\)$LAST_TIME_STEP\_restart.*/\1$LAST_TIME_STEP\_/"                         )
150
151   for comp in restart restart_ice restart_trc; do
152       file=${base_name}${comp} && printf "$file.nc: "
153
154       nb_dom=$( find -name "${file}_[0-9]*.nc" | wc -l | awk '{print $1}' )
155       if   [ ${nb_dom} -gt 1 ]; then
156      ${NEMO_TRBD}/rebuild_nemo -t $NPROC $file ${nb_dom} > /dev/null
157      [ $? -eq 0 ] && rm -f ${base_name}${comp}_[0-9]*.nc > /dev/null
158       elif [ ${nb_dom} -eq 0 ]; then
159      export ST='FAILED' && get_out 10
160       fi
161
162       if [ -e ${REFE_DIR}/$file.nc ]; then
163       ## UNIX `cmp` not suitable (filename & timestamp in .nc file)
164#     diff_rcd=$( $CDO diffn $file.nc ${REFE_DIR}/$file.nc 2> /dev/null \
165#                | awk '/records/ {print $1}'                           )
166      diff_rcd=$( $CDO diffn $file.nc ${REFE_DIR}/$file.nc 2> /dev/null \
167                 | awk '/records/ {print $0}'                           )
168
169#     if [[ ! -z ${diff_rcd} && ${diff_rcd} -ne 0 ]]; then
170      if [[ ! -z ${diff_rcd} && $( echo ${diff_rcd} | awk '{print $1}') -ne 0 ]]; then
171          export ST='FAILED'
172          echo $CDO $( echo ${diff_rcd} | sed 's/differ$/differ,/' | tr -d '\n' )
173#         printf "$CDO ${diff_rcd}\n"
174      else
175          echo 'identical'
176#         printf "identical\n"
177      fi
178
179       else
180      export ST='FAILED' && get_out 9
181       fi
182
183   done
184
185    else
186   export ST='FAILED'
187    fi
188
189}
190
191get_cpu_time() {
192    local real_cpu_time=$( eval ${JOB_TIME} )
193
194    echo ${real_cpu_time} | tee -a ${FILE_CPUT}
195}
196
197comments() {
198    local state=$1
199
200    if [ "$state" == 'E R R O R' ]; then
201   [ -e time.step ] && LAST_TIME_STEP=$( cat time.step | tr -d ' ' )
202#  export LAST_TIME_STEP
203   [ -e ocean.output ] && line=$( grep -m1 -A4 "$state"   ocean.output | tr -d '\n' )
204   echo $line >> ${FILE_COMM}
205    else
206   [ -e ocean.output ] && line=$( grep -m1 -A2 "^ $state" ocean.output | tr -d '\n' )
207    fi
208
209    echo $line
210}
211
212mesg_make() {
213    paste -d ';' mesg_*.txt > ${FILE_TRUS}
214    cat                       ${FILE_TRUS}
215}
216
217mesg_publish() {
218    local cmd
219
220    if [ $PUBLISH -eq 1 ]; then
221
222   if [ -f ${REFE_DIR}/trusting_$PATTERNAME.txt ]; then cmd='tail -1'; else cmd='cat'; fi
223
224   $cmd ${FILE_TRUS} >> ${REFE_DIR}/trusting_$PATTERNAME.txt
225
226  ## Send mail only when FAILED
227   if [[ ! -z $EMAIL && "$ST" == 'FAILED' ]]; then
228       cat << END_MAIL > trusting.mail
229XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX
230
231Dear $USER,
232
233The trusting sequence for ${REFE_CONF} has failed.
234Directory: ${TEST_DIR}
235Archive created: ${FILE_ARCH} in ${REFE_DIR}
236
237XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX
238
239END_MAIL
240       [ -e ${TEST_DIR}/${FILE_TRUS} ] && cat ${TEST_DIR}/${FILE_TRUS} >> trusting.mail
241       mail -s "[trusting ${REFE_CONF} $BRANCH] $ST $ERR" $EMAIL       <  trusting.mail
242   fi
243
244    fi
245}
246
247get_out() {
248    ERR=$1
249
250    cd ${TEST_DIR}
251    echo $ST >> ${FILE_STAT}
252
253    if [ "$ST" == 'FAILED' ]; then
254
255        ## Error identification
256   case $ERR in
257       ## Compilation
258       1) ERR='XIOS compilation failed'               ;;  2) ERR='NEMO compilation failed'            ;;
259       ## Submission
260       3) ERR='Missing input files'                   ;;  4) ERR='Job submission error'               ;;
261       ## Running
262       5) ERR='Crashed at time step '${LAST_TIME_STEP};;  6) ERR='Exceeded time limit '${TIME_LIMI}'h';;
263       ## Results
264       7) ERR='Missing previous outputs '             ;;  8) ERR='New outputs  differ/missing'        ;;
265       9) ERR='Missing previous restarts'             ;; 10) ERR='New restarts differ/missing'        ;;
266       ## Undefined
267       *) ERR='Unknown error'                         ;;
268   esac
269
270   export ERR
271    fi
272
273    echo $ERR >> ${FILE_RESU}
274
275    ## Save tested configuration if trusting failed
276    if [[ "$ST" == 'FAILED' && $DEBUG -eq 0 ]]; then
277   echo 'Creating archive '${FILE_ARCH}' under '${REFE_DIR}
278   tar -czf ${REFE_DIR}/${FILE_ARCH} ../*
279    fi
280
281    mesg_make
282    mesg_publish
283
284    exit 0
285}
Note: See TracBrowser for help on using the repository browser.