Changeset 1220 for trunk


Ignore:
Timestamp:
08/25/15 16:46:24 (9 years ago)
Author:
sdipsl
Message:
  • Any post-procesing errors will stop the computing jobs when SpaceName?=PROD. See #260
  • Feature was removed some years ago because postprocessing errors were legions. More robust now.
Location:
trunk/libIGCM
Files:
2 edited

Legend:

Unmodified
Added
Removed
  • trunk/libIGCM/libIGCM_config/libIGCM_config.ksh

    r1214 r1220  
    311311    fi 
    312312 
    313     #Test state of run in run.card 
    314     IGCM_card_DefineVariableFromOption ${SUBMIT_DIR}/run.card Configuration PeriodState 
    315  
    316     if ( [ ${run_Configuration_PeriodState} != "Start" ] && [ ${run_Configuration_PeriodState} != "Running" ] && [ ${run_Configuration_PeriodState} != "OnQueue" ] && [ ${run_Configuration_PeriodState} != "Continue" ] ) ; then 
    317       echo 
    318       IGCM_debug_Print 1 "!! Error in run.card with PeriodState : " ${run_Configuration_PeriodState} "!!" 
    319       IGCM_debug_Print 1 "Check post-processing jobs carefully by running ${libIGCM}/RunChecker.job -p ${SUBMIT_DIR}" 
    320       IGCM_debug_Print 1 "Then try running ${libIGCM}/clean_month.job to rerun one period" 
    321       IGCM_debug_Print 1 "Then try running ${libIGCM}/clean_year.job to rerun more." 
    322       IGCM_debug_Exit 
    323       IGCM_debug_Verif_Exit 
    324     fi 
     313    # Test state of run in run.card. Will schedule an exit if another process setted it to "Fatal" 
     314    IGCM_config_StateCheck 
     315 
     316    # And EXIT if not OK 
     317    IGCM_debug_Verif_Exit 
    325318  fi 
    326319 
     
    455448} 
    456449 
     450#=================================== 
     451function IGCM_config_StateCheck 
     452{ 
     453  IGCM_debug_PushStack "IGCM_config_StateCheck" 
     454 
     455    #Test state of run in run.card 
     456    IGCM_card_DefineVariableFromOption ${SUBMIT_DIR}/run.card Configuration PeriodState 
     457 
     458    if [ ${run_Configuration_PeriodState} = "Fatal" ] ; then 
     459      echo 
     460      IGCM_debug_Print 1 "!! Error in run.card with PeriodState : " ${run_Configuration_PeriodState} "!!" 
     461      IGCM_debug_Print 1 "Check post-processing jobs carefully by running ${libIGCM}/RunChecker.job -p ${SUBMIT_DIR}" 
     462      IGCM_debug_Print 1 "Then try running ${libIGCM}/clean_month.job to rerun one period" 
     463      IGCM_debug_Print 1 "Then try running ${libIGCM}/clean_year.job to rerun more." 
     464      IGCM_debug_Exit 
     465    fi 
     466 
     467  IGCM_debug_PopStack "IGCM_config_StateCheck" 
     468} 
    457469 
    458470#=================================== 
     
    598610    #================================================# 
    599611 
    600     #Test state of run in run.card 
    601     IGCM_card_DefineVariableFromOption ${SUBMIT_DIR}/run.card Configuration PeriodState 
    602     if ( [ ${run_Configuration_PeriodState} != "Running" ] && [ ${run_Configuration_PeriodState} != "OnQueue" ] && [ ${run_Configuration_PeriodState} != "Continue" ] ) ; then 
    603       echo 
    604       IGCM_debug_Print 1 "!! Error in run.card with PeriodState : " ${run_Configuration_PeriodState} "!!" 
    605       IGCM_debug_Print 1 "Try running ${libIGCM}/clean_month.job to fix this" 
    606       echo 
    607       IGCM_debug_Exit 
    608       IGCM_debug_Verif_Exit 
    609     fi 
     612    # Test state of run in run.card. Will schedule an exit if another process setted it to "Fatal" 
     613    IGCM_config_StateCheck 
     614    # And EXIT if not OK 
     615    IGCM_debug_Verif_Exit 
    610616 
    611617    #===================================# 
     
    659665    IGCM_debug_Verif_Exit 
    660666 
     667    # Test state of run in run.card. Will schedule an exit if another process setted it to "Fatal" 
     668    IGCM_config_StateCheck 
     669    # And EXIT if not OK 
     670    IGCM_debug_Verif_Exit 
     671 
     672    # We can say we are "Running" now. 
    661673    IGCM_card_WriteOption ${SUBMIT_DIR}/run.card Configuration PeriodState "Running" 
    662674  fi 
     
    12501262  echo 
    12511263 
     1264  # Test state of run in run.card. Will schedule an exit if another process setted it to "Fatal" 
     1265  IGCM_config_StateCheck 
     1266 
     1267  # And EXIT if not OK 
     1268  IGCM_debug_Verif_Exit 
     1269 
    12521270  if [ ${SimulationLengthInDays} -ge ${ExperienceLengthInDays} ] ; then 
    12531271    #==========================# 
  • trunk/libIGCM/libIGCM_debug/libIGCM_debug.ksh

    r1216 r1220  
    737737      # If SpaceName is PROD then we stop when post_processing failed 
    738738      if [ X${config_UserChoices_SpaceName} = XPROD ] ; then 
    739         echo "                        EXIT THE JOB." 
     739        echo "                        EXIT THE POST-PROCESSING JOB." 
    740740        echo 
    741741        IGCM_debug_CallStack 
     742 
     743        # Notify the computing job that something wrong happened. 
     744        IGCM_card_WriteOption ${SUBMIT_DIR}/run.card Configuration PeriodState "Fatal" 
    742745 
    743746        # Mail notification? 
Note: See TracChangeset for help on using the changeset viewer.