#PBS -N hmon%NUM%_hycom_post_%CYC% #PBS -j oe #PBS -S /bin/bash #PBS -q %QUEUE% #PBS -A %PROJ%-%PROJENVIR% #PBS -l walltime=02:40:00 #PBS -l place=shared,select=1:ncpus=24:mpiprocs=24:mem=8GB #PBS -l debug=true set -x model=hmon export cyc=%CYC% export PDY=%PDY:""% export TOTAL_TASKS=$(wc -l ${PBS_NODEFILE:?} | cut -f 1 -d " ") %include %include export storm_num="%NUM%" module load PrgEnv-intel/${PrgEnv_intel_ver} module load intel/${intel_ver} module load craype/${craype_ver} module load cray-mpich/${cray_mpich_ver} module load cray-pals/${cray_pals_ver} #module load atp/${atp_ver} module load hdf5/${hdf5_ver} module load netcdf/${netcdf_ver} module load cfp/${cfp_ver} module load python/${python_ver} ${HOMEhmon}/jobs/JHMON_HYCOM_POST %include %manual PURPOSE: Ocean component post-processing for coupled runs. TROUBLESHOOTING Most failures of this job fall in two categories: - model failed - operator error - system issues If this job failed, check the model first. If the model is stuck or failed, that is why this job failed What do I mean by "operator error?" * ALWAYS KILL AND REQUEUE THE fcst FAMILY AND post FAMILY to rerun the forecast model. Never, under ANY circumstances, rerun just the model! %end