From e1d6d3c19cfb40a27a63dfe6f29a2c583b05befb Mon Sep 17 00:00:00 2001 From: Parallel Works app-run user Date: Thu, 3 Nov 2022 21:21:18 +0000 Subject: [PATCH 1/6] update vx maxtries --- ush/config_defaults.yaml | 52 ++++++++++++++++++++-------------------- 1 file changed, 26 insertions(+), 26 deletions(-) diff --git a/ush/config_defaults.yaml b/ush/config_defaults.yaml index 56806fdb06..57236e06ed 100644 --- a/ush/config_defaults.yaml +++ b/ush/config_defaults.yaml @@ -658,7 +658,7 @@ workflow: VX_TN: "run_vx" VX_ENSGRID_TN: "run_ensgridvx" VX_ENSGRID_PROB_REFC_TN: "run_ensgridvx_prob_refc" - MAXTRIES_VX_ENSGRID_PROB_REFC: 1 + MAXTRIES_VX_ENSGRID_PROB_REFC: 2 #---------------------------- # NCO specific variables @@ -1803,7 +1803,7 @@ task_run_vx_gridstat: NNODES_VX_GRIDSTAT: 1 PPN_VX_GRIDSTAT: 1 WTIME_VX_GRIDSTAT: 02:00:00 - MAXTRIES_VX_GRIDSTAT: 1 + MAXTRIES_VX_GRIDSTAT: 2 #---------------------------- # VX_GRIDSTAT_REFC config parameters @@ -1813,7 +1813,7 @@ task_run_vx_gridstat_refc: NNODES_VX_GRIDSTAT: 1 PPN_VX_GRIDSTAT: 1 WTIME_VX_GRIDSTAT: 02:00:00 - MAXTRIES_VX_GRIDSTAT_REFC: 1 + MAXTRIES_VX_GRIDSTAT_REFC: 2 #---------------------------- # VX_GRIDSTAT_RETOP config parameters @@ -1823,7 +1823,7 @@ task_run_vx_gridstat_retop: NNODES_VX_GRIDSTAT: 1 PPN_VX_GRIDSTAT: 1 WTIME_VX_GRIDSTAT: 02:00:00 - MAXTRIES_VX_GRIDSTAT_RETOP: 1 + MAXTRIES_VX_GRIDSTAT_RETOP: 2 #---------------------------- # VX_GRIDSTAT_03h config parameters @@ -1833,7 +1833,7 @@ task_run_vx_gridstat_03h: NNODES_VX_GRIDSTAT: 1 PPN_VX_GRIDSTAT: 1 WTIME_VX_GRIDSTAT: 02:00:00 - MAXTRIES_VX_GRIDSTAT_03h: 1 + MAXTRIES_VX_GRIDSTAT_03h: 2 #---------------------------- # VX_GRIDSTAT_06h config parameters @@ -1843,7 +1843,7 @@ task_run_vx_gridstat_06h: NNODES_VX_GRIDSTAT: 1 PPN_VX_GRIDSTAT: 1 WTIME_VX_GRIDSTAT: 02:00:00 - MAXTRIES_VX_GRIDSTAT_06h: 1 + MAXTRIES_VX_GRIDSTAT_06h: 2 #---------------------------- # VX_GRIDSTAT_24h config parameters @@ -1853,7 +1853,7 @@ task_run_vx_gridstat_24h: NNODES_VX_GRIDSTAT: 1 PPN_VX_GRIDSTAT: 1 WTIME_VX_GRIDSTAT: 02:00:00 - MAXTRIES_VX_GRIDSTAT_24h: 1 + MAXTRIES_VX_GRIDSTAT_24h: 2 #---------------------------- # VX_POINTSTAT config parameters @@ -1863,26 +1863,26 @@ task_run_vx_pointstat: NNODES_VX_POINTSTAT: 1 PPN_VX_POINTSTAT: 1 WTIME_VX_POINTSTAT: 01:00:00 - MAXTRIES_VX_POINTSTAT: 1 + MAXTRIES_VX_POINTSTAT: 2 #---------------------------- # VX_ENSGRID config parameters #----------------------------- task_run_vx_ensgrid: VX_ENSGRID_03h_TN: "run_ensgridvx_03h" - MAXTRIES_VX_ENSGRID_03h: 1 + MAXTRIES_VX_ENSGRID_03h: 2 VX_ENSGRID_06h_TN: "run_ensgridvx_06h" - MAXTRIES_VX_ENSGRID_06h: 1 + MAXTRIES_VX_ENSGRID_06h: 2 VX_ENSGRID_24h_TN: "run_ensgridvx_24h" - MAXTRIES_VX_ENSGRID_24h: 1 + MAXTRIES_VX_ENSGRID_24h: 2 VX_ENSGRID_RETOP_TN: "run_ensgridvx_retop" - MAXTRIES_VX_ENSGRID_RETOP: 1 + MAXTRIES_VX_ENSGRID_RETOP: 2 VX_ENSGRID_PROB_RETOP_TN: "run_ensgridvx_prob_retop" - MAXTRIES_VX_ENSGRID_PROB_RETOP: 1 + MAXTRIES_VX_ENSGRID_PROB_RETOP: 2 NNODES_VX_ENSGRID: 1 PPN_VX_ENSGRID: 1 WTIME_VX_ENSGRID: 01:00:00 - MAXTRIES_VX_ENSGRID: 1 + MAXTRIES_VX_ENSGRID: 2 #---------------------------- @@ -1893,7 +1893,7 @@ task_run_vx_ensgrid_refc: NNODES_VX_ENSGRID: 1 PPN_VX_ENSGRID: 1 WTIME_VX_ENSGRID: 01:00:00 - MAXTRIES_VX_ENSGRID_REFC: 1 + MAXTRIES_VX_ENSGRID_REFC: 2 #---------------------------- # VX_ENSGRID_MEAN config parameters @@ -1903,7 +1903,7 @@ task_run_vx_ensgrid_mean: NNODES_VX_ENSGRID_MEAN: 1 PPN_VX_ENSGRID_MEAN: 1 WTIME_VX_ENSGRID_MEAN: 01:00:00 - MAXTRIES_VX_ENSGRID_MEAN: 1 + MAXTRIES_VX_ENSGRID_MEAN: 2 #---------------------------- # VX_ENSGRID_MEAN_03h config parameters @@ -1913,7 +1913,7 @@ task_run_vx_ensgrid_mean_03h: NNODES_VX_ENSGRID_MEAN: 1 PPN_VX_ENSGRID_MEAN: 1 WTIME_VX_ENSGRID_MEAN: 01:00:00 - MAXTRIES_VX_ENSGRID_MEAN_03h: 1 + MAXTRIES_VX_ENSGRID_MEAN_03h: 2 #---------------------------- # VX_ENSGRID_MEAN_06h config parameters @@ -1923,7 +1923,7 @@ task_run_vx_ensgrid_mean_06h: NNODES_VX_ENSGRID_MEAN: 1 PPN_VX_ENSGRID_MEAN: 1 WTIME_VX_ENSGRID_MEAN: 01:00:00 - MAXTRIES_VX_ENSGRID_MEAN_06h: 1 + MAXTRIES_VX_ENSGRID_MEAN_06h: 2 #---------------------------- # VX_ENSGRID_MEAN_24h config parameters @@ -1933,7 +1933,7 @@ task_run_vx_ensgrid_mean_24h: NNODES_VX_ENSGRID_MEAN: 1 PPN_VX_ENSGRID_MEAN: 1 WTIME_VX_ENSGRID_MEAN: 01:00:00 - MAXTRIES_VX_ENSGRID_MEAN_24h: 1 + MAXTRIES_VX_ENSGRID_MEAN_24h: 2 #---------------------------- # VX_ENSGRID_PROB config parameters @@ -1943,7 +1943,7 @@ task_run_vx_ensgrid_prob: NNODES_VX_ENSGRID_PROB: 1 PPN_VX_ENSGRID_PROB: 1 WTIME_VX_ENSGRID_PROB: 01:00:00 - MAXTRIES_VX_ENSGRID_PROB: 1 + MAXTRIES_VX_ENSGRID_PROB: 2 #---------------------------- # VX_ENSGRID_PROB_03h config parameters @@ -1953,7 +1953,7 @@ task_run_vx_ensgrid_prob_03h: NNODES_VX_ENSGRID_PROB: 1 PPN_VX_ENSGRID_PROB: 1 WTIME_VX_ENSGRID_PROB: 01:00:00 - MAXTRIES_VX_ENSGRID_PROB_03h: 1 + MAXTRIES_VX_ENSGRID_PROB_03h: 2 #---------------------------- # VX_ENSGRID_PROB_06h config parameters @@ -1963,7 +1963,7 @@ task_run_vx_ensgrid_prob_06h: NNODES_VX_ENSGRID_PROB: 1 PPN_VX_ENSGRID_PROB: 1 WTIME_VX_ENSGRID_PROB: 01:00:00 - MAXTRIES_VX_ENSGRID_PROB_06h: 1 + MAXTRIES_VX_ENSGRID_PROB_06h: 2 #---------------------------- # VX_ENSGRID_PROB_24h config parameters @@ -1973,7 +1973,7 @@ task_run_vx_ensgrid_prob_24h: NNODES_VX_ENSGRID_PROB: 1 PPN_VX_ENSGRID_PROB: 1 WTIME_VX_ENSGRID_PROB: 01:00:00 - MAXTRIES_VX_ENSGRID_PROB_24h: 1 + MAXTRIES_VX_ENSGRID_PROB_24h: 2 #---------------------------- # VX_ENSPOINT config parameters @@ -1983,7 +1983,7 @@ task_run_vx_enspoint: NNODES_VX_ENSPOINT: 1 PPN_VX_ENSPOINT: 1 WTIME_VX_ENSPOINT: 01:00:00 - MAXTRIES_VX_ENSPOINT: 1 + MAXTRIES_VX_ENSPOINT: 2 #---------------------------- # VX_ENSPOINT_MEAN config parameters @@ -1993,7 +1993,7 @@ task_run_vx_enspoint_mean: NNODES_VX_ENSPOINT_MEAN: 1 PPN_VX_ENSPOINT_MEAN: 1 WTIME_VX_ENSPOINT_MEAN: 01:00:00 - MAXTRIES_VX_ENSPOINT_MEAN: 1 + MAXTRIES_VX_ENSPOINT_MEAN: 2 #---------------------------- # VX_ENSPOINT_PROB config parameters @@ -2003,7 +2003,7 @@ task_run_vx_enspoint_prob: NNODES_VX_ENSPOINT_PROB: 1 PPN_VX_ENSPOINT_PROB: 1 WTIME_VX_ENSPOINT_PROB: 01:00:00 - MAXTRIES_VX_ENSPOINT_PROB: 1 + MAXTRIES_VX_ENSPOINT_PROB: 2 #---------------------------- From 085618bb826e50e38292812b12ca9b489836573a Mon Sep 17 00:00:00 2001 From: Parallel Works app-run user Date: Thu, 3 Nov 2022 21:21:49 +0000 Subject: [PATCH 2/6] update met/metplus locations --- ush/machine/noaacloud.yaml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/ush/machine/noaacloud.yaml b/ush/machine/noaacloud.yaml index 32246aae54..940b57a622 100644 --- a/ush/machine/noaacloud.yaml +++ b/ush/machine/noaacloud.yaml @@ -5,9 +5,9 @@ platform: CCPA_OBS_DIR: /contrib/EPIC/UFS_SRW_App/develop/obs_data/ccpa/proc MRMS_OBS_DIR: /contrib/EPIC/UFS_SRW_App/develop/obs_data/mrms/proc NDAS_OBS_DIR: /contrib/EPIC/UFS_SRW_App/develop/obs_data/ndas/proc - METPLUS_PATH: /contrib/EPIC/spack-stack/envs/ufs-srw-dev.intel/install/intel/2021.3.0/metplus-4.1.0-t4mkmbg + METPLUS_PATH: /contrib/EPIC/spack-stack/envs/srw-develop-intel/install/intel/2021.3.0/metplus MET_BIN_EXEC: bin - MET_INSTALL_DIR: /contrib/EPIC/spack-stack/envs/ufs-srw-dev.intel/install/intel/2021.3.0/met-10.1.0-mqwqjxt + MET_INSTALL_DIR: /contrib/EPIC/spack-stack/envs/srw-develop-intel/install/intel/2021.3.0/met RUN_CMD_FCST: mpiexec -np ${PE_MEMBER01} RUN_CMD_POST: mpiexec -np $nprocs RUN_CMD_SERIAL: time From 91191a87ab7c743f9d7aae2a43cbdef401707fe5 Mon Sep 17 00:00:00 2001 From: Parallel Works app-run user Date: Thu, 3 Nov 2022 21:22:15 +0000 Subject: [PATCH 3/6] add vx task file --- modulefiles/tasks/noaacloud/run_vx.local.lua | 1 + 1 file changed, 1 insertion(+) create mode 100644 modulefiles/tasks/noaacloud/run_vx.local.lua diff --git a/modulefiles/tasks/noaacloud/run_vx.local.lua b/modulefiles/tasks/noaacloud/run_vx.local.lua new file mode 100644 index 0000000000..d371c08301 --- /dev/null +++ b/modulefiles/tasks/noaacloud/run_vx.local.lua @@ -0,0 +1 @@ +load("miniconda_regional_workflow") From 5b552d8e1176814640d64798fda72c36d39ed28d Mon Sep 17 00:00:00 2001 From: Parallel Works app-run user Date: Thu, 3 Nov 2022 21:42:20 +0000 Subject: [PATCH 4/6] add time fix for aws --- ush/machine/noaacloud.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ush/machine/noaacloud.yaml b/ush/machine/noaacloud.yaml index 940b57a622..6f2137b1fd 100644 --- a/ush/machine/noaacloud.yaml +++ b/ush/machine/noaacloud.yaml @@ -13,7 +13,7 @@ platform: RUN_CMD_SERIAL: time RUN_CMD_UTILS: mpiexec -np $nprocs SCHED_NATIVE_CMD: --export=NONE - PRE_TASK_CMDS: '{ ulimit -s unlimited; ulimit -a; }' + PRE_TASK_CMDS: '{ ulimit -s unlimited; ulimit -a; sudo yum -y install time; }' TEST_EXTRN_MDL_SOURCE_BASEDIR: /contrib/EPIC/UFS_SRW_App/develop/input_model_data TEST_PREGEN_BASEDIR: /contrib/EPIC/UFS_SRW_App/develop/FV3LAM_pregen TEST_ALT_EXTRN_MDL_SYSBASEDIR_ICS: /contrib/EPIC/UFS_SRW_App/develop/dummy_FV3GFS_sys_dir From 6e7d71a51d68b11574cfd7818deee3adc0ac3d12 Mon Sep 17 00:00:00 2001 From: Parallel Works app-run user Date: Mon, 7 Nov 2022 16:44:35 +0000 Subject: [PATCH 5/6] added path for time --- modulefiles/build_noaacloud_intel.lua | 1 + modulefiles/wflow_noaacloud.lua | 1 + 2 files changed, 2 insertions(+) diff --git a/modulefiles/build_noaacloud_intel.lua b/modulefiles/build_noaacloud_intel.lua index 6f99a415cf..7cff9b6cb5 100644 --- a/modulefiles/build_noaacloud_intel.lua +++ b/modulefiles/build_noaacloud_intel.lua @@ -7,6 +7,7 @@ whatis([===[Loads libraries needed for building the UFS SRW App on NOAA cloud ]= prepend_path("MODULEPATH", "/contrib/EPIC/spack-stack/envs/srw-develop-intel/install/modulefiles/Core") prepend_path("MODULEPATH", "/apps/modules/modulefiles") +prepend_path("PATH", "/contrib/EPIC/bin") load("intel/2021.3.0") load("impi/2021.3.0") load("stack-intel") diff --git a/modulefiles/wflow_noaacloud.lua b/modulefiles/wflow_noaacloud.lua index 45444a9eb2..80501f5075 100644 --- a/modulefiles/wflow_noaacloud.lua +++ b/modulefiles/wflow_noaacloud.lua @@ -14,6 +14,7 @@ load(pathJoin("miniconda3", os.getenv("miniconda3_ver") or "4.12.0")) setenv("PROJ_LIB","/contrib/EPIC/miniconda3/4.12.0/envs/regional_workflow/share/proj") setenv("OPT","/contrib/EPIC/hpc-modules") append_path("PATH","/contrib/EPIC/miniconda3/4.12.0/envs/regional_workflow/bin") +prepend_path("PATH","/contrib/EPIC/bin") if mode() == "load" then LmodMsgRaw([===[Please do the following to activate conda: From 4ba6fdbb7513a71244826d0b8fc9b5542243a24c Mon Sep 17 00:00:00 2001 From: Parallel Works app-run user Date: Mon, 7 Nov 2022 16:44:58 +0000 Subject: [PATCH 6/6] remove time install --- ush/machine/noaacloud.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ush/machine/noaacloud.yaml b/ush/machine/noaacloud.yaml index 6f2137b1fd..940b57a622 100644 --- a/ush/machine/noaacloud.yaml +++ b/ush/machine/noaacloud.yaml @@ -13,7 +13,7 @@ platform: RUN_CMD_SERIAL: time RUN_CMD_UTILS: mpiexec -np $nprocs SCHED_NATIVE_CMD: --export=NONE - PRE_TASK_CMDS: '{ ulimit -s unlimited; ulimit -a; sudo yum -y install time; }' + PRE_TASK_CMDS: '{ ulimit -s unlimited; ulimit -a; }' TEST_EXTRN_MDL_SOURCE_BASEDIR: /contrib/EPIC/UFS_SRW_App/develop/input_model_data TEST_PREGEN_BASEDIR: /contrib/EPIC/UFS_SRW_App/develop/FV3LAM_pregen TEST_ALT_EXTRN_MDL_SYSBASEDIR_ICS: /contrib/EPIC/UFS_SRW_App/develop/dummy_FV3GFS_sys_dir