Skip to content

Commit

Permalink
change: set btl_vader_single_copy_mechanism to none to avoid Read -1 …
Browse files Browse the repository at this point in the history
…Warning messages (#95)
  • Loading branch information
karan6181 authored Feb 2, 2021
1 parent a14e8f8 commit 0523a42
Show file tree
Hide file tree
Showing 2 changed files with 9 additions and 0 deletions.
3 changes: 3 additions & 0 deletions src/sagemaker_training/smdataparallel.py
Original file line number Diff line number Diff line change
Expand Up @@ -129,6 +129,9 @@ def _get_mpirun_command(
"orte_abort_on_non_zero_status",
"1",
"-mca",
"btl_vader_single_copy_mechanism",
"none",
"-mca",
"plm_rsh_num_concurrent",
str(num_hosts),
"-x",
Expand Down
6 changes: 6 additions & 0 deletions test/unit/test_smdataparallel.py
Original file line number Diff line number Diff line change
Expand Up @@ -90,6 +90,9 @@ def test_smdataparallel_run_multi_node_python(
"orte_abort_on_non_zero_status",
"1",
"-mca",
"btl_vader_single_copy_mechanism",
"none",
"-mca",
"plm_rsh_num_concurrent",
str(num_hosts),
"-x",
Expand Down Expand Up @@ -189,6 +192,9 @@ def test_smdataparallel_run_single_node_python(
"orte_abort_on_non_zero_status",
"1",
"-mca",
"btl_vader_single_copy_mechanism",
"none",
"-mca",
"plm_rsh_num_concurrent",
str(num_hosts),
"-x",
Expand Down

0 comments on commit 0523a42

Please sign in to comment.