Skip to content

Commit

Permalink
change flag to -mca orte_allowed_exit_without_sync 1
Browse files Browse the repository at this point in the history
  • Loading branch information
siddharth9820 committed Jan 27, 2024
1 parent f191f58 commit b20a401
Showing 1 changed file with 3 additions and 3 deletions.
6 changes: 3 additions & 3 deletions .github/workflows/nvidia-rtx-3090-tests.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -31,7 +31,7 @@ jobs:
export G_data=$(( 2 / G_inter ))
export memopt=${{ matrix.memopt }}
echo "training with G_inter = ${G_inter}, G_data = $(( 2 / G_inter )) ${{ matrix.memopt }}"
mpirun -quiet -n 2 pytest --with-mpi ./axonn/tests/test_vit.py
mpirun -mca orte_allowed_exit_without_sync 1 -n 2 pytest --with-mpi ./axonn/tests/test_vit.py
- name: Uninstall AxoNN
run: |
pip uninstall --yes axonn
Expand All @@ -47,10 +47,10 @@ jobs:
pip install -r requirements.txt
- name: Run intra-layer FC unit tests
run: |
mpirun -quiet -n 2 pytest --with-mpi ./axonn/tests/test_intra_layer_fc.py
mpirun -mca orte_allowed_exit_without_sync 1 -n 2 pytest --with-mpi ./axonn/tests/test_intra_layer_fc.py
- name: Run intra-layer Conv unit tests
run: |
mpirun -quiet -n 2 pytest --with-mpi ./axonn/tests/test_intra_layer_conv.py
mpirun -mca orte_allowed_exit_without_sync 1 -n 2 pytest --with-mpi ./axonn/tests/test_intra_layer_conv.py
- name: Uninstall AxoNN
run: |
pip uninstall --yes axonn

0 comments on commit b20a401

Please sign in to comment.