Skip to content

Test K100-AI #72331

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Open
wants to merge 15 commits into
base: develop
Choose a base branch
from
Open
8 changes: 5 additions & 3 deletions paddle/scripts/paddle_build.sh
Original file line number Diff line number Diff line change
Expand Up @@ -1556,7 +1556,8 @@ function card_test() {
# 2 card for P800 ci
CUDA_DEVICE_COUNT=2
elif [[ "${WITH_ROCM}" == "ON" ]]; then
CUDA_DEVICE_COUNT=$(rocm-smi -i | grep DCU | wc -l)
CUDA_DEVICE_COUNT=`echo $HIP_VISIBLE_DEVICES | tr ',' '\n' | wc -l`
IFS=',' read -ra DEVICE_ARRAY <<< "$HIP_VISIBLE_DEVICES"
elif [[ "${WITH_IPU}" == "ON" ]]; then
CUDA_DEVICE_COUNT=1
else
Expand Down Expand Up @@ -1586,6 +1587,7 @@ function card_test() {
trap 'caught_error' CHLD
tmpfile_rand=`date +%s%N`
NUM_PROC=$[CUDA_DEVICE_COUNT/$cardnumber]
export parallel_job=2
echo "****************************************************************"
echo "***These unittests run $parallel_job job each time with $cardnumber GPU***"
echo "****************************************************************"
Expand Down Expand Up @@ -1617,7 +1619,7 @@ function card_test() {
(ctest -I $i,,$NUM_PROC -R "($testcases)" -E "($disable_ut_quickly)" ${run_label_mode} -V --timeout 120 -j $parallel_job | tee $tmpfile; test ${PIPESTATUS[0]} -eq 0) &
else
if [[ "$WITH_ROCM" == "ON" ]]; then
(env HIP_VISIBLE_DEVICES=$cuda_list ctest -I $i,,$NUM_PROC -R "($testcases)" -E "($disable_ut_quickly)" ${run_label_mode} --timeout 120 -V -j $parallel_job | tee $tmpfile; test ${PIPESTATUS[0]} -eq 0) &
(env HIP_VISIBLE_DEVICES=${DEVICE_ARRAY[$i]} ctest -I $i,,$NUM_PROC -R "($testcases)" -E "($disable_ut_quickly)" ${run_label_mode} --timeout 120 -V -j $parallel_job | tee $tmpfile; test ${PIPESTATUS[0]} -eq 0) &
elif [[ "$WITH_XPU" == "ON" ]]; then
(env XPU_VISIBLE_DEVICES=$cuda_list_str ctest -I $i,,$NUM_PROC -R "($testcases)" -E "($disable_ut_quickly)" ${run_label_mode} --timeout 120 -V -j $parallel_job | tee $tmpfile; test ${PIPESTATUS[0]} -eq 0) &
else
Expand All @@ -1629,7 +1631,7 @@ function card_test() {
(ctest -I $i,,$NUM_PROC -R "($testcases)" -E "($disable_ut_quickly)" ${run_label_mode} --timeout 120 --output-on-failure -j $parallel_job | tee $tmpfile; test ${PIPESTATUS[0]} -eq 0) &
else
if [[ "$WITH_ROCM" == "ON" ]]; then
(env HIP_VISIBLE_DEVICES=$cuda_list ctest -I $i,,$NUM_PROC -R "($testcases)" -E "($disable_ut_quickly)" ${run_label_mode} --timeout 120 --output-on-failure -j $parallel_job | tee $tmpfile; test ${PIPESTATUS[0]} -eq 0) &
(env HIP_VISIBLE_DEVICES=${DEVICE_ARRAY[$i]} ctest -I $i,,$NUM_PROC -R "($testcases)" -E "($disable_ut_quickly)" ${run_label_mode} --timeout 120 --output-on-failure -j $parallel_job | tee $tmpfile; test ${PIPESTATUS[0]} -eq 0) &
elif [[ "$WITH_XPU" == "ON" ]]; then
(env XPU_VISIBLE_DEVICES=$cuda_list_str ctest -I $i,,$NUM_PROC -R "($testcases)" -E "($disable_ut_quickly)" ${run_label_mode} --timeout 120 --output-on-failure -j $parallel_job | tee $tmpfile; test ${PIPESTATUS[0]} -eq 0) &
else
Expand Down
Loading