sync (ROCm fork --> TF repo) the dockerfile+scripts used for ROCm CI

This commit is contained in:
Deven Desai 2019-12-18 20:23:16 +00:00
parent 522eb8fb92
commit 262cbe7827
5 changed files with 94 additions and 25 deletions

View File

@ -16,8 +16,7 @@ RUN sh -c "echo deb [arch=amd64] $DEB_ROCM_REPO xenial main > /etc/apt/sources.
RUN apt-get update --allow-insecure-repositories && \
DEBIAN_FRONTEND=noninteractive apt-get install -y --allow-unauthenticated \
rocm-dev rocm-libs hipcub rocm-utils rocm-cmake \
rocfft miopen-hip miopengemm rocblas hipblas rocrand rccl \
rocm-profiler cxlactivitylogger && \
rocfft miopen-hip miopengemm rocblas hipblas rocrand rccl && \
apt-get clean && \
rm -rf /var/lib/apt/lists/*

View File

@ -58,8 +58,7 @@ RUN apt-get update --allow-insecure-repositories && DEBIAN_FRONTEND=noninteracti
RUN apt-get update --allow-insecure-repositories && \
DEBIAN_FRONTEND=noninteractive apt-get install -y --allow-unauthenticated \
rocm-dev rocm-libs hipcub rocm-utils rocm-cmake \
rocfft miopen-hip miopengemm rocblas hipblas rocrand rccl \
rocm-profiler cxlactivitylogger && \
rocfft miopen-hip miopengemm rocblas hipblas rocrand rccl && \
apt-get clean && \
rm -rf /var/lib/apt/lists/*

View File

@ -35,10 +35,33 @@ export TF_GPU_COUNT=${N_GPUS}
yes "" | $PYTHON_BIN_PATH configure.py
# Run bazel test command. Double test timeouts to avoid flakes.
bazel test --config=rocm --test_tag_filters=-no_oss,-oss_serial,-no_gpu,-no_rocm,-benchmark-test -k \
--test_lang_filters=cc --jobs=${N_JOBS} --test_timeout 300,450,1200,3600 \
--build_tests_only --test_output=errors --local_test_jobs=${TF_GPU_COUNT} --config=opt \
--test_sharding_strategy=disabled \
--test_size_filters=small,medium \
--run_under=//tensorflow/tools/ci_build/gpu_build:parallel_gpu_execute -- \
//tensorflow/... -//tensorflow/compiler/... -//tensorflow/contrib/...
bazel test \
--config=rocm \
-k \
--test_tag_filters=-no_oss,-oss_serial,-no_gpu,-no_rocm,-benchmark-test,-rocm_multi_gpu,-v1only \
--test_lang_filters=cc \
--jobs=${N_JOBS} \
--local_test_jobs=${TF_GPU_COUNT}\
--test_timeout 300,450,1200,3600 \
--build_tests_only \
--test_output=errors \
--test_sharding_strategy=disabled \
--test_size_filters=small,medium \
--run_under=//tensorflow/tools/ci_build/gpu_build:parallel_gpu_execute \
-- \
//tensorflow/... \
-//tensorflow/compiler/... \
-//tensorflow/lite/delegates/gpu/gl/... \
-//tensorflow/lite/delegates/gpu/cl/... \
&& bazel test \
--config=rocm \
-k \
--test_tag_filters=-no_gpu,-no_rocm,-v1only \
--jobs=${N_JOBS} \
--local_test_jobs=1 \
--test_timeout 600,900,2400,7200 \
--build_tests_only \
--test_output=errors \
--test_sharding_strategy=disabled \
-- \
//tensorflow/core/nccl:nccl_manager_test

View File

@ -35,9 +35,18 @@ export TF_GPU_COUNT=${N_GPUS}
yes "" | $PYTHON_BIN_PATH configure.py
# Run bazel test command. Double test timeouts to avoid flakes.
bazel test --config=rocm --test_tag_filters=-no_oss,-oss_serial,-no_gpu,-no_rocm,-benchmark-test -k \
--test_lang_filters=py --jobs=${N_JOBS} --test_timeout 600,900,2400,7200 \
--build_tests_only --test_output=errors --local_test_jobs=${TF_GPU_COUNT} --config=opt \
--test_sharding_strategy=disabled \
--run_under=//tensorflow/tools/ci_build/gpu_build:parallel_gpu_execute -- \
//tensorflow/... -//tensorflow/compiler/... -//tensorflow/contrib/...
bazel test \
--config=rocm \
-k \
--test_tag_filters=-no_oss,-oss_serial,-no_gpu,-no_rocm,-benchmark-test,-rocm_multi_gpu,-v1only \
--test_lang_filters=py \
--jobs=${N_JOBS} \
--local_test_jobs=${TF_GPU_COUNT} \
--test_timeout 600,900,2400,7200 \
--build_tests_only \
--test_output=errors \
--test_sharding_strategy=disabled \
--run_under=//tensorflow/tools/ci_build/gpu_build:parallel_gpu_execute \
-- \
//tensorflow/... \
-//tensorflow/compiler/...

View File

@ -27,6 +27,7 @@ echo ""
# Run configure.
export PYTHON_BIN_PATH=`which python3`
export CC_OPT_FLAGS='-mavx'
export TF_NEED_ROCM=1
export TF_GPU_COUNT=${N_GPUS}
@ -34,12 +35,50 @@ export TF_GPU_COUNT=${N_GPUS}
yes "" | $PYTHON_BIN_PATH configure.py
echo "build --distinct_host_configuration=false" >> .tf_configure.bazelrc
bazel clean
# Run bazel test command. Double test timeouts to avoid flakes.
bazel test --config=rocm --test_tag_filters=-no_gpu,-benchmark-test,-no_oss,-no_rocm -k \
--jobs=${N_JOBS} --test_timeout 600,900,2400,7200 \
--build_tests_only --test_output=errors --local_test_jobs=${TF_GPU_COUNT} \
--test_sharding_strategy=disabled \
--run_under=//tensorflow/tools/ci_build/gpu_build:parallel_gpu_execute \
--config=xla -- \
//tensorflow/compiler/...
bazel test \
--config=rocm \
--config=xla \
-k \
--test_tag_filters=-no_oss,-oss_serial,-no_gpu,-no_rocm,-benchmark-test,-rocm_multi_gpu,-v1only \
--jobs=${N_JOBS} \
--local_test_jobs=${TF_GPU_COUNT} \
--test_timeout 600,900,2400,7200 \
--build_tests_only \
--test_output=errors \
--test_sharding_strategy=disabled \
--run_under=//tensorflow/tools/ci_build/gpu_build:parallel_gpu_execute \
-- \
//tensorflow/compiler/... \
-//tensorflow/compiler/tests:dense_layer_test \
-//tensorflow/compiler/tests:dense_layer_test_gpu \
-//tensorflow/compiler/tests:jit_test \
-//tensorflow/compiler/tests:jit_test_gpu \
-//tensorflow/compiler/tests:matrix_triangular_solve_op_test \
-//tensorflow/compiler/tests:tensor_array_ops_test \
-//tensorflow/compiler/tests:xla_ops_test \
-//tensorflow/compiler/xla/client/lib:svd_test \
-//tensorflow/compiler/tests:lstm_test \
&& bazel test \
--config=rocm \
--config=xla \
-k \
--test_tag_filters=-no_oss,-oss_serial,-no_gpu,-no_rocm,-benchmark-test,-rocm_multi_gpu,-v1only \
--jobs=${N_JOBS} \
--local_test_jobs=${TF_GPU_COUNT} \
--test_timeout 600,900,2400,7200 \
--build_tests_only \
--test_output=errors \
--test_sharding_strategy=disabled \
--test_env=TF2_BEHAVIOR=0 \
--run_under=//tensorflow/tools/ci_build/gpu_build:parallel_gpu_execute \
-- \
//tensorflow/compiler/tests:dense_layer_test \
//tensorflow/compiler/tests:dense_layer_test_gpu \
//tensorflow/compiler/tests:jit_test \
//tensorflow/compiler/tests:jit_test_gpu \
//tensorflow/compiler/tests:matrix_triangular_solve_op_test \
//tensorflow/compiler/tests:tensor_array_ops_test \
//tensorflow/compiler/tests:xla_ops_test \
//tensorflow/compiler/xla/client/lib:svd_test \
//tensorflow/compiler/tests:lstm_test