@@ -43,67 +43,23 @@ export TF_PYTHON_VERSION=$PYTHON_VERSION
4343export TF_NEED_ROCM=1
4444export ROCM_PATH=$ROCM_INSTALL_DIR
4545
46- if [ -f /usertools/rocm.bazelrc ]; then
47- # Use the bazelrc files in /usertools if available
48- if [ ! -d /tf ]; then
49- # The bazelrc files in /usertools expect /tf to exist
50- mkdir /tf
51- fi
52- bazel \
53- --bazelrc=/usertools/rocm.bazelrc \
54- test \
55- --local_test_jobs=${N_TEST_JOBS} \
56- --jobs=30 \
57- --local_ram_resources=60000 \
58- --local_cpu_resources=15 \
59- --config=sigbuild_local_cache \
60- --config=rocm \
61- --config=nonpip_multi_gpu \
62- --action_env=TF_PYTHON_VERSION=$PYTHON_VERSION
63- else
64- # Legacy style: run configure then build
65- yes " " | $PYTHON_BIN_PATH configure.py
66-
67- # Run bazel test command. Double test timeouts to avoid flakes.
68- bazel test \
69- --config=rocm \
70- -k \
71- --test_tag_filters=-no_gpu,-cuda-only \
72- --jobs=30 \
73- --local_ram_resources=60000 \
74- --local_cpu_resources=15 \
75- --local_test_jobs=${N_TEST_JOBS} \
76- --test_timeout 920,2400,7200,9600 \
77- --build_tests_only \
78- --test_output=errors \
79- --test_sharding_strategy=disabled \
80- --test_size_filters=small,medium,large \
81- --cache_test_results=no \
82- --test_env=TF_PER_DEVICE_MEMORY_LIMIT_MB=2048 \
83- --test_env=TF_PYTHON_VERSION=$PYTHON_VERSION \
84- -- \
85- //tensorflow/core/nccl:nccl_manager_test_2gpu \
86- //tensorflow/python/distribute/integration_test:mwms_peer_failure_test_2gpu \
87- //tensorflow/python/distribute:checkpoint_utils_test_2gpu \
88- //tensorflow/python/distribute:checkpointing_test_2gpu \
89- //tensorflow/python/distribute:collective_all_reduce_strategy_test_xla_2gpu \
90- //tensorflow/python/distribute:custom_training_loop_gradient_test_2gpu \
91- //tensorflow/python/distribute:custom_training_loop_input_test_2gpu \
92- //tensorflow/python/distribute:distribute_utils_test_2gpu \
93- //tensorflow/python/distribute:input_lib_test_2gpu \
94- //tensorflow/python/distribute:input_lib_type_spec_test_2gpu \
95- //tensorflow/python/distribute:metrics_v1_test_2gpu \
96- //tensorflow/python/distribute:mirrored_variable_test_2gpu \
97- //tensorflow/python/distribute:parameter_server_strategy_test_2gpu \
98- //tensorflow/python/distribute:ps_values_test_2gpu \
99- //tensorflow/python/distribute:random_generator_test_2gpu \
100- //tensorflow/python/distribute:test_util_test_2gpu \
101- //tensorflow/python/distribute:tf_function_test_2gpu \
102- //tensorflow/python/distribute:vars_test_2gpu \
103- //tensorflow/python/distribute:warm_starting_util_test_2gpu \
104- //tensorflow/python/training:saver_test_2gpu
46+ if [ ! -d /tf ]; then
47+ # The bazelrc files in /usertools expect /tf to exist
48+ mkdir /tf
10549fi
10650
51+ bazel --bazelrc=tensorflow/tools/tf_sig_build_dockerfiles/devel.usertools/rocm.bazelrc test \
52+ --local_test_jobs=${N_TEST_JOBS} \
53+ --jobs=30 \
54+ --local_ram_resources=60000 \
55+ --local_cpu_resources=15 \
56+ --verbose_failures \
57+ --config=rocm \
58+ --config=nonpip_multi_gpu \
59+ --config=sigbuild_local_cache \
60+ --action_env=TF_PYTHON_VERSION=$PYTHON_VERSION \
61+ --repo_env=" ROCM_PATH=$ROCM_PATH " \
62+
10763
10864# Started failing with 210906 sync
10965# FAILED : //tensorflow/core/kernels:collective_nccl_test_2gpu \
0 commit comments