Skip to content

Commit fb6ddfb

Browse files
authored
Add MIOPEN_FIND_ENFORCE For ROCm 7 for convolution gemms (#312)
* Add MIOPEN_FIND_ENFORCE For ROCm 7 for convolution gemms * Exclude failing CollectiveOpsE2E tests
1 parent c424ad9 commit fb6ddfb

2 files changed

Lines changed: 9 additions & 0 deletions

File tree

build_tools/rocm/run_xla.sh

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -107,6 +107,8 @@ bazel \
107107
--action_env=XLA_FLAGS=--xla_gpu_enable_llvm_module_compilation_parallelism=true \
108108
--run_under=//build_tools/ci:parallel_gpu_execute \
109109
--test_filter=-$(IFS=: ; echo "${EXCLUDED_TESTS[*]}") \
110+
--test_env=MIOPEN_FIND_ENFORCE=5 \
111+
--test_env=MIOPEN_FIND_MODE=1 \
110112
-- //xla/... \
111113

112114
# clean up bazel disk_cache

build_tools/rocm/run_xla_multi_gpu.sh

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -77,6 +77,12 @@ GPU_NAME=${GPU_NAME[1]}
7777
BAZEL_DISK_CACHE_SIZE=100G
7878
BAZEL_DISK_CACHE_DIR="/tf/disk_cache/rocm-jaxlib-v0.6.0"
7979

80+
EXCLUDED_TESTS=(
81+
CollectiveOpsTestE2E.MemcpyP2pLargeMessage
82+
RaggedAllToAllTest/RaggedAllToAllTest.RaggedAllToAll_8GPUs_2ReplicasPerGroups/sync_decomposer
83+
RaggedAllToAllTest/RaggedAllToAllTest.RaggedAllToAll_8GPUs_2ReplicasPerGroups/async_decomposer
84+
)
85+
8086
bazel \
8187
test \
8288
--define xnn_enable_avxvnniint8=false \
@@ -99,6 +105,7 @@ bazel \
99105
--action_env=XLA_FLAGS=--xla_gpu_force_compilation_parallelism=16 \
100106
--action_env=XLA_FLAGS=--xla_gpu_enable_llvm_module_compilation_parallelism=true \
101107
--action_env=NCCL_MAX_NCHANNELS=1 \
108+
--test_filter=-$(IFS=: ; echo "${EXCLUDED_TESTS[*]}") \
102109
-- //xla/tests:collective_ops_e2e_test \
103110
//xla/tests:collective_ops_test \
104111
//xla/tests:collective_pipeline_parallelism_test \

0 commit comments

Comments
 (0)