|
2 | 2 | // everything on the same thread. |
3 | 3 | // RUN: mlir-opt %s -test-vector-warp-distribute=rewrite-warp-ops-to-scf-if -canonicalize | \ |
4 | 4 | // RUN: mlir-opt -convert-vector-to-scf -convert-scf-to-cf -convert-cf-to-llvm -convert-vector-to-llvm -convert-arith-to-llvm \ |
5 | | -// RUN: -test-lower-to-nvvm | \ |
| 5 | +// RUN: -gpu-kernel-outlining |\ |
| 6 | +// RUN: mlir-opt -pass-pipeline='builtin.module(gpu.module(strip-debuginfo,convert-gpu-to-nvvm,reconcile-unrealized-casts,gpu-to-cubin))' |\ |
| 7 | +// RUN: mlir-opt -gpu-to-llvm -reconcile-unrealized-casts |\ |
6 | 8 | // RUN: mlir-cpu-runner -e main -entry-point-result=void \ |
7 | 9 | // RUN: -shared-libs=%mlir_cuda_runtime \ |
8 | 10 | // RUN: -shared-libs=%mlir_c_runner_utils \ |
|
13 | 15 | // RUN: mlir-opt %s -test-vector-warp-distribute="hoist-uniform distribute-transfer-write" \ |
14 | 16 | // RUN: -test-vector-warp-distribute=rewrite-warp-ops-to-scf-if -canonicalize | \ |
15 | 17 | // RUN: mlir-opt -convert-vector-to-scf -convert-scf-to-cf -convert-cf-to-llvm -convert-vector-to-llvm -convert-arith-to-llvm \ |
16 | | -// RUN: -test-lower-to-nvvm | \ |
| 18 | +// RUN: -gpu-kernel-outlining |\ |
| 19 | +// RUN: mlir-opt -pass-pipeline='builtin.module(gpu.module(strip-debuginfo,convert-gpu-to-nvvm,reconcile-unrealized-casts,gpu-to-cubin))' |\ |
| 20 | +// RUN: mlir-opt -gpu-to-llvm -reconcile-unrealized-casts |\ |
17 | 21 | // RUN: mlir-cpu-runner -e main -entry-point-result=void \ |
18 | 22 | // RUN: -shared-libs=%mlir_cuda_runtime \ |
19 | 23 | // RUN: -shared-libs=%mlir_c_runner_utils \ |
|
23 | 27 | // RUN: mlir-opt %s -test-vector-warp-distribute="hoist-uniform distribute-transfer-write propagate-distribution" \ |
24 | 28 | // RUN: -test-vector-warp-distribute=rewrite-warp-ops-to-scf-if -canonicalize | \ |
25 | 29 | // RUN: mlir-opt -convert-vector-to-scf -convert-scf-to-cf -convert-cf-to-llvm -convert-vector-to-llvm -convert-arith-to-llvm \ |
26 | | -// RUN: -test-lower-to-nvvm | \ |
| 30 | +// RUN: -gpu-kernel-outlining |\ |
| 31 | +// RUN: mlir-opt -pass-pipeline='builtin.module(gpu.module(strip-debuginfo,convert-gpu-to-nvvm,reconcile-unrealized-casts,gpu-to-cubin))' |\ |
| 32 | +// RUN: mlir-opt -gpu-to-llvm -reconcile-unrealized-casts |\ |
27 | 33 | // RUN: mlir-cpu-runner -e main -entry-point-result=void \ |
28 | 34 | // RUN: -shared-libs=%mlir_cuda_runtime \ |
29 | 35 | // RUN: -shared-libs=%mlir_c_runner_utils \ |
|
0 commit comments