|
2 | 2 | // everything on the same thread.
|
3 | 3 | // RUN: mlir-opt %s -test-vector-warp-distribute=rewrite-warp-ops-to-scf-if -canonicalize | \
|
4 | 4 | // RUN: mlir-opt -convert-vector-to-scf -convert-scf-to-cf -convert-cf-to-llvm -convert-vector-to-llvm -convert-arith-to-llvm \
|
5 |
| -// RUN: -gpu-kernel-outlining |\ |
6 |
| -// RUN: mlir-opt -pass-pipeline='builtin.module(gpu.module(strip-debuginfo,convert-gpu-to-nvvm,reconcile-unrealized-casts,gpu-to-cubin))' |\ |
7 |
| -// RUN: mlir-opt -gpu-to-llvm -reconcile-unrealized-casts |\ |
| 5 | +// RUN: -test-lower-to-nvvm | \ |
8 | 6 | // RUN: mlir-cpu-runner -e main -entry-point-result=void \
|
9 | 7 | // RUN: -shared-libs=%mlir_cuda_runtime \
|
10 | 8 | // RUN: -shared-libs=%mlir_c_runner_utils \
|
|
15 | 13 | // RUN: mlir-opt %s -test-vector-warp-distribute="hoist-uniform distribute-transfer-write" \
|
16 | 14 | // RUN: -test-vector-warp-distribute=rewrite-warp-ops-to-scf-if -canonicalize | \
|
17 | 15 | // RUN: mlir-opt -convert-vector-to-scf -convert-scf-to-cf -convert-cf-to-llvm -convert-vector-to-llvm -convert-arith-to-llvm \
|
18 |
| -// RUN: -gpu-kernel-outlining |\ |
19 |
| -// RUN: mlir-opt -pass-pipeline='builtin.module(gpu.module(strip-debuginfo,convert-gpu-to-nvvm,reconcile-unrealized-casts,gpu-to-cubin))' |\ |
20 |
| -// RUN: mlir-opt -gpu-to-llvm -reconcile-unrealized-casts |\ |
| 16 | +// RUN: -test-lower-to-nvvm | \ |
21 | 17 | // RUN: mlir-cpu-runner -e main -entry-point-result=void \
|
22 | 18 | // RUN: -shared-libs=%mlir_cuda_runtime \
|
23 | 19 | // RUN: -shared-libs=%mlir_c_runner_utils \
|
|
27 | 23 | // RUN: mlir-opt %s -test-vector-warp-distribute="hoist-uniform distribute-transfer-write propagate-distribution" \
|
28 | 24 | // RUN: -test-vector-warp-distribute=rewrite-warp-ops-to-scf-if -canonicalize | \
|
29 | 25 | // RUN: mlir-opt -convert-vector-to-scf -convert-scf-to-cf -convert-cf-to-llvm -convert-vector-to-llvm -convert-arith-to-llvm \
|
30 |
| -// RUN: -gpu-kernel-outlining |\ |
31 |
| -// RUN: mlir-opt -pass-pipeline='builtin.module(gpu.module(strip-debuginfo,convert-gpu-to-nvvm,reconcile-unrealized-casts,gpu-to-cubin))' |\ |
32 |
| -// RUN: mlir-opt -gpu-to-llvm -reconcile-unrealized-casts |\ |
| 26 | +// RUN: -test-lower-to-nvvm | \ |
33 | 27 | // RUN: mlir-cpu-runner -e main -entry-point-result=void \
|
34 | 28 | // RUN: -shared-libs=%mlir_cuda_runtime \
|
35 | 29 | // RUN: -shared-libs=%mlir_c_runner_utils \
|
|
0 commit comments