|
| 1 | +// RUN: mlir-opt %s -split-input-file -convert-gpu-to-rocdl | FileCheck %s --check-prefixes=ROCDL |
| 2 | +// RUN: mlir-opt %s -split-input-file -convert-gpu-to-nvvm | FileCheck %s --check-prefixes=NVVM |
| 3 | + |
| 4 | +gpu.module @kernel { |
| 5 | + gpu.func @gpu_global_id() -> (index) { |
| 6 | + %global_id_x = gpu.global_id x |
| 7 | + gpu.return %global_id_x : index |
| 8 | + } |
| 9 | +} |
| 10 | + |
| 11 | +// ROCDL-LABEL: llvm.func @gpu_global_id() -> i64 { |
| 12 | +// ROCDL: %[[WORKGROUP_0:.*]] = rocdl.workgroup.id.x : i32 |
| 13 | +// ROCDL: %[[SEXT_0:.*]] = llvm.sext %[[WORKGROUP_0]] : i32 to i64 |
| 14 | +// ROCDL: %[[WORKGROUP_1:.*]] = rocdl.workgroup.dim.x : i32 |
| 15 | +// ROCDL: %[[SEXT_1:.*]] = llvm.sext %[[WORKGROUP_1]] : i32 to i64 |
| 16 | +// ROCDL: %[[MUL_0:.*]] = llvm.mul %[[SEXT_0]], %[[SEXT_1]] : i64 |
| 17 | +// ROCDL: %[[WORKITEM_0:.*]] = rocdl.workitem.id.x : i32 |
| 18 | +// ROCDL: %[[SEXT_2:.*]] = llvm.sext %[[WORKITEM_0]] : i32 to i64 |
| 19 | +// ROCDL: %[[ADD_0:.*]] = llvm.add %[[SEXT_2]], %[[MUL_0]] : i64 |
| 20 | +// ROCDL: llvm.return %[[ADD_0]] : i64 |
| 21 | +// ROCDL: } |
| 22 | + |
| 23 | +// NVVM-LABEL: llvm.func @gpu_global_id() -> i64 { |
| 24 | +// NVVM: %[[READ_0:.*]] = nvvm.read.ptx.sreg.ctaid.x : i32 |
| 25 | +// NVVM: %[[SEXT_0:.*]] = llvm.sext %[[READ_0]] : i32 to i64 |
| 26 | +// NVVM: %[[READ_1:.*]] = nvvm.read.ptx.sreg.ntid.x : i32 |
| 27 | +// NVVM: %[[SEXT_1:.*]] = llvm.sext %[[READ_1]] : i32 to i64 |
| 28 | +// NVVM: %[[MUL_0:.*]] = llvm.mul %[[SEXT_0]], %[[SEXT_1]] : i64 |
| 29 | +// NVVM: %[[READ_2:.*]] = nvvm.read.ptx.sreg.tid.x : i32 |
| 30 | +// NVVM: %[[SEXT_2:.*]] = llvm.sext %[[READ_2]] : i32 to i64 |
| 31 | +// NVVM: %[[ADD_0:.*]] = llvm.add %[[SEXT_2]], %[[MUL_0]] : i64 |
| 32 | +// NVVM: llvm.return %[[ADD_0]] : i64 |
| 33 | +// NVVM: } |
0 commit comments