
Replace some more nvvm.annotations with function attributes, auto-upgrading the annotations as needed. These new attributes will be more idiomatic and compile-time efficient than the annotations. - !"maxntid[xyz]" -> "nvvm.maxntid" - !"reqntid[xyz]" -> "nvvm.reqntid" - !"cluster_dim_[xyz]" -> "nvvm.cluster_dim"
24 lines
824 B
LLVM
24 lines
824 B
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
|
|
; RUN: llc < %s -mtriple=nvptx64 -mcpu=sm_80 | FileCheck -check-prefixes=CHECK80 %s
|
|
; RUN: llc < %s -mtriple=nvptx64 -mcpu=sm_90 | FileCheck -check-prefixes=CHECK90 %s
|
|
; RUN: %if ptxas-12.0 %{ llc < %s -mtriple=nvptx64 -mcpu=sm_90 | %ptxas-verify -arch=sm_90 %}
|
|
|
|
define ptx_kernel void @kernel_func_clusterxyz() "nvvm.cluster_dim"="3,5,7" {
|
|
; CHECK80-LABEL: kernel_func_clusterxyz(
|
|
; CHECK80: {
|
|
; CHECK80-EMPTY:
|
|
; CHECK80-EMPTY:
|
|
; CHECK80-NEXT: // %bb.0:
|
|
; CHECK80-NEXT: ret;
|
|
;
|
|
; CHECK90-LABEL: kernel_func_clusterxyz(
|
|
; CHECK90: .explicitcluster
|
|
; CHECK90-NEXT: .reqnctapercluster 3, 5, 7
|
|
; CHECK90-NEXT: {
|
|
; CHECK90-EMPTY:
|
|
; CHECK90-EMPTY:
|
|
; CHECK90-NEXT: // %bb.0:
|
|
; CHECK90-NEXT: ret;
|
|
ret void
|
|
}
|