@@ -15,7 +15,7 @@ declare i64 @llvm.ctlz.i64(i64, i1) nounwind readnone
15
15
declare <2 x i64 > @llvm.ctlz.v2i64 (<2 x i64 >, i1 ) nounwind readnone
16
16
declare <4 x i64 > @llvm.ctlz.v4i64 (<4 x i64 >, i1 ) nounwind readnone
17
17
18
- declare i32 @llvm.r600.read.tidig .x () nounwind readnone
18
+ declare i32 @llvm.amdgcn.workitem.id .x () nounwind readnone
19
19
20
20
define amdgpu_kernel void @s_ctlz_i32 (i32 addrspace (1 )* noalias %out , i32 %val ) nounwind {
21
21
; SI-LABEL: s_ctlz_i32:
@@ -120,7 +120,7 @@ define amdgpu_kernel void @v_ctlz_i32(i32 addrspace(1)* noalias %out, i32 addrsp
120
120
; EG-NEXT: CNDE_INT T0.X, T0.X, literal.x, PV.W,
121
121
; EG-NEXT: LSHR * T1.X, KC0[2].Y, literal.y,
122
122
; EG-NEXT: 32(4.484155e-44), 2(2.802597e-45)
123
- %tid = call i32 @llvm.r600.read.tidig .x ()
123
+ %tid = call i32 @llvm.amdgcn.workitem.id .x ()
124
124
%in.gep = getelementptr i32 , i32 addrspace (1 )* %valptr , i32 %tid
125
125
%val = load i32 , i32 addrspace (1 )* %in.gep , align 4
126
126
%ctlz = call i32 @llvm.ctlz.i32 (i32 %val , i1 false ) nounwind readnone
@@ -195,7 +195,7 @@ define amdgpu_kernel void @v_ctlz_v2i32(<2 x i32> addrspace(1)* noalias %out, <2
195
195
; EG-NEXT: CNDE_INT T0.X, T0.X, literal.x, PV.W,
196
196
; EG-NEXT: LSHR * T1.X, KC0[2].Y, literal.y,
197
197
; EG-NEXT: 32(4.484155e-44), 2(2.802597e-45)
198
- %tid = call i32 @llvm.r600.read.tidig .x ()
198
+ %tid = call i32 @llvm.amdgcn.workitem.id .x ()
199
199
%in.gep = getelementptr <2 x i32 >, <2 x i32 > addrspace (1 )* %valptr , i32 %tid
200
200
%val = load <2 x i32 >, <2 x i32 > addrspace (1 )* %in.gep , align 8
201
201
%ctlz = call <2 x i32 > @llvm.ctlz.v2i32 (<2 x i32 > %val , i1 false ) nounwind readnone
@@ -288,7 +288,7 @@ define amdgpu_kernel void @v_ctlz_v4i32(<4 x i32> addrspace(1)* noalias %out, <4
288
288
; EG-NEXT: CNDE_INT T0.X, T0.X, literal.x, PV.W,
289
289
; EG-NEXT: LSHR * T1.X, KC0[2].Y, literal.y,
290
290
; EG-NEXT: 32(4.484155e-44), 2(2.802597e-45)
291
- %tid = call i32 @llvm.r600.read.tidig .x ()
291
+ %tid = call i32 @llvm.amdgcn.workitem.id .x ()
292
292
%in.gep = getelementptr <4 x i32 >, <4 x i32 > addrspace (1 )* %valptr , i32 %tid
293
293
%val = load <4 x i32 >, <4 x i32 > addrspace (1 )* %in.gep , align 16
294
294
%ctlz = call <4 x i32 > @llvm.ctlz.v4i32 (<4 x i32 > %val , i1 false ) nounwind readnone
@@ -576,7 +576,7 @@ define amdgpu_kernel void @v_ctlz_i64(i64 addrspace(1)* noalias %out, i64 addrsp
576
576
; EG-NEXT: ADD_INT * T0.W, KC0[2].Y, T0.W,
577
577
; EG-NEXT: LSHR * T1.X, PV.W, literal.x,
578
578
; EG-NEXT: 2(2.802597e-45), 0(0.000000e+00)
579
- %tid = call i32 @llvm.r600.read.tidig .x ()
579
+ %tid = call i32 @llvm.amdgcn.workitem.id .x ()
580
580
%in.gep = getelementptr i64 , i64 addrspace (1 )* %in , i32 %tid
581
581
%out.gep = getelementptr i64 , i64 addrspace (1 )* %out , i32 %tid
582
582
%val = load i64 , i64 addrspace (1 )* %in.gep
@@ -663,7 +663,7 @@ define amdgpu_kernel void @v_ctlz_i64_trunc(i32 addrspace(1)* noalias %out, i64
663
663
; EG-NEXT: ADD_INT * T0.W, KC0[2].Y, PV.Z,
664
664
; EG-NEXT: LSHR * T1.X, PV.W, literal.x,
665
665
; EG-NEXT: 2(2.802597e-45), 0(0.000000e+00)
666
- %tid = call i32 @llvm.r600.read.tidig .x ()
666
+ %tid = call i32 @llvm.amdgcn.workitem.id .x ()
667
667
%in.gep = getelementptr i64 , i64 addrspace (1 )* %in , i32 %tid
668
668
%out.gep = getelementptr i32 , i32 addrspace (1 )* %out , i32 %tid
669
669
%val = load i64 , i64 addrspace (1 )* %in.gep
@@ -729,7 +729,7 @@ define amdgpu_kernel void @v_ctlz_i32_sel_eq_neg1(i32 addrspace(1)* noalias %out
729
729
; EG-NEXT: CNDE_INT T0.X, T0.X, literal.x, PV.W,
730
730
; EG-NEXT: LSHR * T1.X, KC0[2].Y, literal.y,
731
731
; EG-NEXT: -1(nan), 2(2.802597e-45)
732
- %tid = call i32 @llvm.r600.read.tidig .x ()
732
+ %tid = call i32 @llvm.amdgcn.workitem.id .x ()
733
733
%in.gep = getelementptr i32 , i32 addrspace (1 )* %valptr , i32 %tid
734
734
%val = load i32 , i32 addrspace (1 )* %in.gep
735
735
%ctlz = call i32 @llvm.ctlz.i32 (i32 %val , i1 false ) nounwind readnone
@@ -795,7 +795,7 @@ define amdgpu_kernel void @v_ctlz_i32_sel_ne_neg1(i32 addrspace(1)* noalias %out
795
795
; EG-NEXT: CNDE_INT T0.X, T0.X, literal.x, PV.W,
796
796
; EG-NEXT: LSHR * T1.X, KC0[2].Y, literal.y,
797
797
; EG-NEXT: -1(nan), 2(2.802597e-45)
798
- %tid = call i32 @llvm.r600.read.tidig .x ()
798
+ %tid = call i32 @llvm.amdgcn.workitem.id .x ()
799
799
%in.gep = getelementptr i32 , i32 addrspace (1 )* %valptr , i32 %tid
800
800
%val = load i32 , i32 addrspace (1 )* %in.gep
801
801
%ctlz = call i32 @llvm.ctlz.i32 (i32 %val , i1 false ) nounwind readnone
@@ -872,7 +872,7 @@ define amdgpu_kernel void @v_ctlz_i32_sel_eq_bitwidth(i32 addrspace(1)* noalias
872
872
; EG-NEXT: CNDE_INT T0.X, PV.W, T0.W, literal.x,
873
873
; EG-NEXT: LSHR * T1.X, KC0[2].Y, literal.y,
874
874
; EG-NEXT: -1(nan), 2(2.802597e-45)
875
- %tid = call i32 @llvm.r600.read.tidig .x ()
875
+ %tid = call i32 @llvm.amdgcn.workitem.id .x ()
876
876
%in.gep = getelementptr i32 , i32 addrspace (1 )* %valptr , i32 %tid
877
877
%val = load i32 , i32 addrspace (1 )* %in.gep
878
878
%ctlz = call i32 @llvm.ctlz.i32 (i32 %val , i1 false ) nounwind readnone
@@ -948,7 +948,7 @@ define amdgpu_kernel void @v_ctlz_i32_sel_ne_bitwidth(i32 addrspace(1)* noalias
948
948
; EG-NEXT: CNDE_INT T0.X, PV.W, literal.x, T0.W,
949
949
; EG-NEXT: LSHR * T1.X, KC0[2].Y, literal.y,
950
950
; EG-NEXT: -1(nan), 2(2.802597e-45)
951
- %tid = call i32 @llvm.r600.read.tidig .x ()
951
+ %tid = call i32 @llvm.amdgcn.workitem.id .x ()
952
952
%in.gep = getelementptr i32 , i32 addrspace (1 )* %valptr , i32 %tid
953
953
%val = load i32 , i32 addrspace (1 )* %in.gep
954
954
%ctlz = call i32 @llvm.ctlz.i32 (i32 %val , i1 false ) nounwind readnone
@@ -1017,7 +1017,7 @@ define amdgpu_kernel void @v_ctlz_i32_sel_ne_bitwidth(i32 addrspace(1)* noalias
1017
1017
; EG-NEXT: MOV * T0.Z, 0.0,
1018
1018
; EG-NEXT: LSHR * T1.X, KC0[2].Y, literal.x,
1019
1019
; EG-NEXT: 2(2.802597e-45), 0(0.000000e+00)
1020
- %tid = call i32 @llvm.r600.read.tidig .x ()
1020
+ %tid = call i32 @llvm.amdgcn.workitem.id .x ()
1021
1021
%valptr.gep = getelementptr i8 , i8 addrspace (1 )* %valptr , i32 %tid
1022
1022
%val = load i8 , i8 addrspace (1 )* %valptr.gep
1023
1023
%ctlz = call i8 @llvm.ctlz.i8 (i8 %val , i1 false ) nounwind readnone
@@ -1160,7 +1160,7 @@ define amdgpu_kernel void @v_ctlz_i7_sel_eq_neg1(i7 addrspace(1)* noalias %out,
1160
1160
; EG-NEXT: MOV * T0.Z, 0.0,
1161
1161
; EG-NEXT: LSHR * T1.X, KC0[2].Y, literal.x,
1162
1162
; EG-NEXT: 2(2.802597e-45), 0(0.000000e+00)
1163
- %tid = call i32 @llvm.r600.read.tidig .x ()
1163
+ %tid = call i32 @llvm.amdgcn.workitem.id .x ()
1164
1164
%valptr.gep = getelementptr i7 , i7 addrspace (1 )* %valptr , i32 %tid
1165
1165
%val = load i7 , i7 addrspace (1 )* %valptr.gep
1166
1166
%ctlz = call i7 @llvm.ctlz.i7 (i7 %val , i1 false ) nounwind readnone
0 commit comments