write_image_impl.ll
1.89 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
target datalayout = "e-p:32:32-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64"
%opencl.image2d_t = type opaque
%opencl.image3d_t = type opaque
declare i32 @llvm.OpenCL.image.get.resource.id.2d(
%opencl.image2d_t addrspace(1)*) nounwind readnone
declare i32 @llvm.OpenCL.image.get.resource.id.3d(
%opencl.image3d_t addrspace(1)*) nounwind readnone
declare void @llvm.r600.rat.store.typed(<4 x i32> %color, <4 x i32> %coord, i32 %rat_id)
define void @__clc_write_imageui_2d(
%opencl.image2d_t addrspace(1)* nocapture %img,
<2 x i32> %coord, <4 x i32> %color) #0 {
; Coordinate int2 -> int4.
%e0 = extractelement <2 x i32> %coord, i32 0
%e1 = extractelement <2 x i32> %coord, i32 1
%coord.0 = insertelement <4 x i32> undef, i32 %e0, i32 0
%coord.1 = insertelement <4 x i32> %coord.0, i32 %e1, i32 1
%coord.2 = insertelement <4 x i32> %coord.1, i32 0, i32 2
%coord.3 = insertelement <4 x i32> %coord.2, i32 0, i32 3
; Get RAT ID.
%img_id = call i32 @llvm.OpenCL.image.get.resource.id.2d(
%opencl.image2d_t addrspace(1)* %img)
%rat_id = add i32 %img_id, 1
; Call store intrinsic.
call void @llvm.r600.rat.store.typed(<4 x i32> %color, <4 x i32> %coord.3, i32 %rat_id)
ret void
}
define void @__clc_write_imagei_2d(
%opencl.image2d_t addrspace(1)* nocapture %img,
<2 x i32> %coord, <4 x i32> %color) #0 {
call void @__clc_write_imageui_2d(
%opencl.image2d_t addrspace(1)* nocapture %img,
<2 x i32> %coord, <4 x i32> %color)
ret void
}
define void @__clc_write_imagef_2d(
%opencl.image2d_t addrspace(1)* nocapture %img,
<2 x i32> %coord, <4 x float> %color) #0 {
%color.i32 = bitcast <4 x float> %color to <4 x i32>
call void @__clc_write_imageui_2d(
%opencl.image2d_t addrspace(1)* nocapture %img,
<2 x i32> %coord, <4 x i32> %color.i32)
ret void
}
attributes #0 = { alwaysinline }