1 | // RUN: %clang_cc1 -O0 -triple spir -emit-llvm %s -o - | FileCheck %s |
2 | // RUN: %clang_cc1 -O0 -triple spir64 -emit-llvm %s -o - | FileCheck %s |
3 | |
4 | // This file tests that using the _Float16 type with the spir target will not |
5 | // use the llvm intrinsics but instead will use the half arithmetic |
6 | // instructions directly. |
7 | |
8 | // Previously attempting to use a constant _Float16 with a comparison |
9 | // instruction when the target is spir or spir64 lead to an assert being hit. |
10 | bool fcmp_const() { |
11 | _Float16 a = 0.0f16; |
12 | const _Float16 b = 1.0f16; |
13 | |
14 | // CHECK-NOT: llvm.convert.to.fp16 |
15 | // CHECK-NOT: llvm.convert.from.fp16 |
16 | |
17 | // CHECK: [[REG1:%.*]] = load half, half* %a, align 2 |
18 | // CHECK-NEXT: fcmp olt half [[REG1]], 0xH3C00 |
19 | |
20 | // CHECK: [[REG2:%.*]] = load half, half* %a, align 2 |
21 | // CHECK-NEXT: fcmp olt half [[REG2]], 0xH4000 |
22 | |
23 | // CHECK: [[REG3:%.*]] = load half, half* %a, align 2 |
24 | // CHECK-NEXT: fcmp ogt half [[REG3]], 0xH3C00 |
25 | |
26 | // CHECK: [[REG4:%.*]] = load half, half* %a, align 2 |
27 | // CHECK-NEXT: fcmp ogt half [[REG4]], 0xH4200 |
28 | |
29 | // CHECK: [[REG5:%.*]] = load half, half* %a, align 2 |
30 | // CHECK-NEXT: fcmp oeq half [[REG5]], 0xH3C00 |
31 | |
32 | // CHECK: [[REG7:%.*]] = load half, half* %a, align 2 |
33 | // CHECK-NEXT: fcmp oeq half [[REG7]], 0xH4400 |
34 | |
35 | // CHECK: [[REG8:%.*]] = load half, half* %a, align 2 |
36 | // CHECK-NEXT: fcmp une half [[REG8]], 0xH3C00 |
37 | |
38 | // CHECK: [[REG9:%.*]] = load half, half* %a, align 2 |
39 | // CHECK-NEXT: fcmp une half [[REG9]], 0xH4500 |
40 | |
41 | // CHECK: [[REG10:%.*]] = load half, half* %a, align 2 |
42 | // CHECK-NEXT: fcmp ole half [[REG10]], 0xH3C00 |
43 | |
44 | // CHECK: [[REG11:%.*]] = load half, half* %a, align 2 |
45 | // CHECK-NEXT: fcmp ole half [[REG11]], 0xH4600 |
46 | |
47 | // CHECK: [[REG12:%.*]] = load half, half* %a, align 2 |
48 | // CHECK-NEXT: fcmp oge half [[REG12]], 0xH3C00 |
49 | |
50 | // CHECK: [[REG13:%.*]] = load half, half* %a, align 2 |
51 | // CHECK-NEXT: fcmp oge half [[REG13]], 0xH4700 |
52 | return a < b || a < 2.0f16 || a > b || a > 3.0f16 || a == b || a == 4.0f16 || |
53 | a != b || a != 5.0f16 || a <= b || a <= 6.0f16 || a >= b || |
54 | a >= 7.0f16; |
55 | } |
56 | |
57 | bool fcmp() { |
58 | _Float16 a = 0.0f16; |
59 | _Float16 b = 1.0f16; |
60 | |
61 | // CHECK-NOT: llvm.convert.to.fp16 |
62 | // CHECK-NOT: llvm.convert.from.fp16 |
63 | // CHECK: [[REG1:%.*]] = load half, half* %a, align 2 |
64 | // CHECK-NEXT: [[REG2:%.*]] = load half, half* %b, align 2 |
65 | // CHECK-NEXT: fcmp olt half [[REG1]], [[REG2]] |
66 | |
67 | // CHECK: [[REG3:%.*]] = load half, half* %a, align 2 |
68 | // CHECK-NEXT: [[REG4:%.*]] = load half, half* %b, align 2 |
69 | // CHECK-NEXT: fcmp ogt half [[REG3]], [[REG4]] |
70 | |
71 | // CHECK: [[REG5:%.*]] = load half, half* %a, align 2 |
72 | // CHECK-NEXT: [[REG6:%.*]] = load half, half* %b, align 2 |
73 | // CHECK-NEXT: fcmp oeq half [[REG5]], [[REG6]] |
74 | |
75 | // CHECK: [[REG7:%.*]] = load half, half* %a, align 2 |
76 | // CHECK-NEXT: [[REG8:%.*]] = load half, half* %b, align 2 |
77 | // CHECK-NEXT: fcmp une half [[REG7]], [[REG8]] |
78 | |
79 | // CHECK: [[REG7:%.*]] = load half, half* %a, align 2 |
80 | // CHECK-NEXT: [[REG8:%.*]] = load half, half* %b, align 2 |
81 | // CHECK-NEXT: fcmp ole half [[REG7]], [[REG8]] |
82 | |
83 | // CHECK: [[REG7:%.*]] = load half, half* %a, align 2 |
84 | // CHECK-NEXT: [[REG8:%.*]] = load half, half* %b, align 2 |
85 | // CHECK-NEXT: fcmp oge half [[REG7]], [[REG8]] |
86 | return a < b || a > b || a == b || a != b || a <= b || a >= b; |
87 | } |
88 | |
89 | _Float16 fadd() { |
90 | _Float16 a = 1.0f16; |
91 | const _Float16 b = 2.0f16; |
92 | |
93 | // CHECK-NOT: llvm.convert.to.fp16 |
94 | // CHECK-NOT: llvm.convert.from.fp16 |
95 | |
96 | // CHECK: [[REG1:%.*]] = load half, half* %a, align 2 |
97 | // CHECK-NEXT: [[REG2:%.*]] = fadd half [[REG1]], 0xH4000 |
98 | // CHECK-NEXT: [[REG3:%.*]] = fadd half [[REG2]], 0xH4200 |
99 | // CHECK-NEXT: ret half [[REG3]] |
100 | return a + b + 3.0f16; |
101 | } |
102 | |
103 | _Float16 fsub() { |
104 | _Float16 a = 1.0f16; |
105 | const _Float16 b = 2.0f16; |
106 | |
107 | // CHECK-NOT: llvm.convert.to.fp16 |
108 | // CHECK-NOT: llvm.convert.from.fp16 |
109 | |
110 | // CHECK: [[REG1:%.*]] = load half, half* %a, align 2 |
111 | // CHECK-NEXT: [[REG2:%.*]] = fsub half [[REG1]], 0xH4000 |
112 | // CHECK-NEXT: [[REG3:%.*]] = fsub half [[REG2]], 0xH4200 |
113 | // CHECK-NEXT: ret half [[REG3]] |
114 | return a - b - 3.0f16; |
115 | } |
116 | |
117 | // CHECK: define spir_func half @_Z4fmulDF16_(half %arg) |
118 | _Float16 fmul(_Float16 arg) { |
119 | _Float16 a = 1.0f16; |
120 | const _Float16 b = 2.0f16; |
121 | |
122 | // CHECK-NOT: llvm.convert.to.fp16 |
123 | // CHECK-NOT: llvm.convert.from.fp16 |
124 | |
125 | // CHECK: [[REG1:%.*]] = load half, half* %a, align 2 |
126 | // CHECK-NEXT: [[REG2:%.*]] = load half, half* %arg.addr, align 2 |
127 | // CHECK-NEXT: [[REG3:%.*]] = fmul half [[REG1]], [[REG2]] |
128 | // CHECK-NEXT: [[REG4:%.*]] = fmul half [[REG3]], 0xH4000 |
129 | // CHECK-NEXT: [[REG5:%.*]] = fmul half [[REG4]], 0xH4200 |
130 | // CHECK-NEXT: ret half [[REG5]] |
131 | return a * arg * b * 3.0f16; |
132 | } |
133 | |
134 | _Float16 fdiv() { |
135 | _Float16 a = 1.0f16; |
136 | const _Float16 b = 2.0f16; |
137 | |
138 | // CHECK-NOT: llvm.convert.to.fp16 |
139 | // CHECK-NOT: llvm.convert.from.fp16 |
140 | |
141 | // CHECK: [[REG1:%.*]] = load half, half* %a, align 2 |
142 | // CHECK-NEXT: [[REG2:%.*]] = fdiv half [[REG1]], 0xH4000 |
143 | // CHECK-NEXT: [[REG3:%.*]] = fdiv half [[REG2]], 0xH4200 |
144 | // CHECK-NEXT: ret half [[REG3]] |
145 | return a / b / 3.0f16; |
146 | } |
147 | |