Jakob Stoklund Olesen | c4b3bcc | 2010-07-10 16:30:25 +0000 | [diff] [blame] | 1 | ; RUN: llc < %s -mtriple=i386-apple-darwin | FileCheck %s |
Chris Lattner | 9e07537 | 2008-03-09 08:49:15 +0000 | [diff] [blame] | 2 | |
Jakob Stoklund Olesen | c4b3bcc | 2010-07-10 16:30:25 +0000 | [diff] [blame] | 3 | ; There should be no stack manipulations between the inline asm and ret. |
| 4 | ; CHECK: test1 |
| 5 | ; CHECK: InlineAsm End |
| 6 | ; CHECK-NEXT: ret |
Chris Lattner | 9e07537 | 2008-03-09 08:49:15 +0000 | [diff] [blame] | 7 | define x86_fp80 @test1() { |
| 8 | %tmp85 = call x86_fp80 asm sideeffect "fld0", "={st(0)}"() |
| 9 | ret x86_fp80 %tmp85 |
| 10 | } |
| 11 | |
Jakob Stoklund Olesen | c4b3bcc | 2010-07-10 16:30:25 +0000 | [diff] [blame] | 12 | ; CHECK: test2 |
| 13 | ; CHECK: InlineAsm End |
| 14 | ; CHECK-NEXT: ret |
Chris Lattner | 9e07537 | 2008-03-09 08:49:15 +0000 | [diff] [blame] | 15 | define double @test2() { |
| 16 | %tmp85 = call double asm sideeffect "fld0", "={st(0)}"() |
| 17 | ret double %tmp85 |
| 18 | } |
| 19 | |
Jakob Stoklund Olesen | c4b3bcc | 2010-07-10 16:30:25 +0000 | [diff] [blame] | 20 | ; Setting up argument in st(0) should be a single fld. |
| 21 | ; CHECK: test3 |
| 22 | ; CHECK: fld |
| 23 | ; CHECK-NEXT: InlineAsm Start |
| 24 | ; Asm consumes stack, nothing should be popped. |
| 25 | ; CHECK: InlineAsm End |
| 26 | ; CHECK-NOT: fstp |
| 27 | ; CHECK: ret |
Chris Lattner | 86829f0 | 2008-03-09 09:15:31 +0000 | [diff] [blame] | 28 | define void @test3(x86_fp80 %X) { |
Jakob Stoklund Olesen | f689760 | 2011-06-27 17:27:37 +0000 | [diff] [blame] | 29 | call void asm sideeffect "frob ", "{st(0)},~{st},~{dirflag},~{fpsr},~{flags}"( x86_fp80 %X) |
Chris Lattner | 86829f0 | 2008-03-09 09:15:31 +0000 | [diff] [blame] | 30 | ret void |
| 31 | } |
| 32 | |
Jakob Stoklund Olesen | c4b3bcc | 2010-07-10 16:30:25 +0000 | [diff] [blame] | 33 | ; CHECK: test4 |
| 34 | ; CHECK: fld |
| 35 | ; CHECK-NEXT: InlineAsm Start |
| 36 | ; CHECK: InlineAsm End |
| 37 | ; CHECK-NOT: fstp |
| 38 | ; CHECK: ret |
Chris Lattner | 86829f0 | 2008-03-09 09:15:31 +0000 | [diff] [blame] | 39 | define void @test4(double %X) { |
Jakob Stoklund Olesen | f689760 | 2011-06-27 17:27:37 +0000 | [diff] [blame] | 40 | call void asm sideeffect "frob ", "{st(0)},~{st},~{dirflag},~{fpsr},~{flags}"( double %X) |
Chris Lattner | 86829f0 | 2008-03-09 09:15:31 +0000 | [diff] [blame] | 41 | ret void |
| 42 | } |
| 43 | |
Jakob Stoklund Olesen | c4b3bcc | 2010-07-10 16:30:25 +0000 | [diff] [blame] | 44 | ; Same as test3/4, but using value from fadd. |
| 45 | ; The fadd can be done in xmm or x87 regs - we don't test that. |
| 46 | ; CHECK: test5 |
| 47 | ; CHECK: InlineAsm End |
| 48 | ; CHECK-NOT: fstp |
| 49 | ; CHECK: ret |
Chris Lattner | 86829f0 | 2008-03-09 09:15:31 +0000 | [diff] [blame] | 50 | define void @test5(double %X) { |
Dan Gohman | a5b9645 | 2009-06-04 22:49:04 +0000 | [diff] [blame] | 51 | %Y = fadd double %X, 123.0 |
Jakob Stoklund Olesen | f689760 | 2011-06-27 17:27:37 +0000 | [diff] [blame] | 52 | call void asm sideeffect "frob ", "{st(0)},~{st},~{dirflag},~{fpsr},~{flags}"( double %Y) |
Chris Lattner | 86829f0 | 2008-03-09 09:15:31 +0000 | [diff] [blame] | 53 | ret void |
| 54 | } |
| 55 | |
Jakob Stoklund Olesen | c4b3bcc | 2010-07-10 16:30:25 +0000 | [diff] [blame] | 56 | ; CHECK: test6 |
Chris Lattner | 8abed80 | 2008-03-11 19:50:13 +0000 | [diff] [blame] | 57 | define void @test6(double %A, double %B, double %C, |
| 58 | double %D, double %E) nounwind { |
| 59 | entry: |
Jakob Stoklund Olesen | c4b3bcc | 2010-07-10 16:30:25 +0000 | [diff] [blame] | 60 | ; Uses the same value twice, should have one fstp after the asm. |
| 61 | ; CHECK: foo |
| 62 | ; CHECK: InlineAsm End |
| 63 | ; CHECK-NEXT: fstp |
| 64 | ; CHECK-NOT: fstp |
Chris Lattner | 8abed80 | 2008-03-11 19:50:13 +0000 | [diff] [blame] | 65 | tail call void asm sideeffect "foo $0 $1", "f,f,~{dirflag},~{fpsr},~{flags}"( double %A, double %A ) nounwind |
Jakob Stoklund Olesen | c4b3bcc | 2010-07-10 16:30:25 +0000 | [diff] [blame] | 66 | ; Uses two different values, should be in st(0)/st(1) and both be popped. |
| 67 | ; CHECK: bar |
| 68 | ; CHECK: InlineAsm End |
| 69 | ; CHECK-NEXT: fstp |
| 70 | ; CHECK-NEXT: fstp |
Chris Lattner | 8abed80 | 2008-03-11 19:50:13 +0000 | [diff] [blame] | 71 | tail call void asm sideeffect "bar $0 $1", "f,f,~{dirflag},~{fpsr},~{flags}"( double %B, double %C ) nounwind |
Jakob Stoklund Olesen | c4b3bcc | 2010-07-10 16:30:25 +0000 | [diff] [blame] | 72 | ; Uses two different values, one of which isn't killed in this asm, it |
| 73 | ; should not be popped after the asm. |
| 74 | ; CHECK: baz |
| 75 | ; CHECK: InlineAsm End |
| 76 | ; CHECK-NEXT: fstp |
| 77 | ; CHECK-NOT: fstp |
Chris Lattner | 8abed80 | 2008-03-11 19:50:13 +0000 | [diff] [blame] | 78 | tail call void asm sideeffect "baz $0 $1", "f,f,~{dirflag},~{fpsr},~{flags}"( double %D, double %E ) nounwind |
Jakob Stoklund Olesen | c4b3bcc | 2010-07-10 16:30:25 +0000 | [diff] [blame] | 79 | ; This is the last use of %D, so it should be popped after. |
| 80 | ; CHECK: baz |
| 81 | ; CHECK: InlineAsm End |
| 82 | ; CHECK-NEXT: fstp |
| 83 | ; CHECK-NOT: fstp |
| 84 | ; CHECK: ret |
Chris Lattner | 8abed80 | 2008-03-11 19:50:13 +0000 | [diff] [blame] | 85 | tail call void asm sideeffect "baz $0", "f,~{dirflag},~{fpsr},~{flags}"( double %D ) nounwind |
| 86 | ret void |
| 87 | } |
Chris Lattner | 9e07537 | 2008-03-09 08:49:15 +0000 | [diff] [blame] | 88 | |
Jakob Stoklund Olesen | f689760 | 2011-06-27 17:27:37 +0000 | [diff] [blame] | 89 | ; PR4185 |
| 90 | ; Passing a non-killed value to asm in {st}. |
| 91 | ; Make sure it is duped before. |
| 92 | ; asm kills st(0), so we shouldn't pop anything |
| 93 | ; CHECK: testPR4185 |
| 94 | ; CHECK: fld %st(0) |
| 95 | ; CHECK: fistpl |
| 96 | ; CHECK-NOT: fstp |
| 97 | ; CHECK: fistpl |
| 98 | ; CHECK-NOT: fstp |
| 99 | ; CHECK: ret |
| 100 | ; A valid alternative would be to remat the constant pool load before each |
| 101 | ; inline asm. |
| 102 | define void @testPR4185() { |
| 103 | return: |
| 104 | call void asm sideeffect "fistpl $0", "{st},~{st}"(double 1.000000e+06) |
| 105 | call void asm sideeffect "fistpl $0", "{st},~{st}"(double 1.000000e+06) |
| 106 | ret void |
| 107 | } |
| 108 | |
Jakob Stoklund Olesen | 7297e7e | 2011-06-28 18:32:28 +0000 | [diff] [blame] | 109 | ; Passing a non-killed value through asm in {st}. |
| 110 | ; Make sure it is not duped before. |
| 111 | ; Second asm kills st(0), so we shouldn't pop anything |
| 112 | ; CHECK: testPR4185b |
| 113 | ; CHECK-NOT: fld %st(0) |
| 114 | ; CHECK: fistl |
| 115 | ; CHECK-NOT: fstp |
| 116 | ; CHECK: fistpl |
| 117 | ; CHECK-NOT: fstp |
| 118 | ; CHECK: ret |
| 119 | ; A valid alternative would be to remat the constant pool load before each |
| 120 | ; inline asm. |
| 121 | define void @testPR4185b() { |
| 122 | return: |
| 123 | call void asm sideeffect "fistl $0", "{st}"(double 1.000000e+06) |
| 124 | call void asm sideeffect "fistpl $0", "{st},~{st}"(double 1.000000e+06) |
| 125 | ret void |
| 126 | } |
| 127 | |
Jakob Stoklund Olesen | f689760 | 2011-06-27 17:27:37 +0000 | [diff] [blame] | 128 | ; PR4459 |
| 129 | ; The return value from ceil must be duped before being consumed by asm. |
| 130 | ; CHECK: testPR4459 |
| 131 | ; CHECK: ceil |
| 132 | ; CHECK: fld %st(0) |
| 133 | ; CHECK-NOT: fxch |
| 134 | ; CHECK: fistpl |
| 135 | ; CHECK-NOT: fxch |
| 136 | ; CHECK: fstpt |
| 137 | ; CHECK: test |
| 138 | define void @testPR4459(x86_fp80 %a) { |
| 139 | entry: |
| 140 | %0 = call x86_fp80 @ceil(x86_fp80 %a) |
| 141 | call void asm sideeffect "fistpl $0", "{st},~{st}"( x86_fp80 %0) |
| 142 | call void @test3(x86_fp80 %0 ) |
| 143 | ret void |
| 144 | } |
| 145 | declare x86_fp80 @ceil(x86_fp80) |
| 146 | |
| 147 | ; PR4484 |
| 148 | ; test1 leaves a value on the stack that is needed after the asm. |
| 149 | ; CHECK: testPR4484 |
| 150 | ; CHECK: test1 |
| 151 | ; CHECK-NOT: fstp |
| 152 | ; Load %a from stack after ceil |
| 153 | ; CHECK: fldt |
| 154 | ; CHECK-NOT: fxch |
| 155 | ; CHECK: fistpl |
| 156 | ; CHECK-NOT: fstp |
| 157 | ; Set up call to test. |
| 158 | ; CHECK: fstpt |
| 159 | ; CHECK: test |
| 160 | define void @testPR4484(x86_fp80 %a) { |
| 161 | entry: |
| 162 | %0 = call x86_fp80 @test1() |
| 163 | call void asm sideeffect "fistpl $0", "{st},~{st}"(x86_fp80 %a) |
| 164 | call void @test3(x86_fp80 %0) |
| 165 | ret void |
| 166 | } |
| 167 | |
| 168 | ; PR4485 |
| 169 | ; CHECK: testPR4485 |
| 170 | define void @testPR4485(x86_fp80* %a) { |
| 171 | entry: |
| 172 | %0 = load x86_fp80* %a, align 16 |
| 173 | %1 = fmul x86_fp80 %0, 0xK4006B400000000000000 |
| 174 | %2 = fmul x86_fp80 %1, 0xK4012F424000000000000 |
| 175 | tail call void asm sideeffect "fistpl $0", "{st},~{st}"(x86_fp80 %2) |
| 176 | %3 = load x86_fp80* %a, align 16 |
| 177 | %4 = fmul x86_fp80 %3, 0xK4006B400000000000000 |
| 178 | %5 = fmul x86_fp80 %4, 0xK4012F424000000000000 |
| 179 | tail call void asm sideeffect "fistpl $0", "{st},~{st}"(x86_fp80 %5) |
| 180 | ret void |
| 181 | } |
Jakob Stoklund Olesen | 7297e7e | 2011-06-28 18:32:28 +0000 | [diff] [blame] | 182 | |
| 183 | ; An input argument in a fixed position is implicitly popped by the asm only if |
| 184 | ; the input argument is tied to an output register, or it is in the clobber list. |
| 185 | ; The clobber list case is tested above. |
| 186 | ; |
| 187 | ; This doesn't implicitly pop the stack: |
| 188 | ; |
| 189 | ; void fist1(long double x, int *p) { |
| 190 | ; asm volatile ("fistl %1" : : "t"(x), "m"(*p)); |
| 191 | ; } |
| 192 | ; |
| 193 | ; CHECK: fist1 |
| 194 | ; CHECK: fldt |
| 195 | ; CHECK: fistl (%e |
| 196 | ; CHECK: fstp |
| 197 | ; CHECK: ret |
| 198 | define void @fist1(x86_fp80 %x, i32* %p) nounwind ssp { |
| 199 | entry: |
| 200 | tail call void asm sideeffect "fistl $1", "{st},*m,~{memory},~{dirflag},~{fpsr},~{flags}"(x86_fp80 %x, i32* %p) nounwind |
| 201 | ret void |
| 202 | } |
| 203 | |
| 204 | ; Here, the input operand is tied to an output which means that is is |
| 205 | ; implicitly popped (and then the output is implicitly pushed). |
| 206 | ; |
| 207 | ; long double fist2(long double x, int *p) { |
| 208 | ; long double y; |
| 209 | ; asm ("fistl %1" : "=&t"(y) : "0"(x), "m"(*p) : "memory"); |
| 210 | ; return y; |
| 211 | ; } |
| 212 | ; |
| 213 | ; CHECK: fist2 |
| 214 | ; CHECK: fldt |
| 215 | ; CHECK: fistl (%e |
| 216 | ; CHECK-NOT: fstp |
| 217 | ; CHECK: ret |
| 218 | define x86_fp80 @fist2(x86_fp80 %x, i32* %p) nounwind ssp { |
| 219 | entry: |
| 220 | %0 = tail call x86_fp80 asm "fistl $2", "=&{st},0,*m,~{memory},~{dirflag},~{fpsr},~{flags}"(x86_fp80 %x, i32* %p) nounwind |
| 221 | ret x86_fp80 %0 |
| 222 | } |
| 223 | |
| 224 | ; An 'f' constraint is never implicitly popped: |
| 225 | ; |
| 226 | ; void fucomp1(long double x, long double y) { |
| 227 | ; asm volatile ("fucomp %1" : : "t"(x), "f"(y) : "st"); |
| 228 | ; } |
| 229 | ; CHECK: fucomp1 |
| 230 | ; CHECK: fldt |
| 231 | ; CHECK: fldt |
| 232 | ; CHECK: fucomp %st |
| 233 | ; CHECK: fstp |
| 234 | ; CHECK-NOT: fstp |
| 235 | ; CHECK: ret |
| 236 | define void @fucomp1(x86_fp80 %x, x86_fp80 %y) nounwind ssp { |
| 237 | entry: |
| 238 | tail call void asm sideeffect "fucomp $1", "{st},f,~{st},~{dirflag},~{fpsr},~{flags}"(x86_fp80 %x, x86_fp80 %y) nounwind |
| 239 | ret void |
| 240 | } |
| 241 | |
| 242 | ; The 'u' constraint is only popped implicitly when clobbered: |
| 243 | ; |
| 244 | ; void fucomp2(long double x, long double y) { |
| 245 | ; asm volatile ("fucomp %1" : : "t"(x), "u"(y) : "st"); |
| 246 | ; } |
| 247 | ; |
| 248 | ; void fucomp3(long double x, long double y) { |
| 249 | ; asm volatile ("fucompp %1" : : "t"(x), "u"(y) : "st", "st(1)"); |
| 250 | ; } |
| 251 | ; |
| 252 | ; CHECK: fucomp2 |
| 253 | ; CHECK: fldt |
| 254 | ; CHECK: fldt |
| 255 | ; CHECK: fucomp %st(1) |
| 256 | ; CHECK: fstp |
| 257 | ; CHECK-NOT: fstp |
| 258 | ; CHECK: ret |
| 259 | ; |
| 260 | ; CHECK: fucomp3 |
| 261 | ; CHECK: fldt |
| 262 | ; CHECK: fldt |
| 263 | ; CHECK: fucompp %st(1) |
| 264 | ; CHECK-NOT: fstp |
| 265 | ; CHECK: ret |
| 266 | define void @fucomp2(x86_fp80 %x, x86_fp80 %y) nounwind ssp { |
| 267 | entry: |
| 268 | tail call void asm sideeffect "fucomp $1", "{st},{st(1)},~{st},~{dirflag},~{fpsr},~{flags}"(x86_fp80 %x, x86_fp80 %y) nounwind |
| 269 | ret void |
| 270 | } |
| 271 | define void @fucomp3(x86_fp80 %x, x86_fp80 %y) nounwind ssp { |
| 272 | entry: |
| 273 | tail call void asm sideeffect "fucompp $1", "{st},{st(1)},~{st},~{st(1)},~{dirflag},~{fpsr},~{flags}"(x86_fp80 %x, x86_fp80 %y) nounwind |
| 274 | ret void |
| 275 | } |
| 276 | |
| 277 | ; One input, two outputs, one dead output. |
| 278 | %complex = type { float, float } |
| 279 | ; CHECK: sincos1 |
| 280 | ; CHECK: flds |
| 281 | ; CHECK-NOT: fxch |
| 282 | ; CHECK: sincos |
| 283 | ; CHECK-NOT: fstp |
| 284 | ; CHECK: fstp %st(1) |
| 285 | ; CHECK-NOT: fstp |
| 286 | ; CHECK: ret |
| 287 | define float @sincos1(float %x) nounwind ssp { |
| 288 | entry: |
| 289 | %0 = tail call %complex asm "sincos", "={st},={st(1)},0,~{dirflag},~{fpsr},~{flags}"(float %x) nounwind |
| 290 | %asmresult = extractvalue %complex %0, 0 |
| 291 | ret float %asmresult |
| 292 | } |
| 293 | |
| 294 | ; Same thing, swapped output operands. |
| 295 | ; CHECK: sincos2 |
| 296 | ; CHECK: flds |
| 297 | ; CHECK-NOT: fxch |
| 298 | ; CHECK: sincos |
| 299 | ; CHECK-NOT: fstp |
| 300 | ; CHECK: fstp %st(1) |
| 301 | ; CHECK-NOT: fstp |
| 302 | ; CHECK: ret |
| 303 | define float @sincos2(float %x) nounwind ssp { |
| 304 | entry: |
| 305 | %0 = tail call %complex asm "sincos", "={st(1)},={st},1,~{dirflag},~{fpsr},~{flags}"(float %x) nounwind |
| 306 | %asmresult = extractvalue %complex %0, 1 |
| 307 | ret float %asmresult |
| 308 | } |
| 309 | |
| 310 | ; Clobber st(0) after it was live-out/dead from the previous asm. |
| 311 | ; CHECK: sincos3 |
| 312 | ; Load x, make a copy for the second asm. |
| 313 | ; CHECK: flds |
| 314 | ; CHECK: fld %st(0) |
| 315 | ; CHECK: sincos |
| 316 | ; Discard dead result in st(0), bring x to the top. |
| 317 | ; CHECK: fstp %st(0) |
| 318 | ; CHECK: fxch |
| 319 | ; x is now in st(0) for the second asm |
| 320 | ; CHECK: sincos |
| 321 | ; Discard both results. |
| 322 | ; CHECK: fstp |
| 323 | ; CHECK: fstp |
| 324 | ; CHECK: ret |
| 325 | define float @sincos3(float %x) nounwind ssp { |
| 326 | entry: |
| 327 | %0 = tail call %complex asm sideeffect "sincos", "={st(1)},={st},1,~{dirflag},~{fpsr},~{flags}"(float %x) nounwind |
| 328 | %1 = tail call %complex asm sideeffect "sincos", "={st(1)},={st},1,~{dirflag},~{fpsr},~{flags}"(float %x) nounwind |
| 329 | %asmresult = extractvalue %complex %0, 0 |
| 330 | ret float %asmresult |
| 331 | } |
Jakob Stoklund Olesen | 4f0ace5 | 2011-08-08 17:15:43 +0000 | [diff] [blame] | 332 | |
| 333 | ; Pass the same value in two fixed stack slots. |
| 334 | ; CHECK: PR10602 |
| 335 | ; CHECK: flds LCPI |
| 336 | ; CHECK: fld %st(0) |
| 337 | ; CHECK: fcomi %st(1), %st(0) |
| 338 | define i32 @PR10602() nounwind ssp { |
| 339 | entry: |
| 340 | %0 = tail call i32 asm "fcomi $2, $1; pushf; pop $0", "=r,{st},{st(1)},~{dirflag},~{fpsr},~{flags}"(double 2.000000e+00, double 2.000000e+00) nounwind |
| 341 | ret i32 %0 |
| 342 | } |