Alex Bradbury | 8cbdd48 | 2018-01-15 17:54:52 +0000 | [diff] [blame] | 1 | // RUN: %clang_cc1 -triple riscv32 -emit-llvm %s -o - | FileCheck %s |
Mandeep Singh Grang | ac24bb5 | 2018-02-25 03:58:23 +0000 | [diff] [blame^] | 2 | // RUN: %clang_cc1 -triple riscv32 -emit-llvm -fforce-enable-int128 %s -o - \ |
| 3 | // RUN: | FileCheck %s -check-prefixes=CHECK,CHECK-FORCEINT128 |
Alex Bradbury | 8cbdd48 | 2018-01-15 17:54:52 +0000 | [diff] [blame] | 4 | |
| 5 | #include <stddef.h> |
| 6 | #include <stdint.h> |
| 7 | |
| 8 | // CHECK-LABEL: define void @f_void() |
| 9 | void f_void(void) {} |
| 10 | |
| 11 | // Scalar arguments and return values smaller than the word size are extended |
| 12 | // according to the sign of their type, up to 32 bits |
| 13 | |
| 14 | // CHECK-LABEL: define zeroext i1 @f_scalar_0(i1 zeroext %x) |
| 15 | _Bool f_scalar_0(_Bool x) { return x; } |
| 16 | |
| 17 | // CHECK-LABEL: define signext i8 @f_scalar_1(i8 signext %x) |
| 18 | int8_t f_scalar_1(int8_t x) { return x; } |
| 19 | |
| 20 | // CHECK-LABEL: define zeroext i8 @f_scalar_2(i8 zeroext %x) |
| 21 | uint8_t f_scalar_2(uint8_t x) { return x; } |
| 22 | |
| 23 | // CHECK-LABEL: define i32 @f_scalar_3(i32 %x) |
| 24 | int32_t f_scalar_3(int32_t x) { return x; } |
| 25 | |
| 26 | // CHECK-LABEL: define i64 @f_scalar_4(i64 %x) |
| 27 | int64_t f_scalar_4(int64_t x) { return x; } |
| 28 | |
Mandeep Singh Grang | ac24bb5 | 2018-02-25 03:58:23 +0000 | [diff] [blame^] | 29 | #ifdef __SIZEOF_INT128__ |
| 30 | // CHECK-FORCEINT128-LABEL: define i128 @f_scalar_5(i128 %x) |
| 31 | __int128_t f_scalar_5(__int128_t x) { return x; } |
| 32 | #endif |
| 33 | |
Alex Bradbury | 8cbdd48 | 2018-01-15 17:54:52 +0000 | [diff] [blame] | 34 | // CHECK-LABEL: define float @f_fp_scalar_1(float %x) |
| 35 | float f_fp_scalar_1(float x) { return x; } |
| 36 | |
| 37 | // CHECK-LABEL: define double @f_fp_scalar_2(double %x) |
| 38 | double f_fp_scalar_2(double x) { return x; } |
| 39 | |
| 40 | // Scalars larger than 2*xlen are passed/returned indirect. However, the |
| 41 | // RISC-V LLVM backend can handle this fine, so the function doesn't need to |
| 42 | // be modified. |
| 43 | |
| 44 | // CHECK-LABEL: define fp128 @f_fp_scalar_3(fp128 %x) |
| 45 | long double f_fp_scalar_3(long double x) { return x; } |
| 46 | |
| 47 | // Empty structs or unions are ignored. |
| 48 | |
| 49 | struct empty_s {}; |
| 50 | |
| 51 | // CHECK-LABEL: define void @f_agg_empty_struct() |
| 52 | struct empty_s f_agg_empty_struct(struct empty_s x) { |
| 53 | return x; |
| 54 | } |
| 55 | |
| 56 | union empty_u {}; |
| 57 | |
| 58 | // CHECK-LABEL: define void @f_agg_empty_union() |
| 59 | union empty_u f_agg_empty_union(union empty_u x) { |
| 60 | return x; |
| 61 | } |
| 62 | |
| 63 | // Aggregates <= 2*xlen may be passed in registers, so will be coerced to |
| 64 | // integer arguments. The rules for return are the same. |
| 65 | |
| 66 | struct tiny { |
| 67 | uint8_t a, b, c, d; |
| 68 | }; |
| 69 | |
| 70 | // CHECK-LABEL: define void @f_agg_tiny(i32 %x.coerce) |
| 71 | void f_agg_tiny(struct tiny x) { |
| 72 | x.a += x.b; |
| 73 | x.c += x.d; |
| 74 | } |
| 75 | |
| 76 | // CHECK-LABEL: define i32 @f_agg_tiny_ret() |
| 77 | struct tiny f_agg_tiny_ret() { |
| 78 | return (struct tiny){1, 2, 3, 4}; |
| 79 | } |
| 80 | |
| 81 | typedef uint8_t v4i8 __attribute__((vector_size(4))); |
| 82 | typedef int32_t v1i32 __attribute__((vector_size(4))); |
| 83 | |
| 84 | // CHECK-LABEL: define void @f_vec_tiny_v4i8(i32 %x.coerce) |
| 85 | void f_vec_tiny_v4i8(v4i8 x) { |
| 86 | x[0] = x[1]; |
| 87 | x[2] = x[3]; |
| 88 | } |
| 89 | |
| 90 | // CHECK-LABEL: define i32 @f_vec_tiny_v4i8_ret() |
| 91 | v4i8 f_vec_tiny_v4i8_ret() { |
| 92 | return (v4i8){1, 2, 3, 4}; |
| 93 | } |
| 94 | |
| 95 | // CHECK-LABEL: define void @f_vec_tiny_v1i32(i32 %x.coerce) |
| 96 | void f_vec_tiny_v1i32(v1i32 x) { |
| 97 | x[0] = 114; |
| 98 | } |
| 99 | |
| 100 | // CHECK-LABEL: define i32 @f_vec_tiny_v1i32_ret() |
| 101 | v1i32 f_vec_tiny_v1i32_ret() { |
| 102 | return (v1i32){1}; |
| 103 | } |
| 104 | |
| 105 | struct small { |
| 106 | int32_t a, *b; |
| 107 | }; |
| 108 | |
| 109 | // CHECK-LABEL: define void @f_agg_small([2 x i32] %x.coerce) |
| 110 | void f_agg_small(struct small x) { |
| 111 | x.a += *x.b; |
| 112 | x.b = &x.a; |
| 113 | } |
| 114 | |
| 115 | // CHECK-LABEL: define [2 x i32] @f_agg_small_ret() |
| 116 | struct small f_agg_small_ret() { |
| 117 | return (struct small){1, 0}; |
| 118 | } |
| 119 | |
| 120 | typedef uint8_t v8i8 __attribute__((vector_size(8))); |
| 121 | typedef int64_t v1i64 __attribute__((vector_size(8))); |
| 122 | |
| 123 | // CHECK-LABEL: define void @f_vec_small_v8i8(i64 %x.coerce) |
| 124 | void f_vec_small_v8i8(v8i8 x) { |
| 125 | x[0] = x[7]; |
| 126 | } |
| 127 | |
| 128 | // CHECK-LABEL: define i64 @f_vec_small_v8i8_ret() |
| 129 | v8i8 f_vec_small_v8i8_ret() { |
| 130 | return (v8i8){1, 2, 3, 4, 5, 6, 7, 8}; |
| 131 | } |
| 132 | |
| 133 | // CHECK-LABEL: define void @f_vec_small_v1i64(i64 %x.coerce) |
| 134 | void f_vec_small_v1i64(v1i64 x) { |
| 135 | x[0] = 114; |
| 136 | } |
| 137 | |
| 138 | // CHECK-LABEL: define i64 @f_vec_small_v1i64_ret() |
| 139 | v1i64 f_vec_small_v1i64_ret() { |
| 140 | return (v1i64){1}; |
| 141 | } |
| 142 | |
| 143 | // Aggregates of 2*xlen size and 2*xlen alignment should be coerced to a |
| 144 | // single 2*xlen-sized argument, to ensure that alignment can be maintained if |
| 145 | // passed on the stack. |
| 146 | |
| 147 | struct small_aligned { |
| 148 | int64_t a; |
| 149 | }; |
| 150 | |
| 151 | // CHECK-LABEL: define void @f_agg_small_aligned(i64 %x.coerce) |
| 152 | void f_agg_small_aligned(struct small_aligned x) { |
| 153 | x.a += x.a; |
| 154 | } |
| 155 | |
| 156 | // CHECK-LABEL: define i64 @f_agg_small_aligned_ret(i64 %x.coerce) |
| 157 | struct small_aligned f_agg_small_aligned_ret(struct small_aligned x) { |
| 158 | return (struct small_aligned){10}; |
| 159 | } |
| 160 | |
| 161 | // Aggregates greater > 2*xlen will be passed and returned indirectly |
| 162 | struct large { |
| 163 | int32_t a, b, c, d; |
| 164 | }; |
| 165 | |
| 166 | // CHECK-LABEL: define void @f_agg_large(%struct.large* %x) |
| 167 | void f_agg_large(struct large x) { |
| 168 | x.a = x.b + x.c + x.d; |
| 169 | } |
| 170 | |
| 171 | // The address where the struct should be written to will be the first |
| 172 | // argument |
| 173 | // CHECK-LABEL: define void @f_agg_large_ret(%struct.large* noalias sret %agg.result, i32 %i, i8 signext %j) |
| 174 | struct large f_agg_large_ret(int32_t i, int8_t j) { |
| 175 | return (struct large){1, 2, 3, 4}; |
| 176 | } |
| 177 | |
| 178 | typedef unsigned char v16i8 __attribute__((vector_size(16))); |
| 179 | |
| 180 | // CHECK-LABEL: define void @f_vec_large_v16i8(<16 x i8>*) |
| 181 | void f_vec_large_v16i8(v16i8 x) { |
| 182 | x[0] = x[7]; |
| 183 | } |
| 184 | |
| 185 | // CHECK-LABEL: define void @f_vec_large_v16i8_ret(<16 x i8>* noalias sret %agg.result) |
| 186 | v16i8 f_vec_large_v16i8_ret() { |
| 187 | return (v16i8){1, 2, 3, 4, 5, 6, 7, 8}; |
| 188 | } |
| 189 | |
| 190 | // Scalars passed on the stack should have signext/zeroext attributes (they |
| 191 | // are anyext). |
| 192 | |
| 193 | // CHECK-LABEL: define i32 @f_scalar_stack_1(i32 %a.coerce, [2 x i32] %b.coerce, i64 %c.coerce, %struct.large* %d, i8 zeroext %e, i8 signext %f, i8 %g, i8 %h) |
| 194 | int f_scalar_stack_1(struct tiny a, struct small b, struct small_aligned c, |
| 195 | struct large d, uint8_t e, int8_t f, uint8_t g, int8_t h) { |
| 196 | return g + h; |
| 197 | } |
| 198 | |
| 199 | // CHECK-LABEL: define i32 @f_scalar_stack_2(i32 %a, i64 %b, float %c, double %d, fp128 %e, i8 zeroext %f, i8 %g, i8 %h) |
| 200 | int f_scalar_stack_2(int32_t a, int64_t b, float c, double d, long double e, |
| 201 | uint8_t f, int8_t g, uint8_t h) { |
| 202 | return g + h; |
| 203 | } |
| 204 | |
| 205 | // Ensure that scalars passed on the stack are still determined correctly in |
| 206 | // the presence of large return values that consume a register due to the need |
| 207 | // to pass a pointer. |
| 208 | |
| 209 | // CHECK-LABEL: define void @f_scalar_stack_3(%struct.large* noalias sret %agg.result, i32 %a, i64 %b, double %c, fp128 %d, i8 zeroext %e, i8 %f, i8 %g) |
| 210 | struct large f_scalar_stack_3(int32_t a, int64_t b, double c, long double d, |
| 211 | uint8_t e, int8_t f, uint8_t g) { |
| 212 | return (struct large){a, e, f, g}; |
| 213 | } |
| 214 | |
| 215 | // CHECK-LABEL: define fp128 @f_scalar_stack_4(i32 %a, i64 %b, double %c, fp128 %d, i8 zeroext %e, i8 %f, i8 %g) |
| 216 | long double f_scalar_stack_4(int32_t a, int64_t b, double c, long double d, |
| 217 | uint8_t e, int8_t f, uint8_t g) { |
| 218 | return d; |
| 219 | } |
| 220 | |
| 221 | // Aggregates and >=XLen scalars passed on the stack should be lowered just as |
| 222 | // they would be if passed via registers. |
| 223 | |
| 224 | // CHECK-LABEL: define void @f_scalar_stack_5(double %a, i64 %b, double %c, i64 %d, i32 %e, i64 %f, float %g, double %h, fp128 %i) |
| 225 | void f_scalar_stack_5(double a, int64_t b, double c, int64_t d, int e, |
| 226 | int64_t f, float g, double h, long double i) {} |
| 227 | |
| 228 | // CHECK-LABEL: define void @f_agg_stack(double %a, i64 %b, double %c, i64 %d, i32 %e.coerce, [2 x i32] %f.coerce, i64 %g.coerce, %struct.large* %h) |
| 229 | void f_agg_stack(double a, int64_t b, double c, int64_t d, struct tiny e, |
| 230 | struct small f, struct small_aligned g, struct large h) {} |
| 231 | |
| 232 | // Ensure that ABI lowering happens as expected for vararg calls. For RV32 |
| 233 | // with the base integer calling convention there will be no observable |
| 234 | // differences in the lowered IR for a call with varargs vs without. |
| 235 | |
| 236 | int f_va_callee(int, ...); |
| 237 | |
| 238 | // CHECK-LABEL: define void @f_va_caller() |
| 239 | // CHECK: call i32 (i32, ...) @f_va_callee(i32 1, i32 2, i64 3, double 4.000000e+00, double 5.000000e+00, i32 {{%.*}}, [2 x i32] {{%.*}}, i64 {{%.*}}, %struct.large* {{%.*}}) |
| 240 | void f_va_caller() { |
| 241 | f_va_callee(1, 2, 3LL, 4.0f, 5.0, (struct tiny){6, 7, 8, 9}, |
| 242 | (struct small){10, NULL}, (struct small_aligned){11}, |
| 243 | (struct large){12, 13, 14, 15}); |
| 244 | } |
| 245 | |
| 246 | // CHECK-LABEL: define i32 @f_va_1(i8* %fmt, ...) {{.*}} { |
| 247 | // CHECK: [[FMT_ADDR:%.*]] = alloca i8*, align 4 |
| 248 | // CHECK: [[VA:%.*]] = alloca i8*, align 4 |
| 249 | // CHECK: [[V:%.*]] = alloca i32, align 4 |
| 250 | // CHECK: store i8* %fmt, i8** [[FMT_ADDR]], align 4 |
| 251 | // CHECK: [[VA1:%.*]] = bitcast i8** [[VA]] to i8* |
| 252 | // CHECK: call void @llvm.va_start(i8* [[VA1]]) |
| 253 | // CHECK: [[ARGP_CUR:%.*]] = load i8*, i8** [[VA]], align 4 |
| 254 | // CHECK: [[ARGP_NEXT:%.*]] = getelementptr inbounds i8, i8* [[ARGP_CUR]], i32 4 |
| 255 | // CHECK: store i8* [[ARGP_NEXT]], i8** [[VA]], align 4 |
| 256 | // CHECK: [[TMP0:%.*]] = bitcast i8* [[ARGP_CUR]] to i32* |
| 257 | // CHECK: [[TMP1:%.*]] = load i32, i32* [[TMP0]], align 4 |
| 258 | // CHECK: store i32 [[TMP1]], i32* [[V]], align 4 |
| 259 | // CHECK: [[VA2:%.*]] = bitcast i8** [[VA]] to i8* |
| 260 | // CHECK: call void @llvm.va_end(i8* [[VA2]]) |
| 261 | // CHECK: [[TMP2:%.*]] = load i32, i32* [[V]], align 4 |
| 262 | // CHECK: ret i32 [[TMP2]] |
| 263 | // CHECK: } |
| 264 | int f_va_1(char *fmt, ...) { |
| 265 | __builtin_va_list va; |
| 266 | |
| 267 | __builtin_va_start(va, fmt); |
| 268 | int v = __builtin_va_arg(va, int); |
| 269 | __builtin_va_end(va); |
| 270 | |
| 271 | return v; |
| 272 | } |
| 273 | |
| 274 | // An "aligned" register pair (where the first register is even-numbered) is |
| 275 | // used to pass varargs with 2x xlen alignment and 2x xlen size. Ensure the |
| 276 | // correct offsets are used. |
| 277 | |
| 278 | // CHECK-LABEL: @f_va_2( |
Alex Bradbury | 78b2c68 | 2018-01-15 20:45:15 +0000 | [diff] [blame] | 279 | // CHECK: [[FMT_ADDR:%.*]] = alloca i8*, align 4 |
Alex Bradbury | 8cbdd48 | 2018-01-15 17:54:52 +0000 | [diff] [blame] | 280 | // CHECK-NEXT: [[VA:%.*]] = alloca i8*, align 4 |
| 281 | // CHECK-NEXT: [[V:%.*]] = alloca double, align 8 |
| 282 | // CHECK-NEXT: store i8* [[FMT:%.*]], i8** [[FMT_ADDR]], align 4 |
| 283 | // CHECK-NEXT: [[VA1:%.*]] = bitcast i8** [[VA]] to i8* |
| 284 | // CHECK-NEXT: call void @llvm.va_start(i8* [[VA1]]) |
| 285 | // CHECK-NEXT: [[ARGP_CUR:%.*]] = load i8*, i8** [[VA]], align 4 |
| 286 | // CHECK-NEXT: [[TMP0:%.*]] = ptrtoint i8* [[ARGP_CUR]] to i32 |
| 287 | // CHECK-NEXT: [[TMP1:%.*]] = add i32 [[TMP0]], 7 |
| 288 | // CHECK-NEXT: [[TMP2:%.*]] = and i32 [[TMP1]], -8 |
| 289 | // CHECK-NEXT: [[ARGP_CUR_ALIGNED:%.*]] = inttoptr i32 [[TMP2]] to i8* |
| 290 | // CHECK-NEXT: [[ARGP_NEXT:%.*]] = getelementptr inbounds i8, i8* [[ARGP_CUR_ALIGNED]], i32 8 |
| 291 | // CHECK-NEXT: store i8* [[ARGP_NEXT]], i8** [[VA]], align 4 |
| 292 | // CHECK-NEXT: [[TMP3:%.*]] = bitcast i8* [[ARGP_CUR_ALIGNED]] to double* |
| 293 | // CHECK-NEXT: [[TMP4:%.*]] = load double, double* [[TMP3]], align 8 |
| 294 | // CHECK-NEXT: store double [[TMP4]], double* [[V]], align 8 |
| 295 | // CHECK-NEXT: [[VA2:%.*]] = bitcast i8** [[VA]] to i8* |
| 296 | // CHECK-NEXT: call void @llvm.va_end(i8* [[VA2]]) |
| 297 | // CHECK-NEXT: [[TMP5:%.*]] = load double, double* [[V]], align 8 |
| 298 | // CHECK-NEXT: ret double [[TMP5]] |
| 299 | double f_va_2(char *fmt, ...) { |
| 300 | __builtin_va_list va; |
| 301 | |
| 302 | __builtin_va_start(va, fmt); |
| 303 | double v = __builtin_va_arg(va, double); |
| 304 | __builtin_va_end(va); |
| 305 | |
| 306 | return v; |
| 307 | } |
| 308 | |
| 309 | // Two "aligned" register pairs. |
| 310 | |
| 311 | // CHECK-LABEL: @f_va_3( |
Alex Bradbury | 78b2c68 | 2018-01-15 20:45:15 +0000 | [diff] [blame] | 312 | // CHECK: [[FMT_ADDR:%.*]] = alloca i8*, align 4 |
Alex Bradbury | 8cbdd48 | 2018-01-15 17:54:52 +0000 | [diff] [blame] | 313 | // CHECK-NEXT: [[VA:%.*]] = alloca i8*, align 4 |
| 314 | // CHECK-NEXT: [[V:%.*]] = alloca double, align 8 |
| 315 | // CHECK-NEXT: [[W:%.*]] = alloca i32, align 4 |
| 316 | // CHECK-NEXT: [[X:%.*]] = alloca double, align 8 |
| 317 | // CHECK-NEXT: store i8* [[FMT:%.*]], i8** [[FMT_ADDR]], align 4 |
| 318 | // CHECK-NEXT: [[VA1:%.*]] = bitcast i8** [[VA]] to i8* |
| 319 | // CHECK-NEXT: call void @llvm.va_start(i8* [[VA1]]) |
| 320 | // CHECK-NEXT: [[ARGP_CUR:%.*]] = load i8*, i8** [[VA]], align 4 |
| 321 | // CHECK-NEXT: [[TMP0:%.*]] = ptrtoint i8* [[ARGP_CUR]] to i32 |
| 322 | // CHECK-NEXT: [[TMP1:%.*]] = add i32 [[TMP0]], 7 |
| 323 | // CHECK-NEXT: [[TMP2:%.*]] = and i32 [[TMP1]], -8 |
| 324 | // CHECK-NEXT: [[ARGP_CUR_ALIGNED:%.*]] = inttoptr i32 [[TMP2]] to i8* |
| 325 | // CHECK-NEXT: [[ARGP_NEXT:%.*]] = getelementptr inbounds i8, i8* [[ARGP_CUR_ALIGNED]], i32 8 |
| 326 | // CHECK-NEXT: store i8* [[ARGP_NEXT]], i8** [[VA]], align 4 |
| 327 | // CHECK-NEXT: [[TMP3:%.*]] = bitcast i8* [[ARGP_CUR_ALIGNED]] to double* |
| 328 | // CHECK-NEXT: [[TMP4:%.*]] = load double, double* [[TMP3]], align 8 |
| 329 | // CHECK-NEXT: store double [[TMP4]], double* [[V]], align 8 |
| 330 | // CHECK-NEXT: [[ARGP_CUR2:%.*]] = load i8*, i8** [[VA]], align 4 |
| 331 | // CHECK-NEXT: [[ARGP_NEXT3:%.*]] = getelementptr inbounds i8, i8* [[ARGP_CUR2]], i32 4 |
| 332 | // CHECK-NEXT: store i8* [[ARGP_NEXT3]], i8** [[VA]], align 4 |
| 333 | // CHECK-NEXT: [[TMP5:%.*]] = bitcast i8* [[ARGP_CUR2]] to i32* |
| 334 | // CHECK-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP5]], align 4 |
| 335 | // CHECK-NEXT: store i32 [[TMP6]], i32* [[W]], align 4 |
| 336 | // CHECK-NEXT: [[ARGP_CUR4:%.*]] = load i8*, i8** [[VA]], align 4 |
| 337 | // CHECK-NEXT: [[TMP7:%.*]] = ptrtoint i8* [[ARGP_CUR4]] to i32 |
| 338 | // CHECK-NEXT: [[TMP8:%.*]] = add i32 [[TMP7]], 7 |
| 339 | // CHECK-NEXT: [[TMP9:%.*]] = and i32 [[TMP8]], -8 |
| 340 | // CHECK-NEXT: [[ARGP_CUR4_ALIGNED:%.*]] = inttoptr i32 [[TMP9]] to i8* |
| 341 | // CHECK-NEXT: [[ARGP_NEXT5:%.*]] = getelementptr inbounds i8, i8* [[ARGP_CUR4_ALIGNED]], i32 8 |
| 342 | // CHECK-NEXT: store i8* [[ARGP_NEXT5]], i8** [[VA]], align 4 |
| 343 | // CHECK-NEXT: [[TMP10:%.*]] = bitcast i8* [[ARGP_CUR4_ALIGNED]] to double* |
| 344 | // CHECK-NEXT: [[TMP11:%.*]] = load double, double* [[TMP10]], align 8 |
| 345 | // CHECK-NEXT: store double [[TMP11]], double* [[X]], align 8 |
| 346 | // CHECK-NEXT: [[VA6:%.*]] = bitcast i8** [[VA]] to i8* |
| 347 | // CHECK-NEXT: call void @llvm.va_end(i8* [[VA6]]) |
| 348 | // CHECK-NEXT: [[TMP12:%.*]] = load double, double* [[V]], align 8 |
| 349 | // CHECK-NEXT: [[TMP13:%.*]] = load double, double* [[X]], align 8 |
| 350 | // CHECK-NEXT: [[ADD:%.*]] = fadd double [[TMP12]], [[TMP13]] |
| 351 | // CHECK-NEXT: ret double [[ADD]] |
| 352 | double f_va_3(char *fmt, ...) { |
| 353 | __builtin_va_list va; |
| 354 | |
| 355 | __builtin_va_start(va, fmt); |
| 356 | double v = __builtin_va_arg(va, double); |
| 357 | int w = __builtin_va_arg(va, int); |
| 358 | double x = __builtin_va_arg(va, double); |
| 359 | __builtin_va_end(va); |
| 360 | |
| 361 | return v + x; |
| 362 | } |
| 363 | |
| 364 | // CHECK-LABEL: define i32 @f_va_4(i8* %fmt, ...) {{.*}} { |
Alex Bradbury | 78b2c68 | 2018-01-15 20:45:15 +0000 | [diff] [blame] | 365 | // CHECK: [[FMT_ADDR:%.*]] = alloca i8*, align 4 |
Alex Bradbury | 8cbdd48 | 2018-01-15 17:54:52 +0000 | [diff] [blame] | 366 | // CHECK-NEXT: [[VA:%.*]] = alloca i8*, align 4 |
| 367 | // CHECK-NEXT: [[V:%.*]] = alloca i32, align 4 |
| 368 | // CHECK-NEXT: [[LD:%.*]] = alloca fp128, align 16 |
| 369 | // CHECK-NEXT: [[TS:%.*]] = alloca [[STRUCT_TINY:%.*]], align 1 |
| 370 | // CHECK-NEXT: [[SS:%.*]] = alloca [[STRUCT_SMALL:%.*]], align 4 |
| 371 | // CHECK-NEXT: [[LS:%.*]] = alloca [[STRUCT_LARGE:%.*]], align 4 |
| 372 | // CHECK-NEXT: [[RET:%.*]] = alloca i32, align 4 |
| 373 | // CHECK-NEXT: store i8* [[FMT:%.*]], i8** [[FMT_ADDR]], align 4 |
| 374 | // CHECK-NEXT: [[VA1:%.*]] = bitcast i8** [[VA]] to i8* |
| 375 | // CHECK-NEXT: call void @llvm.va_start(i8* [[VA1]]) |
| 376 | // CHECK-NEXT: [[ARGP_CUR:%.*]] = load i8*, i8** [[VA]], align 4 |
| 377 | // CHECK-NEXT: [[ARGP_NEXT:%.*]] = getelementptr inbounds i8, i8* [[ARGP_CUR]], i32 4 |
| 378 | // CHECK-NEXT: store i8* [[ARGP_NEXT]], i8** [[VA]], align 4 |
| 379 | // CHECK-NEXT: [[TMP0:%.*]] = bitcast i8* [[ARGP_CUR]] to i32* |
| 380 | // CHECK-NEXT: [[TMP1:%.*]] = load i32, i32* [[TMP0]], align 4 |
| 381 | // CHECK-NEXT: store i32 [[TMP1]], i32* [[V]], align 4 |
| 382 | // CHECK-NEXT: [[ARGP_CUR2:%.*]] = load i8*, i8** [[VA]], align 4 |
| 383 | // CHECK-NEXT: [[ARGP_NEXT3:%.*]] = getelementptr inbounds i8, i8* [[ARGP_CUR2]], i32 4 |
| 384 | // CHECK-NEXT: store i8* [[ARGP_NEXT3]], i8** [[VA]], align 4 |
| 385 | // CHECK-NEXT: [[TMP2:%.*]] = bitcast i8* [[ARGP_CUR2]] to fp128** |
| 386 | // CHECK-NEXT: [[TMP3:%.*]] = load fp128*, fp128** [[TMP2]], align 4 |
| 387 | // CHECK-NEXT: [[TMP4:%.*]] = load fp128, fp128* [[TMP3]], align 16 |
| 388 | // CHECK-NEXT: store fp128 [[TMP4]], fp128* [[LD]], align 16 |
| 389 | // CHECK-NEXT: [[ARGP_CUR4:%.*]] = load i8*, i8** [[VA]], align 4 |
| 390 | // CHECK-NEXT: [[ARGP_NEXT5:%.*]] = getelementptr inbounds i8, i8* [[ARGP_CUR4]], i32 4 |
| 391 | // CHECK-NEXT: store i8* [[ARGP_NEXT5]], i8** [[VA]], align 4 |
| 392 | // CHECK-NEXT: [[TMP5:%.*]] = bitcast i8* [[ARGP_CUR4]] to %struct.tiny* |
| 393 | // CHECK-NEXT: [[TMP6:%.*]] = bitcast %struct.tiny* [[TS]] to i8* |
| 394 | // CHECK-NEXT: [[TMP7:%.*]] = bitcast %struct.tiny* [[TMP5]] to i8* |
Daniel Neilson | c8bdc8d | 2018-01-28 17:27:45 +0000 | [diff] [blame] | 395 | // CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 [[TMP6]], i8* align 4 [[TMP7]], i32 4, i1 false) |
Alex Bradbury | 8cbdd48 | 2018-01-15 17:54:52 +0000 | [diff] [blame] | 396 | // CHECK-NEXT: [[ARGP_CUR6:%.*]] = load i8*, i8** [[VA]], align 4 |
| 397 | // CHECK-NEXT: [[ARGP_NEXT7:%.*]] = getelementptr inbounds i8, i8* [[ARGP_CUR6]], i32 8 |
| 398 | // CHECK-NEXT: store i8* [[ARGP_NEXT7]], i8** [[VA]], align 4 |
| 399 | // CHECK-NEXT: [[TMP8:%.*]] = bitcast i8* [[ARGP_CUR6]] to %struct.small* |
| 400 | // CHECK-NEXT: [[TMP9:%.*]] = bitcast %struct.small* [[SS]] to i8* |
| 401 | // CHECK-NEXT: [[TMP10:%.*]] = bitcast %struct.small* [[TMP8]] to i8* |
Daniel Neilson | 6e938ef | 2018-01-19 17:12:54 +0000 | [diff] [blame] | 402 | // CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 4 [[TMP9]], i8* align 4 [[TMP10]], i32 8, i1 false) |
Alex Bradbury | 8cbdd48 | 2018-01-15 17:54:52 +0000 | [diff] [blame] | 403 | // CHECK-NEXT: [[ARGP_CUR8:%.*]] = load i8*, i8** [[VA]], align 4 |
| 404 | // CHECK-NEXT: [[ARGP_NEXT9:%.*]] = getelementptr inbounds i8, i8* [[ARGP_CUR8]], i32 4 |
| 405 | // CHECK-NEXT: store i8* [[ARGP_NEXT9]], i8** [[VA]], align 4 |
| 406 | // CHECK-NEXT: [[TMP11:%.*]] = bitcast i8* [[ARGP_CUR8]] to %struct.large** |
| 407 | // CHECK-NEXT: [[TMP12:%.*]] = load %struct.large*, %struct.large** [[TMP11]], align 4 |
| 408 | // CHECK-NEXT: [[TMP13:%.*]] = bitcast %struct.large* [[LS]] to i8* |
| 409 | // CHECK-NEXT: [[TMP14:%.*]] = bitcast %struct.large* [[TMP12]] to i8* |
Daniel Neilson | 6e938ef | 2018-01-19 17:12:54 +0000 | [diff] [blame] | 410 | // CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 4 [[TMP13]], i8* align 4 [[TMP14]], i32 16, i1 false) |
Alex Bradbury | 8cbdd48 | 2018-01-15 17:54:52 +0000 | [diff] [blame] | 411 | // CHECK-NEXT: [[VA10:%.*]] = bitcast i8** [[VA]] to i8* |
| 412 | // CHECK-NEXT: call void @llvm.va_end(i8* [[VA10]]) |
| 413 | int f_va_4(char *fmt, ...) { |
| 414 | __builtin_va_list va; |
| 415 | |
| 416 | __builtin_va_start(va, fmt); |
| 417 | int v = __builtin_va_arg(va, int); |
| 418 | long double ld = __builtin_va_arg(va, long double); |
| 419 | struct tiny ts = __builtin_va_arg(va, struct tiny); |
| 420 | struct small ss = __builtin_va_arg(va, struct small); |
| 421 | struct large ls = __builtin_va_arg(va, struct large); |
| 422 | __builtin_va_end(va); |
| 423 | |
| 424 | int ret = (int)((long double)v + ld); |
| 425 | ret = ret + ts.a + ts.b + ts.c + ts.d; |
| 426 | ret = ret + ss.a + (int)ss.b; |
| 427 | ret = ret + ls.a + ls.b + ls.c + ls.d; |
| 428 | |
| 429 | return ret; |
| 430 | } |