1// REQUIRES: arm-registered-target
2// RUN: %clang_cc1 -triple thumbv7-apple-darwin9 \
3// RUN:   -target-abi aapcs \
4// RUN:   -target-cpu cortex-a8 \
5// RUN:   -mfloat-abi hard \
6// RUN:   -ffreestanding \
7// RUN:   -emit-llvm -w -o - %s | FileCheck %s
8
9// RUN: %clang_cc1 -triple armv7-unknown-nacl-gnueabi \
10// RUN:  -target-cpu cortex-a8 \
11// RUN:  -mfloat-abi hard \
12// RUN:  -ffreestanding \
13// RUN:  -emit-llvm -w -o - %s | FileCheck %s
14
15// RUN: %clang_cc1 -triple arm64-apple-darwin9 -target-feature +neon \
16// RUN:   -ffreestanding \
17// RUN:   -emit-llvm -w -o - %s | FileCheck -check-prefix=CHECK64 %s
18
19#ifdef __arm64__
20#include <arm_neon.h>
21#else
22#include <arm_neon.h>
23#endif
24
25struct homogeneous_struct {
26  float f[2];
27  float f3;
28  float f4;
29};
30// CHECK: define arm_aapcs_vfpcc %struct.homogeneous_struct @test_struct(%struct.homogeneous_struct %{{.*}})
31// CHECK64: define %struct.homogeneous_struct @test_struct(float %{{.*}}, float %{{.*}}, float %{{.*}}, float %{{.*}})
32extern struct homogeneous_struct struct_callee(struct homogeneous_struct);
33struct homogeneous_struct test_struct(struct homogeneous_struct arg) {
34  return struct_callee(arg);
35}
36
37// CHECK: define arm_aapcs_vfpcc void @test_struct_variadic(%struct.homogeneous_struct* {{.*}}, ...)
38struct homogeneous_struct test_struct_variadic(struct homogeneous_struct arg, ...) {
39  return struct_callee(arg);
40}
41
42struct nested_array {
43  double d[4];
44};
45// CHECK: define arm_aapcs_vfpcc void @test_array(%struct.nested_array %{{.*}})
46// CHECK64: define void @test_array(double %{{.*}}, double %{{.*}}, double %{{.*}}, double %{{.*}})
47extern void array_callee(struct nested_array);
48void test_array(struct nested_array arg) {
49  array_callee(arg);
50}
51
52extern void complex_callee(__complex__ double);
53// CHECK: define arm_aapcs_vfpcc void @test_complex({ double, double } %{{.*}})
54// CHECK64: define void @test_complex(double %{{.*}}, double %{{.*}})
55void test_complex(__complex__ double cd) {
56  complex_callee(cd);
57}
58
59// Long double is the same as double on AAPCS, it should be homogeneous.
60extern void complex_long_callee(__complex__ long double);
61// CHECK: define arm_aapcs_vfpcc void @test_complex_long({ double, double } %{{.*}})
62void test_complex_long(__complex__ long double cd) {
63  complex_callee(cd);
64}
65
66// Structs with more than 4 elements of the base type are not treated
67// as homogeneous aggregates.  Test that.
68
69struct big_struct {
70  float f1;
71  float f[2];
72  float f3;
73  float f4;
74};
75// CHECK: define arm_aapcs_vfpcc void @test_big({ [5 x i32] } %{{.*}})
76// CHECK64: define void @test_big(%struct.big_struct* %{{.*}})
77// CHECK64: call void @llvm.memcpy
78// CHECK64: call void @big_callee(%struct.big_struct*
79extern void big_callee(struct big_struct);
80void test_big(struct big_struct arg) {
81  big_callee(arg);
82}
83
84// Make sure that aggregates with multiple base types are not treated as
85// homogeneous aggregates.
86
87struct heterogeneous_struct {
88  float f1;
89  int i2;
90};
91// CHECK: define arm_aapcs_vfpcc void @test_hetero({ [2 x i32] } %{{.*}})
92// CHECK64: define void @test_hetero(i64 %{{.*}})
93extern void hetero_callee(struct heterogeneous_struct);
94void test_hetero(struct heterogeneous_struct arg) {
95  hetero_callee(arg);
96}
97
98// Neon multi-vector types are homogeneous aggregates.
99// CHECK: define arm_aapcs_vfpcc <16 x i8> @f0(%struct.int8x16x4_t %{{.*}})
100// CHECK64: define <16 x i8> @f0(<16 x i8> %{{.*}}, <16 x i8> %{{.*}}, <16 x i8> %{{.*}}, <16 x i8> %{{.*}})
101int8x16_t f0(int8x16x4_t v4) {
102  return vaddq_s8(v4.val[0], v4.val[3]);
103}
104
105// ...and it doesn't matter whether the vectors are exactly the same, as long
106// as they have the same size.
107
108struct neon_struct {
109  int8x8x2_t v12;
110  int32x2_t v3;
111  int16x4_t v4;
112};
113// CHECK: define arm_aapcs_vfpcc void @test_neon(%struct.neon_struct %{{.*}})
114// CHECK64: define void @test_neon(<8 x i8> %{{.*}}, <8 x i8> %{{.*}}, <2 x i32> %{{.*}}, <4 x i16> %{{.*}})
115extern void neon_callee(struct neon_struct);
116void test_neon(struct neon_struct arg) {
117  neon_callee(arg);
118}
119
120// CHECK-LABEL: define arm_aapcs_vfpcc void @f33(%struct.s33* byval align 1 %s)
121struct s33 { char buf[32*32]; };
122void f33(struct s33 s) { }
123
124typedef struct { long long x; int y; } struct_long_long_int;
125// CHECK: define arm_aapcs_vfpcc void @test_vfp_stack_gpr_split_1(double %a, double %b, double %c, double %d, double %e, double %f, double %g, double %h, double %i, i32 %j, i64 %k, i32 %l)
126void test_vfp_stack_gpr_split_1(double a, double b, double c, double d, double e, double f, double g, double h, double i, int j, long long k, int l) {}
127
128// CHECK: define arm_aapcs_vfpcc void @test_vfp_stack_gpr_split_2(double %a, double %b, double %c, double %d, double %e, double %f, double %g, double %h, double %i, i32 %j, [3 x i32], { [2 x i64] } %k.coerce)
129void test_vfp_stack_gpr_split_2(double a, double b, double c, double d, double e, double f, double g, double h, double i, int j, struct_long_long_int k) {}
130
131// CHECK: define arm_aapcs_vfpcc void @test_vfp_stack_gpr_split_3(%struct.struct_long_long_int* noalias sret %agg.result, double %a, double %b, double %c, double %d, double %e, double %f, double %g, double %h, double %i, [3 x i32], { [2 x i64] } %k.coerce)
132struct_long_long_int test_vfp_stack_gpr_split_3(double a, double b, double c, double d, double e, double f, double g, double h, double i, struct_long_long_int k) {}
133
134typedef struct { int a; int b:4; int c; } struct_int_bitfield_int;
135// CHECK: define arm_aapcs_vfpcc void @test_test_vfp_stack_gpr_split_bitfield(double %a, double %b, double %c, double %d, double %e, double %f, double %g, double %h, double %i, i32 %j, i32 %k, [2 x i32], { [3 x i32] } %l.coerce)
136void test_test_vfp_stack_gpr_split_bitfield(double a, double b, double c, double d, double e, double f, double g, double h, double i, int j, int k, struct_int_bitfield_int l) {}
137
138// Note: this struct requires internal padding
139typedef struct { int x; long long y; } struct_int_long_long;
140// CHECK: define arm_aapcs_vfpcc void @test_vfp_stack_gpr_split_4(double %a, double %b, double %c, double %d, double %e, double %f, double %g, double %h, double %i, i32 %j, [3 x i32], { [2 x i64] } %k.coerce)
141void test_vfp_stack_gpr_split_4(double a, double b, double c, double d, double e, double f, double g, double h, double i, int j, struct_int_long_long k) {}
142
143// This very large struct (passed byval) uses up the GPRs, so no padding is needed
144typedef struct { int x[17]; } struct_seventeen_ints;
145typedef struct { int x[4]; } struct_four_ints;
146// CHECK: define arm_aapcs_vfpcc void @test_vfp_stack_gpr_split_5(%struct.struct_seventeen_ints* byval align 4 %a, double %b, double %c, double %d, double %e, double %f, double %g, double %h, double %i, double %j, { [4 x i32] } %k.coerce)
147void test_vfp_stack_gpr_split_5(struct_seventeen_ints a, double b, double c, double d, double e, double f, double g, double h, double i, double j, struct_four_ints k) {}
148