1; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2; RUN: llc -relocation-model=pic -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown \
3; RUN:   -verify-machineinstrs -ppc-vsr-nums-as-vr -ppc-asm-full-reg-names < %s \
4; RUN:   | FileCheck %s
5; RUN: llc -relocation-model=pic -mcpu=pwr9 -mtriple=powerpc64-unknown-unknown \
6; RUN:   -verify-machineinstrs -ppc-vsr-nums-as-vr -ppc-asm-full-reg-names < %s \
7; RUN:   | FileCheck -check-prefix=CHECK-BE %s
8; RUN: llc -relocation-model=pic -mcpu=pwr8 -mtriple=powerpc64le-unknown-unknown \
9; RUN:   -verify-machineinstrs -ppc-vsr-nums-as-vr -ppc-asm-full-reg-names < %s \
10; RUN:   | FileCheck %s -check-prefix=CHECK-P8
11
12; Testing homogeneous aggregates.
13
14%struct.With9fp128params = type { fp128, fp128, fp128, fp128, fp128, fp128,
15                                  fp128, fp128, fp128 }
16
17@a1 = local_unnamed_addr global [3 x fp128] zeroinitializer, align 16
18
19; Function Attrs: norecurse nounwind readonly
20define fp128 @testArray_01(fp128* nocapture readonly %sa) {
21; CHECK-LABEL: testArray_01:
22; CHECK:       # %bb.0: # %entry
23; CHECK-NEXT:    lxv v2, 32(r3)
24; CHECK-NEXT:    blr
25;
26; CHECK-BE-LABEL: testArray_01:
27; CHECK-BE:       # %bb.0: # %entry
28; CHECK-BE-NEXT:    lxv v2, 32(r3)
29; CHECK-BE-NEXT:    blr
30;
31; CHECK-P8-LABEL: testArray_01:
32; CHECK-P8:       # %bb.0: # %entry
33; CHECK-P8-NEXT:    ld r5, 32(r3)
34; CHECK-P8-NEXT:    ld r4, 40(r3)
35; CHECK-P8-NEXT:    mr r3, r5
36; CHECK-P8-NEXT:    blr
37
38entry:
39  %arrayidx = getelementptr inbounds fp128, fp128* %sa, i64 2
40  %0 = load fp128, fp128* %arrayidx, align 16
41  ret fp128 %0
42}
43
44; Function Attrs: norecurse nounwind readonly
45define fp128 @testArray_02() {
46; CHECK-LABEL: testArray_02:
47; CHECK:       # %bb.0: # %entry
48; CHECK-NEXT:    addis r3, r2, .LC0@toc@ha
49; CHECK-NEXT:    ld r3, .LC0@toc@l(r3)
50; CHECK-NEXT:    lxv v2, 32(r3)
51; CHECK-NEXT:    blr
52;
53; CHECK-BE-LABEL: testArray_02:
54; CHECK-BE:       # %bb.0: # %entry
55; CHECK-BE-NEXT:    addis r3, r2, .LC0@toc@ha
56; CHECK-BE-NEXT:    ld r3, .LC0@toc@l(r3)
57; CHECK-BE-NEXT:    lxv v2, 32(r3)
58; CHECK-BE-NEXT:    blr
59;
60; CHECK-P8-LABEL: testArray_02:
61; CHECK-P8:       # %bb.0: # %entry
62; CHECK-P8-NEXT:    addis r3, r2, .LC0@toc@ha
63; CHECK-P8-NEXT:    ld r4, .LC0@toc@l(r3)
64; CHECK-P8-NEXT:    ld r3, 32(r4)
65; CHECK-P8-NEXT:    ld r4, 40(r4)
66; CHECK-P8-NEXT:    blr
67
68entry:
69  %0 = load fp128, fp128* getelementptr inbounds ([3 x fp128], [3 x fp128]* @a1,
70                                                  i64 0, i64 2), align 16
71  ret fp128 %0
72}
73
74; Function Attrs: norecurse nounwind readnone
75define fp128 @testStruct_01(fp128 inreg returned %a.coerce) {
76; CHECK-LABEL: testStruct_01:
77; CHECK:       # %bb.0: # %entry
78; CHECK-NEXT:    blr
79;
80; CHECK-BE-LABEL: testStruct_01:
81; CHECK-BE:       # %bb.0: # %entry
82; CHECK-BE-NEXT:    blr
83;
84; CHECK-P8-LABEL: testStruct_01:
85; CHECK-P8:       # %bb.0: # %entry
86; CHECK-P8-NEXT:    blr
87
88entry:
89  ret fp128 %a.coerce
90}
91
92; Function Attrs: norecurse nounwind readnone
93define fp128 @testStruct_02([8 x fp128] %a.coerce) {
94; CHECK-LABEL: testStruct_02:
95; CHECK:       # %bb.0: # %entry
96; CHECK-NEXT:    vmr v2, v9
97; CHECK-NEXT:    blr
98;
99; CHECK-BE-LABEL: testStruct_02:
100; CHECK-BE:       # %bb.0: # %entry
101; CHECK-BE-NEXT:    vmr v2, v9
102; CHECK-BE-NEXT:    blr
103;
104; CHECK-P8-LABEL: testStruct_02:
105; CHECK-P8:       # %bb.0: # %entry
106; CHECK-P8-NEXT:    ld r3, 144(r1)
107; CHECK-P8-NEXT:    ld r4, 152(r1)
108; CHECK-P8-NEXT:    blr
109
110entry:
111  %a.coerce.fca.7.extract = extractvalue [8 x fp128] %a.coerce, 7
112  ret fp128 %a.coerce.fca.7.extract
113}
114
115; Since we can only pass a max of 8 float128 value in VSX registers, ensure we
116; store to stack if passing more.
117; Function Attrs: norecurse nounwind readonly
118define fp128 @testStruct_03(%struct.With9fp128params* byval(%struct.With9fp128params) nocapture readonly align 16 %a) {
119; CHECK-LABEL: testStruct_03:
120; CHECK:       # %bb.0: # %entry
121; CHECK-NEXT:    lxv v2, 128(r1)
122; CHECK-NEXT:    std r3, 32(r1)
123; CHECK-NEXT:    std r4, 40(r1)
124; CHECK-NEXT:    std r5, 48(r1)
125; CHECK-NEXT:    std r6, 56(r1)
126; CHECK-NEXT:    std r7, 64(r1)
127; CHECK-NEXT:    std r8, 72(r1)
128; CHECK-NEXT:    std r9, 80(r1)
129; CHECK-NEXT:    std r10, 88(r1)
130; CHECK-NEXT:    blr
131;
132; CHECK-BE-LABEL: testStruct_03:
133; CHECK-BE:       # %bb.0: # %entry
134; CHECK-BE-NEXT:    lxv v2, 144(r1)
135; CHECK-BE-NEXT:    std r3, 48(r1)
136; CHECK-BE-NEXT:    std r4, 56(r1)
137; CHECK-BE-NEXT:    std r5, 64(r1)
138; CHECK-BE-NEXT:    std r6, 72(r1)
139; CHECK-BE-NEXT:    std r7, 80(r1)
140; CHECK-BE-NEXT:    std r8, 88(r1)
141; CHECK-BE-NEXT:    std r9, 96(r1)
142; CHECK-BE-NEXT:    std r10, 104(r1)
143; CHECK-BE-NEXT:    blr
144;
145; CHECK-P8-LABEL: testStruct_03:
146; CHECK-P8:       # %bb.0: # %entry
147; CHECK-P8-NEXT:    ld r11, 128(r1)
148; CHECK-P8-NEXT:    ld r12, 136(r1)
149; CHECK-P8-NEXT:    std r3, 32(r1)
150; CHECK-P8-NEXT:    std r4, 40(r1)
151; CHECK-P8-NEXT:    std r5, 48(r1)
152; CHECK-P8-NEXT:    std r6, 56(r1)
153; CHECK-P8-NEXT:    mr r3, r11
154; CHECK-P8-NEXT:    mr r4, r12
155; CHECK-P8-NEXT:    std r7, 64(r1)
156; CHECK-P8-NEXT:    std r8, 72(r1)
157; CHECK-P8-NEXT:    std r9, 80(r1)
158; CHECK-P8-NEXT:    std r10, 88(r1)
159; CHECK-P8-NEXT:    blr
160
161entry:
162  %a7 = getelementptr inbounds %struct.With9fp128params,
163                               %struct.With9fp128params* %a, i64 0, i32 6
164  %0 = load fp128, fp128* %a7, align 16
165  ret fp128 %0
166}
167
168; Function Attrs: norecurse nounwind readnone
169define fp128 @testStruct_04([8 x fp128] %a.coerce) {
170; CHECK-LABEL: testStruct_04:
171; CHECK:       # %bb.0: # %entry
172; CHECK-NEXT:    vmr v2, v5
173; CHECK-NEXT:    blr
174;
175; CHECK-BE-LABEL: testStruct_04:
176; CHECK-BE:       # %bb.0: # %entry
177; CHECK-BE-NEXT:    vmr v2, v5
178; CHECK-BE-NEXT:    blr
179;
180; CHECK-P8-LABEL: testStruct_04:
181; CHECK-P8:       # %bb.0: # %entry
182; CHECK-P8-NEXT:    mr r4, r10
183; CHECK-P8-NEXT:    mr r3, r9
184; CHECK-P8-NEXT:    blr
185
186entry:
187  %a.coerce.fca.3.extract = extractvalue [8 x fp128] %a.coerce, 3
188  ret fp128 %a.coerce.fca.3.extract
189}
190
191; Function Attrs: norecurse nounwind readnone
192define fp128 @testHUnion_01([1 x fp128] %a.coerce) {
193; CHECK-LABEL: testHUnion_01:
194; CHECK:       # %bb.0: # %entry
195; CHECK-NEXT:    blr
196;
197; CHECK-BE-LABEL: testHUnion_01:
198; CHECK-BE:       # %bb.0: # %entry
199; CHECK-BE-NEXT:    blr
200;
201; CHECK-P8-LABEL: testHUnion_01:
202; CHECK-P8:       # %bb.0: # %entry
203; CHECK-P8-NEXT:    blr
204
205entry:
206  %a.coerce.fca.0.extract = extractvalue [1 x fp128] %a.coerce, 0
207  ret fp128 %a.coerce.fca.0.extract
208}
209
210; Function Attrs: norecurse nounwind readnone
211define fp128 @testHUnion_02([3 x fp128] %a.coerce) {
212; CHECK-LABEL: testHUnion_02:
213; CHECK:       # %bb.0: # %entry
214; CHECK-NEXT:    blr
215;
216; CHECK-BE-LABEL: testHUnion_02:
217; CHECK-BE:       # %bb.0: # %entry
218; CHECK-BE-NEXT:    blr
219;
220; CHECK-P8-LABEL: testHUnion_02:
221; CHECK-P8:       # %bb.0: # %entry
222; CHECK-P8-NEXT:    blr
223
224entry:
225  %a.coerce.fca.0.extract = extractvalue [3 x fp128] %a.coerce, 0
226  ret fp128 %a.coerce.fca.0.extract
227}
228
229; Function Attrs: norecurse nounwind readnone
230define fp128 @testHUnion_03([3 x fp128] %a.coerce) {
231; CHECK-LABEL: testHUnion_03:
232; CHECK:       # %bb.0: # %entry
233; CHECK-NEXT:    vmr v2, v3
234; CHECK-NEXT:    blr
235;
236; CHECK-BE-LABEL: testHUnion_03:
237; CHECK-BE:       # %bb.0: # %entry
238; CHECK-BE-NEXT:    vmr v2, v3
239; CHECK-BE-NEXT:    blr
240;
241; CHECK-P8-LABEL: testHUnion_03:
242; CHECK-P8:       # %bb.0: # %entry
243; CHECK-P8-NEXT:    mr r4, r6
244; CHECK-P8-NEXT:    mr r3, r5
245; CHECK-P8-NEXT:    blr
246
247entry:
248  %a.coerce.fca.1.extract = extractvalue [3 x fp128] %a.coerce, 1
249  ret fp128 %a.coerce.fca.1.extract
250}
251
252; Function Attrs: norecurse nounwind readnone
253define fp128 @testHUnion_04([3 x fp128] %a.coerce) {
254; CHECK-LABEL: testHUnion_04:
255; CHECK:       # %bb.0: # %entry
256; CHECK-NEXT:    vmr v2, v4
257; CHECK-NEXT:    blr
258;
259; CHECK-BE-LABEL: testHUnion_04:
260; CHECK-BE:       # %bb.0: # %entry
261; CHECK-BE-NEXT:    vmr v2, v4
262; CHECK-BE-NEXT:    blr
263;
264; CHECK-P8-LABEL: testHUnion_04:
265; CHECK-P8:       # %bb.0: # %entry
266; CHECK-P8-NEXT:    mr r4, r8
267; CHECK-P8-NEXT:    mr r3, r7
268; CHECK-P8-NEXT:    blr
269
270entry:
271  %a.coerce.fca.2.extract = extractvalue [3 x fp128] %a.coerce, 2
272  ret fp128 %a.coerce.fca.2.extract
273}
274
275; Testing mixed member aggregates.
276
277%struct.MixedC = type { i32, %struct.SA, float, [12 x i8] }
278%struct.SA = type { double, fp128, <4 x float> }
279
280; Function Attrs: norecurse nounwind readnone
281define fp128 @testMixedAggregate([3 x i128] %a.coerce) {
282; CHECK-LABEL: testMixedAggregate:
283; CHECK:       # %bb.0: # %entry
284; CHECK-NEXT:    mtvsrdd v2, r8, r7
285; CHECK-NEXT:    blr
286;
287; CHECK-BE-LABEL: testMixedAggregate:
288; CHECK-BE:       # %bb.0: # %entry
289; CHECK-BE-NEXT:    mtvsrdd v2, r8, r7
290; CHECK-BE-NEXT:    blr
291;
292; CHECK-P8-LABEL: testMixedAggregate:
293; CHECK-P8:       # %bb.0: # %entry
294; CHECK-P8-NEXT:    mr r4, r8
295; CHECK-P8-NEXT:    mr r3, r7
296; CHECK-P8-NEXT:    blr
297
298entry:
299  %a.coerce.fca.2.extract = extractvalue [3 x i128] %a.coerce, 2
300  %0 = bitcast i128 %a.coerce.fca.2.extract to fp128
301  ret fp128 %0
302}
303
304; Function Attrs: norecurse nounwind readnone
305define fp128 @testMixedAggregate_02([4 x i128] %a.coerce) {
306; CHECK-LABEL: testMixedAggregate_02:
307; CHECK:       # %bb.0: # %entry
308; CHECK-NEXT:    mtvsrdd v2, r6, r5
309; CHECK-NEXT:    blr
310;
311; CHECK-BE-LABEL: testMixedAggregate_02:
312; CHECK-BE:       # %bb.0: # %entry
313; CHECK-BE-NEXT:    mtvsrdd v2, r6, r5
314; CHECK-BE-NEXT:    blr
315;
316; CHECK-P8-LABEL: testMixedAggregate_02:
317; CHECK-P8:       # %bb.0: # %entry
318; CHECK-P8-NEXT:    mr r4, r6
319; CHECK-P8-NEXT:    mr r3, r5
320; CHECK-P8-NEXT:    blr
321
322entry:
323  %a.coerce.fca.1.extract = extractvalue [4 x i128] %a.coerce, 1
324  %0 = bitcast i128 %a.coerce.fca.1.extract to fp128
325  ret fp128 %0
326}
327
328; Function Attrs: norecurse nounwind readnone
329define fp128 @testMixedAggregate_03([4 x i128] %sa.coerce) {
330; CHECK-LABEL: testMixedAggregate_03:
331; CHECK:       # %bb.0: # %entry
332; CHECK-NEXT:    mtvsrwa v2, r3
333; CHECK-NEXT:    mtvsrdd v3, r6, r5
334; CHECK-NEXT:    xscvsdqp v2, v2
335; CHECK-NEXT:    xsaddqp v2, v3, v2
336; CHECK-NEXT:    mtvsrd v3, r10
337; CHECK-NEXT:    xscvsdqp v3, v3
338; CHECK-NEXT:    xsaddqp v2, v2, v3
339; CHECK-NEXT:    blr
340;
341; CHECK-BE-LABEL: testMixedAggregate_03:
342; CHECK-BE:       # %bb.0: # %entry
343; CHECK-BE-NEXT:    mtvsrwa v2, r4
344; CHECK-BE-NEXT:    mtvsrdd v3, r6, r5
345; CHECK-BE-NEXT:    xscvsdqp v2, v2
346; CHECK-BE-NEXT:    xsaddqp v2, v3, v2
347; CHECK-BE-NEXT:    mtvsrd v3, r9
348; CHECK-BE-NEXT:    xscvsdqp v3, v3
349; CHECK-BE-NEXT:    xsaddqp v2, v2, v3
350; CHECK-BE-NEXT:    blr
351;
352; CHECK-P8-LABEL: testMixedAggregate_03:
353; CHECK-P8:       # %bb.0: # %entry
354; CHECK-P8-NEXT:    mflr r0
355; CHECK-P8-NEXT:    .cfi_def_cfa_offset 64
356; CHECK-P8-NEXT:    .cfi_offset lr, 16
357; CHECK-P8-NEXT:    .cfi_offset r28, -32
358; CHECK-P8-NEXT:    .cfi_offset r29, -24
359; CHECK-P8-NEXT:    .cfi_offset r30, -16
360; CHECK-P8-NEXT:    std r28, -32(r1) # 8-byte Folded Spill
361; CHECK-P8-NEXT:    std r29, -24(r1) # 8-byte Folded Spill
362; CHECK-P8-NEXT:    std r30, -16(r1) # 8-byte Folded Spill
363; CHECK-P8-NEXT:    std r0, 16(r1)
364; CHECK-P8-NEXT:    stdu r1, -64(r1)
365; CHECK-P8-NEXT:    extsw r3, r3
366; CHECK-P8-NEXT:    mr r30, r10
367; CHECK-P8-NEXT:    mr r29, r6
368; CHECK-P8-NEXT:    mr r28, r5
369; CHECK-P8-NEXT:    bl __floatsikf
370; CHECK-P8-NEXT:    nop
371; CHECK-P8-NEXT:    mr r5, r3
372; CHECK-P8-NEXT:    mr r6, r4
373; CHECK-P8-NEXT:    mr r3, r28
374; CHECK-P8-NEXT:    mr r4, r29
375; CHECK-P8-NEXT:    bl __addkf3
376; CHECK-P8-NEXT:    nop
377; CHECK-P8-NEXT:    mr r29, r3
378; CHECK-P8-NEXT:    mr r3, r30
379; CHECK-P8-NEXT:    mr r28, r4
380; CHECK-P8-NEXT:    bl __floatdikf
381; CHECK-P8-NEXT:    nop
382; CHECK-P8-NEXT:    mr r5, r3
383; CHECK-P8-NEXT:    mr r6, r4
384; CHECK-P8-NEXT:    mr r3, r29
385; CHECK-P8-NEXT:    mr r4, r28
386; CHECK-P8-NEXT:    bl __addkf3
387; CHECK-P8-NEXT:    nop
388; CHECK-P8-NEXT:    addi r1, r1, 64
389; CHECK-P8-NEXT:    ld r0, 16(r1)
390; CHECK-P8-NEXT:    ld r30, -16(r1) # 8-byte Folded Reload
391; CHECK-P8-NEXT:    ld r29, -24(r1) # 8-byte Folded Reload
392; CHECK-P8-NEXT:    ld r28, -32(r1) # 8-byte Folded Reload
393; CHECK-P8-NEXT:    mtlr r0
394; CHECK-P8-NEXT:    blr
395entry:
396  %sa.coerce.fca.0.extract = extractvalue [4 x i128] %sa.coerce, 0
397  %sa.sroa.0.0.extract.trunc = trunc i128 %sa.coerce.fca.0.extract to i32
398  %sa.coerce.fca.1.extract = extractvalue [4 x i128] %sa.coerce, 1
399  %sa.coerce.fca.3.extract = extractvalue [4 x i128] %sa.coerce, 3
400  %sa.sroa.6.48.extract.shift = lshr i128 %sa.coerce.fca.3.extract, 64
401  %sa.sroa.6.48.extract.trunc = trunc i128 %sa.sroa.6.48.extract.shift to i64
402  %conv = sitofp i32 %sa.sroa.0.0.extract.trunc to fp128
403  %0 = bitcast i128 %sa.coerce.fca.1.extract to fp128
404  %add = fadd fp128 %0, %conv
405  %conv2 = sitofp i64 %sa.sroa.6.48.extract.trunc to fp128
406  %add3 = fadd fp128 %add, %conv2
407  ret fp128 %add3
408}
409
410
411; Function Attrs: norecurse nounwind readonly
412define fp128 @testNestedAggregate(%struct.MixedC* byval(%struct.MixedC) nocapture readonly align 16 %a) {
413; CHECK-LABEL: testNestedAggregate:
414; CHECK:       # %bb.0: # %entry
415; CHECK-NEXT:    std r8, 72(r1)
416; CHECK-NEXT:    std r7, 64(r1)
417; CHECK-NEXT:    lxv v2, 64(r1)
418; CHECK-NEXT:    std r3, 32(r1)
419; CHECK-NEXT:    std r4, 40(r1)
420; CHECK-NEXT:    std r5, 48(r1)
421; CHECK-NEXT:    std r6, 56(r1)
422; CHECK-NEXT:    std r9, 80(r1)
423; CHECK-NEXT:    std r10, 88(r1)
424; CHECK-NEXT:    blr
425;
426; CHECK-BE-LABEL: testNestedAggregate:
427; CHECK-BE:       # %bb.0: # %entry
428; CHECK-BE-NEXT:    std r8, 88(r1)
429; CHECK-BE-NEXT:    std r7, 80(r1)
430; CHECK-BE-NEXT:    lxv v2, 80(r1)
431; CHECK-BE-NEXT:    std r3, 48(r1)
432; CHECK-BE-NEXT:    std r4, 56(r1)
433; CHECK-BE-NEXT:    std r5, 64(r1)
434; CHECK-BE-NEXT:    std r6, 72(r1)
435; CHECK-BE-NEXT:    std r9, 96(r1)
436; CHECK-BE-NEXT:    std r10, 104(r1)
437; CHECK-BE-NEXT:    blr
438;
439; CHECK-P8-LABEL: testNestedAggregate:
440; CHECK-P8:       # %bb.0: # %entry
441; CHECK-P8-NEXT:    std r3, 32(r1)
442; CHECK-P8-NEXT:    std r4, 40(r1)
443; CHECK-P8-NEXT:    mr r3, r7
444; CHECK-P8-NEXT:    mr r4, r8
445; CHECK-P8-NEXT:    std r8, 72(r1)
446; CHECK-P8-NEXT:    std r7, 64(r1)
447; CHECK-P8-NEXT:    std r5, 48(r1)
448; CHECK-P8-NEXT:    std r6, 56(r1)
449; CHECK-P8-NEXT:    std r9, 80(r1)
450; CHECK-P8-NEXT:    std r10, 88(r1)
451; CHECK-P8-NEXT:    blr
452
453entry:
454  %c = getelementptr inbounds %struct.MixedC, %struct.MixedC* %a, i64 0, i32 1, i32 1
455  %0 = load fp128, fp128* %c, align 16
456  ret fp128 %0
457}
458
459; Function Attrs: norecurse nounwind readnone
460define fp128 @testUnion_01([1 x i128] %a.coerce) {
461; CHECK-LABEL: testUnion_01:
462; CHECK:       # %bb.0: # %entry
463; CHECK-NEXT:    mtvsrdd v2, r4, r3
464; CHECK-NEXT:    blr
465;
466; CHECK-BE-LABEL: testUnion_01:
467; CHECK-BE:       # %bb.0: # %entry
468; CHECK-BE-NEXT:    mtvsrdd v2, r4, r3
469; CHECK-BE-NEXT:    blr
470;
471; CHECK-P8-LABEL: testUnion_01:
472; CHECK-P8:       # %bb.0: # %entry
473; CHECK-P8-NEXT:    blr
474
475entry:
476  %a.coerce.fca.0.extract = extractvalue [1 x i128] %a.coerce, 0
477  %0 = bitcast i128 %a.coerce.fca.0.extract to fp128
478  ret fp128 %0
479}
480
481; Function Attrs: norecurse nounwind readnone
482define fp128 @testUnion_02([1 x i128] %a.coerce) {
483; CHECK-LABEL: testUnion_02:
484; CHECK:       # %bb.0: # %entry
485; CHECK-NEXT:    mtvsrdd v2, r4, r3
486; CHECK-NEXT:    blr
487;
488; CHECK-BE-LABEL: testUnion_02:
489; CHECK-BE:       # %bb.0: # %entry
490; CHECK-BE-NEXT:    mtvsrdd v2, r4, r3
491; CHECK-BE-NEXT:    blr
492;
493; CHECK-P8-LABEL: testUnion_02:
494; CHECK-P8:       # %bb.0: # %entry
495; CHECK-P8-NEXT:    blr
496
497entry:
498  %a.coerce.fca.0.extract = extractvalue [1 x i128] %a.coerce, 0
499  %0 = bitcast i128 %a.coerce.fca.0.extract to fp128
500  ret fp128 %0
501}
502
503; Function Attrs: norecurse nounwind readnone
504define fp128 @testUnion_03([4 x i128] %a.coerce) {
505; CHECK-LABEL: testUnion_03:
506; CHECK:       # %bb.0: # %entry
507; CHECK-NEXT:    mtvsrdd v2, r8, r7
508; CHECK-NEXT:    blr
509;
510; CHECK-BE-LABEL: testUnion_03:
511; CHECK-BE:       # %bb.0: # %entry
512; CHECK-BE-NEXT:    mtvsrdd v2, r8, r7
513; CHECK-BE-NEXT:    blr
514;
515; CHECK-P8-LABEL: testUnion_03:
516; CHECK-P8:       # %bb.0: # %entry
517; CHECK-P8-NEXT:    mr r4, r8
518; CHECK-P8-NEXT:    mr r3, r7
519; CHECK-P8-NEXT:    blr
520
521entry:
522  %a.coerce.fca.2.extract = extractvalue [4 x i128] %a.coerce, 2
523  %0 = bitcast i128 %a.coerce.fca.2.extract to fp128
524  ret fp128 %0
525}
526
527; Function Attrs: nounwind
528define fp128 @sum_float128(i32 signext %count, ...) {
529; CHECK-LABEL: sum_float128:
530; CHECK:       # %bb.0: # %entry
531; CHECK-NEXT:    std r4, 40(r1)
532; CHECK-NEXT:    addis r4, r2, .LCPI17_0@toc@ha
533; CHECK-NEXT:    cmpwi r3, 1
534; CHECK-NEXT:    std r5, 48(r1)
535; CHECK-NEXT:    addi r4, r4, .LCPI17_0@toc@l
536; CHECK-NEXT:    std r6, 56(r1)
537; CHECK-NEXT:    std r7, 64(r1)
538; CHECK-NEXT:    std r8, 72(r1)
539; CHECK-NEXT:    lxvx v2, 0, r4
540; CHECK-NEXT:    std r9, 80(r1)
541; CHECK-NEXT:    std r10, 88(r1)
542; CHECK-NEXT:    bltlr cr0
543; CHECK-NEXT:  # %bb.1: # %if.end
544; CHECK-NEXT:    addi r3, r1, 40
545; CHECK-NEXT:    addi r4, r1, 72
546; CHECK-NEXT:    lxvx v3, 0, r3
547; CHECK-NEXT:    std r4, -8(r1)
548; CHECK-NEXT:    xsaddqp v2, v3, v2
549; CHECK-NEXT:    lxv v3, 16(r3)
550; CHECK-NEXT:    xsaddqp v2, v2, v3
551; CHECK-NEXT:    blr
552;
553; CHECK-BE-LABEL: sum_float128:
554; CHECK-BE:       # %bb.0: # %entry
555; CHECK-BE-NEXT:    std r4, 56(r1)
556; CHECK-BE-NEXT:    addis r4, r2, .LCPI17_0@toc@ha
557; CHECK-BE-NEXT:    cmpwi r3, 1
558; CHECK-BE-NEXT:    std r5, 64(r1)
559; CHECK-BE-NEXT:    addi r4, r4, .LCPI17_0@toc@l
560; CHECK-BE-NEXT:    std r6, 72(r1)
561; CHECK-BE-NEXT:    std r7, 80(r1)
562; CHECK-BE-NEXT:    std r8, 88(r1)
563; CHECK-BE-NEXT:    lxvx v2, 0, r4
564; CHECK-BE-NEXT:    std r9, 96(r1)
565; CHECK-BE-NEXT:    std r10, 104(r1)
566; CHECK-BE-NEXT:    bltlr cr0
567; CHECK-BE-NEXT:  # %bb.1: # %if.end
568; CHECK-BE-NEXT:    addi r3, r1, 56
569; CHECK-BE-NEXT:    addi r4, r1, 88
570; CHECK-BE-NEXT:    lxvx v3, 0, r3
571; CHECK-BE-NEXT:    std r4, -8(r1)
572; CHECK-BE-NEXT:    xsaddqp v2, v3, v2
573; CHECK-BE-NEXT:    lxv v3, 16(r3)
574; CHECK-BE-NEXT:    xsaddqp v2, v2, v3
575; CHECK-BE-NEXT:    blr
576;
577; CHECK-P8-LABEL: sum_float128:
578; CHECK-P8:       # %bb.0: # %entry
579; CHECK-P8-NEXT:    mflr r0
580; CHECK-P8-NEXT:    std r0, 16(r1)
581; CHECK-P8-NEXT:    stdu r1, -48(r1)
582; CHECK-P8-NEXT:    .cfi_def_cfa_offset 48
583; CHECK-P8-NEXT:    .cfi_offset lr, 16
584; CHECK-P8-NEXT:    cmpwi r3, 1
585; CHECK-P8-NEXT:    std r4, 88(r1)
586; CHECK-P8-NEXT:    std r5, 96(r1)
587; CHECK-P8-NEXT:    std r6, 104(r1)
588; CHECK-P8-NEXT:    std r7, 112(r1)
589; CHECK-P8-NEXT:    std r8, 120(r1)
590; CHECK-P8-NEXT:    std r9, 128(r1)
591; CHECK-P8-NEXT:    std r10, 136(r1)
592; CHECK-P8-NEXT:    blt cr0, .LBB17_2
593; CHECK-P8-NEXT:  # %bb.1: # %if.end
594; CHECK-P8-NEXT:    ld r3, 88(r1)
595; CHECK-P8-NEXT:    ld r4, 96(r1)
596; CHECK-P8-NEXT:    li r5, 0
597; CHECK-P8-NEXT:    li r6, 0
598; CHECK-P8-NEXT:    bl __addkf3
599; CHECK-P8-NEXT:    nop
600; CHECK-P8-NEXT:    ld r5, 104(r1)
601; CHECK-P8-NEXT:    ld r6, 112(r1)
602; CHECK-P8-NEXT:    addi r7, r1, 120
603; CHECK-P8-NEXT:    std r7, 40(r1)
604; CHECK-P8-NEXT:    bl __addkf3
605; CHECK-P8-NEXT:    nop
606; CHECK-P8-NEXT:    b .LBB17_3
607; CHECK-P8-NEXT:  .LBB17_2:
608; CHECK-P8-NEXT:    li r3, 0
609; CHECK-P8-NEXT:    li r4, 0
610; CHECK-P8-NEXT:  .LBB17_3: # %cleanup
611; CHECK-P8-NEXT:    addi r1, r1, 48
612; CHECK-P8-NEXT:    ld r0, 16(r1)
613; CHECK-P8-NEXT:    mtlr r0
614; CHECK-P8-NEXT:    blr
615entry:
616  %ap = alloca i8*, align 8
617  %0 = bitcast i8** %ap to i8*
618  call void @llvm.lifetime.start.p0i8(i64 8, i8* nonnull %0) #2
619  %cmp = icmp slt i32 %count, 1
620  br i1 %cmp, label %cleanup, label %if.end
621
622if.end:                                           ; preds = %entry
623  call void @llvm.va_start(i8* nonnull %0)
624  %argp.cur = load i8*, i8** %ap, align 8
625  %argp.next = getelementptr inbounds i8, i8* %argp.cur, i64 16
626  %1 = bitcast i8* %argp.cur to fp128*
627  %2 = load fp128, fp128* %1, align 8
628  %add = fadd fp128 %2, 0xL00000000000000000000000000000000
629  %argp.next3 = getelementptr inbounds i8, i8* %argp.cur, i64 32
630  store i8* %argp.next3, i8** %ap, align 8
631  %3 = bitcast i8* %argp.next to fp128*
632  %4 = load fp128, fp128* %3, align 8
633  %add4 = fadd fp128 %add, %4
634  call void @llvm.va_end(i8* nonnull %0)
635  br label %cleanup
636
637cleanup:                                          ; preds = %entry, %if.end
638  %retval.0 = phi fp128 [ %add4, %if.end ], [ 0xL00000000000000000000000000000000, %entry ]
639  call void @llvm.lifetime.end.p0i8(i64 8, i8* nonnull %0) #2
640  ret fp128 %retval.0
641}
642
643declare void @llvm.lifetime.start.p0i8(i64, i8* nocapture) #1
644declare void @llvm.va_start(i8*) #2
645declare void @llvm.va_end(i8*) #2
646declare void @llvm.lifetime.end.p0i8(i64, i8* nocapture) #1
647