1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
2; RUN: opt < %s -basic-aa -slp-vectorizer -S -mcpu=corei7-avx | FileCheck %s
3
4target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
5target triple = "x86_64-unknown-linux-gnu"
6
7define void @test1(x86_mmx %a, x86_mmx %b, i64* %ptr) {
8; Ensure we can handle x86_mmx values which are primitive and can be bitcast
9; with integer types but can't be put into a vector.
10;
11; CHECK-LABEL: @test1(
12; CHECK-NEXT:  entry:
13; CHECK-NEXT:    [[A_CAST:%.*]] = bitcast x86_mmx [[A:%.*]] to i64
14; CHECK-NEXT:    [[B_CAST:%.*]] = bitcast x86_mmx [[B:%.*]] to i64
15; CHECK-NEXT:    [[A_AND:%.*]] = and i64 [[A_CAST]], 42
16; CHECK-NEXT:    [[B_AND:%.*]] = and i64 [[B_CAST]], 42
17; CHECK-NEXT:    [[GEP:%.*]] = getelementptr i64, i64* [[PTR:%.*]], i32 1
18; CHECK-NEXT:    store i64 [[A_AND]], i64* [[PTR]]
19; CHECK-NEXT:    store i64 [[B_AND]], i64* [[GEP]]
20; CHECK-NEXT:    ret void
21;
22entry:
23  %a.cast = bitcast x86_mmx %a to i64
24  %b.cast = bitcast x86_mmx %b to i64
25  %a.and = and i64 %a.cast, 42
26  %b.and = and i64 %b.cast, 42
27  %gep = getelementptr i64, i64* %ptr, i32 1
28  store i64 %a.and, i64* %ptr
29  store i64 %b.and, i64* %gep
30  ret void
31}
32
33define void @test2(x86_mmx %a, x86_mmx %b) {
34; Same as @test1 but using phi-input vectorization instead of store
35; vectorization.
36;
37; CHECK-LABEL: @test2(
38; CHECK-NEXT:  entry:
39; CHECK-NEXT:    br i1 undef, label [[IF_THEN:%.*]], label [[EXIT:%.*]]
40; CHECK:       if.then:
41; CHECK-NEXT:    [[A_CAST:%.*]] = bitcast x86_mmx [[A:%.*]] to i64
42; CHECK-NEXT:    [[B_CAST:%.*]] = bitcast x86_mmx [[B:%.*]] to i64
43; CHECK-NEXT:    [[A_AND:%.*]] = and i64 [[A_CAST]], 42
44; CHECK-NEXT:    [[B_AND:%.*]] = and i64 [[B_CAST]], 42
45; CHECK-NEXT:    br label [[EXIT]]
46; CHECK:       exit:
47; CHECK-NEXT:    [[A_PHI:%.*]] = phi i64 [ 0, [[ENTRY:%.*]] ], [ [[A_AND]], [[IF_THEN]] ]
48; CHECK-NEXT:    [[B_PHI:%.*]] = phi i64 [ 0, [[ENTRY]] ], [ [[B_AND]], [[IF_THEN]] ]
49; CHECK-NEXT:    tail call void @f(i64 [[A_PHI]], i64 [[B_PHI]])
50; CHECK-NEXT:    ret void
51;
52entry:
53  br i1 undef, label %if.then, label %exit
54
55if.then:
56  %a.cast = bitcast x86_mmx %a to i64
57  %b.cast = bitcast x86_mmx %b to i64
58  %a.and = and i64 %a.cast, 42
59  %b.and = and i64 %b.cast, 42
60  br label %exit
61
62exit:
63  %a.phi = phi i64 [ 0, %entry ], [ %a.and, %if.then ]
64  %b.phi = phi i64 [ 0, %entry ], [ %b.and, %if.then ]
65  tail call void @f(i64 %a.phi, i64 %b.phi)
66  ret void
67}
68
69define i8 @test3(i8 *%addr) {
70; Check that we do not vectorize types that are padded to a bigger ones.
71;
72; CHECK-LABEL: @test3(
73; CHECK-NEXT:  entry:
74; CHECK-NEXT:    [[A:%.*]] = bitcast i8* [[ADDR:%.*]] to i2*
75; CHECK-NEXT:    [[A0:%.*]] = getelementptr inbounds i2, i2* [[A]], i64 0
76; CHECK-NEXT:    [[A1:%.*]] = getelementptr inbounds i2, i2* [[A]], i64 1
77; CHECK-NEXT:    [[A2:%.*]] = getelementptr inbounds i2, i2* [[A]], i64 2
78; CHECK-NEXT:    [[A3:%.*]] = getelementptr inbounds i2, i2* [[A]], i64 3
79; CHECK-NEXT:    [[L0:%.*]] = load i2, i2* [[A0]], align 1
80; CHECK-NEXT:    [[L1:%.*]] = load i2, i2* [[A1]], align 1
81; CHECK-NEXT:    [[L2:%.*]] = load i2, i2* [[A2]], align 1
82; CHECK-NEXT:    [[L3:%.*]] = load i2, i2* [[A3]], align 1
83; CHECK-NEXT:    br label [[BB1:%.*]]
84; CHECK:       bb1:
85; CHECK-NEXT:    [[P0:%.*]] = phi i2 [ [[L0]], [[ENTRY:%.*]] ]
86; CHECK-NEXT:    [[P1:%.*]] = phi i2 [ [[L1]], [[ENTRY]] ]
87; CHECK-NEXT:    [[P2:%.*]] = phi i2 [ [[L2]], [[ENTRY]] ]
88; CHECK-NEXT:    [[P3:%.*]] = phi i2 [ [[L3]], [[ENTRY]] ]
89; CHECK-NEXT:    [[R:%.*]] = zext i2 [[P2]] to i8
90; CHECK-NEXT:    ret i8 [[R]]
91;
92entry:
93  %a = bitcast i8* %addr to i2*
94  %a0 = getelementptr inbounds i2, i2* %a, i64 0
95  %a1 = getelementptr inbounds i2, i2* %a, i64 1
96  %a2 = getelementptr inbounds i2, i2* %a, i64 2
97  %a3 = getelementptr inbounds i2, i2* %a, i64 3
98  %l0 = load i2, i2* %a0, align 1
99  %l1 = load i2, i2* %a1, align 1
100  %l2 = load i2, i2* %a2, align 1
101  %l3 = load i2, i2* %a3, align 1
102  br label %bb1
103bb1:                                              ; preds = %entry
104  %p0 = phi i2 [ %l0, %entry ]
105  %p1 = phi i2 [ %l1, %entry ]
106  %p2 = phi i2 [ %l2, %entry ]
107  %p3 = phi i2 [ %l3, %entry ]
108  %r  = zext i2 %p2 to i8
109  ret i8 %r
110}
111
112declare void @f(i64, i64)
113