1 //===- HexagonSplitDouble.cpp ---------------------------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 
9 #define DEBUG_TYPE "hsdr"
10 
11 #include "HexagonInstrInfo.h"
12 #include "HexagonRegisterInfo.h"
13 #include "HexagonSubtarget.h"
14 #include "llvm/ADT/BitVector.h"
15 #include "llvm/ADT/STLExtras.h"
16 #include "llvm/ADT/SmallVector.h"
17 #include "llvm/ADT/StringRef.h"
18 #include "llvm/CodeGen/MachineBasicBlock.h"
19 #include "llvm/CodeGen/MachineFunction.h"
20 #include "llvm/CodeGen/MachineFunctionPass.h"
21 #include "llvm/CodeGen/MachineInstr.h"
22 #include "llvm/CodeGen/MachineInstrBuilder.h"
23 #include "llvm/CodeGen/MachineLoopInfo.h"
24 #include "llvm/CodeGen/MachineMemOperand.h"
25 #include "llvm/CodeGen/MachineOperand.h"
26 #include "llvm/CodeGen/MachineRegisterInfo.h"
27 #include "llvm/CodeGen/TargetRegisterInfo.h"
28 #include "llvm/Config/llvm-config.h"
29 #include "llvm/IR/DebugLoc.h"
30 #include "llvm/Pass.h"
31 #include "llvm/Support/CommandLine.h"
32 #include "llvm/Support/Compiler.h"
33 #include "llvm/Support/Debug.h"
34 #include "llvm/Support/ErrorHandling.h"
35 #include "llvm/Support/raw_ostream.h"
36 #include <algorithm>
37 #include <cassert>
38 #include <cstdint>
39 #include <limits>
40 #include <map>
41 #include <set>
42 #include <utility>
43 #include <vector>
44 
45 using namespace llvm;
46 
47 namespace llvm {
48 
49   FunctionPass *createHexagonSplitDoubleRegs();
50   void initializeHexagonSplitDoubleRegsPass(PassRegistry&);
51 
52 } // end namespace llvm
53 
54 static cl::opt<int> MaxHSDR("max-hsdr", cl::Hidden, cl::init(-1),
55     cl::desc("Maximum number of split partitions"));
56 static cl::opt<bool> MemRefsFixed("hsdr-no-mem", cl::Hidden, cl::init(true),
57     cl::desc("Do not split loads or stores"));
58   static cl::opt<bool> SplitAll("hsdr-split-all", cl::Hidden, cl::init(false),
59       cl::desc("Split all partitions"));
60 
61 namespace {
62 
63   class HexagonSplitDoubleRegs : public MachineFunctionPass {
64   public:
65     static char ID;
66 
67     HexagonSplitDoubleRegs() : MachineFunctionPass(ID) {}
68 
69     StringRef getPassName() const override {
70       return "Hexagon Split Double Registers";
71     }
72 
73     void getAnalysisUsage(AnalysisUsage &AU) const override {
74       AU.addRequired<MachineLoopInfo>();
75       AU.addPreserved<MachineLoopInfo>();
76       MachineFunctionPass::getAnalysisUsage(AU);
77     }
78 
79     bool runOnMachineFunction(MachineFunction &MF) override;
80 
81   private:
82     static const TargetRegisterClass *const DoubleRC;
83 
84     const HexagonRegisterInfo *TRI = nullptr;
85     const HexagonInstrInfo *TII = nullptr;
86     const MachineLoopInfo *MLI;
87     MachineRegisterInfo *MRI;
88 
89     using USet = std::set<unsigned>;
90     using UUSetMap = std::map<unsigned, USet>;
91     using UUPair = std::pair<unsigned, unsigned>;
92     using UUPairMap = std::map<unsigned, UUPair>;
93     using LoopRegMap = std::map<const MachineLoop *, USet>;
94 
95     bool isInduction(unsigned Reg, LoopRegMap &IRM) const;
96     bool isVolatileInstr(const MachineInstr *MI) const;
97     bool isFixedInstr(const MachineInstr *MI) const;
98     void partitionRegisters(UUSetMap &P2Rs);
99     int32_t profit(const MachineInstr *MI) const;
100     int32_t profit(unsigned Reg) const;
101     bool isProfitable(const USet &Part, LoopRegMap &IRM) const;
102 
103     void collectIndRegsForLoop(const MachineLoop *L, USet &Rs);
104     void collectIndRegs(LoopRegMap &IRM);
105 
106     void createHalfInstr(unsigned Opc, MachineInstr *MI,
107         const UUPairMap &PairMap, unsigned SubR);
108     void splitMemRef(MachineInstr *MI, const UUPairMap &PairMap);
109     void splitImmediate(MachineInstr *MI, const UUPairMap &PairMap);
110     void splitCombine(MachineInstr *MI, const UUPairMap &PairMap);
111     void splitExt(MachineInstr *MI, const UUPairMap &PairMap);
112     void splitShift(MachineInstr *MI, const UUPairMap &PairMap);
113     void splitAslOr(MachineInstr *MI, const UUPairMap &PairMap);
114     bool splitInstr(MachineInstr *MI, const UUPairMap &PairMap);
115     void replaceSubregUses(MachineInstr *MI, const UUPairMap &PairMap);
116     void collapseRegPairs(MachineInstr *MI, const UUPairMap &PairMap);
117     bool splitPartition(const USet &Part);
118 
119     static int Counter;
120 
121     static void dump_partition(raw_ostream&, const USet&,
122        const TargetRegisterInfo&);
123   };
124 
125 } // end anonymous namespace
126 
127 char HexagonSplitDoubleRegs::ID;
128 int HexagonSplitDoubleRegs::Counter = 0;
129 const TargetRegisterClass *const HexagonSplitDoubleRegs::DoubleRC =
130     &Hexagon::DoubleRegsRegClass;
131 
132 INITIALIZE_PASS(HexagonSplitDoubleRegs, "hexagon-split-double",
133   "Hexagon Split Double Registers", false, false)
134 
135 #if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
136 LLVM_DUMP_METHOD void HexagonSplitDoubleRegs::dump_partition(raw_ostream &os,
137       const USet &Part, const TargetRegisterInfo &TRI) {
138   dbgs() << '{';
139   for (auto I : Part)
140     dbgs() << ' ' << printReg(I, &TRI);
141   dbgs() << " }";
142 }
143 #endif
144 
145 bool HexagonSplitDoubleRegs::isInduction(unsigned Reg, LoopRegMap &IRM) const {
146   for (auto I : IRM) {
147     const USet &Rs = I.second;
148     if (Rs.find(Reg) != Rs.end())
149       return true;
150   }
151   return false;
152 }
153 
154 bool HexagonSplitDoubleRegs::isVolatileInstr(const MachineInstr *MI) const {
155   for (auto &MO : MI->memoperands())
156     if (MO->isVolatile() || MO->isAtomic())
157       return true;
158   return false;
159 }
160 
161 bool HexagonSplitDoubleRegs::isFixedInstr(const MachineInstr *MI) const {
162   if (MI->mayLoadOrStore())
163     if (MemRefsFixed || isVolatileInstr(MI))
164       return true;
165   if (MI->isDebugInstr())
166     return false;
167 
168   unsigned Opc = MI->getOpcode();
169   switch (Opc) {
170     default:
171       return true;
172 
173     case TargetOpcode::PHI:
174     case TargetOpcode::COPY:
175       break;
176 
177     case Hexagon::L2_loadrd_io:
178       // Not handling stack stores (only reg-based addresses).
179       if (MI->getOperand(1).isReg())
180         break;
181       return true;
182     case Hexagon::S2_storerd_io:
183       // Not handling stack stores (only reg-based addresses).
184       if (MI->getOperand(0).isReg())
185         break;
186       return true;
187     case Hexagon::L2_loadrd_pi:
188     case Hexagon::S2_storerd_pi:
189 
190     case Hexagon::A2_tfrpi:
191     case Hexagon::A2_combineii:
192     case Hexagon::A4_combineir:
193     case Hexagon::A4_combineii:
194     case Hexagon::A4_combineri:
195     case Hexagon::A2_combinew:
196     case Hexagon::CONST64:
197 
198     case Hexagon::A2_sxtw:
199 
200     case Hexagon::A2_andp:
201     case Hexagon::A2_orp:
202     case Hexagon::A2_xorp:
203     case Hexagon::S2_asl_i_p_or:
204     case Hexagon::S2_asl_i_p:
205     case Hexagon::S2_asr_i_p:
206     case Hexagon::S2_lsr_i_p:
207       break;
208   }
209 
210   for (auto &Op : MI->operands()) {
211     if (!Op.isReg())
212       continue;
213     Register R = Op.getReg();
214     if (!Register::isVirtualRegister(R))
215       return true;
216   }
217   return false;
218 }
219 
220 void HexagonSplitDoubleRegs::partitionRegisters(UUSetMap &P2Rs) {
221   using UUMap = std::map<unsigned, unsigned>;
222   using UVect = std::vector<unsigned>;
223 
224   unsigned NumRegs = MRI->getNumVirtRegs();
225   BitVector DoubleRegs(NumRegs);
226   for (unsigned i = 0; i < NumRegs; ++i) {
227     unsigned R = Register::index2VirtReg(i);
228     if (MRI->getRegClass(R) == DoubleRC)
229       DoubleRegs.set(i);
230   }
231 
232   BitVector FixedRegs(NumRegs);
233   for (int x = DoubleRegs.find_first(); x >= 0; x = DoubleRegs.find_next(x)) {
234     unsigned R = Register::index2VirtReg(x);
235     MachineInstr *DefI = MRI->getVRegDef(R);
236     // In some cases a register may exist, but never be defined or used.
237     // It should never appear anywhere, but mark it as "fixed", just to be
238     // safe.
239     if (!DefI || isFixedInstr(DefI))
240       FixedRegs.set(x);
241   }
242 
243   UUSetMap AssocMap;
244   for (int x = DoubleRegs.find_first(); x >= 0; x = DoubleRegs.find_next(x)) {
245     if (FixedRegs[x])
246       continue;
247     unsigned R = Register::index2VirtReg(x);
248     LLVM_DEBUG(dbgs() << printReg(R, TRI) << " ~~");
249     USet &Asc = AssocMap[R];
250     for (auto U = MRI->use_nodbg_begin(R), Z = MRI->use_nodbg_end();
251          U != Z; ++U) {
252       MachineOperand &Op = *U;
253       MachineInstr *UseI = Op.getParent();
254       if (isFixedInstr(UseI))
255         continue;
256       for (unsigned i = 0, n = UseI->getNumOperands(); i < n; ++i) {
257         MachineOperand &MO = UseI->getOperand(i);
258         // Skip non-registers or registers with subregisters.
259         if (&MO == &Op || !MO.isReg() || MO.getSubReg())
260           continue;
261         Register T = MO.getReg();
262         if (!Register::isVirtualRegister(T)) {
263           FixedRegs.set(x);
264           continue;
265         }
266         if (MRI->getRegClass(T) != DoubleRC)
267           continue;
268         unsigned u = Register::virtReg2Index(T);
269         if (FixedRegs[u])
270           continue;
271         LLVM_DEBUG(dbgs() << ' ' << printReg(T, TRI));
272         Asc.insert(T);
273         // Make it symmetric.
274         AssocMap[T].insert(R);
275       }
276     }
277     LLVM_DEBUG(dbgs() << '\n');
278   }
279 
280   UUMap R2P;
281   unsigned NextP = 1;
282   USet Visited;
283   for (int x = DoubleRegs.find_first(); x >= 0; x = DoubleRegs.find_next(x)) {
284     unsigned R = Register::index2VirtReg(x);
285     if (Visited.count(R))
286       continue;
287     // Create a new partition for R.
288     unsigned ThisP = FixedRegs[x] ? 0 : NextP++;
289     UVect WorkQ;
290     WorkQ.push_back(R);
291     for (unsigned i = 0; i < WorkQ.size(); ++i) {
292       unsigned T = WorkQ[i];
293       if (Visited.count(T))
294         continue;
295       R2P[T] = ThisP;
296       Visited.insert(T);
297       // Add all registers associated with T.
298       USet &Asc = AssocMap[T];
299       for (USet::iterator J = Asc.begin(), F = Asc.end(); J != F; ++J)
300         WorkQ.push_back(*J);
301     }
302   }
303 
304   for (auto I : R2P)
305     P2Rs[I.second].insert(I.first);
306 }
307 
308 static inline int32_t profitImm(unsigned Imm) {
309   int32_t P = 0;
310   if (Imm == 0 || Imm == 0xFFFFFFFF)
311     P += 10;
312   return P;
313 }
314 
315 int32_t HexagonSplitDoubleRegs::profit(const MachineInstr *MI) const {
316   unsigned ImmX = 0;
317   unsigned Opc = MI->getOpcode();
318   switch (Opc) {
319     case TargetOpcode::PHI:
320       for (const auto &Op : MI->operands())
321         if (!Op.getSubReg())
322           return 0;
323       return 10;
324     case TargetOpcode::COPY:
325       if (MI->getOperand(1).getSubReg() != 0)
326         return 10;
327       return 0;
328 
329     case Hexagon::L2_loadrd_io:
330     case Hexagon::S2_storerd_io:
331       return -1;
332     case Hexagon::L2_loadrd_pi:
333     case Hexagon::S2_storerd_pi:
334       return 2;
335 
336     case Hexagon::A2_tfrpi:
337     case Hexagon::CONST64: {
338       uint64_t D = MI->getOperand(1).getImm();
339       unsigned Lo = D & 0xFFFFFFFFULL;
340       unsigned Hi = D >> 32;
341       return profitImm(Lo) + profitImm(Hi);
342     }
343     case Hexagon::A2_combineii:
344     case Hexagon::A4_combineii: {
345       const MachineOperand &Op1 = MI->getOperand(1);
346       const MachineOperand &Op2 = MI->getOperand(2);
347       int32_t Prof1 = Op1.isImm() ? profitImm(Op1.getImm()) : 0;
348       int32_t Prof2 = Op2.isImm() ? profitImm(Op2.getImm()) : 0;
349       return Prof1 + Prof2;
350     }
351     case Hexagon::A4_combineri:
352       ImmX++;
353       // Fall through into A4_combineir.
354       LLVM_FALLTHROUGH;
355     case Hexagon::A4_combineir: {
356       ImmX++;
357       const MachineOperand &OpX = MI->getOperand(ImmX);
358       if (OpX.isImm()) {
359         int64_t V = OpX.getImm();
360         if (V == 0 || V == -1)
361           return 10;
362       }
363       // Fall through into A2_combinew.
364       LLVM_FALLTHROUGH;
365     }
366     case Hexagon::A2_combinew:
367       return 2;
368 
369     case Hexagon::A2_sxtw:
370       return 3;
371 
372     case Hexagon::A2_andp:
373     case Hexagon::A2_orp:
374     case Hexagon::A2_xorp: {
375       Register Rs = MI->getOperand(1).getReg();
376       Register Rt = MI->getOperand(2).getReg();
377       return profit(Rs) + profit(Rt);
378     }
379 
380     case Hexagon::S2_asl_i_p_or: {
381       unsigned S = MI->getOperand(3).getImm();
382       if (S == 0 || S == 32)
383         return 10;
384       return -1;
385     }
386     case Hexagon::S2_asl_i_p:
387     case Hexagon::S2_asr_i_p:
388     case Hexagon::S2_lsr_i_p:
389       unsigned S = MI->getOperand(2).getImm();
390       if (S == 0 || S == 32)
391         return 10;
392       if (S == 16)
393         return 5;
394       if (S == 48)
395         return 7;
396       return -10;
397   }
398 
399   return 0;
400 }
401 
402 int32_t HexagonSplitDoubleRegs::profit(unsigned Reg) const {
403   assert(Register::isVirtualRegister(Reg));
404 
405   const MachineInstr *DefI = MRI->getVRegDef(Reg);
406   switch (DefI->getOpcode()) {
407     case Hexagon::A2_tfrpi:
408     case Hexagon::CONST64:
409     case Hexagon::A2_combineii:
410     case Hexagon::A4_combineii:
411     case Hexagon::A4_combineri:
412     case Hexagon::A4_combineir:
413     case Hexagon::A2_combinew:
414       return profit(DefI);
415     default:
416       break;
417   }
418   return 0;
419 }
420 
421 bool HexagonSplitDoubleRegs::isProfitable(const USet &Part, LoopRegMap &IRM)
422       const {
423   unsigned FixedNum = 0, LoopPhiNum = 0;
424   int32_t TotalP = 0;
425 
426   for (unsigned DR : Part) {
427     MachineInstr *DefI = MRI->getVRegDef(DR);
428     int32_t P = profit(DefI);
429     if (P == std::numeric_limits<int>::min())
430       return false;
431     TotalP += P;
432     // Reduce the profitability of splitting induction registers.
433     if (isInduction(DR, IRM))
434       TotalP -= 30;
435 
436     for (auto U = MRI->use_nodbg_begin(DR), W = MRI->use_nodbg_end();
437          U != W; ++U) {
438       MachineInstr *UseI = U->getParent();
439       if (isFixedInstr(UseI)) {
440         FixedNum++;
441         // Calculate the cost of generating REG_SEQUENCE instructions.
442         for (auto &Op : UseI->operands()) {
443           if (Op.isReg() && Part.count(Op.getReg()))
444             if (Op.getSubReg())
445               TotalP -= 2;
446         }
447         continue;
448       }
449       // If a register from this partition is used in a fixed instruction,
450       // and there is also a register in this partition that is used in
451       // a loop phi node, then decrease the splitting profit as this can
452       // confuse the modulo scheduler.
453       if (UseI->isPHI()) {
454         const MachineBasicBlock *PB = UseI->getParent();
455         const MachineLoop *L = MLI->getLoopFor(PB);
456         if (L && L->getHeader() == PB)
457           LoopPhiNum++;
458       }
459       // Splittable instruction.
460       int32_t P = profit(UseI);
461       if (P == std::numeric_limits<int>::min())
462         return false;
463       TotalP += P;
464     }
465   }
466 
467   if (FixedNum > 0 && LoopPhiNum > 0)
468     TotalP -= 20*LoopPhiNum;
469 
470   LLVM_DEBUG(dbgs() << "Partition profit: " << TotalP << '\n');
471   if (SplitAll)
472     return true;
473   return TotalP > 0;
474 }
475 
476 void HexagonSplitDoubleRegs::collectIndRegsForLoop(const MachineLoop *L,
477       USet &Rs) {
478   const MachineBasicBlock *HB = L->getHeader();
479   const MachineBasicBlock *LB = L->getLoopLatch();
480   if (!HB || !LB)
481     return;
482 
483   // Examine the latch branch. Expect it to be a conditional branch to
484   // the header (either "br-cond header" or "br-cond exit; br header").
485   MachineBasicBlock *TB = nullptr, *FB = nullptr;
486   MachineBasicBlock *TmpLB = const_cast<MachineBasicBlock*>(LB);
487   SmallVector<MachineOperand,2> Cond;
488   bool BadLB = TII->analyzeBranch(*TmpLB, TB, FB, Cond, false);
489   // Only analyzable conditional branches. HII::analyzeBranch will put
490   // the branch opcode as the first element of Cond, and the predicate
491   // operand as the second.
492   if (BadLB || Cond.size() != 2)
493     return;
494   // Only simple jump-conditional (with or without negation).
495   if (!TII->PredOpcodeHasJMP_c(Cond[0].getImm()))
496     return;
497   // Must go to the header.
498   if (TB != HB && FB != HB)
499     return;
500   assert(Cond[1].isReg() && "Unexpected Cond vector from analyzeBranch");
501   // Expect a predicate register.
502   Register PR = Cond[1].getReg();
503   assert(MRI->getRegClass(PR) == &Hexagon::PredRegsRegClass);
504 
505   // Get the registers on which the loop controlling compare instruction
506   // depends.
507   unsigned CmpR1 = 0, CmpR2 = 0;
508   const MachineInstr *CmpI = MRI->getVRegDef(PR);
509   while (CmpI->getOpcode() == Hexagon::C2_not)
510     CmpI = MRI->getVRegDef(CmpI->getOperand(1).getReg());
511 
512   int Mask = 0, Val = 0;
513   bool OkCI = TII->analyzeCompare(*CmpI, CmpR1, CmpR2, Mask, Val);
514   if (!OkCI)
515     return;
516   // Eliminate non-double input registers.
517   if (CmpR1 && MRI->getRegClass(CmpR1) != DoubleRC)
518     CmpR1 = 0;
519   if (CmpR2 && MRI->getRegClass(CmpR2) != DoubleRC)
520     CmpR2 = 0;
521   if (!CmpR1 && !CmpR2)
522     return;
523 
524   // Now examine the top of the loop: the phi nodes that could poten-
525   // tially define loop induction registers. The registers defined by
526   // such a phi node would be used in a 64-bit add, which then would
527   // be used in the loop compare instruction.
528 
529   // Get the set of all double registers defined by phi nodes in the
530   // loop header.
531   using UVect = std::vector<unsigned>;
532 
533   UVect DP;
534   for (auto &MI : *HB) {
535     if (!MI.isPHI())
536       break;
537     const MachineOperand &MD = MI.getOperand(0);
538     Register R = MD.getReg();
539     if (MRI->getRegClass(R) == DoubleRC)
540       DP.push_back(R);
541   }
542   if (DP.empty())
543     return;
544 
545   auto NoIndOp = [this, CmpR1, CmpR2] (unsigned R) -> bool {
546     for (auto I = MRI->use_nodbg_begin(R), E = MRI->use_nodbg_end();
547          I != E; ++I) {
548       const MachineInstr *UseI = I->getParent();
549       if (UseI->getOpcode() != Hexagon::A2_addp)
550         continue;
551       // Get the output from the add. If it is one of the inputs to the
552       // loop-controlling compare instruction, then R is likely an induc-
553       // tion register.
554       Register T = UseI->getOperand(0).getReg();
555       if (T == CmpR1 || T == CmpR2)
556         return false;
557     }
558     return true;
559   };
560   UVect::iterator End = llvm::remove_if(DP, NoIndOp);
561   Rs.insert(DP.begin(), End);
562   Rs.insert(CmpR1);
563   Rs.insert(CmpR2);
564 
565   LLVM_DEBUG({
566     dbgs() << "For loop at " << printMBBReference(*HB) << " ind regs: ";
567     dump_partition(dbgs(), Rs, *TRI);
568     dbgs() << '\n';
569   });
570 }
571 
572 void HexagonSplitDoubleRegs::collectIndRegs(LoopRegMap &IRM) {
573   using LoopVector = std::vector<MachineLoop *>;
574 
575   LoopVector WorkQ;
576 
577   for (auto I : *MLI)
578     WorkQ.push_back(I);
579   for (unsigned i = 0; i < WorkQ.size(); ++i) {
580     for (auto I : *WorkQ[i])
581       WorkQ.push_back(I);
582   }
583 
584   USet Rs;
585   for (unsigned i = 0, n = WorkQ.size(); i < n; ++i) {
586     MachineLoop *L = WorkQ[i];
587     Rs.clear();
588     collectIndRegsForLoop(L, Rs);
589     if (!Rs.empty())
590       IRM.insert(std::make_pair(L, Rs));
591   }
592 }
593 
594 void HexagonSplitDoubleRegs::createHalfInstr(unsigned Opc, MachineInstr *MI,
595       const UUPairMap &PairMap, unsigned SubR) {
596   MachineBasicBlock &B = *MI->getParent();
597   DebugLoc DL = MI->getDebugLoc();
598   MachineInstr *NewI = BuildMI(B, MI, DL, TII->get(Opc));
599 
600   for (auto &Op : MI->operands()) {
601     if (!Op.isReg()) {
602       NewI->addOperand(Op);
603       continue;
604     }
605     // For register operands, set the subregister.
606     Register R = Op.getReg();
607     unsigned SR = Op.getSubReg();
608     bool isVirtReg = Register::isVirtualRegister(R);
609     bool isKill = Op.isKill();
610     if (isVirtReg && MRI->getRegClass(R) == DoubleRC) {
611       isKill = false;
612       UUPairMap::const_iterator F = PairMap.find(R);
613       if (F == PairMap.end()) {
614         SR = SubR;
615       } else {
616         const UUPair &P = F->second;
617         R = (SubR == Hexagon::isub_lo) ? P.first : P.second;
618         SR = 0;
619       }
620     }
621     auto CO = MachineOperand::CreateReg(R, Op.isDef(), Op.isImplicit(), isKill,
622           Op.isDead(), Op.isUndef(), Op.isEarlyClobber(), SR, Op.isDebug(),
623           Op.isInternalRead());
624     NewI->addOperand(CO);
625   }
626 }
627 
628 void HexagonSplitDoubleRegs::splitMemRef(MachineInstr *MI,
629       const UUPairMap &PairMap) {
630   bool Load = MI->mayLoad();
631   unsigned OrigOpc = MI->getOpcode();
632   bool PostInc = (OrigOpc == Hexagon::L2_loadrd_pi ||
633                   OrigOpc == Hexagon::S2_storerd_pi);
634   MachineInstr *LowI, *HighI;
635   MachineBasicBlock &B = *MI->getParent();
636   DebugLoc DL = MI->getDebugLoc();
637 
638   // Index of the base-address-register operand.
639   unsigned AdrX = PostInc ? (Load ? 2 : 1)
640                           : (Load ? 1 : 0);
641   MachineOperand &AdrOp = MI->getOperand(AdrX);
642   unsigned RSA = getRegState(AdrOp);
643   MachineOperand &ValOp = Load ? MI->getOperand(0)
644                                : (PostInc ? MI->getOperand(3)
645                                           : MI->getOperand(2));
646   UUPairMap::const_iterator F = PairMap.find(ValOp.getReg());
647   assert(F != PairMap.end());
648 
649   if (Load) {
650     const UUPair &P = F->second;
651     int64_t Off = PostInc ? 0 : MI->getOperand(2).getImm();
652     LowI = BuildMI(B, MI, DL, TII->get(Hexagon::L2_loadri_io), P.first)
653              .addReg(AdrOp.getReg(), RSA & ~RegState::Kill, AdrOp.getSubReg())
654              .addImm(Off);
655     HighI = BuildMI(B, MI, DL, TII->get(Hexagon::L2_loadri_io), P.second)
656               .addReg(AdrOp.getReg(), RSA & ~RegState::Kill, AdrOp.getSubReg())
657               .addImm(Off+4);
658   } else {
659     const UUPair &P = F->second;
660     int64_t Off = PostInc ? 0 : MI->getOperand(1).getImm();
661     LowI = BuildMI(B, MI, DL, TII->get(Hexagon::S2_storeri_io))
662              .addReg(AdrOp.getReg(), RSA & ~RegState::Kill, AdrOp.getSubReg())
663              .addImm(Off)
664              .addReg(P.first);
665     HighI = BuildMI(B, MI, DL, TII->get(Hexagon::S2_storeri_io))
666               .addReg(AdrOp.getReg(), RSA & ~RegState::Kill, AdrOp.getSubReg())
667               .addImm(Off+4)
668               .addReg(P.second);
669   }
670 
671   if (PostInc) {
672     // Create the increment of the address register.
673     int64_t Inc = Load ? MI->getOperand(3).getImm()
674                        : MI->getOperand(2).getImm();
675     MachineOperand &UpdOp = Load ? MI->getOperand(1) : MI->getOperand(0);
676     const TargetRegisterClass *RC = MRI->getRegClass(UpdOp.getReg());
677     Register NewR = MRI->createVirtualRegister(RC);
678     assert(!UpdOp.getSubReg() && "Def operand with subreg");
679     BuildMI(B, MI, DL, TII->get(Hexagon::A2_addi), NewR)
680       .addReg(AdrOp.getReg(), RSA)
681       .addImm(Inc);
682     MRI->replaceRegWith(UpdOp.getReg(), NewR);
683     // The original instruction will be deleted later.
684   }
685 
686   // Generate a new pair of memory-operands.
687   MachineFunction &MF = *B.getParent();
688   for (auto &MO : MI->memoperands()) {
689     const MachinePointerInfo &Ptr = MO->getPointerInfo();
690     MachineMemOperand::Flags F = MO->getFlags();
691     int A = MO->getAlignment();
692 
693     auto *Tmp1 = MF.getMachineMemOperand(Ptr, F, 4/*size*/, A);
694     LowI->addMemOperand(MF, Tmp1);
695     auto *Tmp2 = MF.getMachineMemOperand(Ptr, F, 4/*size*/, std::min(A, 4));
696     HighI->addMemOperand(MF, Tmp2);
697   }
698 }
699 
700 void HexagonSplitDoubleRegs::splitImmediate(MachineInstr *MI,
701       const UUPairMap &PairMap) {
702   MachineOperand &Op0 = MI->getOperand(0);
703   MachineOperand &Op1 = MI->getOperand(1);
704   assert(Op0.isReg() && Op1.isImm());
705   uint64_t V = Op1.getImm();
706 
707   MachineBasicBlock &B = *MI->getParent();
708   DebugLoc DL = MI->getDebugLoc();
709   UUPairMap::const_iterator F = PairMap.find(Op0.getReg());
710   assert(F != PairMap.end());
711   const UUPair &P = F->second;
712 
713   // The operand to A2_tfrsi can only have 32 significant bits. Immediate
714   // values in MachineOperand are stored as 64-bit integers, and so the
715   // value -1 may be represented either as 64-bit -1, or 4294967295. Both
716   // will have the 32 higher bits truncated in the end, but -1 will remain
717   // as -1, while the latter may appear to be a large unsigned value
718   // requiring a constant extender. The casting to int32_t will select the
719   // former representation. (The same reasoning applies to all 32-bit
720   // values.)
721   BuildMI(B, MI, DL, TII->get(Hexagon::A2_tfrsi), P.first)
722     .addImm(int32_t(V & 0xFFFFFFFFULL));
723   BuildMI(B, MI, DL, TII->get(Hexagon::A2_tfrsi), P.second)
724     .addImm(int32_t(V >> 32));
725 }
726 
727 void HexagonSplitDoubleRegs::splitCombine(MachineInstr *MI,
728       const UUPairMap &PairMap) {
729   MachineOperand &Op0 = MI->getOperand(0);
730   MachineOperand &Op1 = MI->getOperand(1);
731   MachineOperand &Op2 = MI->getOperand(2);
732   assert(Op0.isReg());
733 
734   MachineBasicBlock &B = *MI->getParent();
735   DebugLoc DL = MI->getDebugLoc();
736   UUPairMap::const_iterator F = PairMap.find(Op0.getReg());
737   assert(F != PairMap.end());
738   const UUPair &P = F->second;
739 
740   if (!Op1.isReg()) {
741     BuildMI(B, MI, DL, TII->get(Hexagon::A2_tfrsi), P.second)
742       .add(Op1);
743   } else {
744     BuildMI(B, MI, DL, TII->get(TargetOpcode::COPY), P.second)
745       .addReg(Op1.getReg(), getRegState(Op1), Op1.getSubReg());
746   }
747 
748   if (!Op2.isReg()) {
749     BuildMI(B, MI, DL, TII->get(Hexagon::A2_tfrsi), P.first)
750       .add(Op2);
751   } else {
752     BuildMI(B, MI, DL, TII->get(TargetOpcode::COPY), P.first)
753       .addReg(Op2.getReg(), getRegState(Op2), Op2.getSubReg());
754   }
755 }
756 
757 void HexagonSplitDoubleRegs::splitExt(MachineInstr *MI,
758       const UUPairMap &PairMap) {
759   MachineOperand &Op0 = MI->getOperand(0);
760   MachineOperand &Op1 = MI->getOperand(1);
761   assert(Op0.isReg() && Op1.isReg());
762 
763   MachineBasicBlock &B = *MI->getParent();
764   DebugLoc DL = MI->getDebugLoc();
765   UUPairMap::const_iterator F = PairMap.find(Op0.getReg());
766   assert(F != PairMap.end());
767   const UUPair &P = F->second;
768   unsigned RS = getRegState(Op1);
769 
770   BuildMI(B, MI, DL, TII->get(TargetOpcode::COPY), P.first)
771     .addReg(Op1.getReg(), RS & ~RegState::Kill, Op1.getSubReg());
772   BuildMI(B, MI, DL, TII->get(Hexagon::S2_asr_i_r), P.second)
773     .addReg(Op1.getReg(), RS, Op1.getSubReg())
774     .addImm(31);
775 }
776 
777 void HexagonSplitDoubleRegs::splitShift(MachineInstr *MI,
778       const UUPairMap &PairMap) {
779   using namespace Hexagon;
780 
781   MachineOperand &Op0 = MI->getOperand(0);
782   MachineOperand &Op1 = MI->getOperand(1);
783   MachineOperand &Op2 = MI->getOperand(2);
784   assert(Op0.isReg() && Op1.isReg() && Op2.isImm());
785   int64_t Sh64 = Op2.getImm();
786   assert(Sh64 >= 0 && Sh64 < 64);
787   unsigned S = Sh64;
788 
789   UUPairMap::const_iterator F = PairMap.find(Op0.getReg());
790   assert(F != PairMap.end());
791   const UUPair &P = F->second;
792   Register LoR = P.first;
793   Register HiR = P.second;
794 
795   unsigned Opc = MI->getOpcode();
796   bool Right = (Opc == S2_lsr_i_p || Opc == S2_asr_i_p);
797   bool Left = !Right;
798   bool Signed = (Opc == S2_asr_i_p);
799 
800   MachineBasicBlock &B = *MI->getParent();
801   DebugLoc DL = MI->getDebugLoc();
802   unsigned RS = getRegState(Op1);
803   unsigned ShiftOpc = Left ? S2_asl_i_r
804                            : (Signed ? S2_asr_i_r : S2_lsr_i_r);
805   unsigned LoSR = isub_lo;
806   unsigned HiSR = isub_hi;
807 
808   if (S == 0) {
809     // No shift, subregister copy.
810     BuildMI(B, MI, DL, TII->get(TargetOpcode::COPY), LoR)
811       .addReg(Op1.getReg(), RS & ~RegState::Kill, LoSR);
812     BuildMI(B, MI, DL, TII->get(TargetOpcode::COPY), HiR)
813       .addReg(Op1.getReg(), RS, HiSR);
814   } else if (S < 32) {
815     const TargetRegisterClass *IntRC = &IntRegsRegClass;
816     Register TmpR = MRI->createVirtualRegister(IntRC);
817     // Expansion:
818     // Shift left:    DR = shl R, #s
819     //   LoR  = shl R.lo, #s
820     //   TmpR = extractu R.lo, #s, #32-s
821     //   HiR  = or (TmpR, asl(R.hi, #s))
822     // Shift right:   DR = shr R, #s
823     //   HiR  = shr R.hi, #s
824     //   TmpR = shr R.lo, #s
825     //   LoR  = insert TmpR, R.hi, #s, #32-s
826 
827     // Shift left:
828     //   LoR  = shl R.lo, #s
829     // Shift right:
830     //   TmpR = shr R.lo, #s
831 
832     // Make a special case for A2_aslh and A2_asrh (they are predicable as
833     // opposed to S2_asl_i_r/S2_asr_i_r).
834     if (S == 16 && Left)
835       BuildMI(B, MI, DL, TII->get(A2_aslh), LoR)
836         .addReg(Op1.getReg(), RS & ~RegState::Kill, LoSR);
837     else if (S == 16 && Signed)
838       BuildMI(B, MI, DL, TII->get(A2_asrh), TmpR)
839         .addReg(Op1.getReg(), RS & ~RegState::Kill, LoSR);
840     else
841       BuildMI(B, MI, DL, TII->get(ShiftOpc), (Left ? LoR : TmpR))
842         .addReg(Op1.getReg(), RS & ~RegState::Kill, LoSR)
843         .addImm(S);
844 
845     if (Left) {
846       // TmpR = extractu R.lo, #s, #32-s
847       BuildMI(B, MI, DL, TII->get(S2_extractu), TmpR)
848         .addReg(Op1.getReg(), RS & ~RegState::Kill, LoSR)
849         .addImm(S)
850         .addImm(32-S);
851       // HiR  = or (TmpR, asl(R.hi, #s))
852       BuildMI(B, MI, DL, TII->get(S2_asl_i_r_or), HiR)
853         .addReg(TmpR)
854         .addReg(Op1.getReg(), RS, HiSR)
855         .addImm(S);
856     } else {
857       // HiR  = shr R.hi, #s
858       BuildMI(B, MI, DL, TII->get(ShiftOpc), HiR)
859         .addReg(Op1.getReg(), RS & ~RegState::Kill, HiSR)
860         .addImm(S);
861       // LoR  = insert TmpR, R.hi, #s, #32-s
862       BuildMI(B, MI, DL, TII->get(S2_insert), LoR)
863         .addReg(TmpR)
864         .addReg(Op1.getReg(), RS, HiSR)
865         .addImm(S)
866         .addImm(32-S);
867     }
868   } else if (S == 32) {
869     BuildMI(B, MI, DL, TII->get(TargetOpcode::COPY), (Left ? HiR : LoR))
870       .addReg(Op1.getReg(), RS & ~RegState::Kill, (Left ? LoSR : HiSR));
871     if (!Signed)
872       BuildMI(B, MI, DL, TII->get(A2_tfrsi), (Left ? LoR : HiR))
873         .addImm(0);
874     else  // Must be right shift.
875       BuildMI(B, MI, DL, TII->get(S2_asr_i_r), HiR)
876         .addReg(Op1.getReg(), RS, HiSR)
877         .addImm(31);
878   } else if (S < 64) {
879     S -= 32;
880     if (S == 16 && Left)
881       BuildMI(B, MI, DL, TII->get(A2_aslh), HiR)
882         .addReg(Op1.getReg(), RS & ~RegState::Kill, LoSR);
883     else if (S == 16 && Signed)
884       BuildMI(B, MI, DL, TII->get(A2_asrh), LoR)
885         .addReg(Op1.getReg(), RS & ~RegState::Kill, HiSR);
886     else
887       BuildMI(B, MI, DL, TII->get(ShiftOpc), (Left ? HiR : LoR))
888         .addReg(Op1.getReg(), RS & ~RegState::Kill, (Left ? LoSR : HiSR))
889         .addImm(S);
890 
891     if (Signed)
892       BuildMI(B, MI, DL, TII->get(S2_asr_i_r), HiR)
893         .addReg(Op1.getReg(), RS, HiSR)
894         .addImm(31);
895     else
896       BuildMI(B, MI, DL, TII->get(A2_tfrsi), (Left ? LoR : HiR))
897         .addImm(0);
898   }
899 }
900 
901 void HexagonSplitDoubleRegs::splitAslOr(MachineInstr *MI,
902       const UUPairMap &PairMap) {
903   using namespace Hexagon;
904 
905   MachineOperand &Op0 = MI->getOperand(0);
906   MachineOperand &Op1 = MI->getOperand(1);
907   MachineOperand &Op2 = MI->getOperand(2);
908   MachineOperand &Op3 = MI->getOperand(3);
909   assert(Op0.isReg() && Op1.isReg() && Op2.isReg() && Op3.isImm());
910   int64_t Sh64 = Op3.getImm();
911   assert(Sh64 >= 0 && Sh64 < 64);
912   unsigned S = Sh64;
913 
914   UUPairMap::const_iterator F = PairMap.find(Op0.getReg());
915   assert(F != PairMap.end());
916   const UUPair &P = F->second;
917   unsigned LoR = P.first;
918   unsigned HiR = P.second;
919 
920   MachineBasicBlock &B = *MI->getParent();
921   DebugLoc DL = MI->getDebugLoc();
922   unsigned RS1 = getRegState(Op1);
923   unsigned RS2 = getRegState(Op2);
924   const TargetRegisterClass *IntRC = &IntRegsRegClass;
925 
926   unsigned LoSR = isub_lo;
927   unsigned HiSR = isub_hi;
928 
929   // Op0 = S2_asl_i_p_or Op1, Op2, Op3
930   // means:  Op0 = or (Op1, asl(Op2, Op3))
931 
932   // Expansion of
933   //   DR = or (R1, asl(R2, #s))
934   //
935   //   LoR  = or (R1.lo, asl(R2.lo, #s))
936   //   Tmp1 = extractu R2.lo, #s, #32-s
937   //   Tmp2 = or R1.hi, Tmp1
938   //   HiR  = or (Tmp2, asl(R2.hi, #s))
939 
940   if (S == 0) {
941     // DR  = or (R1, asl(R2, #0))
942     //    -> or (R1, R2)
943     // i.e. LoR = or R1.lo, R2.lo
944     //      HiR = or R1.hi, R2.hi
945     BuildMI(B, MI, DL, TII->get(A2_or), LoR)
946       .addReg(Op1.getReg(), RS1 & ~RegState::Kill, LoSR)
947       .addReg(Op2.getReg(), RS2 & ~RegState::Kill, LoSR);
948     BuildMI(B, MI, DL, TII->get(A2_or), HiR)
949       .addReg(Op1.getReg(), RS1, HiSR)
950       .addReg(Op2.getReg(), RS2, HiSR);
951   } else if (S < 32) {
952     BuildMI(B, MI, DL, TII->get(S2_asl_i_r_or), LoR)
953       .addReg(Op1.getReg(), RS1 & ~RegState::Kill, LoSR)
954       .addReg(Op2.getReg(), RS2 & ~RegState::Kill, LoSR)
955       .addImm(S);
956     Register TmpR1 = MRI->createVirtualRegister(IntRC);
957     BuildMI(B, MI, DL, TII->get(S2_extractu), TmpR1)
958       .addReg(Op2.getReg(), RS2 & ~RegState::Kill, LoSR)
959       .addImm(S)
960       .addImm(32-S);
961     Register TmpR2 = MRI->createVirtualRegister(IntRC);
962     BuildMI(B, MI, DL, TII->get(A2_or), TmpR2)
963       .addReg(Op1.getReg(), RS1, HiSR)
964       .addReg(TmpR1);
965     BuildMI(B, MI, DL, TII->get(S2_asl_i_r_or), HiR)
966       .addReg(TmpR2)
967       .addReg(Op2.getReg(), RS2, HiSR)
968       .addImm(S);
969   } else if (S == 32) {
970     // DR  = or (R1, asl(R2, #32))
971     //    -> or R1, R2.lo
972     // LoR = R1.lo
973     // HiR = or R1.hi, R2.lo
974     BuildMI(B, MI, DL, TII->get(TargetOpcode::COPY), LoR)
975       .addReg(Op1.getReg(), RS1 & ~RegState::Kill, LoSR);
976     BuildMI(B, MI, DL, TII->get(A2_or), HiR)
977       .addReg(Op1.getReg(), RS1, HiSR)
978       .addReg(Op2.getReg(), RS2, LoSR);
979   } else if (S < 64) {
980     // DR  = or (R1, asl(R2, #s))
981     //
982     // LoR = R1:lo
983     // HiR = or (R1:hi, asl(R2:lo, #s-32))
984     S -= 32;
985     BuildMI(B, MI, DL, TII->get(TargetOpcode::COPY), LoR)
986       .addReg(Op1.getReg(), RS1 & ~RegState::Kill, LoSR);
987     BuildMI(B, MI, DL, TII->get(S2_asl_i_r_or), HiR)
988       .addReg(Op1.getReg(), RS1, HiSR)
989       .addReg(Op2.getReg(), RS2, LoSR)
990       .addImm(S);
991   }
992 }
993 
994 bool HexagonSplitDoubleRegs::splitInstr(MachineInstr *MI,
995       const UUPairMap &PairMap) {
996   using namespace Hexagon;
997 
998   LLVM_DEBUG(dbgs() << "Splitting: " << *MI);
999   bool Split = false;
1000   unsigned Opc = MI->getOpcode();
1001 
1002   switch (Opc) {
1003     case TargetOpcode::PHI:
1004     case TargetOpcode::COPY: {
1005       Register DstR = MI->getOperand(0).getReg();
1006       if (MRI->getRegClass(DstR) == DoubleRC) {
1007         createHalfInstr(Opc, MI, PairMap, isub_lo);
1008         createHalfInstr(Opc, MI, PairMap, isub_hi);
1009         Split = true;
1010       }
1011       break;
1012     }
1013     case A2_andp:
1014       createHalfInstr(A2_and, MI, PairMap, isub_lo);
1015       createHalfInstr(A2_and, MI, PairMap, isub_hi);
1016       Split = true;
1017       break;
1018     case A2_orp:
1019       createHalfInstr(A2_or, MI, PairMap, isub_lo);
1020       createHalfInstr(A2_or, MI, PairMap, isub_hi);
1021       Split = true;
1022       break;
1023     case A2_xorp:
1024       createHalfInstr(A2_xor, MI, PairMap, isub_lo);
1025       createHalfInstr(A2_xor, MI, PairMap, isub_hi);
1026       Split = true;
1027       break;
1028 
1029     case L2_loadrd_io:
1030     case L2_loadrd_pi:
1031     case S2_storerd_io:
1032     case S2_storerd_pi:
1033       splitMemRef(MI, PairMap);
1034       Split = true;
1035       break;
1036 
1037     case A2_tfrpi:
1038     case CONST64:
1039       splitImmediate(MI, PairMap);
1040       Split = true;
1041       break;
1042 
1043     case A2_combineii:
1044     case A4_combineir:
1045     case A4_combineii:
1046     case A4_combineri:
1047     case A2_combinew:
1048       splitCombine(MI, PairMap);
1049       Split = true;
1050       break;
1051 
1052     case A2_sxtw:
1053       splitExt(MI, PairMap);
1054       Split = true;
1055       break;
1056 
1057     case S2_asl_i_p:
1058     case S2_asr_i_p:
1059     case S2_lsr_i_p:
1060       splitShift(MI, PairMap);
1061       Split = true;
1062       break;
1063 
1064     case S2_asl_i_p_or:
1065       splitAslOr(MI, PairMap);
1066       Split = true;
1067       break;
1068 
1069     default:
1070       llvm_unreachable("Instruction not splitable");
1071       return false;
1072   }
1073 
1074   return Split;
1075 }
1076 
1077 void HexagonSplitDoubleRegs::replaceSubregUses(MachineInstr *MI,
1078       const UUPairMap &PairMap) {
1079   for (auto &Op : MI->operands()) {
1080     if (!Op.isReg() || !Op.isUse() || !Op.getSubReg())
1081       continue;
1082     Register R = Op.getReg();
1083     UUPairMap::const_iterator F = PairMap.find(R);
1084     if (F == PairMap.end())
1085       continue;
1086     const UUPair &P = F->second;
1087     switch (Op.getSubReg()) {
1088       case Hexagon::isub_lo:
1089         Op.setReg(P.first);
1090         break;
1091       case Hexagon::isub_hi:
1092         Op.setReg(P.second);
1093         break;
1094     }
1095     Op.setSubReg(0);
1096   }
1097 }
1098 
1099 void HexagonSplitDoubleRegs::collapseRegPairs(MachineInstr *MI,
1100       const UUPairMap &PairMap) {
1101   MachineBasicBlock &B = *MI->getParent();
1102   DebugLoc DL = MI->getDebugLoc();
1103 
1104   for (auto &Op : MI->operands()) {
1105     if (!Op.isReg() || !Op.isUse())
1106       continue;
1107     Register R = Op.getReg();
1108     if (!Register::isVirtualRegister(R))
1109       continue;
1110     if (MRI->getRegClass(R) != DoubleRC || Op.getSubReg())
1111       continue;
1112     UUPairMap::const_iterator F = PairMap.find(R);
1113     if (F == PairMap.end())
1114       continue;
1115     const UUPair &Pr = F->second;
1116     Register NewDR = MRI->createVirtualRegister(DoubleRC);
1117     BuildMI(B, MI, DL, TII->get(TargetOpcode::REG_SEQUENCE), NewDR)
1118       .addReg(Pr.first)
1119       .addImm(Hexagon::isub_lo)
1120       .addReg(Pr.second)
1121       .addImm(Hexagon::isub_hi);
1122     Op.setReg(NewDR);
1123   }
1124 }
1125 
1126 bool HexagonSplitDoubleRegs::splitPartition(const USet &Part) {
1127   using MISet = std::set<MachineInstr *>;
1128 
1129   const TargetRegisterClass *IntRC = &Hexagon::IntRegsRegClass;
1130   bool Changed = false;
1131 
1132   LLVM_DEBUG(dbgs() << "Splitting partition: ";
1133              dump_partition(dbgs(), Part, *TRI); dbgs() << '\n');
1134 
1135   UUPairMap PairMap;
1136 
1137   MISet SplitIns;
1138   for (unsigned DR : Part) {
1139     MachineInstr *DefI = MRI->getVRegDef(DR);
1140     SplitIns.insert(DefI);
1141 
1142     // Collect all instructions, including fixed ones.  We won't split them,
1143     // but we need to visit them again to insert the REG_SEQUENCE instructions.
1144     for (auto U = MRI->use_nodbg_begin(DR), W = MRI->use_nodbg_end();
1145          U != W; ++U)
1146       SplitIns.insert(U->getParent());
1147 
1148     Register LoR = MRI->createVirtualRegister(IntRC);
1149     Register HiR = MRI->createVirtualRegister(IntRC);
1150     LLVM_DEBUG(dbgs() << "Created mapping: " << printReg(DR, TRI) << " -> "
1151                       << printReg(HiR, TRI) << ':' << printReg(LoR, TRI)
1152                       << '\n');
1153     PairMap.insert(std::make_pair(DR, UUPair(LoR, HiR)));
1154   }
1155 
1156   MISet Erase;
1157   for (auto MI : SplitIns) {
1158     if (isFixedInstr(MI)) {
1159       collapseRegPairs(MI, PairMap);
1160     } else {
1161       bool Done = splitInstr(MI, PairMap);
1162       if (Done)
1163         Erase.insert(MI);
1164       Changed |= Done;
1165     }
1166   }
1167 
1168   for (unsigned DR : Part) {
1169     // Before erasing "double" instructions, revisit all uses of the double
1170     // registers in this partition, and replace all uses of them with subre-
1171     // gisters, with the corresponding single registers.
1172     MISet Uses;
1173     for (auto U = MRI->use_nodbg_begin(DR), W = MRI->use_nodbg_end();
1174          U != W; ++U)
1175       Uses.insert(U->getParent());
1176     for (auto M : Uses)
1177       replaceSubregUses(M, PairMap);
1178   }
1179 
1180   for (auto MI : Erase) {
1181     MachineBasicBlock *B = MI->getParent();
1182     B->erase(MI);
1183   }
1184 
1185   return Changed;
1186 }
1187 
1188 bool HexagonSplitDoubleRegs::runOnMachineFunction(MachineFunction &MF) {
1189   if (skipFunction(MF.getFunction()))
1190     return false;
1191 
1192   LLVM_DEBUG(dbgs() << "Splitting double registers in function: "
1193                     << MF.getName() << '\n');
1194 
1195   auto &ST = MF.getSubtarget<HexagonSubtarget>();
1196   TRI = ST.getRegisterInfo();
1197   TII = ST.getInstrInfo();
1198   MRI = &MF.getRegInfo();
1199   MLI = &getAnalysis<MachineLoopInfo>();
1200 
1201   UUSetMap P2Rs;
1202   LoopRegMap IRM;
1203 
1204   collectIndRegs(IRM);
1205   partitionRegisters(P2Rs);
1206 
1207   LLVM_DEBUG({
1208     dbgs() << "Register partitioning: (partition #0 is fixed)\n";
1209     for (UUSetMap::iterator I = P2Rs.begin(), E = P2Rs.end(); I != E; ++I) {
1210       dbgs() << '#' << I->first << " -> ";
1211       dump_partition(dbgs(), I->second, *TRI);
1212       dbgs() << '\n';
1213     }
1214   });
1215 
1216   bool Changed = false;
1217   int Limit = MaxHSDR;
1218 
1219   for (UUSetMap::iterator I = P2Rs.begin(), E = P2Rs.end(); I != E; ++I) {
1220     if (I->first == 0)
1221       continue;
1222     if (Limit >= 0 && Counter >= Limit)
1223       break;
1224     USet &Part = I->second;
1225     LLVM_DEBUG(dbgs() << "Calculating profit for partition #" << I->first
1226                       << '\n');
1227     if (!isProfitable(Part, IRM))
1228       continue;
1229     Counter++;
1230     Changed |= splitPartition(Part);
1231   }
1232 
1233   return Changed;
1234 }
1235 
1236 FunctionPass *llvm::createHexagonSplitDoubleRegs() {
1237   return new HexagonSplitDoubleRegs();
1238 }
1239