/src/llvm-project/llvm/lib/Target/AArch64/AArch64CleanupLocalDynamicTLSPass.cpp
Line | Count | Source (jump to first uncovered line) |
1 | | //===-- AArch64CleanupLocalDynamicTLSPass.cpp ---------------------*- C++ -*-=// |
2 | | // |
3 | | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
4 | | // See https://llvm.org/LICENSE.txt for license information. |
5 | | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
6 | | // |
7 | | //===----------------------------------------------------------------------===// |
8 | | // |
9 | | // Local-dynamic access to thread-local variables proceeds in three stages. |
10 | | // |
11 | | // 1. The offset of this Module's thread-local area from TPIDR_EL0 is calculated |
12 | | // in much the same way as a general-dynamic TLS-descriptor access against |
13 | | // the special symbol _TLS_MODULE_BASE. |
14 | | // 2. The variable's offset from _TLS_MODULE_BASE_ is calculated using |
15 | | // instructions with "dtprel" modifiers. |
16 | | // 3. These two are added, together with TPIDR_EL0, to obtain the variable's |
17 | | // true address. |
18 | | // |
19 | | // This is only better than general-dynamic access to the variable if two or |
20 | | // more of the first stage TLS-descriptor calculations can be combined. This |
21 | | // pass looks through a function and performs such combinations. |
22 | | // |
23 | | //===----------------------------------------------------------------------===// |
24 | | #include "AArch64.h" |
25 | | #include "AArch64InstrInfo.h" |
26 | | #include "AArch64MachineFunctionInfo.h" |
27 | | #include "llvm/CodeGen/MachineDominators.h" |
28 | | #include "llvm/CodeGen/MachineFunction.h" |
29 | | #include "llvm/CodeGen/MachineFunctionPass.h" |
30 | | #include "llvm/CodeGen/MachineInstrBuilder.h" |
31 | | #include "llvm/CodeGen/MachineRegisterInfo.h" |
32 | | using namespace llvm; |
33 | | |
34 | 0 | #define TLSCLEANUP_PASS_NAME "AArch64 Local Dynamic TLS Access Clean-up" |
35 | | |
36 | | namespace { |
37 | | struct LDTLSCleanup : public MachineFunctionPass { |
38 | | static char ID; |
39 | 4.00k | LDTLSCleanup() : MachineFunctionPass(ID) { |
40 | 4.00k | initializeLDTLSCleanupPass(*PassRegistry::getPassRegistry()); |
41 | 4.00k | } |
42 | | |
43 | 34.0k | bool runOnMachineFunction(MachineFunction &MF) override { |
44 | 34.0k | if (skipFunction(MF.getFunction())) |
45 | 0 | return false; |
46 | | |
47 | 34.0k | AArch64FunctionInfo *AFI = MF.getInfo<AArch64FunctionInfo>(); |
48 | 34.0k | if (AFI->getNumLocalDynamicTLSAccesses() < 2) { |
49 | | // No point folding accesses if there isn't at least two. |
50 | 34.0k | return false; |
51 | 34.0k | } |
52 | | |
53 | 0 | MachineDominatorTree *DT = &getAnalysis<MachineDominatorTree>(); |
54 | 0 | return VisitNode(DT->getRootNode(), 0); |
55 | 34.0k | } |
56 | | |
57 | | // Visit the dominator subtree rooted at Node in pre-order. |
58 | | // If TLSBaseAddrReg is non-null, then use that to replace any |
59 | | // TLS_base_addr instructions. Otherwise, create the register |
60 | | // when the first such instruction is seen, and then use it |
61 | | // as we encounter more instructions. |
62 | 0 | bool VisitNode(MachineDomTreeNode *Node, unsigned TLSBaseAddrReg) { |
63 | 0 | MachineBasicBlock *BB = Node->getBlock(); |
64 | 0 | bool Changed = false; |
65 | | |
66 | | // Traverse the current block. |
67 | 0 | for (MachineBasicBlock::iterator I = BB->begin(), E = BB->end(); I != E; |
68 | 0 | ++I) { |
69 | 0 | switch (I->getOpcode()) { |
70 | 0 | case AArch64::TLSDESC_CALLSEQ: |
71 | | // Make sure it's a local dynamic access. |
72 | 0 | if (!I->getOperand(0).isSymbol() || |
73 | 0 | strcmp(I->getOperand(0).getSymbolName(), "_TLS_MODULE_BASE_")) |
74 | 0 | break; |
75 | | |
76 | 0 | if (TLSBaseAddrReg) |
77 | 0 | I = replaceTLSBaseAddrCall(*I, TLSBaseAddrReg); |
78 | 0 | else |
79 | 0 | I = setRegister(*I, &TLSBaseAddrReg); |
80 | 0 | Changed = true; |
81 | 0 | break; |
82 | 0 | default: |
83 | 0 | break; |
84 | 0 | } |
85 | 0 | } |
86 | | |
87 | | // Visit the children of this block in the dominator tree. |
88 | 0 | for (MachineDomTreeNode *N : *Node) { |
89 | 0 | Changed |= VisitNode(N, TLSBaseAddrReg); |
90 | 0 | } |
91 | |
|
92 | 0 | return Changed; |
93 | 0 | } |
94 | | |
95 | | // Replace the TLS_base_addr instruction I with a copy from |
96 | | // TLSBaseAddrReg, returning the new instruction. |
97 | | MachineInstr *replaceTLSBaseAddrCall(MachineInstr &I, |
98 | 0 | unsigned TLSBaseAddrReg) { |
99 | 0 | MachineFunction *MF = I.getParent()->getParent(); |
100 | 0 | const TargetInstrInfo *TII = MF->getSubtarget().getInstrInfo(); |
101 | | |
102 | | // Insert a Copy from TLSBaseAddrReg to x0, which is where the rest of the |
103 | | // code sequence assumes the address will be. |
104 | 0 | MachineInstr *Copy = BuildMI(*I.getParent(), I, I.getDebugLoc(), |
105 | 0 | TII->get(TargetOpcode::COPY), AArch64::X0) |
106 | 0 | .addReg(TLSBaseAddrReg); |
107 | | |
108 | | // Update the call site info. |
109 | 0 | if (I.shouldUpdateCallSiteInfo()) |
110 | 0 | I.getMF()->eraseCallSiteInfo(&I); |
111 | | |
112 | | // Erase the TLS_base_addr instruction. |
113 | 0 | I.eraseFromParent(); |
114 | |
|
115 | 0 | return Copy; |
116 | 0 | } |
117 | | |
118 | | // Create a virtual register in *TLSBaseAddrReg, and populate it by |
119 | | // inserting a copy instruction after I. Returns the new instruction. |
120 | 0 | MachineInstr *setRegister(MachineInstr &I, unsigned *TLSBaseAddrReg) { |
121 | 0 | MachineFunction *MF = I.getParent()->getParent(); |
122 | 0 | const TargetInstrInfo *TII = MF->getSubtarget().getInstrInfo(); |
123 | | |
124 | | // Create a virtual register for the TLS base address. |
125 | 0 | MachineRegisterInfo &RegInfo = MF->getRegInfo(); |
126 | 0 | *TLSBaseAddrReg = RegInfo.createVirtualRegister(&AArch64::GPR64RegClass); |
127 | | |
128 | | // Insert a copy from X0 to TLSBaseAddrReg for later. |
129 | 0 | MachineInstr *Copy = |
130 | 0 | BuildMI(*I.getParent(), ++I.getIterator(), I.getDebugLoc(), |
131 | 0 | TII->get(TargetOpcode::COPY), *TLSBaseAddrReg) |
132 | 0 | .addReg(AArch64::X0); |
133 | |
|
134 | 0 | return Copy; |
135 | 0 | } |
136 | | |
137 | 0 | StringRef getPassName() const override { return TLSCLEANUP_PASS_NAME; } |
138 | | |
139 | 4.00k | void getAnalysisUsage(AnalysisUsage &AU) const override { |
140 | 4.00k | AU.setPreservesCFG(); |
141 | 4.00k | AU.addRequired<MachineDominatorTree>(); |
142 | 4.00k | MachineFunctionPass::getAnalysisUsage(AU); |
143 | 4.00k | } |
144 | | }; |
145 | | } |
146 | | |
147 | | INITIALIZE_PASS(LDTLSCleanup, "aarch64-local-dynamic-tls-cleanup", |
148 | | TLSCLEANUP_PASS_NAME, false, false) |
149 | | |
150 | | char LDTLSCleanup::ID = 0; |
151 | 4.00k | FunctionPass *llvm::createAArch64CleanupLocalDynamicTLSPass() { |
152 | 4.00k | return new LDTLSCleanup(); |
153 | 4.00k | } |