1 /* 2 * Copyright (C) 2015 The Android Open Source Project 3 * 4 * Licensed under the Apache License, Version 2.0 (the "License"); 5 * you may not use this file except in compliance with the License. 6 * You may obtain a copy of the License at 7 * 8 * http://www.apache.org/licenses/LICENSE-2.0 9 * 10 * Unless required by applicable law or agreed to in writing, software 11 * distributed under the License is distributed on an "AS IS" BASIS, 12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13 * See the License for the specific language governing permissions and 14 * limitations under the License. 15 */ 16 17 #include "pc_relative_fixups_x86.h" 18 #include "code_generator_x86.h" 19 #include "intrinsics_x86.h" 20 21 namespace art { 22 namespace x86 { 23 24 /** 25 * Finds instructions that need the constant area base as an input. 26 */ 27 class PCRelativeHandlerVisitor : public HGraphVisitor { 28 public: 29 PCRelativeHandlerVisitor(HGraph* graph, CodeGenerator* codegen) 30 : HGraphVisitor(graph), 31 codegen_(down_cast<CodeGeneratorX86*>(codegen)), 32 base_(nullptr) {} 33 34 void MoveBaseIfNeeded() { 35 if (base_ != nullptr) { 36 // Bring the base closer to the first use (previously, it was in the 37 // entry block) and relieve some pressure on the register allocator 38 // while avoiding recalculation of the base in a loop. 39 base_->MoveBeforeFirstUserAndOutOfLoops(); 40 } 41 } 42 43 private: 44 void VisitAdd(HAdd* add) OVERRIDE { 45 BinaryFP(add); 46 } 47 48 void VisitSub(HSub* sub) OVERRIDE { 49 BinaryFP(sub); 50 } 51 52 void VisitMul(HMul* mul) OVERRIDE { 53 BinaryFP(mul); 54 } 55 56 void VisitDiv(HDiv* div) OVERRIDE { 57 BinaryFP(div); 58 } 59 60 void VisitCompare(HCompare* compare) OVERRIDE { 61 BinaryFP(compare); 62 } 63 64 void VisitReturn(HReturn* ret) OVERRIDE { 65 HConstant* value = ret->InputAt(0)->AsConstant(); 66 if ((value != nullptr && DataType::IsFloatingPointType(value->GetType()))) { 67 ReplaceInput(ret, value, 0, true); 68 } 69 } 70 71 void VisitInvokeStaticOrDirect(HInvokeStaticOrDirect* invoke) OVERRIDE { 72 HandleInvoke(invoke); 73 } 74 75 void VisitInvokeVirtual(HInvokeVirtual* invoke) OVERRIDE { 76 HandleInvoke(invoke); 77 } 78 79 void VisitInvokeInterface(HInvokeInterface* invoke) OVERRIDE { 80 HandleInvoke(invoke); 81 } 82 83 void VisitLoadClass(HLoadClass* load_class) OVERRIDE { 84 HLoadClass::LoadKind load_kind = load_class->GetLoadKind(); 85 if (load_kind == HLoadClass::LoadKind::kBootImageLinkTimePcRelative || 86 load_kind == HLoadClass::LoadKind::kBootImageClassTable || 87 load_kind == HLoadClass::LoadKind::kBssEntry) { 88 HX86ComputeBaseMethodAddress* method_address = GetPCRelativeBasePointer(load_class); 89 load_class->AddSpecialInput(method_address); 90 } 91 } 92 93 void VisitLoadString(HLoadString* load_string) OVERRIDE { 94 HLoadString::LoadKind load_kind = load_string->GetLoadKind(); 95 if (load_kind == HLoadString::LoadKind::kBootImageLinkTimePcRelative || 96 load_kind == HLoadString::LoadKind::kBootImageInternTable || 97 load_kind == HLoadString::LoadKind::kBssEntry) { 98 HX86ComputeBaseMethodAddress* method_address = GetPCRelativeBasePointer(load_string); 99 load_string->AddSpecialInput(method_address); 100 } 101 } 102 103 void BinaryFP(HBinaryOperation* bin) { 104 HConstant* rhs = bin->InputAt(1)->AsConstant(); 105 if (rhs != nullptr && DataType::IsFloatingPointType(rhs->GetType())) { 106 ReplaceInput(bin, rhs, 1, false); 107 } 108 } 109 110 void VisitEqual(HEqual* cond) OVERRIDE { 111 BinaryFP(cond); 112 } 113 114 void VisitNotEqual(HNotEqual* cond) OVERRIDE { 115 BinaryFP(cond); 116 } 117 118 void VisitLessThan(HLessThan* cond) OVERRIDE { 119 BinaryFP(cond); 120 } 121 122 void VisitLessThanOrEqual(HLessThanOrEqual* cond) OVERRIDE { 123 BinaryFP(cond); 124 } 125 126 void VisitGreaterThan(HGreaterThan* cond) OVERRIDE { 127 BinaryFP(cond); 128 } 129 130 void VisitGreaterThanOrEqual(HGreaterThanOrEqual* cond) OVERRIDE { 131 BinaryFP(cond); 132 } 133 134 void VisitNeg(HNeg* neg) OVERRIDE { 135 if (DataType::IsFloatingPointType(neg->GetType())) { 136 // We need to replace the HNeg with a HX86FPNeg in order to address the constant area. 137 HX86ComputeBaseMethodAddress* method_address = GetPCRelativeBasePointer(neg); 138 HGraph* graph = GetGraph(); 139 HBasicBlock* block = neg->GetBlock(); 140 HX86FPNeg* x86_fp_neg = new (graph->GetAllocator()) HX86FPNeg( 141 neg->GetType(), 142 neg->InputAt(0), 143 method_address, 144 neg->GetDexPc()); 145 block->ReplaceAndRemoveInstructionWith(neg, x86_fp_neg); 146 } 147 } 148 149 void VisitPackedSwitch(HPackedSwitch* switch_insn) OVERRIDE { 150 if (switch_insn->GetNumEntries() <= 151 InstructionCodeGeneratorX86::kPackedSwitchJumpTableThreshold) { 152 return; 153 } 154 // We need to replace the HPackedSwitch with a HX86PackedSwitch in order to 155 // address the constant area. 156 HX86ComputeBaseMethodAddress* method_address = GetPCRelativeBasePointer(switch_insn); 157 HGraph* graph = GetGraph(); 158 HBasicBlock* block = switch_insn->GetBlock(); 159 HX86PackedSwitch* x86_switch = new (graph->GetAllocator()) HX86PackedSwitch( 160 switch_insn->GetStartValue(), 161 switch_insn->GetNumEntries(), 162 switch_insn->InputAt(0), 163 method_address, 164 switch_insn->GetDexPc()); 165 block->ReplaceAndRemoveInstructionWith(switch_insn, x86_switch); 166 } 167 168 HX86ComputeBaseMethodAddress* GetPCRelativeBasePointer(HInstruction* cursor) { 169 bool has_irreducible_loops = GetGraph()->HasIrreducibleLoops(); 170 if (!has_irreducible_loops) { 171 // Ensure we only initialize the pointer once. 172 if (base_ != nullptr) { 173 return base_; 174 } 175 } 176 // Insert the base at the start of the entry block, move it to a better 177 // position later in MoveBaseIfNeeded(). 178 HX86ComputeBaseMethodAddress* method_address = 179 new (GetGraph()->GetAllocator()) HX86ComputeBaseMethodAddress(); 180 if (has_irreducible_loops) { 181 cursor->GetBlock()->InsertInstructionBefore(method_address, cursor); 182 } else { 183 HBasicBlock* entry_block = GetGraph()->GetEntryBlock(); 184 entry_block->InsertInstructionBefore(method_address, entry_block->GetFirstInstruction()); 185 base_ = method_address; 186 } 187 return method_address; 188 } 189 190 void ReplaceInput(HInstruction* insn, HConstant* value, int input_index, bool materialize) { 191 HX86ComputeBaseMethodAddress* method_address = GetPCRelativeBasePointer(insn); 192 HX86LoadFromConstantTable* load_constant = 193 new (GetGraph()->GetAllocator()) HX86LoadFromConstantTable(method_address, value); 194 if (!materialize) { 195 load_constant->MarkEmittedAtUseSite(); 196 } 197 insn->GetBlock()->InsertInstructionBefore(load_constant, insn); 198 insn->ReplaceInput(load_constant, input_index); 199 } 200 201 void HandleInvoke(HInvoke* invoke) { 202 // If this is an invoke-static/-direct with PC-relative dex cache array 203 // addressing, we need the PC-relative address base. 204 HInvokeStaticOrDirect* invoke_static_or_direct = invoke->AsInvokeStaticOrDirect(); 205 // We can't add a pointer to the constant area if we already have a current 206 // method pointer. This may arise when sharpening doesn't remove the current 207 // method pointer from the invoke. 208 if (invoke_static_or_direct != nullptr && 209 invoke_static_or_direct->HasCurrentMethodInput()) { 210 DCHECK(!invoke_static_or_direct->HasPcRelativeMethodLoadKind()); 211 return; 212 } 213 214 bool base_added = false; 215 if (invoke_static_or_direct != nullptr && 216 invoke_static_or_direct->HasPcRelativeMethodLoadKind() && 217 !IsCallFreeIntrinsic<IntrinsicLocationsBuilderX86>(invoke, codegen_)) { 218 HX86ComputeBaseMethodAddress* method_address = GetPCRelativeBasePointer(invoke); 219 // Add the extra parameter. 220 invoke_static_or_direct->AddSpecialInput(method_address); 221 base_added = true; 222 } 223 224 // Ensure that we can load FP arguments from the constant area. 225 HInputsRef inputs = invoke->GetInputs(); 226 for (size_t i = 0; i < inputs.size(); i++) { 227 HConstant* input = inputs[i]->AsConstant(); 228 if (input != nullptr && DataType::IsFloatingPointType(input->GetType())) { 229 ReplaceInput(invoke, input, i, true); 230 } 231 } 232 233 // These intrinsics need the constant area. 234 switch (invoke->GetIntrinsic()) { 235 case Intrinsics::kMathAbsDouble: 236 case Intrinsics::kMathAbsFloat: 237 case Intrinsics::kMathMaxDoubleDouble: 238 case Intrinsics::kMathMaxFloatFloat: 239 case Intrinsics::kMathMinDoubleDouble: 240 case Intrinsics::kMathMinFloatFloat: 241 case Intrinsics::kMathRoundFloat: 242 if (!base_added) { 243 DCHECK(invoke_static_or_direct != nullptr); 244 DCHECK(!invoke_static_or_direct->HasCurrentMethodInput()); 245 HX86ComputeBaseMethodAddress* method_address = GetPCRelativeBasePointer(invoke); 246 invoke_static_or_direct->AddSpecialInput(method_address); 247 } 248 break; 249 default: 250 break; 251 } 252 } 253 254 CodeGeneratorX86* codegen_; 255 256 // The generated HX86ComputeBaseMethodAddress in the entry block needed as an 257 // input to the HX86LoadFromConstantTable instructions. Only set for 258 // graphs with reducible loops. 259 HX86ComputeBaseMethodAddress* base_; 260 }; 261 262 void PcRelativeFixups::Run() { 263 PCRelativeHandlerVisitor visitor(graph_, codegen_); 264 visitor.VisitInsertionOrder(); 265 visitor.MoveBaseIfNeeded(); 266 } 267 268 } // namespace x86 269 } // namespace art 270