Clement Courbet | ac74acd | 2018-04-04 11:37:06 +0000 | [diff] [blame] | 1 | //===-- Latency.cpp ---------------------------------------------*- C++ -*-===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | |
| 10 | #include "Latency.h" |
Clement Courbet | 0e69e2d | 2018-05-17 10:52:18 +0000 | [diff] [blame] | 11 | |
| 12 | #include "Assembler.h" |
| 13 | #include "BenchmarkRunner.h" |
| 14 | #include "MCInstrDescView.h" |
Clement Courbet | ac74acd | 2018-04-04 11:37:06 +0000 | [diff] [blame] | 15 | #include "PerfHelper.h" |
Clement Courbet | 0e69e2d | 2018-05-17 10:52:18 +0000 | [diff] [blame] | 16 | #include "llvm/ADT/STLExtras.h" |
| 17 | #include "llvm/MC/MCInst.h" |
| 18 | #include "llvm/MC/MCInstBuilder.h" |
Clement Courbet | ac74acd | 2018-04-04 11:37:06 +0000 | [diff] [blame] | 19 | |
| 20 | namespace exegesis { |
| 21 | |
Clement Courbet | 0e69e2d | 2018-05-17 10:52:18 +0000 | [diff] [blame] | 22 | static bool HasUnknownOperand(const llvm::MCOperandInfo &OpInfo) { |
| 23 | return OpInfo.OperandType == llvm::MCOI::OPERAND_UNKNOWN; |
| 24 | } |
| 25 | |
Clement Courbet | ac74acd | 2018-04-04 11:37:06 +0000 | [diff] [blame] | 26 | // FIXME: Handle memory, see PR36905. |
Clement Courbet | 0e69e2d | 2018-05-17 10:52:18 +0000 | [diff] [blame] | 27 | static bool HasMemoryOperand(const llvm::MCOperandInfo &OpInfo) { |
| 28 | return OpInfo.OperandType == llvm::MCOI::OPERAND_MEMORY; |
| 29 | } |
| 30 | |
| 31 | static bool IsInfeasible(const Instruction &Instruction, std::string &Error) { |
| 32 | const auto &MCInstrDesc = Instruction.Description; |
| 33 | if (MCInstrDesc.isPseudo()) { |
| 34 | Error = "is pseudo"; |
Clement Courbet | ac74acd | 2018-04-04 11:37:06 +0000 | [diff] [blame] | 35 | return true; |
Clement Courbet | ac74acd | 2018-04-04 11:37:06 +0000 | [diff] [blame] | 36 | } |
Clement Courbet | 0e69e2d | 2018-05-17 10:52:18 +0000 | [diff] [blame] | 37 | if (llvm::any_of(MCInstrDesc.operands(), HasUnknownOperand)) { |
| 38 | Error = "has unknown operands"; |
| 39 | return true; |
| 40 | } |
| 41 | if (llvm::any_of(MCInstrDesc.operands(), HasMemoryOperand)) { |
| 42 | Error = "has memory operands"; |
| 43 | return true; |
| 44 | } |
| 45 | return false; |
Clement Courbet | ac74acd | 2018-04-04 11:37:06 +0000 | [diff] [blame] | 46 | } |
| 47 | |
| 48 | static llvm::Error makeError(llvm::Twine Msg) { |
| 49 | return llvm::make_error<llvm::StringError>(Msg, |
| 50 | llvm::inconvertibleErrorCode()); |
| 51 | } |
| 52 | |
| 53 | LatencyBenchmarkRunner::~LatencyBenchmarkRunner() = default; |
| 54 | |
Clement Courbet | 62b34fa | 2018-06-06 09:42:36 +0000 | [diff] [blame] | 55 | InstructionBenchmark::ModeE LatencyBenchmarkRunner::getMode() const { |
| 56 | return InstructionBenchmark::Latency; |
Clement Courbet | 2cb97b9 | 2018-06-04 11:43:40 +0000 | [diff] [blame] | 57 | } |
Clement Courbet | ac74acd | 2018-04-04 11:37:06 +0000 | [diff] [blame] | 58 | |
Guillaume Chatelet | 7b852cd | 2018-06-07 08:11:54 +0000 | [diff] [blame^] | 59 | llvm::Expected<BenchmarkConfiguration> |
| 60 | LatencyBenchmarkRunner::createConfiguration(RegisterAliasingTrackerCache &RATC, |
| 61 | unsigned Opcode, |
| 62 | llvm::raw_ostream &Info) const { |
| 63 | BenchmarkConfiguration Configuration; |
| 64 | std::vector<llvm::MCInst> &Snippet = Configuration.Snippet; |
Clement Courbet | 0e69e2d | 2018-05-17 10:52:18 +0000 | [diff] [blame] | 65 | const llvm::MCInstrDesc &MCInstrDesc = MCInstrInfo.get(Opcode); |
| 66 | const Instruction ThisInstruction(MCInstrDesc, RATC); |
Clement Courbet | ac74acd | 2018-04-04 11:37:06 +0000 | [diff] [blame] | 67 | |
Clement Courbet | 0e69e2d | 2018-05-17 10:52:18 +0000 | [diff] [blame] | 68 | std::string Error; |
| 69 | if (IsInfeasible(ThisInstruction, Error)) |
| 70 | return makeError(llvm::Twine("Infeasible : ").concat(Error)); |
| 71 | |
| 72 | const AliasingConfigurations SelfAliasing(ThisInstruction, ThisInstruction); |
| 73 | if (!SelfAliasing.empty()) { |
| 74 | if (!SelfAliasing.hasImplicitAliasing()) { |
| 75 | Info << "explicit self cycles, selecting one aliasing configuration.\n"; |
| 76 | setRandomAliasing(SelfAliasing); |
| 77 | } else { |
| 78 | Info << "implicit Self cycles, picking random values.\n"; |
| 79 | } |
| 80 | Snippet.push_back(randomizeUnsetVariablesAndBuild(ThisInstruction)); |
Guillaume Chatelet | 7b852cd | 2018-06-07 08:11:54 +0000 | [diff] [blame^] | 81 | return Configuration; |
Clement Courbet | ac74acd | 2018-04-04 11:37:06 +0000 | [diff] [blame] | 82 | } |
| 83 | |
Clement Courbet | 0e69e2d | 2018-05-17 10:52:18 +0000 | [diff] [blame] | 84 | // Let's try to create a dependency through another opcode. |
| 85 | std::vector<unsigned> Opcodes; |
| 86 | Opcodes.resize(MCInstrInfo.getNumOpcodes()); |
| 87 | std::iota(Opcodes.begin(), Opcodes.end(), 0U); |
| 88 | std::shuffle(Opcodes.begin(), Opcodes.end(), randomGenerator()); |
| 89 | for (const unsigned OtherOpcode : Opcodes) { |
| 90 | clearVariableAssignments(ThisInstruction); |
| 91 | if (OtherOpcode == Opcode) |
| 92 | continue; |
| 93 | const Instruction OtherInstruction(MCInstrInfo.get(OtherOpcode), RATC); |
| 94 | if (IsInfeasible(OtherInstruction, Error)) |
| 95 | continue; |
| 96 | const AliasingConfigurations Forward(ThisInstruction, OtherInstruction); |
| 97 | const AliasingConfigurations Back(OtherInstruction, ThisInstruction); |
| 98 | if (Forward.empty() || Back.empty()) |
| 99 | continue; |
| 100 | setRandomAliasing(Forward); |
| 101 | setRandomAliasing(Back); |
| 102 | Info << "creating cycle through " << MCInstrInfo.getName(OtherOpcode) |
| 103 | << ".\n"; |
| 104 | Snippet.push_back(randomizeUnsetVariablesAndBuild(ThisInstruction)); |
| 105 | Snippet.push_back(randomizeUnsetVariablesAndBuild(OtherInstruction)); |
Guillaume Chatelet | 7b852cd | 2018-06-07 08:11:54 +0000 | [diff] [blame^] | 106 | return Configuration; |
Clement Courbet | 0e69e2d | 2018-05-17 10:52:18 +0000 | [diff] [blame] | 107 | } |
| 108 | |
| 109 | return makeError( |
| 110 | "Infeasible : Didn't find any scheme to make the instruction serial\n"); |
Clement Courbet | ac74acd | 2018-04-04 11:37:06 +0000 | [diff] [blame] | 111 | } |
| 112 | |
| 113 | std::vector<BenchmarkMeasure> |
Clement Courbet | 0e69e2d | 2018-05-17 10:52:18 +0000 | [diff] [blame] | 114 | LatencyBenchmarkRunner::runMeasurements(const ExecutableFunction &Function, |
Clement Courbet | ac74acd | 2018-04-04 11:37:06 +0000 | [diff] [blame] | 115 | const unsigned NumRepetitions) const { |
| 116 | // Cycle measurements include some overhead from the kernel. Repeat the |
| 117 | // measure several times and take the minimum value. |
| 118 | constexpr const int NumMeasurements = 30; |
| 119 | int64_t MinLatency = std::numeric_limits<int64_t>::max(); |
Clement Courbet | b449379 | 2018-04-10 08:16:37 +0000 | [diff] [blame] | 120 | const char *CounterName = State.getSubtargetInfo() |
| 121 | .getSchedModel() |
| 122 | .getExtraProcessorInfo() |
| 123 | .PfmCounters.CycleCounter; |
| 124 | if (!CounterName) |
| 125 | llvm::report_fatal_error("sched model does not define a cycle counter"); |
| 126 | const pfm::PerfEvent CyclesPerfEvent(CounterName); |
Clement Courbet | ac74acd | 2018-04-04 11:37:06 +0000 | [diff] [blame] | 127 | if (!CyclesPerfEvent.valid()) |
Clement Courbet | b449379 | 2018-04-10 08:16:37 +0000 | [diff] [blame] | 128 | llvm::report_fatal_error("invalid perf event"); |
Clement Courbet | ac74acd | 2018-04-04 11:37:06 +0000 | [diff] [blame] | 129 | for (size_t I = 0; I < NumMeasurements; ++I) { |
| 130 | pfm::Counter Counter(CyclesPerfEvent); |
| 131 | Counter.start(); |
| 132 | Function(); |
| 133 | Counter.stop(); |
| 134 | const int64_t Value = Counter.read(); |
| 135 | if (Value < MinLatency) |
| 136 | MinLatency = Value; |
| 137 | } |
Clement Courbet | 3f20fee | 2018-04-04 12:01:38 +0000 | [diff] [blame] | 138 | return {{"latency", static_cast<double>(MinLatency) / NumRepetitions, ""}}; |
Clement Courbet | ac74acd | 2018-04-04 11:37:06 +0000 | [diff] [blame] | 139 | } |
| 140 | |
| 141 | } // namespace exegesis |