Skip to content

Commit 41c8af3

Browse files
committed
[MCSched] Bind PFM Counters to the CPUs instead of the SchedModel.
Summary: The pfm counters are now in the ExegesisTarget rather than the MCSchedModel (PR39165). This also compresses the pfm counter tables (PR37068). Reviewers: RKSimon, gchatelet Subscribers: mgrang, llvm-commits Differential Revision: https://reviews.llvm.org/D52932 llvm-svn: 345243
1 parent 128fcff commit 41c8af3

25 files changed

+477
-247
lines changed

llvm/docs/CommandGuide/llvm-exegesis.rst

+4
Original file line numberDiff line numberDiff line change
@@ -224,6 +224,10 @@ OPTIONS
224224

225225
If set, ignore instructions that do not have a sched class (class idx = 0).
226226

227+
.. option:: -mcpu=<cpu name>
228+
229+
If set, measure the cpu characteristics using the counters for this CPU. This
230+
is useful when creating new sched models (the host CPU is unknown to LLVM).
227231

228232
EXIT STATUS
229233
-----------

llvm/docs/CommandGuide/tblgen.rst

+4
Original file line numberDiff line numberDiff line change
@@ -130,6 +130,10 @@ OPTIONS
130130

131131
Generate enhanced disassembly info.
132132

133+
.. option:: -gen-exegesis
134+
135+
Generate llvm-exegesis tables.
136+
133137
.. option:: -version
134138

135139
Show the version number of this program.

llvm/include/llvm/MC/MCSchedule.h

-16
Original file line numberDiff line numberDiff line change
@@ -183,22 +183,6 @@ struct MCExtraProcessorInfo {
183183
unsigned NumRegisterFiles;
184184
const MCRegisterCostEntry *RegisterCostTable;
185185
unsigned NumRegisterCostEntries;
186-
187-
struct PfmCountersInfo {
188-
// An optional name of a performance counter that can be used to measure
189-
// cycles.
190-
const char *CycleCounter;
191-
192-
// An optional name of a performance counter that can be used to measure
193-
// uops.
194-
const char *UopsCounter;
195-
196-
// For each MCProcResourceDesc defined by the processor, an optional list of
197-
// names of performance counters that can be used to measure the resource
198-
// utilization.
199-
const char **IssueCounters;
200-
};
201-
PfmCountersInfo PfmCounters;
202186
};
203187

204188
/// Machine model for scheduling, bundling, and heuristics.

llvm/include/llvm/Target/Target.td

+5
Original file line numberDiff line numberDiff line change
@@ -1555,3 +1555,8 @@ include "llvm/Target/GlobalISel/Target.td"
15551555
// Pull in the common support for the Global ISel DAG-based selector generation.
15561556
//
15571557
include "llvm/Target/GlobalISel/SelectionDAGCompat.td"
1558+
1559+
//===----------------------------------------------------------------------===//
1560+
// Pull in the common support for Pfm Counters generation.
1561+
//
1562+
include "llvm/Target/TargetPfmCounters.td"
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,46 @@
1+
//===- TargetPfmCounters.td - Target Pfm Counters -*- tablegen ----------*-===//
2+
//
3+
// The LLVM Compiler Infrastructure
4+
//
5+
// This file is distributed under the University of Illinois Open Source
6+
// License. See LICENSE.TXT for details.
7+
//
8+
//===----------------------------------------------------------------------===//
9+
//
10+
// This file defines the target-independent interfaces for performance counters.
11+
12+
// Definition of a hardware counters from libpfm identifiers.
13+
class PfmCounter<string counter> {
14+
// The name of the counter that measures events.
15+
// The name can be "some_counter + some_other_counter", in which case the
16+
// measured value is the sum of events on these counters.
17+
string Counter = counter;
18+
}
19+
20+
// Issue counters can be tied to a ProcResource
21+
class PfmIssueCounter<string resource_name, string counter>
22+
: PfmCounter<counter> {
23+
// The name of the ProcResource on which uops are issued. This is used by
24+
// llvm-exegesis to compare measurements with values in the SchedModels.
25+
// If the CPU has a sched model, this should correspond to the name of a
26+
// ProcResource.
27+
string ResourceName = resource_name;
28+
}
29+
30+
def NoPfmCounter : PfmCounter <""> {}
31+
32+
// Set of PfmCounters for measuring sched model characteristics.
33+
class ProcPfmCounters {
34+
// Processors can define how to measure cycles by defining a CycleCounter.
35+
PfmCounter CycleCounter = NoPfmCounter;
36+
// Processors can define how to measure uops by defining a UopsCounter.
37+
PfmCounter UopsCounter = NoPfmCounter;
38+
// Processors can define how to measure issued uops by defining IssueCounters.
39+
list<PfmIssueCounter> IssueCounters = [];
40+
}
41+
42+
// A binding of a set of counters to a CPU.
43+
class PfmCountersBinding<string cpu_name, ProcPfmCounters counters> {
44+
string CpuName = cpu_name;
45+
ProcPfmCounters Counters = counters;
46+
}

llvm/include/llvm/Target/TargetSchedule.td

-28
Original file line numberDiff line numberDiff line change
@@ -557,31 +557,3 @@ class RetireControlUnit<int bufferSize, int retirePerCycle> {
557557
int MaxRetirePerCycle = retirePerCycle;
558558
SchedMachineModel SchedModel = ?;
559559
}
560-
561-
// Allow the definition of hardware counters.
562-
class PfmCounter {
563-
SchedMachineModel SchedModel = ?;
564-
}
565-
566-
// Each processor can define how to measure cycles by defining a
567-
// PfmCycleCounter.
568-
class PfmCycleCounter<string counter> : PfmCounter {
569-
string Counter = counter;
570-
}
571-
572-
// Each ProcResourceUnits can define how to measure issued uops by defining
573-
// a PfmIssueCounter.
574-
class PfmIssueCounter<ProcResourceUnits resource, list<string> counters>
575-
: PfmCounter{
576-
// The resource units on which uops are issued.
577-
ProcResourceUnits Resource = resource;
578-
// The list of counters that measure issue events.
579-
list<string> Counters = counters;
580-
}
581-
582-
// Each processor can define how to measure NumMicroOps by defining a
583-
// PfmUopsCounter.
584-
class PfmUopsCounter<string counter> : PfmCounter {
585-
string Counter = counter;
586-
}
587-

llvm/lib/Target/X86/CMakeLists.txt

+1
Original file line numberDiff line numberDiff line change
@@ -13,6 +13,7 @@ tablegen(LLVM X86GenInstrInfo.inc -gen-instr-info)
1313
tablegen(LLVM X86GenRegisterBank.inc -gen-register-bank)
1414
tablegen(LLVM X86GenRegisterInfo.inc -gen-register-info)
1515
tablegen(LLVM X86GenSubtargetInfo.inc -gen-subtarget)
16+
tablegen(LLVM X86GenExegesis.inc -gen-exegesis)
1617

1718
if (X86_GEN_FOLD_TABLES)
1819
tablegen(LLVM X86GenFoldTables.inc -gen-x86-fold-tables)

llvm/lib/Target/X86/X86PfmCounters.td

+78-59
Original file line numberDiff line numberDiff line change
@@ -11,73 +11,92 @@
1111
//
1212
//===----------------------------------------------------------------------===//
1313

14-
let SchedModel = SandyBridgeModel in {
15-
def SBCycleCounter : PfmCycleCounter<"unhalted_core_cycles">;
16-
def SBPort0Counter : PfmIssueCounter<SBPort0, ["uops_dispatched_port:port_0"]>;
17-
def SBPort1Counter : PfmIssueCounter<SBPort1, ["uops_dispatched_port:port_1"]>;
18-
def SBPort23Counter : PfmIssueCounter<SBPort23,
19-
["uops_dispatched_port:port_2",
20-
"uops_dispatched_port:port_3"]>;
21-
def SBPort4Counter : PfmIssueCounter<SBPort4, ["uops_dispatched_port:port_4"]>;
22-
def SBPort5Counter : PfmIssueCounter<SBPort5, ["uops_dispatched_port:port_5"]>;
23-
def SBUopsCounter : PfmUopsCounter<"uops_issued:any">;
14+
def UnhaltedCoreCyclesPfmCounter : PfmCounter<"unhalted_core_cycles">;
15+
def UopsIssuedPfmCounter : PfmCounter<"uops_issued:any">;
16+
17+
def SandyBridgePfmCounters : ProcPfmCounters {
18+
let CycleCounter = UnhaltedCoreCyclesPfmCounter;
19+
let UopsCounter = UopsIssuedPfmCounter;
20+
let IssueCounters = [
21+
PfmIssueCounter<"SBPort0", "uops_dispatched_port:port_0">,
22+
PfmIssueCounter<"SBPort1", "uops_dispatched_port:port_1">,
23+
PfmIssueCounter<"SBPort23", "uops_dispatched_port:port_2 + uops_dispatched_port:port_3">,
24+
PfmIssueCounter<"SBPort4", "uops_dispatched_port:port_4">,
25+
PfmIssueCounter<"SBPort5", "uops_dispatched_port:port_5">
26+
];
2427
}
28+
def : PfmCountersBinding<"sandybridge", SandyBridgePfmCounters>;
2529

26-
let SchedModel = HaswellModel in {
27-
def HWCycleCounter : PfmCycleCounter<"unhalted_core_cycles">;
28-
def HWPort0Counter : PfmIssueCounter<HWPort0, ["uops_dispatched_port:port_0"]>;
29-
def HWPort1Counter : PfmIssueCounter<HWPort1, ["uops_dispatched_port:port_1"]>;
30-
def HWPort2Counter : PfmIssueCounter<HWPort2, ["uops_dispatched_port:port_2"]>;
31-
def HWPort3Counter : PfmIssueCounter<HWPort3, ["uops_dispatched_port:port_3"]>;
32-
def HWPort4Counter : PfmIssueCounter<HWPort4, ["uops_dispatched_port:port_4"]>;
33-
def HWPort5Counter : PfmIssueCounter<HWPort5, ["uops_dispatched_port:port_5"]>;
34-
def HWPort6Counter : PfmIssueCounter<HWPort6, ["uops_dispatched_port:port_6"]>;
35-
def HWPort7Counter : PfmIssueCounter<HWPort7, ["uops_dispatched_port:port_7"]>;
36-
def HWUopsCounter : PfmUopsCounter<"uops_issued:any">;
30+
def HaswellPfmCounters : ProcPfmCounters {
31+
let CycleCounter = UnhaltedCoreCyclesPfmCounter;
32+
let UopsCounter = UopsIssuedPfmCounter;
33+
let IssueCounters = [
34+
PfmIssueCounter<"HWPort0", "uops_dispatched_port:port_0">,
35+
PfmIssueCounter<"HWPort1", "uops_dispatched_port:port_1">,
36+
PfmIssueCounter<"HWPort2", "uops_dispatched_port:port_2">,
37+
PfmIssueCounter<"HWPort3", "uops_dispatched_port:port_3">,
38+
PfmIssueCounter<"HWPort4", "uops_dispatched_port:port_4">,
39+
PfmIssueCounter<"HWPort5", "uops_dispatched_port:port_5">,
40+
PfmIssueCounter<"HWPort6", "uops_dispatched_port:port_6">,
41+
PfmIssueCounter<"HWPort7", "uops_dispatched_port:port_7">
42+
];
3743
}
44+
def : PfmCountersBinding<"haswell", HaswellPfmCounters>;
3845

39-
let SchedModel = BroadwellModel in {
40-
def BWCycleCounter : PfmCycleCounter<"unhalted_core_cycles">;
41-
def BWPort0Counter : PfmIssueCounter<BWPort0, ["uops_executed_port:port_0"]>;
42-
def BWPort1Counter : PfmIssueCounter<BWPort1, ["uops_executed_port:port_1"]>;
43-
def BWPort2Counter : PfmIssueCounter<BWPort2, ["uops_executed_port:port_2"]>;
44-
def BWPort3Counter : PfmIssueCounter<BWPort3, ["uops_executed_port:port_3"]>;
45-
def BWPort4Counter : PfmIssueCounter<BWPort4, ["uops_executed_port:port_4"]>;
46-
def BWPort5Counter : PfmIssueCounter<BWPort5, ["uops_executed_port:port_5"]>;
47-
def BWPort6Counter : PfmIssueCounter<BWPort6, ["uops_executed_port:port_6"]>;
48-
def BWPort7Counter : PfmIssueCounter<BWPort7, ["uops_executed_port:port_7"]>;
49-
def BWUopsCounter : PfmUopsCounter<"uops_issued:any">;
46+
def BroadwellPfmCounters : ProcPfmCounters {
47+
let CycleCounter = UnhaltedCoreCyclesPfmCounter;
48+
let UopsCounter = UopsIssuedPfmCounter;
49+
let IssueCounters = [
50+
PfmIssueCounter<"BWPort0", "uops_executed_port:port_0">,
51+
PfmIssueCounter<"BWPort1", "uops_executed_port:port_1">,
52+
PfmIssueCounter<"BWPort2", "uops_executed_port:port_2">,
53+
PfmIssueCounter<"BWPort3", "uops_executed_port:port_3">,
54+
PfmIssueCounter<"BWPort4", "uops_executed_port:port_4">,
55+
PfmIssueCounter<"BWPort5", "uops_executed_port:port_5">,
56+
PfmIssueCounter<"BWPort6", "uops_executed_port:port_6">,
57+
PfmIssueCounter<"BWPort7", "uops_executed_port:port_7">
58+
];
5059
}
60+
def : PfmCountersBinding<"broadwell", BroadwellPfmCounters>;
5161

52-
let SchedModel = SkylakeClientModel in {
53-
def SKLCycleCounter : PfmCycleCounter<"unhalted_core_cycles">;
54-
def SKLPort0Counter : PfmIssueCounter<SKLPort0, ["uops_dispatched_port:port_0"]>;
55-
def SKLPort1Counter : PfmIssueCounter<SKLPort1, ["uops_dispatched_port:port_1"]>;
56-
def SKLPort2Counter : PfmIssueCounter<SKLPort2, ["uops_dispatched_port:port_2"]>;
57-
def SKLPort3Counter : PfmIssueCounter<SKLPort3, ["uops_dispatched_port:port_3"]>;
58-
def SKLPort4Counter : PfmIssueCounter<SKLPort4, ["uops_dispatched_port:port_4"]>;
59-
def SKLPort5Counter : PfmIssueCounter<SKLPort5, ["uops_dispatched_port:port_5"]>;
60-
def SKLPort6Counter : PfmIssueCounter<SKLPort6, ["uops_dispatched_port:port_6"]>;
61-
def SKLPort7Counter : PfmIssueCounter<SKLPort7, ["uops_dispatched_port:port_7"]>;
62-
def SKLUopsCounter : PfmUopsCounter<"uops_issued:any">;
62+
def SkylakeClientPfmCounters : ProcPfmCounters {
63+
let CycleCounter = UnhaltedCoreCyclesPfmCounter;
64+
let UopsCounter = UopsIssuedPfmCounter;
65+
let IssueCounters = [
66+
PfmIssueCounter<"SKLPort0", "uops_dispatched_port:port_0">,
67+
PfmIssueCounter<"SKLPort1", "uops_dispatched_port:port_1">,
68+
PfmIssueCounter<"SKLPort2", "uops_dispatched_port:port_2">,
69+
PfmIssueCounter<"SKLPort3", "uops_dispatched_port:port_3">,
70+
PfmIssueCounter<"SKLPort4", "uops_dispatched_port:port_4">,
71+
PfmIssueCounter<"SKLPort5", "uops_dispatched_port:port_5">,
72+
PfmIssueCounter<"SKLPort6", "uops_dispatched_port:port_6">,
73+
PfmIssueCounter<"SKLPort7", "uops_dispatched_port:port_7">
74+
];
6375
}
76+
def : PfmCountersBinding<"skylake", SkylakeClientPfmCounters>;
6477

65-
let SchedModel = SkylakeServerModel in {
66-
def SKXCycleCounter : PfmCycleCounter<"unhalted_core_cycles">;
67-
def SKXPort0Counter : PfmIssueCounter<SKXPort0, ["uops_dispatched_port:port_0"]>;
68-
def SKXPort1Counter : PfmIssueCounter<SKXPort1, ["uops_dispatched_port:port_1"]>;
69-
def SKXPort2Counter : PfmIssueCounter<SKXPort2, ["uops_dispatched_port:port_2"]>;
70-
def SKXPort3Counter : PfmIssueCounter<SKXPort3, ["uops_dispatched_port:port_3"]>;
71-
def SKXPort4Counter : PfmIssueCounter<SKXPort4, ["uops_dispatched_port:port_4"]>;
72-
def SKXPort5Counter : PfmIssueCounter<SKXPort5, ["uops_dispatched_port:port_5"]>;
73-
def SKXPort6Counter : PfmIssueCounter<SKXPort6, ["uops_dispatched_port:port_6"]>;
74-
def SKXPort7Counter : PfmIssueCounter<SKXPort7, ["uops_dispatched_port:port_7"]>;
75-
def SKXUopsCounter : PfmUopsCounter<"uops_issued:any">;
78+
def SkylakeServerPfmCounters : ProcPfmCounters {
79+
let CycleCounter = UnhaltedCoreCyclesPfmCounter;
80+
let UopsCounter = UopsIssuedPfmCounter;
81+
let IssueCounters = [
82+
PfmIssueCounter<"SKXPort0", "uops_dispatched_port:port_0">,
83+
PfmIssueCounter<"SKXPort1", "uops_dispatched_port:port_1">,
84+
PfmIssueCounter<"SKXPort2", "uops_dispatched_port:port_2">,
85+
PfmIssueCounter<"SKXPort3", "uops_dispatched_port:port_3">,
86+
PfmIssueCounter<"SKXPort4", "uops_dispatched_port:port_4">,
87+
PfmIssueCounter<"SKXPort5", "uops_dispatched_port:port_5">,
88+
PfmIssueCounter<"SKXPort6", "uops_dispatched_port:port_6">,
89+
PfmIssueCounter<"SKXPort7", "uops_dispatched_port:port_7">
90+
];
7691
}
92+
def : PfmCountersBinding<"skylake-avx512", SkylakeServerPfmCounters>;
7793

78-
let SchedModel = BtVer2Model in {
79-
def JCycleCounter : PfmCycleCounter<"cpu_clk_unhalted">;
80-
def JUopsCounter : PfmUopsCounter<"retired_uops">;
81-
def JFPU0Counter : PfmIssueCounter<JFPU0, ["dispatched_fpu:pipe0"]>;
82-
def JFPU1Counter : PfmIssueCounter<JFPU1, ["dispatched_fpu:pipe1"]>;
94+
def BtVer2PfmCounters : ProcPfmCounters {
95+
let CycleCounter = PfmCounter<"cpu_clk_unhalted">;
96+
let UopsCounter = PfmCounter<"retired_uops">;
97+
let IssueCounters = [
98+
PfmIssueCounter<"JFPU0", "dispatched_fpu:pipe0">,
99+
PfmIssueCounter<"JFPU1", "dispatched_fpu:pipe1">
100+
];
83101
}
102+
def : PfmCountersBinding<"btver2", BtVer2PfmCounters>;

llvm/tools/llvm-exegesis/lib/AArch64/Target.cpp

+4
Original file line numberDiff line numberDiff line change
@@ -53,6 +53,10 @@ static llvm::MCInst loadImmediate(unsigned Reg, unsigned RegBitWidth,
5353
} // namespace
5454

5555
class ExegesisAArch64Target : public ExegesisTarget {
56+
public:
57+
ExegesisAArch64Target() : ExegesisTarget({}) {}
58+
59+
private:
5660
std::vector<llvm::MCInst> setRegTo(const llvm::MCSubtargetInfo &STI,
5761
unsigned Reg,
5862
const llvm::APInt &Value) const override {

llvm/tools/llvm-exegesis/lib/Latency.cpp

+3-6
Original file line numberDiff line numberDiff line change
@@ -12,6 +12,8 @@
1212
#include "Assembler.h"
1313
#include "BenchmarkRunner.h"
1414
#include "MCInstrDescView.h"
15+
#include "PerfHelper.h"
16+
#include "Target.h"
1517
#include "llvm/ADT/STLExtras.h"
1618
#include "llvm/MC/MCInst.h"
1719
#include "llvm/MC/MCInstBuilder.h"
@@ -165,12 +167,7 @@ LatencySnippetGenerator::generateCodeTemplates(const Instruction &Instr) const {
165167
}
166168

167169
const char *LatencyBenchmarkRunner::getCounterName() const {
168-
if (!State.getSubtargetInfo().getSchedModel().hasExtraProcessorInfo())
169-
llvm::report_fatal_error("sched model is missing extra processor info!");
170-
const char *CounterName = State.getSubtargetInfo()
171-
.getSchedModel()
172-
.getExtraProcessorInfo()
173-
.PfmCounters.CycleCounter;
170+
const char *CounterName = State.getPfmCounters().CycleCounter;
174171
if (!CounterName)
175172
llvm::report_fatal_error("sched model does not define a cycle counter");
176173
return CounterName;

llvm/tools/llvm-exegesis/lib/LlvmState.cpp

+5-2
Original file line numberDiff line numberDiff line change
@@ -36,14 +36,17 @@ LLVMState::LLVMState(const std::string &Triple, const std::string &CpuName) {
3636
llvm::errs() << "no exegesis target for " << Triple << ", using default\n";
3737
TheExegesisTarget = &ExegesisTarget::getDefault();
3838
}
39+
PfmCounters = &TheExegesisTarget->getPfmCounters(CpuName);
40+
3941
RATC.reset(new RegisterAliasingTrackerCache(
4042
getRegInfo(), getFunctionReservedRegs(getTargetMachine())));
4143
IC.reset(new InstructionsCache(getInstrInfo(), getRATC()));
4244
}
4345

44-
LLVMState::LLVMState()
46+
LLVMState::LLVMState(const std::string &CpuName)
4547
: LLVMState(llvm::sys::getProcessTriple(),
46-
llvm::sys::getHostCPUName().str()) {}
48+
CpuName.empty() ? llvm::sys::getHostCPUName().str() : CpuName) {
49+
}
4750

4851
std::unique_ptr<llvm::LLVMTargetMachine>
4952
LLVMState::createTargetMachine() const {

llvm/tools/llvm-exegesis/lib/LlvmState.h

+7-1
Original file line numberDiff line numberDiff line change
@@ -30,12 +30,14 @@ namespace llvm {
3030
namespace exegesis {
3131

3232
class ExegesisTarget;
33+
class PfmCountersInfo;
3334

3435
// An object to initialize LLVM and prepare objects needed to run the
3536
// measurements.
3637
class LLVMState {
3738
public:
38-
LLVMState();
39+
// Uses the host triple. If CpuName is empty, uses the host CPU.
40+
LLVMState(const std::string &CpuName);
3941

4042
LLVMState(const std::string &Triple,
4143
const std::string &CpuName); // For tests.
@@ -57,14 +59,18 @@ class LLVMState {
5759
const llvm::MCSubtargetInfo &getSubtargetInfo() const {
5860
return *TargetMachine->getMCSubtargetInfo();
5961
}
62+
6063
const RegisterAliasingTrackerCache &getRATC() const { return *RATC; }
6164
const InstructionsCache &getIC() const { return *IC; }
6265

66+
const PfmCountersInfo &getPfmCounters() const { return *PfmCounters; }
67+
6368
private:
6469
const ExegesisTarget *TheExegesisTarget;
6570
std::unique_ptr<const llvm::TargetMachine> TargetMachine;
6671
std::unique_ptr<const RegisterAliasingTrackerCache> RATC;
6772
std::unique_ptr<const InstructionsCache> IC;
73+
const PfmCountersInfo *PfmCounters;
6874
};
6975

7076
} // namespace exegesis

0 commit comments

Comments
 (0)