Skip to content

Commit d9b511d

Browse files
committed
[CSSPGO] Set PseudoProbeInserter as a default pass.
Currenlty PseudoProbeInserter is a pass conditioned on a target switch. It works well with a single clang invocation. It doesn't work so well when the backend is called separately (i.e, through the linker or llc), where user has always to pass -pseudo-probe-for-profiling explictly. I'm making the pass a default pass that requires no command line arg to trigger, but will be actually run depending on whether the CU comes with `llvm.pseudo_probe_desc` metadata. Reviewed By: wenlei Differential Revision: https://reviews.llvm.org/D110209
1 parent 173dd89 commit d9b511d

19 files changed

+26
-38
lines changed

clang/lib/CodeGen/BackendUtil.cpp

-1
Original file line numberDiff line numberDiff line change
@@ -576,7 +576,6 @@ static bool initTargetOptions(DiagnosticsEngine &Diags,
576576
Options.ForceDwarfFrameSection = CodeGenOpts.ForceDwarfFrameSection;
577577
Options.EmitCallSiteInfo = CodeGenOpts.EmitCallSiteInfo;
578578
Options.EnableAIXExtendedAltivecABI = CodeGenOpts.EnableAIXExtendedAltivecABI;
579-
Options.PseudoProbeForProfiling = CodeGenOpts.PseudoProbeForProfiling;
580579
Options.ValueTrackingVariableLocations =
581580
CodeGenOpts.ValueTrackingVariableLocations;
582581
Options.XRayOmitFunctionIndex = CodeGenOpts.XRayOmitFunctionIndex;

lld/ELF/Config.h

-1
Original file line numberDiff line numberDiff line change
@@ -183,7 +183,6 @@ struct Configuration {
183183
bool ltoDebugPassManager;
184184
bool ltoEmitAsm;
185185
bool ltoNewPassManager;
186-
bool ltoPseudoProbeForProfiling;
187186
bool ltoUniqueBasicBlockSectionNames;
188187
bool ltoWholeProgramVisibility;
189188
bool mergeArmExidx;

lld/ELF/Driver.cpp

-2
Original file line numberDiff line numberDiff line change
@@ -1084,8 +1084,6 @@ static void readConfigs(opt::InputArgList &args) {
10841084
config->ltoo = args::getInteger(args, OPT_lto_O, 2);
10851085
config->ltoObjPath = args.getLastArgValue(OPT_lto_obj_path_eq);
10861086
config->ltoPartitions = args::getInteger(args, OPT_lto_partitions, 1);
1087-
config->ltoPseudoProbeForProfiling =
1088-
args.hasArg(OPT_lto_pseudo_probe_for_profiling);
10891087
config->ltoSampleProfile = args.getLastArgValue(OPT_lto_sample_profile);
10901088
config->ltoBasicBlockSections =
10911089
args.getLastArgValue(OPT_lto_basic_block_sections);

lld/ELF/LTO.cpp

-1
Original file line numberDiff line numberDiff line change
@@ -112,7 +112,6 @@ static lto::Config createConfig() {
112112
}
113113
}
114114

115-
c.Options.PseudoProbeForProfiling = config->ltoPseudoProbeForProfiling;
116115
c.Options.UniqueBasicBlockSectionNames =
117116
config->ltoUniqueBasicBlockSectionNames;
118117

lld/ELF/Options.td

-4
Original file line numberDiff line numberDiff line change
@@ -574,8 +574,6 @@ def lto_sample_profile: JJ<"lto-sample-profile=">,
574574
defm lto_whole_program_visibility: BB<"lto-whole-program-visibility",
575575
"Asserts that the LTO link has whole program visibility",
576576
"Asserts that the LTO link does not have whole program visibility">;
577-
def lto_pseudo_probe_for_profiling: F<"lto-pseudo-probe-for-profiling">,
578-
HelpText<"Emit pseudo probes for sample profiling">;
579577
def disable_verify: F<"disable-verify">;
580578
defm mllvm: Eq<"mllvm", "Additional arguments to forward to LLVM's option processing">;
581579
def opt_remarks_filename: Separate<["--"], "opt-remarks-filename">,
@@ -651,8 +649,6 @@ def: F<"plugin-opt=opt-remarks-with-hotness">,
651649
def: J<"plugin-opt=opt-remarks-hotness-threshold=">,
652650
Alias<opt_remarks_hotness_threshold>,
653651
HelpText<"Alias for --opt-remarks-hotness-threshold">;
654-
def: J<"plugin-opt=pseudo-probe-for-profiling">,
655-
Alias<lto_pseudo_probe_for_profiling>, HelpText<"Alias for --lto-pseudo-probe-for-profiling">;
656652
def: J<"plugin-opt=sample-profile=">,
657653
Alias<lto_sample_profile>, HelpText<"Alias for --lto-sample-profile">;
658654
def: F<"plugin-opt=save-temps">, Alias<save_temps>, HelpText<"Alias for --save-temps">;

lld/test/ELF/lto/pseudo-probe-lto.ll

+1-2
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,6 @@
11
; REQUIRES: x86
22
; RUN: opt < %s -passes=pseudo-probe -function-sections -o %t.o
3-
; RUN: ld.lld %t.o -shared --lto-pseudo-probe-for-profiling --lto-emit-asm -o - | FileCheck %s
4-
; RUN: ld.lld %t.o -shared -plugin-opt=pseudo-probe-for-profiling --lto-emit-asm -o - | FileCheck %s
3+
; RUN: ld.lld %t.o -shared --lto-emit-asm -o - | FileCheck %s
54

65
target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128"
76
target triple = "x86_64-scei-ps4"

llvm/include/llvm/CodeGen/CommandFlags.h

-2
Original file line numberDiff line numberDiff line change
@@ -129,8 +129,6 @@ bool getEnableMachineFunctionSplitter();
129129

130130
bool getEnableDebugEntryValues();
131131

132-
bool getPseudoProbeForProfiling();
133-
134132
bool getValueTrackingVariableLocations();
135133

136134
bool getForceDwarfFrameSection();

llvm/include/llvm/Target/TargetOptions.h

+1-4
Original file line numberDiff line numberDiff line change
@@ -140,7 +140,7 @@ namespace llvm {
140140
EnableMachineFunctionSplitter(false), SupportsDefaultOutlining(false),
141141
EmitAddrsig(false), EmitCallSiteInfo(false),
142142
SupportsDebugEntryValues(false), EnableDebugEntryValues(false),
143-
PseudoProbeForProfiling(false), ValueTrackingVariableLocations(false),
143+
ValueTrackingVariableLocations(false),
144144
ForceDwarfFrameSection(false), XRayOmitFunctionIndex(false),
145145
DebugStrictDwarf(false),
146146
FPDenormalMode(DenormalMode::IEEE, DenormalMode::IEEE) {}
@@ -321,9 +321,6 @@ namespace llvm {
321321
/// production.
322322
bool ShouldEmitDebugEntryValues() const;
323323

324-
/// Emit pseudo probes into the binary for sample profiling
325-
unsigned PseudoProbeForProfiling : 1;
326-
327324
// When set to true, use experimental new debug variable location tracking,
328325
// which seeks to follow the values of variables rather than their location,
329326
// post isel.

llvm/lib/CodeGen/CommandFlags.cpp

-7
Original file line numberDiff line numberDiff line change
@@ -90,7 +90,6 @@ CGOPT(bool, EnableAddrsig)
9090
CGOPT(bool, EmitCallSiteInfo)
9191
CGOPT(bool, EnableMachineFunctionSplitter)
9292
CGOPT(bool, EnableDebugEntryValues)
93-
CGOPT(bool, PseudoProbeForProfiling)
9493
CGOPT(bool, ValueTrackingVariableLocations)
9594
CGOPT(bool, ForceDwarfFrameSection)
9695
CGOPT(bool, XRayOmitFunctionIndex)
@@ -434,11 +433,6 @@ codegen::RegisterCodeGenFlags::RegisterCodeGenFlags() {
434433
cl::init(false));
435434
CGBINDOPT(EnableDebugEntryValues);
436435

437-
static cl::opt<bool> PseudoProbeForProfiling(
438-
"pseudo-probe-for-profiling", cl::desc("Emit pseudo probes for AutoFDO"),
439-
cl::init(false));
440-
CGBINDOPT(PseudoProbeForProfiling);
441-
442436
static cl::opt<bool> ValueTrackingVariableLocations(
443437
"experimental-debug-variable-locations",
444438
cl::desc("Use experimental new value-tracking variable locations"),
@@ -540,7 +534,6 @@ codegen::InitTargetOptionsFromCodeGenFlags(const Triple &TheTriple) {
540534
Options.EmitAddrsig = getEnableAddrsig();
541535
Options.EmitCallSiteInfo = getEmitCallSiteInfo();
542536
Options.EnableDebugEntryValues = getEnableDebugEntryValues();
543-
Options.PseudoProbeForProfiling = getPseudoProbeForProfiling();
544537
Options.ValueTrackingVariableLocations = getValueTrackingVariableLocations();
545538
Options.ForceDwarfFrameSection = getForceDwarfFrameSection();
546539
Options.XRayOmitFunctionIndex = getXRayOmitFunctionIndex();

llvm/lib/CodeGen/PseudoProbeInserter.cpp

+9
Original file line numberDiff line numberDiff line change
@@ -44,7 +44,14 @@ class PseudoProbeInserter : public MachineFunctionPass {
4444
MachineFunctionPass::getAnalysisUsage(AU);
4545
}
4646

47+
bool doInitialization(Module &M) override {
48+
ShouldRun = M.getNamedMetadata(PseudoProbeDescMetadataName);
49+
return false;
50+
}
51+
4752
bool runOnMachineFunction(MachineFunction &MF) override {
53+
if (!ShouldRun)
54+
return false;
4855
const TargetInstrInfo *TII = MF.getSubtarget().getInstrInfo();
4956
bool Changed = false;
5057
for (MachineBasicBlock &MBB : MF) {
@@ -129,6 +136,8 @@ class PseudoProbeInserter : public MachineFunctionPass {
129136
Name = SP->getName();
130137
return Function::getGUID(Name);
131138
}
139+
140+
bool ShouldRun = false;
132141
};
133142
} // namespace
134143

llvm/lib/CodeGen/TargetPassConfig.cpp

-4
Original file line numberDiff line numberDiff line change
@@ -1276,10 +1276,6 @@ void TargetPassConfig::addMachinePasses() {
12761276
// Add passes that directly emit MI after all other MI passes.
12771277
addPreEmitPass2();
12781278

1279-
// Insert pseudo probe annotation for callsite profiling
1280-
if (TM->Options.PseudoProbeForProfiling)
1281-
addPass(createPseudoProbeInserter());
1282-
12831279
AddingMachinePasses = false;
12841280
}
12851281

llvm/lib/Target/X86/X86TargetMachine.cpp

+3
Original file line numberDiff line numberDiff line change
@@ -585,6 +585,9 @@ void X86PassConfig::addPreEmitPass2() {
585585
addPass(createEHContGuardCatchretPass());
586586
}
587587
addPass(createX86LoadValueInjectionRetHardeningPass());
588+
589+
// Insert pseudo probe annotation for callsite profiling
590+
addPass(createPseudoProbeInserter());
588591
}
589592

590593
bool X86PassConfig::addPostFastRegAllocRewrite() {

llvm/test/CodeGen/X86/O0-pipeline.ll

+2-1
Original file line numberDiff line numberDiff line change
@@ -72,7 +72,8 @@
7272
; CHECK-NEXT: X86 Speculative Execution Side Effect Suppression
7373
; CHECK-NEXT: X86 Indirect Thunks
7474
; CHECK-NEXT: Check CFA info and insert CFI instructions if needed
75-
; CHECK-NEXT: X86 Load Value Injection (LVI) Ret-Hardening
75+
; CHECK-NEXT: X86 Load Value Injection (LVI) Ret-Hardening
76+
; CHECK-NEXT: Pseudo Probe Inserter
7677
; CHECK-NEXT: Lazy Machine Block Frequency Analysis
7778
; CHECK-NEXT: Machine Optimization Remark Emitter
7879
; CHECK-NEXT: X86 Assembly Printer

llvm/test/CodeGen/X86/opt-pipeline.ll

+1
Original file line numberDiff line numberDiff line change
@@ -200,6 +200,7 @@
200200
; CHECK-NEXT: X86 Indirect Thunks
201201
; CHECK-NEXT: Check CFA info and insert CFI instructions if needed
202202
; CHECK-NEXT: X86 Load Value Injection (LVI) Ret-Hardening
203+
; CHECK-NEXT: Pseudo Probe Inserter
203204
; CHECK-NEXT: Lazy Machine Block Frequency Analysis
204205
; CHECK-NEXT: Machine Optimization Remark Emitter
205206
; CHECK-NEXT: X86 Assembly Printer

llvm/test/Transforms/SampleProfile/pseudo-probe-dangle.ll

+2-2
Original file line numberDiff line numberDiff line change
@@ -1,9 +1,9 @@
11
; REQUIRES: x86_64-linux
22
; RUN: opt < %s -passes='pseudo-probe,jump-threading' -S -o %t
33
; RUN: FileCheck %s < %t --check-prefix=JT
4-
; RUN: llc -pseudo-probe-for-profiling -function-sections <%t -filetype=asm | FileCheck %s --check-prefix=ASM
4+
; RUN: llc -function-sections <%t -filetype=asm | FileCheck %s --check-prefix=ASM
55
; RUN: opt < %s -passes='pseudo-probe' -S -o %t1
6-
; RUN: llc -pseudo-probe-for-profiling -stop-after=tailduplication <%t1 | FileCheck %s --check-prefix=MIR-tail
6+
; RUN: llc -stop-after=tailduplication <%t1 | FileCheck %s --check-prefix=MIR-tail
77
; RUN: opt < %s -passes='pseudo-probe,simplifycfg' -S | FileCheck %s --check-prefix=SC
88

99
declare i32 @f1()

llvm/test/Transforms/SampleProfile/pseudo-probe-emit-inline.ll

+2-2
Original file line numberDiff line numberDiff line change
@@ -1,9 +1,9 @@
11
; REQUIRES: x86_64-linux
22
; RUN: opt < %s -passes='pseudo-probe,cgscc(inline)' -function-sections -mtriple=x86_64-unknown-linux-gnu -S -o %t
33
; RUN: FileCheck %s < %t --check-prefix=CHECK-IL
4-
; RUN: llc -pseudo-probe-for-profiling -function-sections <%t -filetype=asm -o %t1
4+
; RUN: llc -function-sections <%t -filetype=asm -o %t1
55
; RUN: FileCheck %s < %t1 --check-prefix=CHECK-ASM
6-
; RUN: llc -pseudo-probe-for-profiling -function-sections <%t -filetype=obj -o %t2
6+
; RUN: llc -function-sections <%t -filetype=obj -o %t2
77
; RUN: llvm-objdump --section-headers %t2 | FileCheck %s --check-prefix=CHECK-OBJ
88
; RUN: llvm-mc -filetype=asm <%t1 -o %t3
99
; RUN: FileCheck %s < %t3 --check-prefix=CHECK-ASM

llvm/test/Transforms/SampleProfile/pseudo-probe-emit.ll

+3-3
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,10 @@
11
; REQUIRES: x86_64-linux
22
; RUN: opt < %s -passes=pseudo-probe -function-sections -S -o %t
33
; RUN: FileCheck %s < %t --check-prefix=CHECK-IL
4-
; RUN: llc %t -pseudo-probe-for-profiling -stop-after=pseudo-probe-inserter -o - | FileCheck %s --check-prefix=CHECK-MIR
5-
; RUN: llc %t -pseudo-probe-for-profiling -function-sections -filetype=asm -o %t1
4+
; RUN: llc %t -stop-after=pseudo-probe-inserter -o - | FileCheck %s --check-prefix=CHECK-MIR
5+
; RUN: llc %t -function-sections -filetype=asm -o %t1
66
; RUN: FileCheck %s < %t1 --check-prefix=CHECK-ASM
7-
; RUN: llc %t -pseudo-probe-for-profiling -function-sections -filetype=obj -o %t2
7+
; RUN: llc %t -function-sections -filetype=obj -o %t2
88
; RUN: llvm-objdump --section-headers %t2 | FileCheck %s --check-prefix=CHECK-OBJ
99
; RUN: llvm-mc %t1 -filetype=obj -o %t3
1010
; RUN: llvm-objdump --section-headers %t3 | FileCheck %s --check-prefix=CHECK-OBJ

llvm/test/Transforms/SampleProfile/pseudo-probe-instsched.ll

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
; REQUIRES: x86_64-linux
2-
; RUN: llc < %s -mcpu=generic -mtriple=x86_64-- -pseudo-probe-for-profiling -O3 | FileCheck %s
2+
; RUN: llc < %s -mcpu=generic -mtriple=x86_64-- -O3 | FileCheck %s
33

44
define float @foo(float %x) #0 {
55
%tmp1 = fmul float %x, 3.000000e+00

llvm/test/tools/llvm-profgen/truncated-pseudoprobe.test

+1-1
Original file line numberDiff line numberDiff line change
@@ -20,5 +20,5 @@
2020
; CHECK-NEXT: !Attributes: 1
2121

2222
; truncated-pseudoprobe.perfbin is from the following compile commands:
23-
; llc -pseudo-probe-for-profiling truncated-pseudoprobe.ll -filetype=obj -o truncated-pseudoprobe.o
23+
; llc truncated-pseudoprobe.ll -filetype=obj -o truncated-pseudoprobe.o
2424
; clang truncated-pseudoprobe.o -o truncated-pseudoprobe.perfbin

0 commit comments

Comments
 (0)