-
Notifications
You must be signed in to change notification settings - Fork 12.4k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
[PGO] Add ability to mark cold functions as optsize/minsize/optnone
The performance of cold functions shouldn't matter too much, so if we care about binary sizes, add an option to mark cold functions as optsize/minsize for binary size, or optnone for compile times [1]. Clang patch will be in a future patch Initial version: https://reviews.llvm.org/D149800 [1] https://discourse.llvm.org/t/rfc-new-feature-proposal-de-optimizing-cold-functions-using-pgo-info/56388
- Loading branch information
Showing
13 changed files
with
253 additions
and
19 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
28 changes: 28 additions & 0 deletions
28
llvm/include/llvm/Transforms/Instrumentation/MarkColdFunctions.h
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,28 @@ | ||
//===- MarkColdFunctions.h - ------------------------------------*- C++ -*-===// | ||
// | ||
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. | ||
// See https://llvm.org/LICENSE.txt for license information. | ||
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception | ||
// | ||
//===----------------------------------------------------------------------===// | ||
|
||
#ifndef LLVM_TRANSFORMS_INSTRUMENTATION_MARKCOLDFUNCTIONS_H | ||
#define LLVM_TRANSFORMS_INSTRUMENTATION_MARKCOLDFUNCTIONS_H | ||
|
||
#include "llvm/IR/PassManager.h" | ||
#include "llvm/Support/PGOOptions.h" | ||
|
||
namespace llvm { | ||
|
||
struct MarkColdFunctionsPass : public PassInfoMixin<MarkColdFunctionsPass> { | ||
MarkColdFunctionsPass(PGOOptions::ColdFuncAttr ColdType) | ||
: ColdType(ColdType) {} | ||
PreservedAnalyses run(Module &M, ModuleAnalysisManager &AM); | ||
|
||
private: | ||
PGOOptions::ColdFuncAttr ColdType; | ||
}; | ||
|
||
} // namespace llvm | ||
|
||
#endif // LLVM_TRANSFORMS_INSTRUMENTATION_MARKCOLDFUNCTIONS_H |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,65 @@ | ||
//===----------------------------------------------------------------------===// | ||
// | ||
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. | ||
// See https://llvm.org/LICENSE.txt for license information. | ||
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception | ||
// | ||
//===----------------------------------------------------------------------===// | ||
|
||
#include "llvm/Transforms/Instrumentation/MarkColdFunctions.h" | ||
#include "llvm/Analysis/BlockFrequencyInfo.h" | ||
#include "llvm/Analysis/ProfileSummaryInfo.h" | ||
#include "llvm/IR/PassManager.h" | ||
|
||
using namespace llvm; | ||
|
||
PreservedAnalyses MarkColdFunctionsPass::run(Module &M, | ||
ModuleAnalysisManager &AM) { | ||
if (ColdType == PGOOptions::ColdFuncAttr::None) | ||
return PreservedAnalyses::all(); | ||
ProfileSummaryInfo &PSI = AM.getResult<ProfileSummaryAnalysis>(M); | ||
if (!PSI.hasProfileSummary()) | ||
return PreservedAnalyses::all(); | ||
FunctionAnalysisManager &FAM = | ||
AM.getResult<FunctionAnalysisManagerModuleProxy>(M).getManager(); | ||
bool MadeChange = false; | ||
for (Function &F : M) { | ||
if (F.isDeclaration()) | ||
continue; | ||
BlockFrequencyInfo &BFI = FAM.getResult<BlockFrequencyAnalysis>(F); | ||
if (!PSI.isFunctionColdInCallGraph(&F, BFI)) | ||
continue; | ||
// Add optsize/minsize/optnone if requested. | ||
switch (ColdType) { | ||
case PGOOptions::ColdFuncAttr::None: | ||
assert(false); | ||
break; | ||
case PGOOptions::ColdFuncAttr::OptSize: | ||
if (!F.hasFnAttribute(Attribute::OptimizeNone) && | ||
!F.hasFnAttribute(Attribute::OptimizeForSize) && | ||
!F.hasFnAttribute(Attribute::MinSize)) { | ||
F.addFnAttr(Attribute::OptimizeForSize); | ||
MadeChange = true; | ||
} | ||
break; | ||
case PGOOptions::ColdFuncAttr::MinSize: | ||
// Change optsize to minsize. | ||
if (!F.hasFnAttribute(Attribute::OptimizeNone) && | ||
!F.hasFnAttribute(Attribute::MinSize)) { | ||
F.removeFnAttr(Attribute::OptimizeForSize); | ||
F.addFnAttr(Attribute::MinSize); | ||
MadeChange = true; | ||
} | ||
break; | ||
case PGOOptions::ColdFuncAttr::OptNone: | ||
// Strip optsize/minsize. | ||
F.removeFnAttr(Attribute::OptimizeForSize); | ||
F.removeFnAttr(Attribute::MinSize); | ||
F.addFnAttr(Attribute::OptimizeNone); | ||
F.addFnAttr(Attribute::NoInline); | ||
MadeChange = true; | ||
break; | ||
} | ||
} | ||
return MadeChange ? PreservedAnalyses::none() : PreservedAnalyses::all(); | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,97 @@ | ||
; RUN: opt < %s -passes=mark-cold-functions -pgo-kind=pgo-instr-use-pipeline -S -pgo-cold-func-attr=none | FileCheck %s --check-prefixes=NONE,CHECK | ||
; RUN: opt < %s -passes=mark-cold-functions -pgo-kind=pgo-instr-use-pipeline -S -pgo-cold-func-attr=optsize | FileCheck %s --check-prefixes=OPTSIZE,CHECK | ||
; RUN: opt < %s -passes=mark-cold-functions -pgo-kind=pgo-instr-use-pipeline -S -pgo-cold-func-attr=minsize | FileCheck %s --check-prefixes=MINSIZE,CHECK | ||
; RUN: opt < %s -passes=mark-cold-functions -pgo-kind=pgo-instr-use-pipeline -S -pgo-cold-func-attr=optnone | FileCheck %s --check-prefixes=OPTNONE,CHECK | ||
|
||
; Should be no changes without profile data | ||
; RUN: opt < %s -passes=mark-cold-functions -S -pgo-cold-func-attr=minsize | FileCheck %s --check-prefixes=NONE,CHECK | ||
|
||
; NONE-NOT: Function Attrs: | ||
; OPTSIZE: Function Attrs: optsize{{$}} | ||
; MINSIZE: Function Attrs: minsize{{$}} | ||
; OPTNONE: Function Attrs: noinline optnone{{$}} | ||
; CHECK: define void @cold() | ||
|
||
; NONE: Function Attrs: optsize{{$}} | ||
; OPTSIZE: Function Attrs: optsize{{$}} | ||
; MINSIZE: Function Attrs: minsize{{$}} | ||
; OPTNONE: Function Attrs: noinline optnone{{$}} | ||
; CHECK-NEXT: define void @cold1() | ||
|
||
; NONE: Function Attrs: minsize{{$}} | ||
; OPTSIZE: Function Attrs: minsize{{$}} | ||
; MINSIZE: Function Attrs: minsize{{$}} | ||
; OPTNONE: Function Attrs: noinline optnone{{$}} | ||
; CHECK-NEXT: define void @cold2() | ||
|
||
; CHECK: Function Attrs: noinline optnone{{$}} | ||
; CHECK-NEXT: define void @cold3() | ||
|
||
; CHECK-NOT: Function Attrs: {{.*}}optsize | ||
; CHECK-NOT: Function Attrs: {{.*}}minsize | ||
; CHECK-NOT: Function Attrs: {{.*}}optnone | ||
|
||
@s = global i32 0 | ||
|
||
define void @cold() !prof !27 { | ||
store i32 1, ptr @s, align 4 | ||
ret void | ||
} | ||
|
||
define void @cold1() optsize !prof !27 { | ||
store i32 1, ptr @s, align 4 | ||
ret void | ||
} | ||
|
||
define void @cold2() minsize !prof !27 { | ||
store i32 1, ptr @s, align 4 | ||
ret void | ||
} | ||
|
||
define void @cold3() noinline optnone !prof !27 { | ||
store i32 1, ptr @s, align 4 | ||
ret void | ||
} | ||
|
||
define void @hot() !prof !28 { | ||
%l = load i32, ptr @s, align 4 | ||
%add = add nsw i32 %l, 4 | ||
store i32 %add, ptr @s, align 4 | ||
ret void | ||
} | ||
|
||
attributes #0 = { optsize } | ||
attributes #1 = { minsize } | ||
attributes #2 = { noinline optnone } | ||
|
||
!llvm.module.flags = !{!0} | ||
|
||
!0 = !{i32 1, !"ProfileSummary", !1} | ||
!1 = !{!2, !3, !4, !5, !6, !7, !8, !9} | ||
!2 = !{!"ProfileFormat", !"InstrProf"} | ||
!3 = !{!"TotalCount", i64 9040} | ||
!4 = !{!"MaxCount", i64 9000} | ||
!5 = !{!"MaxInternalCount", i64 0} | ||
!6 = !{!"MaxFunctionCount", i64 9000} | ||
!7 = !{!"NumCounts", i64 5} | ||
!8 = !{!"NumFunctions", i64 5} | ||
!9 = !{!"DetailedSummary", !10} | ||
!10 = !{!11, !12, !13, !14, !15, !16, !17, !18, !19, !20, !21, !22, !23, !24, !25, !26} | ||
!11 = !{i32 10000, i64 9000, i32 1} | ||
!12 = !{i32 100000, i64 9000, i32 1} | ||
!13 = !{i32 200000, i64 9000, i32 1} | ||
!14 = !{i32 300000, i64 9000, i32 1} | ||
!15 = !{i32 400000, i64 9000, i32 1} | ||
!16 = !{i32 500000, i64 9000, i32 1} | ||
!17 = !{i32 600000, i64 9000, i32 1} | ||
!18 = !{i32 700000, i64 9000, i32 1} | ||
!19 = !{i32 800000, i64 9000, i32 1} | ||
!20 = !{i32 900000, i64 9000, i32 1} | ||
!21 = !{i32 950000, i64 9000, i32 1} | ||
!22 = !{i32 990000, i64 9000, i32 1} | ||
!23 = !{i32 999000, i64 10, i32 5} | ||
!24 = !{i32 999900, i64 10, i32 5} | ||
!25 = !{i32 999990, i64 10, i32 5} | ||
!26 = !{i32 999999, i64 10, i32 5} | ||
!27 = !{!"function_entry_count", i64 10} | ||
!28 = !{!"function_entry_count", i64 9000} |
Oops, something went wrong.