LLVM-技巧-提示和最佳实践-全-

第一章

TranslationUnitDecl 0x560f3929f5a8 <<invalid sloc>> <invalid sloc>
|…
`-FunctionDecl 0x560f392e1350 <./test.c:2:1, col:30> col:5 foo 'int (int)'

  |-ParmVarDecl 0x560f392e1280 <col:9, col:13> col:13 used c 'int'
  `-CompoundStmt 0x560f392e14c8 <col:16, col:30>
    `-ReturnStmt 0x560f392e14b8 <col:17, col:28>
      `-BinaryOperator 0x560f392e1498 <col:24, col:28> 'int' '+'
        |-ImplicitCastExpr 0x560f392e1480 <col:24> 'int' <LValueToRValue>
        | `-DeclRefExpr 0x560f392e1440 <col:24> 'int' lvalue ParmVar 0x560f392e1280 'c' 'int'
        `-IntegerLiteral 0x560f392e1460 <col:28> 'int' 1

$ clang -fplugin=/path/to/MyPlugin.so … foo.cpp

$ git clone https://github.com/llvm/llvm-project

$ git clone -b release/10.x https://github.com/llvm/llvm-project

$ mkdir .my_build
$ cd .my_build

$ cmake ../llvm
$ make all

$ sudo apt install ninja-build

$ cmake -G "Ninja" ../llvm

$ ninja all

$ ninja -j8 all

$ cmake -G "Ninja" -DLLVM_USE_LINKER=gold ../llvm

$ cmake -G "Ninja" -DLLVM_USE_LINKER=lld ../llvm

$ cmake -DCMAKE_BUILD_TYPE=RelWithDebInfo …

$ cmake -DLLVM_TARGETS_TO_BUILD="X86" …

$ cmake -DLLVM_TARGETS_TO_BUILD="X86;AArch64;AMDGPU" …

$ cmake -DBUILD_SHARED_LIBS=ON …

$ cmake -DcmAKE_BUILD_TYPE=Debug -DLLVM_USE_SPLIT_DWARF=ON …

$ cmake -DLLVM_OPTIMIZED_TABLEGEN=ON -DCMAKE_BUILD_TYPE=Debug …

$ env CC=`which clang` CXX=`which clang++` \
  cmake -DLLVM_USE_NEWPM=ON …

get.py, simply put your version into the system's PATH. If you are wondering what other GN versions are available, you might want to check out the instructions for installing depot_tools at https://dev.chromium.org/developers/how-tos/install-depot-tools.

out/x64.release is the name of the build folder. Usually, GN users will name the build folder in <architecture>.<build type>.<other features> format.

$ cd out/x64.release
$ ninja <build target>

$ ninja -C out/x64.release <build target>

$ ./gn.py args out/x64.release

# Inside args.gn
is_debug = true
llvm_targets_to_build = ["X86", "AArch64"]

$ ./gn.py args --list out/x64.release

# In an in-tree CMakeLists.txt file…
add_library(MyLLVMPass SHARED
  MyPass.cpp) # Do NOT do this to add a new LLVM library

# In a CMakeLists.txt
add_llvm_component_library(LLVMFancyOpt
  FancyOpt.cpp)

add_llvm_component_library(LLVMFancyOpt
  FancyOpt.cpp
  LINK_COMPONENTS
  Analysis ScalarOpts)

set(LLVM_LINK_COMPONENTS
    Analysis ScalarOpts)
add_llvm_component_library(LLVMFancyOpt
   FancyOpt.cpp)

llvm_map_components_to_libnames(output_lib_names
  <list of component names>)

add_llvm_component_library(LLVMFancyOpt
  FancyOpt.cpp
  LINK_LIBS
  ${BOOST_LIBRARY})

add_llvm_component_library(LLVMFancyOpt
  FancyOpt.cpp
  DEPENDS
  intrinsics_gen)

/FancyOpt
  |___ FancyOpt.cpp
  |___ AggressiveFancyOpt.cpp
  |___ CMakeLists.txt

# In /FancyOpt/CMakeLists.txt
add_llvm_component_library(LLVMFancyOpt
  FancyOpt.cpp)
add_llvm_component_library(LLVMAggressiveFancyOpt
  AggressiveFancyOpt.cpp)

/FancyOpt
  |___ FancyOpt.cpp
  |___ CMakeLists.txt
  |___ /AggressiveFancyOpt
       |___ AggressiveFancyOpt.cpp
       |___ CMakeLists.txt

add_llvm_component_library(LLVMFancyOpt
  FancyOpt.cpp)
add_subdirectory(AggressiveFancyOpt)

add_llvm_component_library(LLVMAggressiveFancyOpt
  AggressiveFancyOpt.cpp)

add_llvm_tool(myLittleTool
  MyLittleTool.cpp)

add_llvm_pass_plugin(MyPass
   HelloWorldPass.cpp)

project(MagicCLITool)
set(SOURCE_FILES
    main.cpp)
add_executable(magic-cli
  ${SOURCE_FILES})

project(MagicCLITool)
find_package trick work, you need to supply the LLVM_DIR CMake variable while invoking the CMake command for this project:

find_package(LLVM REQUIRED CONFIG)
…
list(APPEND CMAKE_MODULE_PATH ${LLVM_CMAKE_DIR})
include(AddLLVM)

find_package(LLVM REQUIRED CONFIG)
…
include(AddLLVM)
set(LLVM_LINK_COMPONENTS
  Support
  Analysis)
add_llvm_executable(magic-cli
  main.cpp)

find_package(LLVM REQUIRED CONFIG)
…
include(AddLLVM)
add_llvm_library(MyMagicLibrary
  lib.cpp
  LINK_COMPONENTS
  Support Analysis)

find_package(LLVM REQUIRED CONFIG)
…
include(AddLLVM)
add_llvm_pass_plugin(MyMagicPass
  ThePass.cpp)

find_package(LLVM REQUIRED CONFIG)
…
add_definitions(${LLVM_DEFINITIONS})
if(NOT ${LLVM_ENABLE_RTTI})
  # For non-MSVC compilers
  set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fno-rtti")
endif()
add_llvm_xxx(source.cpp)

$ ninja check-llvm-support

$ git clone https://github.com/llvm/llvm-test-suite

$ mkdir .O3_build
$ cd .O3_build
$ cmake -G Ninja -DCMAKE_C_COMPILER=<desired Clang binary \ path> -C ../cmake/caches/O3.cmake ../

$ ninja all

; RUN: opt < %s -instcombine -S -o - | FileCheck %s
target triple = "x86_64-unknown-linux"
define i32 @foo(i32 %c) {
entry:
  ; CHECK: [[RET:%.+]] = add nsw i32 %c, 3
  ; CHECK: ret i32 [[RET]]
  %add1 = add nsw i32 %c, 1
  %add2 = add nsw i32 %add1, 2
  ret i32 %add2
}

const foo = (a, b) => {
  let c = a + b;
  console.log(`This is ${c}`); 
}

const foo = (a,b) => {let c = a + b; console.log(`This is ${c}`);}

/JSMinifier
  |__ CMakeLists.txt
  |__ /src
      |__ js-minifier.cpp
  |__ /test
      |__ test.js
      |__ CMakeLists.txt
  |__ /build

$ cd build
$ llvm-lit -sv .
-- Testing: 1 tests, 1 workers –
PASS: JSMinifier Test :: test.js (1 of 1)
Testing Time: 0.03s
  Expected Passes    : 1

// RUN: %jsm %s -o - | FileCheck
// CHECK: const foo = (a,b) =>
// CHECK-SAME: {let c = a + b; console.log(`This is ${c}`);}
const foo = (a, b) => {
  let c = a + b;
  console.log(`This is ${c}`); 
}

$ pip install --user lit

#!/usr/bin/env python
from lit.main import main
if __name__ == '__main__':
    main()

import lit.formats
config.name = 'JSMinifier Test'
config.test_format = config variable here is a Python object that will be populated later when this script is loaded into LIT's runtime. It's basically a registry with predefined fields that carry configuration values, along with custom fields that can be added by lit.*.py scripts at any time.The `config.test_format` field suggests that LIT will run every test inside a shell environment (in the `ShTest` format), while the `config.suffixes` field suggests that only files with `.js` in their filename suffix will be treated as test cases (that is, all the JavaScript files).

…
config.suffixes = ['.js']
config.test_source_root = os.path.dirname(__file__)
config.test_exec_root = os.path.join(config.test_source_root, it's simply pointing to /JSMinifier/test. On the other hand, config.test_exec_root, which is the working directory, is pointing to a place whose parent folder is the value of a custom configuration field, my_obj_root. While it will be introduced later, simply put, it points to the build folder path. In other words, config.test_exec_root will eventually have a value of /JSMinifier/build/test.

…
config.test_exec_root = os.path.join(config.my_obj_root, 'test')
config.config.substitutions field, which makes LIT replace every %jsm occurrence in the test files with the /JSMinifier/build/js-minifier value. This wraps up all the content in lit.cfg.py.

import os
config.my_src_root = r'@CMAKE_SOURCE_DIR@'
config.my_obj_root = r'@CMAKE_BINARY_DIR@'

…
lit_config.@ being resolved and copied into the build folder. From there, it will *call back* the lit.cfg.py script we saw in the earlier steps. This will be explained later in this section.

configure_file function will replace all the @-clamped string occurrences in the input file (lit.site.cfg.py.in, in this case) with their CMake variable counterparts in the current CMake context. For example, let's say there is a file called `demo.txt.in` that contains the following content:

Now, let's use `configure_file` in `CMakeLists.txt`:

Here, the aforementioned replacement will kick in and generate an output file, `demo.txt`, that contains the following content:

import os
config.my_src_root = r'/absolute/path/to/JSMinifier'
config.my_obj_root = r'/absolute/path/to/JSMinifier/build'
lit_config.load_config(
    config, os.path.join(config.my_src_root, 'test/      lit.cfg.py'))

$ ninja check-llvm-support

const onLoginPOST = (req, resp) => {
  if(req.name == 'admin')
    resp.send('OK');
  else
    resp.sendError(403);
}
myReset.post('/console', onLoginPOST);

const t = "nikfmnsdzaO";
const aaa = (a, b) => {
  if(a.z[0] == t[9] && a.z[1] == t[7] &&…)
    b.f0(t[10] + t[2].toUpperCase());
  else
    b.f1(0x193);
}
G.f4(YYY, aaa);

const square = x => x * x;
const cube = x => x * x * x;
const my_func1 = (input1, input2, input3) => {
  // TODO: Check if the arrow and curly brace are in the second   // line
  // TODO: Check if local variable and parameter names are   // obfuscated
  let intermediate = square(input3);
  let output = input1 + intermediate - input2;
  return output;
}
const my_func2 = (factor1, factor2) => {
  // TODO: Check if local variable and parameter names are   // obfuscated
  let term2 = cube(factor1);
  // TODO: Check if literal numbers are obfuscated
  return my_func1(94,
                  term2, factor2);
}
console.log(my_func2(1,2));

// CHECK: my_func1 = ({{[a-z]+0}}, {{[a-z]+1}}, // {{[a-z]+2}})
const my_func1 = (input1, input2, input3) => {
…

// CHECK: my_func1 = ([[A0:[a-z]+0]], // [[A1:[a-z]+1]], [[A2:[a-z]+2]])
const my_func1 = (input1, input2, input3) => {
  // CHECK: square(A0 ~ A2 using the [[…]] syntax, in which the binding variable name and the pattern are divided by a colon: [[<binding variable>:<pattern>]]. On the reference sites of the binding variable, the same [[…]] syntax is used, but without the pattern part.NoteA binding variable can have multiple definition sites. Its reference sites will read the last defined value. 

// CHECK: my_func1 = ([[A0:[a-z]+0]], // [[A1:[a-z]+1]], [[A2:[a-z]+2]])
const my_func1 = (input1, input2, input3) => {
  // CHECK directive, CHECK-NEXT will not only check if the pattern exists but also ensure that the pattern is in the line that follows the line matched by the previous directive.

// CHECK: my_func1 = ([[A0:[a-z]+0]], // [[A1:[a-z]+1]], [[A2:[a-z]+2]])
const my_func1 = (input1, input2, input3) => {
  // CHECK: let [[IM:[a-zA-Z]+]] = square([[A2]]);
  let intermediate = square(input3);
  // CHECK: let [[OUT:[a-zA-Z]+]] =
  // CHECK-SAME directive was used to match the succeeding pattern in the exact same line. The rationale behind this is that FileCheck expected different CHECK directives to be matched in different *lines*. So, let's say part of the snippet was written like this:

It will *only* match code that spread across two lines or more, as shown here:

It will throw an error otherwise. This directive is especially useful if you wish to avoid writing a super long line of checking statements, thus making the testing scripts more concise and readable.

…
// CHECK: return my_func1(
// CHECK-NOT: 94 
return my_func1(94,
                term2, factor2);
…
// CHECK: return my_func1
// CHECK-NOT: 94,
// CHECK-SAME: {{0x5[eE]}}
return my_func1(94,
                term2, factor2);

// CHECK-DAG: 123
// CHECK-DAG: 456

123
456

456
123

// CHECK-DAG: 123
// CHECK-DAG: 456
// CHECK: 789
// CHECK-DAG: abc
// CHECK-DAG: def

456
123
789
def
abc

456
789
123
def
abc

…
// FileCheck provides a way to multiplex different *check suites* into a single file, where each suite can define how it runs and separates the checks from other suites. 

// --check-prefix command-line option. Here, the FileCheck command invocation will look like this:

…
// CHECK-SHUFFLE-DAG: const square =
// CHECK-SHUFFLE-DAG: const cube =
// CHECK-SHUFFLE-DAG: const my_func1 =
// CHECK-SHUFFLE-DAG: const my_func2 =
// CHECK-SHUFFLE: console.log
console.log(my_func2(1,2));

# Running the default check suite
$ js-obfuscator test.js | FileCheck test.js
# Running check suite for the function shuffling option
$ js-obfuscator --shuffle-funcs test.js | \
  FileCheck --check-prefix=CHECK-SHUFFLE test.js

GeoDistance
  |___ helper.cpp
  |___ main.cpp
  |___ sample_input.txt
  |___ Makefile

FLAGS := -DSMALL_INPUT -ffast-math
EXE := geo-distance
OBJS := helper.o main.o
%.o: %.cpp
    $(CXX) $(FLAGS) -c $^
$(EXE): $(OBJS)
    $(CXX) $(FLAGS) $< -o $@

$ geo-distance ./sample_input.txt

$ geo-distance ./sample_input.txt
94.873467

# Inside MultiSource/Applications/CMakeLists.txt
…
add_subdirectory(GeoDistance)

# Inside MultiSource/Applications/GeoDistance/CMakeLists.txt
# (Unfinished)
llvm_multisource(geo-distance)
llvm_test_data(geo-distance sample_input.txt)

# Inside MultiSource/Applications/GeoDistance/CMakeLists.txt
# (Continue)
list(APPEND CPPFLAGS -DSMALL_INPUT)
list(APPEND CFLAGS -ffast-math)
llvm_multisource(geo-distance)
llvm_test_data(geo-distance sample_input.txt)

# Inside MultiSource/Applications/GeoDistance/CMakeLists.txt
# (Continue)
…
set(RUN_OPTIONS sample_input.txt)
set(FP_TOLERANCE 0.001)
llvm_multisource(geo-distance)
…

94.873
exit 0

$ ninja llvm-tblgen

class Person {
  string Name = "John Smith";
  int Age;
}

def john_smith : Person;

def john_smith : Person {
  let Age = 87;
}

def john_smith : Person {
  let Age = 87;
  string Job = "Teacher";
}

class Weight<int kilogram> {
  int Gram = !mul(kilogram, 1000);
}

class AutoPart<int quantity> {…}
def car1_fuel_tank : AutoPart<1>;
def car1_engine : AutoPart<1>;
def car1_wheels : AutoPart<4>;
…
def car2_fuel_tank : AutoPart<1>;
def car2_engine : AutoPart<1>;
def car2_wheels : AutoPart<4>;
…

class AutoPart<int quantity> {…}
multiclass Car<int quantity> {
  def _fuel_tank : AutoPart<quantity>;
  def _engine : AutoPart<quantity>;
  def _wheels : AutoPart<!mul(quantity, 4)>;
  …
}

defm car1 : Car<1>;
defm car2 : Car<1>;

(operator operand1, operand2,…, operandN)

class Variable {…}
class Operator {…}
class Expression<dag expr> {…}
// define variables
def x : Variable;
def y : Variable;
def z : Variable;
// define operators
def mul : Operator;
def plus : Operator;
// define expression
def tmp1 : Expression<(mul x, 2)>;
def tmp2 : Expression<(mul 8, z)>;
def result : Expression<(plus tmp1, tmp2, y)>;

…
def tmp1 : Expression<(mul:$op x, 2)>;
def tmp2 : Expression<(mul:$op 8, z)>;
def result : Expression<(plus tmp1:$term1, tmp2:$term2, y:$term3)>;

class Unit {
  string Text;
  bit Imperial;
}

def gram_unit : Unit {
  let Imperial = false;
  let Text = "g";
}
def tbsp_unit : Unit {
  let Imperial = true;
  let Text = "tbsp";
}

class Unit<bit imperial, string text> {
  string Text = text;
  bit Imperial = imperial;
}
def gram_unit : Unit<false, "g">;
def tbsp_unit : Unit<true, "tbsp">;

class NplusQuarter<class is simply just integrating its fields.

class NplusQuarter<num_quarter variable. By writing num_quarter{1…0}, this gives you a bits value that is equal to the 0th and first bit of num_quarter. There are some other variants of this technique. For example, it can slice a non-continuous range of bits, as follows:

Or, it can extract bits in reversed ordering, as follows:

NoteYou might wonder why the code needs to extract the smallest 2 bits *explicitly* even it has declared that `num_quarter` has a width of 2 bits (the `bits<2>` type). It turned out that for some reason, TableGen will not stop anyone from assigning values greater than `3` into `num_quarter`, like this: `def x : NplusQuarter<1,999>`.

// In Ingredients.td…
include "Kitchen.td"

class IngredientBase<Unit unit> {
  IngredientBase, with parameters to specify the quantity needed by a recipe, and the unit used to measure this ingredient. Take milk, for example, as shown in the following code snippet:

def ingredient_milk : Milk<1,2>; // Need 1.5 cup of milk

defm syntax to create multiclass records, as follows:

After using `defm`, three records will actually be created: `egg_ingredient_whole`, `egg_ingredient_yolk`, and `egg_ingredient_white`, inheriting from `WholeEgg`, `EggYolk`, and `EggWhite`, respectively. 

class Step<Action field carries the baking instructions and information about the ingredients used. Here is an example:

…
def step_mixing : Step<(mix milk, flour), …>;
def step_mixing2 : Step<Step records will form a DAG, in which a vertex will either be a step or an ingredient record.We're also annotating our `dag` operator and operand with tags, as follows:

def step_prep : Step<(heat:$action, $oil, and $temp in the string with the textual representation of those records, generating a string such as *heat the peanut oil until it reaches 300 F*.

=======Ingredients=======
1\. oil 500 ml
2\. flour 300 g
3\. milk 1.25 cup
4\. whole egg 1
5\. yeast 1.50 tsp
6\. butter 3.50 tbsp
7\. sugar 2.0 tbsp
8\. salt 0.50 tsp
9\. vanilla extract 1.0 tsp
=======Instructions=======
1\. use deep fryer to heat oil until 160 C
2\. use mixer to mix flour, milk, whole egg, yeast, butter, sugar, salt, and vanilla extract. stir in low speed.
3\. use mixer to mix outcome from (step 2). stir in medium speed.
4\. use bowl to ferment outcome from (step 3).
5\. use rolling pin to flatten outcome from (step 4).
6\. use cutter to cut outcome from (step 5).
7\. use deep fryer to fry outcome from (step 1) and outcome from (step 6).

class SampleEmitter {
  RecordKeeper &Records;
public:
  SampleEmitter(RecordKeeper &RK) : Records(RK) {}
  void run(raw_ostream &OS);
};

$ cd llvm
$ cp lib/TableGen/TableGenBackendSkeleton.cpp \
     utils/TableGen/RecipePrinter.cpp

// In RecipePrinter::run method…
std::vector<Record*> Steps = Records.getAllDerivedDefinitions("Step");

void RecipePrinter::printUnit(raw_ostream& OS, Record* UnitRecord) {
  OS << UnitRecord->getValueAsString("Text");
}

const auto* SIDef = cast<const DefInit>(StepOrIngredient);

Record* SIRecord = SIDef->getDef();
if (SIRecord->isSubClassOf("Step")) {
  // This Record is a baking step!
} else if (SIRecord->isSubClassOf("IngredientBase")){
  // This Record is an ingredient!
} 

def step_prep : Step<(heat:$action fry_oil:$oil, oil_temp:$temp)> {
  let CustomFormat = "$action $oil until $temp";
}

DagInit* DAG = StepRecord->getValueAsDag("Action");

for(i = 0; i < DAG->arg_size; ++i) {
  Init* Arg = DAG->getArg(i);
}

for(i = 0; i < DAG->arg_size; ++i) {
  StringRef ArgTok = DAG->getArgNameStr(i);
}

$ llvm-tblgen -gen-instr-info /path/to/X86.td -o GenX86InstrInfo.inc

…
void EmitX86FoldTables(RecordKeeper &RK, raw_ostream &OS);
void EmitRecipe(RecordKeeper &RK, raw_ostream &OS);
void EmitRegisterBank(RecordKeeper &RK, raw_ostream &OS);
…

enum Action Type {
…
  GenRecipe,
…
}
…
cl::opt<ActionType> Action(
    cl::desc("Action to perform:"),
    cl::values(
        …
        clEnumValN(GenRecipe, "gen-recipe",
                   "Print delicious recipes"),
        …
    ));

bool LLVMTableGenMain(raw_ostream &OS, RecordKeeper &Records) {
  switch (Action) {
  …
  case GenRecipe:
    EmitRecipe(Records, OS);
    break;
  }
}

add_tablegen(llvm-tblgen LLVM
  …
  RecipePrinter.cpp
  …)

-o option.)The preceding command will print out a (mostly) normal donut recipe, just like this:

$ cmake -G Ninja -DLLVM_ENABLE_PROJECTS="clang;clang-tools-extra" …

$ ninja clang

$ ninja check-clang

$ clang++ -### -std=c++11 -Wall ./hello_world.cpp -o hello_world

"/path/to/clang" "-cc1" "-triple" "x86_64-apple-macosx11.0.0" "-Wdeprecated-objc-isa-usage" "-Werror=deprecated-objc-isa-usage" "-Werror=implicit-function-declaration" "-emit-obj" "-mrelax-all" "-disable-free" "-disable-llvm-verifier" … "-fno-strict-return" "-masm-verbose" "-munwind-tables" "-target-sdk-version=11.0" … "-resource-dir" "/Library/Developer/CommandLineTools/usr/lib/clang/12.0.0" "-isysroot" "/Library/Developer/CommandLineTools/SDKs/MacOSX.sdk" "-I/usr/local/include" "-stdlib=libc++" … "-Wall" "-Wno-reorder-init-list" "-Wno-implicit-int-float-conversion" "-Wno-c99-designator" … "-std=c++11" "-fdeprecated-macro" "-fdebug-compilation-dir" "/Users/Rem" "-ferror-limit" "19" "-fmessage-length" "87" "-stack-protector" "1" "-fstack-check" "-mdarwin-stkchk-strong-link" … "-fexceptions" … "-fdiagnostics-show-option" "-fcolor-diagnostics" "-o" "/path/to/temp/hello_world-dEadBeEf.o" "-x" "c++" "hello_world.cpp"…

$ clang -Xclang -ast-dump -fsyntax-only foo.c

int foo(int c) { return c + 1; }

TranslationUnitDecl 0x560f3929f5a8 <<invalid sloc>> <invalid sloc>
|…
`-FunctionDecl 0x560f392e1350 <./test.c:2:1, col:30> col:5 foo 'int (int)'
  |-ParmVarDecl 0x560f392e1280 <col:9, col:13> col:13 used c 'int'
  `-CompoundStmt 0x560f392e14c8 <col:16, col:30>
    `-ReturnStmt 0x560f392e14b8 <col:17, col:28>
      `-BinaryOperator 0x560f392e1498 <col:24, col:28> 'int' '+'
        |-ImplicitCastExpr 0x560f392e1480 <col:24> 'int' <LValueToRValue>
        | `-DeclRefExpr 0x560f392e1440 <col:24> 'int' lvalue ParmVar 0x560f392e1280 'c' 'int'
        `-IntegerLiteral 0x560f392e1460 <col:28> 'int' 1

$ clang -fplugin=/path/to/MyPlugin.so … foo.cpp

int main(int argc, char** argv) {
  CommonOptionsParser OptionsParser(argc, argv,…);
  ClangTool Tool(OptionsParser.getCompilations(), {"foo.cpp"});
  return Tool.run(newFrontendActionFactory<MyCustomAction>().         get());
}

// In foo.cpp…
struct Location {
  float Lat, Lng;
};
float foo(Location *loc) {
  auto Lat = loc->Lat + 1.0;
  return Lat;
}

$ clang-refactor --selection="foo.cpp:1:1-10:2" \
                 --old-qualified-name="Location::Lat" \
                 --new-qualified-name="Location::Latitude" \
                 foo.cpp

// In foo.cpp…
struct Location {
  float Latitude, Lng;
};
float foo(Location *loc) {
  auto Lat = loc->Latitude + 1.0;
  return Lat;
}

$ ninja clang

#define HELLO 4
int foo(int x) {
  return x + HELLO;
}

$ clang -E foo.c

…
int foo(int x) {
  return x + 4;
}

void foo(SourceManager &SM, SourceLocation SLoc) {
  auto Line = SM.getSpellingLineNumber(SLoc),
       Column = SM.getSpellingColumnNumber(SLoc);
  …
}

SourceLocation NewSLoc = SM.createExpansionLoc(
  SpellingLoc,    // The original macro spelling location
  ExpansionStart, // Start of the location where macro is                   //expanded
  ExpansionEnd,   // End of the location where macro is                   // expanded
  Len             // Length of the content you want to expand
);

Token GetNextToken(Preprocessor &PP) {
  Token Tok;
  PP.Lex(Tok);
  return Tok;
}

$ clang -fsyntax-only -Xclang -dump-tokens foo.cc

namespace foo {
  class MyClass {};
}
foo::MyClass Obj;

namespace 'namespace'    [StartOfLine]  Loc=<foo.cc:1:1>
identifier 'foo'         [LeadingSpace] Loc=<foo.cc:1:11>
l_brace '{'      [LeadingSpace] Loc=<foo.cc:1:15>
class 'class'    [StartOfLine] [LeadingSpace]   Loc=<foo.cc:2:3>
identifier 'MyClass'     [LeadingSpace] Loc=<foo.cc:2:9>
l_brace '{'      [LeadingSpace] Loc=<foo.cc:2:17>
r_brace '}'             Loc=<foo.cc:2:18>
semi ';'                Loc=<foo.cc:2:19>
r_brace '}'      [StartOfLine]  Loc=<foo.cc:3:1>
identifier 'foo'         [StartOfLine]  Loc=<foo.cc:5:1>
coloncolon '::'         Loc=<foo.cc:5:4>
identifier 'MyClass'            Loc=<foo.cc:5:6>
identifier 'Obj'         [LeadingSpace] Loc=<foo.cc:5:14>
semi ';'                Loc=<foo.cc:5:17>
eof ''          Loc=<foo.cc:5:18>

int* foo(int N) {
  return ::new int[N]; // Equivalent to 'new int[N]'
}

bool IsReturn(Token Tok) {
  return Tok.getKind() == tok::kw_return;
}

bool IsReturn(Token Tok) {
  return Tok.is(tok::kw_return);
}

IdentifierInfo *II = Tok.getIdentifierInfo();

void foo(int auto) {}

$ clang++ -std=c++03 standard into -std=c++11 or a later standard. The error message in the latter case will say that auto, a language keyword since C++11, can't be used there. To give the frontend have an easier time judging if a given token is a keyword in any case, the IdentifierInfo object attached on keyword tokens is designed to answer if an identifier is a keyword under a certain language standard (or language feature), using the IdentifierInfo::isKeyword(…) function, for example, whereby you pass a LangOptions class object (a class carrying information such as the language standard and features currently being used) as the argument to that function.

#define FOO(X) (X + 1)
return FOO(3); // Equivalent to "return (3 + 1);"
#define FOO(X) (X - 100)
return FOO(3); // Now this is equivalent to "return (3 - 100);"
#undef FOO
return FOO(3); // "FOO(3)" here will not be expanded in                //preprocessor

void printMacroBody(IdentifierInfo *MacroII, Preprocessor &PP) {
  MacroDefinition Def = PP.getMacroDefinition(MacroII);
  MacroInfo *Info = Def.getMacroInfo();
  …
}

void printMacroBody(IdentifierInfo *MacroII, Preprocessor &PP) {
  …
  MacroInfo *Info = Def.getMacroInfo();
  for(Token Tok : Info->tokens()) {
    std::cout << Tok.getName() << "\n";
  }
}

#define PRINT(val) \
  printf("%d\n", val * 2)
void main() {
  PRINT(1 + 3);
}

void main() {
  printf("%d\n", 1 + 3 * 2);
}

#define PRINT(val) \
  printf("%d\n", (val) * 2)

void main() {
  printf("%d\n", (1 + 3) * 2);
}

#pragma macro_arg_guard val
#define PRINT(val) \
  printf("%d\n", val * 94 + (val) * 87);
void main() {
  PRINT(1 + 3);
}

$ clang … foo.c
[WARNING] In foo.c:3:18: macro argument 'val' is not enclosed by parenthesis

MacroGuard
  |___ CMakeLists.txt
  |___ MacroGuardPragma.cpp
  |___ MacroGuardValidator.h
  |___ MacroGuardValidator.cpp

# In MacroGuard/CmakeLists.txt
…
# (after importing LLVM's CMake directives)
find_package(Clang REQUIRED CONFIG)
include_directories(${CLANG_INCLUDE_DIRS})

set(_SOURCE_FILES
    MacroGuardPragma.cpp
    MacroGuardValidator.cpp
    )
add_llvm_library(MacroGuardPlugin MODULE
                 ${_SOURCE_FILES}
                 PLUGIN_TOOL clang)

Windows platforms, since PLUGIN_TOOL is also used for specifying this plugin loader executable's name.

$ clang … -fplugin=/path/to/MacroGuardPlugin.so foo.c

struct MacroGuardHandler : public PragmaHandler {
  MacroGuardHandler() : PragmaHandler("macro_arg_guard"){}
  void HandlePragma(Preprocessor &PP, PragmaIntroducer                     Introducer, Token &PragmaTok) override;
};

#pragma macro_arg_guard val
                       ^--Stop at here

void MacroGuardHandler::HandlePragma(Preprocessor &PP,…) {
  Token Tok;
  PP.Lex(Tok);
  while (Tok.isNot(tok::eod)) {
    ArgsToEnclosed.push_back(Tok.getIdentifierInfo());
    PP.Lex(Tok);
  }
}

SmallVector<const IdentifierInfo*, 2> ArgsToEnclosed;
struct MacroGuardHandler: public PragmaHandler {
  …
};

struct MacroGuardHandler : public PragmaHandler {
  bool IsValidatorRegistered;
  MacroGuardHandler() : PragmaHandler("macro_arg_guard"),
                        IsValidatorRegistered(false) {}
  …
};
void MacroGuardHandler::HandlePragma(Preprocessor &PP,…) {
  …
  if (!IsValidatorRegistered) {
    auto Validator = std::make_unique<MacroGuardValidator>(…);
    PP.addCallbackPPCallbacks(std::move(Validator));
    IsValidatorRegistered = true;
  }
}

struct MacroGuardHandler : public PragmaHandler {
  …
};
static PragmaHandlerRegistry::Add<MacroGuardHandler>
  X("macro_arg_guard", "Verify if designated macro args are     enclosed");

// In MacroGuardValidator.h
extern SmallVector<const IdentifierInfo*, 2> ArgsToEnclosed;
class MacroGuardValidator : public PPCallbacks {
  SourceManager &SM;
public:
  explicit MacroGuardValidator(SourceManager &SM) : SM(SM) {}
  void MacroDefined(const Token &MacroNameToke,
                    const MacroDirective *MD) override;
};
// In MacroGuardValidator.cpp
void MacroGuardValidator::MacroDefined(const Token &MacroNameTok, const MacroDirective *MD) {
}

void MacroGuardValidator::MacroDefined(const Token &MacroNameTok, const MacroDirective *MD) {
  const MacroInfo *MI = MD->getMacroInfo();
  // For each argument to be checked…
  for (const IdentifierInfo *ArgII : ArgsToEnclosed) {
    // Scanning the macro body
    for (auto TokIdx = 0U, TokSize = MI->getNumTokens();
         TokIdx < TokSize; ++TokIdx) {
      …
    }
  }
}

for (const IdentifierInfo *ArgII : ArgsToEnclosed) {
  for (auto TokIdx = 0U, TokSize = MI->getNumTokens();
       TokIdx < TokSize; ++TokIdx) {
    Token CurTok = *(MI->tokens_begin() + TokIdx);
    if (CurTok.getIdentifierInfo() == ArgII) {
      if (TokIdx > 0 && TokIdx < TokSize - 1) {
        auto PrevTok = *(MI->tokens_begin() + TokIdx - 1),
             NextTok = *(MI->tokens_begin() + TokIdx + 1);
        if (PrevTok.is(tok::l_paren) && NextTok.is            (tok::r_paren))
          continue;
      }
      …
    }  
  }
}

for (const IdentifierInfo *ArgII : ArgsToEnclosed) {
  for (auto TokIdx = 0U, TokSize = MI->getNumTokens();
       TokIdx < TokSize; ++TokIdx) {
    …
    if (CurTok.getIdentifierInfo() == ArgII) {
      if (TokIdx > 0 && TokIdx < TokSize - 1) {
        …
        if (PrevTok.is(tok::l_paren) && NextTok.is            (tok::r_paren))
          continue;
      }
      SourceLocation TokLoc = CurTok.getLocation();
      errs() << "[WARNING] In " << TokLoc.printToString(SM) << ": ";
      errs() << "macro argument '" << ArgII->getName()
             << "' is not enclosed by parenthesis\n";
    }  
  }
}

./simple_warn.c:2:7: warning: unused variable 'y'…
  int y = x + 1;
      ^
1 warning generated.

$ ninja clang

$ clang -Xclang -ast-dump foo.c

int foo(int c) { return c + 1; }

TranslationUnitDecl 0x560f3929f5a8 <<invalid sloc>> <invalid sloc>
|…
`-FunctionDecl 0x560f392e1350 <foo.c:2:1, col:30> col:5 foo 'int (int)'
  |-ParmVarDecl 0x560f392e1280 <col:9, col:13> col:13 used c 'int'
  `-CompoundStmt 0x560f392e14c8 <col:16, col:30>
    `-ReturnStmt 0x560f392e14b8 <col:17, col:28>
      `-BinaryOperator 0x560f392e1498 <col:24, col:28> 'int' '+'
        |-ImplicitCastExpr 0x560f392e1480 <col:24> 'int' <LValueToRValue>
        | `-DeclRefExpr 0x560f392e1440 <col:24> 'int' lvalue ParmVar 0x560f392e1280 'c' 'int'
        `-IntegerLiteral 0x560f392e1460 <col:28> 'int' 1

// If `T` is representing 'int'…
QualType toConstVolatileTy(Type *T) {
  return QualType(T, Qualifier::Const | Qualifier::Volatile);
} // Then the returned QualType represents `volatile const int`

// `FD` has the type of `const FunctionDecl&`
const auto* Body = dyn_cast<CompoundStmt>(FD.getBody());
for(const auto* S : Body->body()) {
  if(const auto* L = dyn_cast<WhileStmt>(S)) {
    if(const auto* Cond = dyn_cast<CXXBoolLiteralExpr>      (L->getCond()))
      if(Cond->getValue()) {
        // The exit condition is `true`!!
      }
  }
}

functionDecl(compountStmt(hasAnySubstatement(
  whileStmt(
    hasCondition(cxxBoolLiteral(equals(true)))))));

using namespace ast_matchers;
…
MatchFinder Finder;
// Add AST matching patterns to `MatchFinder`
Finder.addMatch(traverse(TK_AsIs, pattern1), Callback1);
Finder.addMatch(traverse(TK_AsIs, pattern2), Callback2);
…
// Match a given AST. `Tree` has the type of `ASTContext&`
// If there is a match in either of the above patterns,
// functions in Callback1 or Callback2 will be invoked // accordingly
Finder.matchAST(Tree);
// …Or match a specific AST node. `FD` has the type of // `FunctionDecl&`
Finder.match(FD, Tree);

struct B {
  B(int);
};
B foo() { return 87; }

FunctionDecl
`-CompoundStmt
  `-ReturnStmt
    `-ExprWithCleanups
      `-CXXConstructExpr
        `-MaterializeTemporaryExpr
          `-ImplicitCastExpr
            `-ImplicitCastExpr
              `-CXXConstructExpr
                `-IntegerLiteral 'int' 87

FunctionDecl
`-CompoundStmt
  `-ReturnStmt
    `-IntegerLiteral 'int' 87

struct MyMatchCallback : public MatchFinder::MatchCallback {
  void run(const MatchFinder::MatchResult &Result) override {
    // Reach here if there is a match on the corresponding     // pattern
    // Handling "bound" result from `Result`, if there is any
  }
};

forStmt(hasBody(…));

forStmt(hasBody(…),
        hasCondition(…));

forStmt(
  hasCondition(
    expr().bind("exit_condition")));

…
void run(const MatchFinder::MatchResult &Result) override {
  cons auto& Nodes = Result.Nodes;
  const Expr* CondExpr = Nodes.getNodeAs<Expr>    ("exit_condition");
  // Use `CondExpr`…
}

auto PatExitCondition = binaryOperator(
                           hasOperatorName("<"),
                           hasRHS(integerLiteral()
                           .bind("trip_count")));
auto Pattern = functionDecl(
                 compountStmt(hasAnySubstatement(
              forStmt(hasCondition(PatExitCondition)))));
MatchFinder Finder;
auto* Callback = new MyMatchCallback();
Finder.addMatcher(traverse(TK_IgnoreUnlessSpelledInSource,
                           Pattern), Callback);

void run(const MatchFinder::MatchResult &Result) override {
  const auto& Nodes = Result.Nodes;
  const auto* TripCount = 
        Nodes.getNodeAs<IntegerLiteral>("trip_count");
  if (TripCount)
    TripCount->dump(); // print to llvm::errs()
}

int foo(int c) {
  if (c > 10) {
    return c + 100;
  } else {
    return 94;
  }
}
void bar(int x) {
  int a;
  if (x > 10) {
    a = 87;
  } else {
    a = x – 100;
  }
}

int foo(int c) {
  return c > 10? c + 100 : 94;
}
void bar(int x) {
  int a;
  a = x > 10? 87 : x – 100;
}

$ clang …(flags to run the plugin) ./test.c
./test.c:2:3: warning: this if statement can be converted to ternary operator:
  if (c > 10) {
  ^
./test.c:3:12: note: with true expression being this:
    return c + 100;
           ^
./test.c:5:12: note: with false expression being this:
    return 94;
           ^
./test.c:11:3: warning: this if statement can be converted to ternary operator:
  if (x > 10) {
  ^
./test.c:12:9: note: with true expression being this:
    a = 87;
        ^
./test.c:14:9: note: with false expression being this:
    a = x - 100;
        ^
2 warnings generated.

"use of undeclared identifier %0"

def err_undeclared_var_use : Error<"use of undeclared identifier %0">;

// `Ctx` has the type of `ASTContext&`
DiagnosticsEngine& Diag = Ctx.getDiagnostics();

Diag.Report(err_undeclared_var_use takes one placeholder argument – namely, the identifier name – which is supplied through concatenating the Report function call with << operators:

"you cannot put %1 into %0"

Diag.Report(diag::err_invalid_placement)
             << "boiling oil" << "water";

"you exceed the daily %select directive consists of curly braces in which different message options are separated by |. Outside the curly braces, a number – 0, in the preceding code – indicates which supplement data is used to select the option within the braces. The following is an example of this:

Diag.Report(diag::warn_exceed_limit) << 0;

// `SLoc` has the type of `SourceLocation`
Diag.Report(SLoc:

auto MyDiagID = Diag.MyDiagID, that has a message template of Today's weather is %0 at its note diagnostic level. You can use this diagnostic ID just like any other ID:

struct TernaryConverterAction : public PluginASTAction {
  std::unique_ptr<ASTConsumer>
    CreateASTConsumer(CompilerInstance &CI,
                      StringRef InFile) override;
};

struct TernaryConverterAction : public PluginASTAction {
  …
  ActionType getActionType() override { return ParseArgs member function, on the other hand, handles (frontend) command-line options specific to this plugin. In other words, you can create custom command-line flags for your plugin. In our case, we are going to create two flags: -no-detect-return and -no-detect-assignment. This allows us to decide whether we wish to detect potential ternary conversions regarding return statements or assignment statements, respectively:

using namespace ast_matchers;
struct TernaryConverterAction : public PluginASTAction {
  …
private:
  std::unique_ptr<MatchFinder> unique_ptr type member variables: one for holding MatchFinder and two MatchCallback ones for return-based and assignment-based patterns.Why Use unique_ptr?The rationale behind using `unique_ptr` to store those three objects – or storing those objects *persistently* – is because the `ASTConsumer` instance we created at the end of `CreateASTConsumer` (`ASTFinder->newASTConsumer()`) keeps references to those three objects. Thus, we need a way to keep them alive during the lifetime of the frontend.In addition to that, we registered the pattern for traversal with MatchFinder by using `MatchFinder::addMatcher`, the `traverse` function, and `MatchCallback` instances. If you're not familiar with these APIs, feel free to check out the *ASTMatcher* section.Now, we only need to compose the matching patterns and implement some callbacks to print out warning messages if there is a match – as the `TODO` comments suggested in the preceding snippet.

FunctionDecl 
  |_CompoundStmt
    |_(Other AST nodes we don't care)
    |_IfStmt
      |_(true branch: contain only one return/assign         statement)
      |_(false branch: contain only one return/assign         statement)

functionDecl(
  compoundStmt(hasAnySubstatement
    IfStmt(
      hasThen(/*CompoundStmt, you should always use quantifier directives such as hasAnySubstatement to match its body statements.We are going to use the previous `TODO` comments to customize for either return-based or assignment-based situations. Let's use subpattern variables to replace those `TODO` comments and put the preceding code into another function:

StatementMatcher buildReturnMatcher() {
  return compoundStmt(statementCountIs directive to match the code blocks with only one statement. Also, we specified that we don't want an empty return via hasReturnValue(…). The argument for hasReturnValue is necessary since the latter takes at least one argument, but since we don't care what type of node it is, we are using expr() as some sort of wildcard pattern.For assignment-based patterns, things get a little bit complicated: we don't just want to match a single assignment statement (modeled by the `BinaryOperator` class) in both branches – the LHS of those assignments need to be `DeclRefExpr` expressions that point to the same `Decl` instance. Unfortunately, we are not able to express all these predicates using ASTMatch's DSL. What we can do, however, is push off some of those checks into `MatchCallback` later, and only use DSL directives to check the *shape* of our desired patterns:

StatementMatcher buildAssignmentMatcher() {
  return compoundStmt(statementCountIs(1),
                      hasAnySubstatement(
                        binaryOperator(
                          hasOperatorName("="),
                          hasLHS(DeclRefExpr is bound to the same name, meaning that the AST node that occurred later will overwrite the previously bound node. So, eventually, we won't get DeclRefExpr nodes from both branches as we previously planned.Therefore, let's use a different tags for `DeclRefExpr` that match from both branches: `dest.true` for the true branch and `dest.false` for the false branch. Let's tweak the preceding code to reflect this strategy:

void
MatchAssignmentCallback::run(const MatchResult &Result) override {
  const auto& Nodes = Result.Nodes;
  // Check if destination of both assignments are the   // same
  const auto *DestTrue =
             Nodes.getNodeAs<DeclRefExpr>("dest.true"),
             *DestFalse = 
             Nodes.getNodeAs<DeclRefExpr>("dest.false");
  if (DestTrue->getDecl() == DestFalse->getDecl()) {
    // Can be converted into ternary operator!
  }
}

StatementMatcher
buildIfStmtMatcher(StatementMatcher truePattern,
                   StatementMatcher falsePattern) {
  return functionDecl(
    compoundStmt(hasAnySubstatement
      IfStmt(
        hasThen(truePattern)
        hasElse(falsePattern)).IfStmt since we want to tell our users where the potential places that can be converted into ternary operators are:

void
MatchAssignmentCallback::run(const MatchResult &Result) override {
  …
  auto& Diag = Result.Context->getDiagnostics();
  auto DiagWarnMain = Diag.getCustomDiagID(
    DiagnosticsEngine::Warning,
    "this if statement can be converted to ternary      operator:");
  auto DiagNoteTrueExpr = Diag.getCustomDiagID(
    DiagnosticsEngine::Note,
    "with true expression being this:");
  auto DiagNoteFalseExpr = Diag.getCustomDiagID(
    DiagnosticsEngine::Note,
    "with false expression being this:");
  …
}

void
MatchAssignmentCallback::run(const MatchResult &Result) override {
  …
  if (DestTrue && DestFalse) {
      if (DestTrue->getDecl() == DestFalse->getDecl()) {
        // Can be converted to ternary!
        const auto* If = Nodes.getNodeAs<IfStmt>        ("if_stmt");
        Diag.Report(If->getBeginLoc(), DiagWarnMain);
        const auto* TrueValExpr = 
                    Nodes.getNodeAs<Expr>("val.true");
        const auto* FalseValExpr = 
                    Nodes.getNodeAs<Expr>("val.false");
        Diag.Report(TrueValExpr->getBeginLoc(), 
                    DiagNoteTrueExpr);
        Diag.Report(FalseValExpr->getBeginLoc(), 
                    DiagNoteFalseExpr);
      }
    }
}

std::unique_ptr<ASTConsumer>
TernaryConverterAction::CreateASTConsumer(CompilerInstance &CI, StringRef InFile) {
  …
  // Return matcher
  if (!NoReturn) {
  ReturnMatchCB = std::make_unique<MatchReturnCallback>();
    ASTFinder->addMatcher(
      traverse(TK_IgnoreUnlessSpelledInSource,                          
               buildIfStmtMatcher(
                 buildReturnMatcher(".true"),                                                 
                 buildReturnMatcher(".false"))),
      ReturnMatchCB.get()
    );
  }
  // Assignment matcher
  if (!NoAssignment) {
    AssignMatchCB = std::make_     unique<MatchAssignmentCallback>();
    ASTFinder->addMatcher(
      traverse(TK_IgnoreUnlessSpelledInSource,
               buildIfStmtMatcher(
                 buildAssignmentMatcher(".true"),
                 buildAssignmentMatcher(".false"))),
      AssignMatchCB.get()
    );
  }
  return std::move(ASTFinder->newASTConsumer());
}

-no-detect-return and -no-detect-assignment in this project, please add the command-line options highlighted here:

$ ninja clang

$ clang++ -### -std=c++11 -Wall hello_world.cpp -o hello_world
"/path/to/clang" "-cc1" "-triple" "x86_64-apple-macosx11.0.0" "-Wdeprecated-objc-isa-usage" "-Werror=deprecated-objc-isa-usage" "-Werror=implicit-function-declaration" "-emit-obj" "-mrelax-all" "-disable-free" "-disable-llvm-verifier" … "-fno-strict-return" "-masm-verbose" "-munwind-tables" "-target-sdk-version=11.0" … "-resource-dir" "/Library/Developer/CommandLineTools/usr/lib/clang/12.0.0" "-isysroot" "/Library/Developer/CommandLineTools/SDKs/MacOSX.sdk" "-I/usr/local/include" "-stdlib=libc++" … "-Wall" "-Wno-reorder-init-list" "-Wno-implicit-int-float-conversion" "-Wno-c99-designator" … "-std=c++11" "-fdeprecated-macro" "-fdebug-compilation-dir" "/Users/Rem" "-ferror-limit" "19" "-fmessage-length" "87" "-stack-protector" "1" "-fstack-check" "-mdarwin-stkchk-strong-link" … "-fexceptions" … "-fdiagnostics-show-option" "-fcolor-diagnostics" "-o" "/path/to/temp/hello_world-dEadBeEf.o" "-x" "c++" "hello_world.cpp"…

$ sudo apt install openssl

$ clang hello_world.c -o hello_world

#ifndef SIMPLE_LOG_H
#define SIMPLE_LOG_H
#include <iostream>
#include <string>
#ifdef SLG_ENABLE_DEBUG
inline void print_debug(const std::string &M) {
  std::cout << "[DEBUG] " << M << std::endl;
}
#endif
#ifdef SLG_ENABLE_ERROR
inline void print_error(const std::string &M) {
  std::cout << "[ERROR] " << M << std::endl;
}
#endif
#ifdef SLG_ENABLE_INFO
inline void print_info(const std::string &M) {
  std::cout << "[INFO] " << M << std::endl;
}
#endif
#endif

int main() {
  print_info("Hello world!!");
  return 0;
}

$ clang++ -fuse-simple-log test.cc -o test
$ ./test
[INFO] Hello world!!
$

$ clang++ -fuse-simple-log -fno-use-info-simple-log test.cc -o test
test.cc:2:3: error: use of undeclared identifier 'print_info'
  print_info("Hello World!!");
  ^
1 error generated
$

$ clang++ -fuse-simple-log=/home/user/advanced_log.h test.cc -o test
[01/28/2021 20:51 PST][INFO] Hello World!!
$

def g_Flag : Flag<["-"], "g">, Group<g_Group>,
  HelpText<"Generate source-level debug information">;

def std_EQ : Joined<["-", "--"], "std=">, Flags<[CC1Option]>, …;

def fuse_simple_log : Flag<["-"], "fuse-simple-log">,
                  Group<f_Group>, Flags<[NoXarchOption]>;

defm use_error_simple_log : BooleanFFlag<"use-error-simple-log">, Group<f_Group>, Flags<[NoXarchOption]>;

defm use_debug_simple_log : BooleanFFlag<"use-debug-simple-log">, Group<f_Group>, Flags<[NoXarchOption]>;
defm use_info_simple_log : BooleanFFlag<"use-info-simple-log">, Group<f_Group>, Flags<[NoXarchOption]>;

def fsimple_log_path_EQ : Joined<["-"], "fsimple-log-path=">, Group<f_Group>, Flags<[NoXarchOption]>;
def fuse_simple_log_EQ : Joined<["-"], "fuse-simple-log=">, Group<f_Group>, Flags<[NoXarchOption]>;

-include frontend flag, as its name suggests, *implicitly* includes the designated file in the compiling source code.Using the same logic, if `-fuse-simple-log=/other/file.h` or `-fuse-simple-log -fsimple-log-path=/other/file.h` are given, they will be translated into the following:

-D flag implicitly defines a macro variable for the compiling source code.However, if only `-fuse-simple-only` is given, the flag will implicitly include all the log printing functions. In other words, `-fuse-simple-only` will not only be translated into the `-include` flag, as introduced in previous bullet point, but also the following flags:

-fuse-simple-log -fno-use-error-simple-log

-include "simple_log.h" -D SLG_ENABLE_DEBUG -D SLG_ENABLE_INFO

-fuse-info-simple-log -fsimple-log-path="my_log.h"

-include "my_log.h" -D SLG_ENABLE_INFO

struct SimpleLogOpts {
  // If a certain log level is enabled
  bool Error = false,
       Info = false,
       Debug = false;
  static inline SimpleLogOpts All() { 
    return {true, true, true};
  }
  // If any of the log level is enabled
  inline operator bool() const {
    return Error || Info || Debug;
  }
};
// The object we are going to work on later
SimpleLogOpts SLG;

if (SLG) {
  // At least one log level is enabled!
}

if (Args.hasArg(options::OPT_fuse_simple_log)) {
  SLG = SimpleLogOpts::All();
}

if (Args.hasArg(options::OPT_fuse_simple_log,
                options::OPT_fuse_simple_log_EQ)) {
  SLG = SimpleLogOpts::All();
}

SLG.Error = Args.hasFlag(options::OPT_fuse_error_simple_log, options::OPT_fno_use_error_simple_log, SLG.Error);

if (SLG) {
  CmdArgs.push_back("-include");
  …
}

if (SLG) {
  CmdArgs.push_back("-include");
  if (Arg *A = Args.getLastArg(options::OPT_fuse_simple_  log_EQ, options::OPT_fsimple_log_path_EQ))
    CmdArgs.push_back(A->getValue());
  else
    CmdArgs.push_back("simple_log.h");
  …
}

if (SLG) {
  …
  if (SLG.Error) {
    CmdArgs.push_back("-D");
    CmdArgs.push_back("SLG_ENABLE_ERROR");
  }
  …
}

$ clang++ -### -fuse-simple-log -c test.cc

"-include" "simple_log.h" "-D" "SLG_ENABLE_ERROR" "-D" "SLG_ENABLE_INFO" "-D" "SLG_ENABLE_DEBUG"

$ clang++ -### -fuse-simple-log=my_log.h -fno-use-error-simple-log -c test.cc

"-include" "my_log.h" "-D" "SLG_ENABLE_INFO" "-D" "SLG_ENABLE_DEBUG"

$ clang++ -### -fuse-info-simple-log -fsimple-log-path=my_log.h -c test.cc

"-include" "my_log.h" "-D" "SLG_ENABLE_INFO"

$ clang++ -fplugin=MyPlugin.so \
          -Xclang -plugin -Xclang ternary-converter \
          -fsyntax-only test.cc

# Error: `ternary-converter` will not be recognized
$ clang++ -fplugin=MyPlugin.so \
          -Xclang -plugin ternary-converter \
          -fsyntax-only test.cc

def foo : Flag<["-"], "foo">, Flags<[NoDriverOption]>;

$ ls
main.cc simple_log.h
$ clang++ -fuse-simple-log -fsyntax-only main.cc
$ # OK

$ ls .
# No simple_log.h in current folder
main.cc
$ clang++ -fuse-simple-log=/path/to/simple_log.h -fsyntax-only main.cc
$ # OK

$ ls .
# No simple_log.h in current folder
main.cc
$ ls ~/my_include
simple_log.h
$ clang++ -zipline -fuse-simple-log -fsyntax-only main.cc
$ # OK

$ clang -zipline -c test.c
$ file test.o
test.o: ASCII text # Not (binary) object file anymore
$ cat test.o
CS50ZXh0CgkuZmlsZQkidGVzdC5jYyIKCS 5nbG9ibAlfWjNmb29pCgkucDJhbGln
bgk0LCAweDkwCgkudHlwZQlfWjNmb29p LEBmdW5jdGlvbgpfWjNmb29pOgoJLmNm
… # Base64 encoded contents
$

$ clang -zipline test.c -o test.zip
$ file test.zip
test.zip: Zip archive, at least v2.0 to extract
$

$ clang -zipline -fuse-ld=tar test.c -o test.tar.gz
$ file test.tar.gz
test.tar.gz: gzip compressed data, from Unix, original size…
$

// zipline toolchain
def zipline : Flag<["-", "--"], "zipline">,
              Flags<[NoXarchOption]>; 

namespace clang {
namespace driver {
namespace toolchains {
struct LLVM_LIBRARY_VISIBILITY ZiplineToolChain 
  : public Generic_ELF {
  ZiplineToolChain(const Driver &D, const llvm::Triple    &Triple, const llvm::opt::ArgList &Args)
    : Generic_ELF(D, Triple, Args) {}
  ~ZiplineToolChain() override {}
  // Disable the integrated assembler
  bool IsIntegratedAssemblerDefault() const override
    { return false; }
  bool useIntegratedAs() const override { return false; }
  void
  AddClangSystemIncludeArgs(const llvm::opt::ArgList    &DriverArgs, llvm::opt::ArgStringList &CC1Args) 
    const override;
protected:
  Tool *buildAssembler() const override;
  Tool *buildLinker() const override;
};
} // end namespace toolchains
} // end namespace driver
} // end namespace clang

void ZiplineToolChain::AddClangSystemIncludeArgs(
                       const ArgList &DriverArgs,
                       ArgStringList &CC1Args) const {
  using namespace llvm;
  SmallString<16> CustomIncludePath;
  sys::fs::expand_tilde("~/my_include",                         CustomIncludePath);
  addSystemInclude(DriverArgs,
                   CC1Args, CustomIncludePath.c_str());
}

const ToolChain
&Driver::getToolChain(const ArgList &Args,
                      const llvm::Triple &Target) const {
  …
  switch (Target.getOS()) {
  case llvm::Triple::Linux:
  …
    else if (Args.hasArg(options::OPT_zipline))
     TC = std::make_unique<toolchains::ZiplineToolChain>     (*this, Target, Args);
  …
    break;
  case …
  case …
  }
}

namespace clang {
namespace driver {
namespace tools {
namespace zipline {
struct LLVM_LIBRARY_VISIBILITY Assembler : public Tool {
  Assembler(const ToolChain &TC)
    : Tool("zipeline::toBase64", "toBase64", TC) {}
  bool hasIntegratedCPP() const override { return false; }
  void ConstructJob(Compilation &C, const JobAction &JA,
                    const InputInfo &Output,
                    const InputInfoList &Inputs,
                    const llvm::opt::ArgList &TCArgs,
                    const char *LinkingOutput) const                     override;
};
} // end namespace zipline
} // end namespace tools
namespace toolchains {
struct LLVM_LIBRARY_VISIBILITY ZiplineToolChain … {
…
};
} // end namespace toolchains
} // end namespace driver
} // end namespace clang

void
tools::zipline::Assembler::ConstructJob(Compilation &C,
                            const JobAction &JA,
                            const InputInfo &Output,
                            const InputInfoList &Inputs,
                            const ArgList &Args,
                            const char *LinkingOutput)                            const {
                            ArgStringList CmdArgs;
                            const InputInfo &II =                             Inputs[0];
  std::string Exec =
    Args.MakeArgString(getToolChain().     GetProgramPath("openssl"));
  // opeenssl base64 arguments
  CmdArgs.push_back("base64");
  CmdArgs.push_back("-in");
  CmdArgs.push_back(II.getFilename());
  CmdArgs.push_back("-out");
  CmdArgs.push_back(Output.getFilename());

  C.addCommand(
    std::make_unique<Command>(
           JA, *this, ResponseFileSupport::None(),
           Args.MakeArgString(Exec), CmdArgs,
           Inputs, Output));
}

$ openssl base64 -in <input file> -out <output file>

Tool *ZiplineToolChain::buildAssembler() const {
  return new tools::zipline::Assembler(*this);
}

namespace zipline {
struct LLVM_LIBRARY_VISIBILITY Assembler : public Tool {
…
};
struct LLVM_LIBRARY_VISIBILITY Linker : public Tool {
  Linker(const ToolChain &TC)
    : Tool("zipeline::zipper", "zipper", TC) {}
  bool hasIntegratedCPP() const override { return false; }
  bool isLinkJob() const override { return true; }
  void ConstructJob(Compilation &C, const JobAction &JA,
                    const InputInfo &Output,
                    const InputInfoList &Inputs,
                    const llvm::opt::ArgList &TCArgs,
                    const char *LinkingOutput) const                     override;
private:
  void buildZipArgs(const JobAction&, const InputInfo&,
                    const InputInfoList&,
                    const llvm::opt::ArgList&, 
                    llvm::opt::ArgStringList&) const;
  void buildTarArgs(const JobAction&,
                    const InputInfo&,                     const InputInfoList&,
                    const llvm::opt::ArgList&, 
                    llvm::opt::ArgStringList&) const;
};
} // end namespace zipline

void
tools::zipline::Linker::ConstructJob(Compilation &C,
                        const JobAction &JA,
                        const InputInfo &Output,
                        const InputInfoList &Inputs,
                        const ArgList &Args,
                        const char *LinkingOutput) const {
  ArgStringList CmdArgs;
  std::string Compressor = "zip";
  if (Arg *A = Args.getLastArg(options::OPT_fuse_ld_EQ))
    Compressor = A->getValue();
  std::string Exec = Args.MakeArgString(
      getToolChain().GetProgramPath(Compressor.c_str()));
  if (Compressor == "zip")
    buildZipArgs(JA, Output, Inputs, Args, CmdArgs);
  if (Compressor == "tar" || Compressor == "gzip")
    buildTarArgs(JA, Output, Inputs, Args, CmdArgs);
  else
    llvm_unreachable("Unsupported compressor name");
  C.addCommand(
    std::make_unique<Command>(
      JA, *this, ResponseFileSupport::None(), 
      Args.MakeArgString(Exec),
      CmdArgs, Inputs, Output));
}

$ zip <output zip file> <input file 1> <input file 2>…

void
tools::zipline::Linker::buildZipArgs(const JobAction &JA,
                             const InputInfo &Output,
                             const InputInfoList &Inputs,
                             const ArgList &Args,
                             ArgStringList &CmdArgs)                             const {
  // output file
  CmdArgs.push_back(Output.getFilename());
  // input files
  AddLinkerInputs(getToolChain(), Inputs, Args, CmdArgs, JA);
}

$ tar -czf <output tar.gz file> <input file 1> <input file 2>…

void
tools::zipline::Linker::buildTarArgs(const JobAction &JA,
                             const InputInfo &Output,
                             const InputInfoList &Inputs,
                             const ArgList &Args,
                             ArgStringList &CmdArgs)                              const {
  // arguments and output file
  CmdArgs.push_back("-czf");
  CmdArgs.push_back(Output.getFilename());
  // input files
  AddLinkerInputs(getToolChain(), Inputs, Args, CmdArgs,    JA);
}

Tool *ZiplineToolChain::buildLinker() const {
  return new tools::zipline::Linker(*this);
}

$ clang -### -zipline -c test.c

$ clang -### -zipline -c test.c
"/path/to/clang" "-cc1" …
"/usr/bin/openssl" "base64" "-in" "/tmp/test_ae4f5b.s" "-out" "test.o"
$

$ clang -### -zipline test.c -o test.zip
"/path/to/clang" "-cc1" …
"/usr/bin/openssl" "base64" "-in" "/tmp/test_ae4f5b.s" "-out" "/tmp/test_ae4f5b.o"
"/usr/bin/zip" "test.zip" "/tmp/test_ae4f5b.o"
$

$ ninja opt

int foo(int* restrict x, int* restrict y) {
  *x = *y + 1;
  return *y;
}

…
// Programmers will NEVER write the following code
int main() {
  int V = 1;
  return foo(&V, &V);
}

foo:                                    
     mov   eax, dword ptr [rsi]
     add   eax, 1
     mov   dword ptr [rdi], eax
     mov   eax, dword ptr [rsi]
     ret

foo:                                    
     mov   eax, dword ptr [rsi]
     lea   ecx, [rax + 1]
     mov   dword ptr [rdi], ecx
     ret

define i32 @foo(i32* noalias %0, i32* noalias %1) {
  %3 = load i32, i32* %1
  %4 = add i32 %3, 1
  store i32 %4, i32* %0
  ret i32 %3
}

define i32 @foo(i32* %0, i32* %1) {
  %3 = load i32, i32* %1
  %4 = add i32 %3, 1
  store i32 %4, i32* %0
  %5 = load i32, i32* %1
  ret i32 %5
}

$ opt --load-pass-plugin=StrictOpt.so \
      --passes="function(strict-opt)" \
      -S -o – test.ll

$ opt -O3 --enable-new-pm \
      --load-pass-plugin=StrictOpt.so \
      -S -o – test.ll

#include "llvm/IR/PassManager.h"
struct StrictOpt : public Function IR unit. The run method is the primary entry point for this Pass, which we are going to fill in later. It takes two arguments: a Function class that we will work on and a FunctionAnalysisManager class that can give you analysis data. It returns a PreservedAnalyses instance, which tells PassManager (and AnalysisManager) what analysis data was *invalidated* by this Pass.If you have prior experience in writing LLVM Pass for the *legacy* PassManager, you might find several differences between the legacy Pass and the new Pass:a) The Pass class no longer derives from one of the `FunctionPass`, `ModulePass`, or `LoopPass`. Instead, the Passes running on different IR units are all deriving from `PassInfoMixin<YOUR_PASS>`. In fact, deriving from `PassInfoMixin` is *not* even a requirement for a functional Pass anymore – we will leave this as an exercise for you.b) Instead of *overriding* methods, such as `runOnFunction` or `runOnModule`, you will define a normal class member method, `run` (be aware that `run` does *not* have an `override` keyword that follows), which operates on the desired IR unit.Overall, the new Pass has a cleaner interface compared to the legacy one. This difference also allows the new PassManager to have less overhead runtime.

#include "StrictOpt.h"
using namespace llvm;
PreservedAnalyses StrictOpt::run(Function &F,
                          FunctionAnalysisManager &FAM) {
  return PreservedAnalyses::all(); // Just a placeholder
}

// Inside StrictOpt::run…
bool Modified = false;
for (auto &Arg : F.args() method of the Function class will return a range of Argument instances representing all of the formal parameters. We check each of their types to make sure there isn't an existing noalias attribute (which is represented by the Attribute::NoAlias enum). If everything looks good, we use addAttr to attach noalias. Here, the `Modified` flag here records whether any of the arguments were modified in this function. We will use this flag shortly.

#include "llvm/Analysis/AliasAnalysis.h"
…
// Inside StrictOpt::run…
auto PA = PreservedAnalyses instance, PA, which represents *all analyses*. Then, if the Function class we are working on here has been modified, we *discard* the AAManager analysis via the abandon method. AAManager represents the noalias attribute we are discussing here has strong relations with this analysis since they're working on a nearly identical problem. Therefore, if any new noalias attribute was generated, all the cached alias analysis data would be outdated. This is why we invalidate it using abandon.Note that you can always return a `PreservedAnalyses::none()` instance, which tells AnalysisManager to mark *every* analysis as outdated if you are not sure what analyses have been affected. This comes at a cost, of course, since AnalysisManager then needs to spend extra effort to recalculate the analyses that might contain expensive computations.

extern "C" ::llvm::PassPluginLibraryInfo instance, which contains various piecesLLVM_PLUGIN_API_VERSION) and the Pass name (StrictOpt). One of its most important fields is a lambda function that takes a single PassBuilder& argument. In that particular function, we are going to insert our StrictOpt into a proper position within the Pass pipeline.`PassBuilder`, as its name suggests, is an entity LLVM that is used to build the Pass pipeline. In addition to its primary job, which involves configuring the pipeline according to the optimization level, it also allows developers to insert Passes into some of the places in the pipeline. Furthermore, to increase its flexibility, `PassBuilder` allows you to specify a *textual* description of the pipeline you want to run by using the `--passes` argument on `opt`, as we have seen previously. For instance, the following command will run `InstCombine`, `PromoteMemToReg`, and `SROA` (`opt` will run our Pass if `strict-opt` appears in the `--passes` argument, as follows:

…
[](PassBuilder &PB) {
  using PipelineElement = typename PassBuilder::PipelineElement;
  PB.registerPipelineParsingCallback method takes another lambda callback as the argument. This callback is invoked whenever PassBuilder encounters an unrecognized Pass name while parsing the textual pipeline representation. Therefore, in our implementation, we simply insert our StrictOpt pass into the pipeline via FunctionPassManager::addPass when the unrecognized Pass name, that is, the Name parameter, is strict-opt.

$ opt -O2 --enable-new-pm \
      --enable-new-pm flag in the preceding command forced opt to use the new PassManager since it's still using the legacy one by default. We haven't used this flag before because --passes implicitly enables the new PassManager under the hood.)To do this, instead of using `PassBuilder::registerPipelineParsingCallback` to register a custom (pipeline) parser callback, we are going to use `registerPipelineStartEPCallback` to handle this. Here is the alternative version of the code snippet from the previous step:

int foo(int x, int y) {
  if (x < 43) {
    my_halt();
    if (y > 45)
      return x + 1;
    else {
      bar();
      return x;
    }
  } else {
    return y;
  }
}

$ opt --enable-new-pm --load-pass-plugin ./HaltAnalyzer.so \
      --disable-output ./test.ll
[WARNING] Unreachable BB: label %if.else
[WARNING] Unreachable BB: label %if.then2
$

class HaltAnalyzer : public PassInfoMixin<HaltAnalyzer> {
  static constexpr const char* HaltFuncName = "my_halt";
  // All the call sites to "my_halt"
  SmallVector<Instruction*, 2> run method that we saw in the previous section, we are creating an additional method, findHaltCalls, which will collect all of the Instruction calls to my_halt in the current function and store them inside the Calls vector.

void HaltAnalyzer::findHaltCalls(Function &F) {
  Calls.clear();
  for (auto &I : llvm::instructions to iterate through every Instruction call in the current function and check them one by one. If the Instruction call is a CallInst – representing a typical function call site – and the callee name is my_halt, we will push it into the Calls vector for later use.Function name manglingBe aware that when a line of C++ code is compiled into LLVM IR or native code, the name of any symbol – including the function name – will be different from what you saw in the original source code. For example, a simple function that has the name of *foo* and takes no argument might have *_Z3foov* as its name in LLVM IR. We call such a transformation in C++ **name mangling**. Different platforms also adopt different name mangling schemes. For example, in Visual Studio, the same function name becomes *?foo@@YAHH@Z* in LLVM IR.

#include "llvm/IR/Dominators.h"
…
PreservedAnalyses
HaltAnalyzer::run(Function &F, FunctionAnalysisManager type argument to retrieve specific analysis data (in this case, DominatorTree) for a specific Function class.Although, so far, we have (kind of) used the words *analysis* and *analysis data* interchangeably, in a real LLVM implementation, they are actually two different entities. Take the DT that we are using here as an example:a) `Function`. In other words, it is the one that *performs* the analysis.b) `DominatorTreeAnalysis`. This is just static data that will be cached by AnalysisManager until it is invalidated.Furthermore, LLVM asks every analysis to clarify its affiliated result type via the `Result` member type. For example, `DominatorTreeAnalysis::Result` is equal to `DominatorTree`.To make this even more formal, to associate the analysis data of an analysis class, `T`, with a `Function` variable, `F`, we can use the following snippet:

PreservedAnalyses
HaltAnalyzer::run(Function &F, FunctionAnalysisManager &FAM) {
  …
  SmallVector<BasicBlock*, 4> DomBBs;
  for (auto *I : Calls) {
    auto *BB = I->getParent();
    DomBBs.clear();
    DT.DominatorTree::getDescendants method, we can retrieve all of the basic blocks dominated by a my_halt call site. Note that the results from getDescendants will also contain the block you put into the query (in this case, the block containing the my_halt call sites), so we need to exclude it before printing the basic block name using the BasicBlock::printAsOperand method.With the ending of the returning `PreservedAnalyses::all()`, which tells AnalysisManager that this Pass does not invalidate any analysis since we don't modify the IR at all, we will wrap up the `HaltAnalyzer::run` method here.

extern "C" ::llvm::PassPluginLibraryInfo LLVM_ATTRIBUTE_WEAK
llvmGetPassPluginInfo() {
  return {
    LLVM_PLUGIN_API_VERSION, "HaltAnalyzer", "v0.1",
    [](PassBuilder &PB) {
      using OptimizationLevel
        = typename PassBuilder::OptimizationLevel;
      PB.StrictOpt in the previous section, we are using registerOptimizerLastEPCallback to insert HaltAnalyzer *after* all of the other optimization Passes. The rationale behind this is that some optimizations might move basic blocks around, so prompting warnings too early might not be very useful. Nevertheless, we are still leveraging ModuletoFunctionPassAdaptor to wrap around our Pass; this is because registerOptimizerLastEPCallback only provides ModulePassManager for us to add our Pass, which is a function Pass.

int bar(int x) {
  int y = x;
  return y * 4;
}
int foo(int z) {
  return z + z * 2;
}

$ clang -O0 -Xclang -disable-O0-optnone -emit-llvm -S test.c

$ opt -O2 --disable-output --debug-pass-manager test.ll
Starting llvm::Module pass manager run.
…
Running pass: Annotation2MetadataPass on ./test.ll
Running pass: ForceFunctionAttrsPass on ./test.ll
…
Starting llvm::Function pass manager run.
Running pass: SimplifyCFGPass on bar
Running pass: SROA on bar
Running analysis: DominatorTreeAnalysis on bar
Running pass: EarlyCSEPass on bar
…
Finished llvm::Function pass manager run.
…
Starting llvm::Function pass manager run.
Running pass: SimplifyCFGPass on foo
…
Finished llvm::Function pass manager run.
Invalidating analysis: VerifierAnalysis on ./test.ll
…
$

$ opt -O2 --disable-output --print-changed ./test.ll
*** IR Dump At Start: ***
...
define dso_local i32 @bar(i32 %x) #0 {
entry:
  %x.addr = alloca i32, align 4
  %y = alloca i32, align 4
  …
  %1 = load i32, i32* %y, align 4
  %mul = mul nsw i32 %1, 4
  ret i32 %mul
}
...
*** IR Dump After VerifierPass (module) omitted because no change ***
…
...
*** IR Dump After SROA *** (function: bar)
; Function Attrs: noinline nounwind uwtable
define dso_local i32 @bar(i32 %x) #0 {
entry:
  %mul = mul nsw i32 %x, 4
  ret i32 %mul
}
...
$

$ opt -O2 --disable-output \
          --print-changed --filter-print-funcs=foo ./test.ll

$ opt -O2 --disable-output \
          --print-changed \
          --filter-passes=SROA,InstCombinePass ./test.ll

$ opt -O2 --opt-bisect-limit=5 -S -o – test.ll
BISECT: running pass (1) Annotation2MetadataPass on module (./test.ll)
BISECT: running pass (2) ForceFunctionAttrsPass on module (./test.ll)
BISECT: running pass (3) InferFunctionAttrsPass on module (./test.ll)
BISECT: running pass (4) SimplifyCFGPass on function (bar)
BISECT: running pass (5) SROA on function (bar)
BISECT: NOT running pass (6) EarlyCSEPass on function (bar)
BISECT: NOT running pass (7) LowerExpectIntrinsicPass on function (bar)
BISECT: NOT running pass (8) SimplifyCFGPass on function (foo)
BISECT: NOT running pass (9) SROA on function (foo)
BISECT: NOT running pass (10) EarlyCSEPass on function (foo)
...
define dso_local i32 @bar(i32 %x) #0 {
entry:
  %mul = mul nsw i32 %x, 4
  ret i32 %mul
}
define dso_local i32 @foo(i32 %y) #0 {
entry:
  %y.addr = alloca i32, align 4
  store i32 %y, i32* %y.addr, align 4
  %0 = load i32, i32* %y.addr, align 4
  %1 = load i32, i32* %y.addr, align 4
  %mul = mul nsw i32 %1, 2
  %add = add nsw i32 %0, %mul
  ret i32 %add
}
$

$ ninja opt clang

$ sudo apt install graphviz

int foo(int a, int b) {
  return a > 0? a – b : a + b;
}

$ clang -emit-llvm -S foo.c

<result> = <operator / op-code> <type>, [operand1, operand2, …]

%12 = load i32, i32* %3

// `BB` has the type of `BasicBlock&`
for (Instruction &I : BB) {
  // Work on `I`
}

// `F` has the type of `Function&`
for (BasicBlock &BB : F) {
  for (Instruction &I : BB) {
    // Work on `I`
  }
}

#include "llvm/IR/InstIterator.h"
…
// `F` has the type of `Function&`
for (Instruction &I : instructions(F)) {
  // Work on `I`
}

for (Instruction &I : instructions(F)) {
  switch (I.getOpcode()) {
  case Instruction::BinaryOperator:
  // this instruction is a binary operator like `add` or `sub`
    break;
  case Instruction::Return:
    // this is a return instruction
    break;
  …
  }
}

#include "llvm/IR/InstVisitor.h"
class MyInstVisitor : public InstVisitor<MyInstVisitor> {
  void visitBinaryOperator(BinaryOperator &BOp) {
    // Work on binary operator instruction
    …
  }
  void visitReturnInst(ReturnInst &RI) {
    // Work on return instruction
    …
  }
};

// `F` has the type of `Function&`
MyInstVisitor Visitor;
Visitor.visit(F);

$ opt -dot-cfg -disable-output foo.ll

$ dot -Tpng foo.cfg.dot > foo.cfg.png

#include "llvm/ADT/PostOrderIterator.h"
#include "llvm/IR/CFG.h"
// `F` has the type of `Function*`
for (BasicBlock *BB : post_order(F)) {
  BB->printAsOperand(errs());
  errs() << "\n";
}

label %12
label %9
label %5
label %7
label %3
label %10
label %1

// `F` has the type of `Function*`
BasicBlock &EntryBB = F->getEntryBlock();
for (BasicBlock *BB : post_order(&EntryBB)) {
  BB->printAsOperand(errs());
  errs() << "\n";
}

#include "llvm/ADT/DepthFirstIterator.h"
#include "llvm/IR/CFG.h"
// `F` has the type of `Function*`
for (BasicBlock *BB : depth_first(F)) {
  BB->printAsOperand(errs());
  errs() << "\n";
}

label %1
label %3
label %5
label %9
label %12
label %7
label %10

label %1
label %3
label %10
label %5
label %7
label %12
label %9

#include "llvm/ADT/SCCIterator.h"
#include "llvm/IR/CFG.h"
// `F` has the type of `Function*`
for (auto SCCI = scc_begin(&F); !SCCI.isAtEnd(); ++SCCI) {
  const std::vector<BasicBlock*> &SCC = *SCCI;
  for (auto *BB : SCC) {
    BB->printAsOperand(errs());
    errs() << "\n";
  }
  errs() << "====\n";
}

label %6
====
label %4
label %2
====
label %1
====

#include "llvm/Analysis/CallGraph.h"
struct SimpleIPO : public PassInfoMixin<SimpleIPO> {
  PreservedAnalyses run(Module &M, ModuleAnalysisManager &MAM) {
    CallGraph CG(M);
    for (auto &Node : CG) {
      // Print function name
      if (Node.first)
        errs() << Node.first->getName() << "\n";
    }
    return PreservedAnalysis::all();
  }
};

template <typename T>
struct Distance {
  static T compute(T &PointA, T &PointB) {
    return PointA – PointB;
  }
};

Distance<int>::compute(94, 87); // Success
…
struct SimplePoint {
  float X, Y;
};
SimplePoint A, B;
Distance<SimplePoint>::compute(A, B); // Compilation Error

// After the original declaration of struct Distance…
template<>
struct Distance<SimplePoint> {
  SimplePoint compute(SimplePoint &A, SimplePoint &B) {
    return std::sqrt(std::pow(A.X – B.X, 2),…);
  }
};
…
SimplePoint A, B;
Distance<SimplePoint>::compute(A, B); // Success

template<>
struct GraphTraits<Function*> {…}

template<>
struct GraphTraits<Function*> {
  typedef pointer_iterator<Function::iterator> nodes_iterator;
  static node_iterator nodes_begin(Function *F) {
    return nodes_iterator(F->begin());
  }
  …
};

template<>
struct GraphTraits<CallGraph*> {
  typedef mapped_iterator<CallGraph::iterator, 
  decltype(&CGGetValuePtr)> nodes_iterator;
  static node_iterator nodes_begin(CallGraph *CG) {
    return nodes_iterator(CG->begin(), &CGGetValuePtr);
  }
};

template<class GraphTy,
         typename GT = GraphTraits<GraphTy>>
  auto find_tail(GraphTy G) {
  for(auto NI = GT::nodes_begin(G); NI != GT::nodes_end(G);    ++NI) {
    // A node in this graph
    auto Node = *NI;
    // Child iterator for this particular node
    auto ChildIt = GT::child_begin(Node);
    auto ChildItEnd = GT::child_end(Node);
    if (ChildIt == ChildItEnd)
      // No child nodes
      return Node;
  }
  …
}

// `F` has the type of `Function*`
BasicBlock *TailBB = find_tail(F);
// `CG` has the type of `CallGraph*`
CallGraphNode *TailCGN = find_tail(CG);

// the following code is NOT in SSA form
x = 94;
x = 87; // `x` is assigned the second time, not SSA!

x = 94;
y = x + 4; // first time `x` is used
z = x + 2; // second time `x` is used

x = 94;
x = x * y; // `x` is assigned more than once, not SSA!
x = x + 5;

x0 = 94;
x1 = x0 * y;
x2 = x1 + 5;

// let's say `I` represents an instruction `x = a + b`
Instruction *I = …;
Value *V = I; // `V` effectively represents the value `x`

Instruction *BinI = BinaryOperator::Create(Instruction::Add,…);
Instruction *RetI = ReturnInst::Create(…, BinI, …);

x = a + b;
return x;

// `Usr` has the type of `User*`
for (Value *V : Usr->operand_values()) {
  // Working with `V`
}

void vulnerable() {
  v = get_password();
  …
  bar(v); // WARNING: sensitive information leak to `bar`!
}

User *find_leakage(CallInst *GetPWDCall) {
  for (auto *Usr : GetPWDCall->users()) {
    if (isa<CallInst>(Usr)) {
      return Usr;
    }
  }
  …
}

// `V` has the type of `Value*`
for (User *Usr : V->users()) {
  // Working with `Usr`
}

class Parent {…};
class Child1 : public Parent {…};
class Child2 : public Parent {…};
void foo() {
  Parent *P = new Child1();
  Child1 *C = dynamic_cast<Child1*>(P); // OK
  Child2 *O = dynamic_cast<Child2*>(P); // Error: bails out at                                         // runtime
}

// `I` has the type of `Instruction*`
if (isa<BinaryOperator>(I)) {
  // `I` can be casted to `BinaryOperator*`
}

// `I` has the type of `Instruction*`
if (isa<BinaryOperator>(I)) {
  BinaryOperator *BinOp = cast<BinaryOperator>(I);
}

// `I` has the type of `Instruction*`
if (BinaryOperator *BinOp = dyn_cast<BinaryOperator>(I)) {
  // Work with `BinOp`
}

Instruction *BinI = BinaryOperator::Create(…);
Instruction *RetI = ReturnInst::Create(…, BinI, …);

Instruction *BinOp will be placed before the one represented by BeforeI. This method, however, can't be ported across different instruction classes. Not every instruction class has factory methods that provide this feature and even if they do provide them, the API might not be the same.

// `BB` has the type of `BasicBlock*`
IRBuilder instance, we need to designate an *insertion point* as one of the constructor arguments. This insertion point argument can be a BasicBlock, which means we want to insert a new instruction at the end of BasicBlock; it can also be an Instruction instance, which means that new instructions are going to be inserted *before* that specific Instruction. You are encouraged to use `IRBuilder` over other mechanisms if possible whenever you need to create and insert new instructions in sequential order.

void replacePow2Mul(BinaryOperator &Mul) {
  // Find the operand that is a power-of-2 integer   // constant
  int ConstIdx = isa<ConstantInt>(Mul.getOperand(0))? 0    : 1;
  ConstantInt *ShiftAmount = getLog2(Mul.   getOperand(ConstIdx));
}

void replacePow2Mul(BinaryOperator &Mul) {
  …
  // Get the other operand from the original instruction
  auto *Base = Mul.getOperand(ConstIdx? 0 : 1);
  // Create an instruction representing left-shifting
  IRBuilder<> Builder(&Mul);
  auto *Shl = Builder.CreateShl(Base, ShiftAmount);
}

void replacePow2Mul(BinaryOperator &Mul) {
  …
  // Using `replaceAllUsesWith` to update users of `Mul`
  Mul.Mul are using Shl instead. Thus, we can safely remove Mul from the program.

// `BB` has the type of `BasicBlock&`
for (Instruction &I : BB) {
  if (auto *BinOp = dyn_cast<BinaryOperator>(&I)) {
    if (isMulWithPowerOf2(BinOp))
      replacePow2Mul(BinOp);
  }
}

// `BB` has the type of `BasicBlock&`
std::vector<BinaryOperator*> Worklist;
// Only perform the feasibility check
for (auto &I : BB) {
  if (auto *BinOp = dyn_cast<BinaryOperator>(&I)) {
    if (isMulWithPowerOf2(BinOp)) Worklist.push_back(BinOp);
  }
}
// Replace the target instructions at once
for (auto *BinOp : Worklist) {
  replacePow2Mul(BinOp);
}

#include "llvm/Analysis/LoopInfo.h"
…
PreservedAnalyses run(Function &F, FunctionAnalysisManager &FAM) {
  LoopInfo &LI = FAM.getResult<LoopAnalysis>(F);
  // `LI` contains ALL `Loop` instances in `F`
  for (Loop *LP : LI) {
    // Working with one of the loops, `LP`
  }
  …
}

for (int i = 0; i < 87; ++i){…}

// `N` is not a constant
for (int i = 0; i < N; ++i){…}

if (i < N) {
  do {
    …
    ++i;
  } while(i < N);
}

PreservedAnalyses run(<IR unit class> &Unit,
                      <IR unit>AnalysisManager &AM);

PreservedAnalyses run(Loop &LP, LoopAnalysisManager &LAM,
                      LoopStandardAnalysisResults &LAR,
                      LPMUpdater &U);

PreservedAnalyses run(Loop &LP, LoopAnalysisManager &LAM,
                      LoopStandardAnalysisResults &LAR,
                      LPMUpdater &U) {
  …
  LoopNest &LN = LAM.getResult<LoopNestAnalysis>(LP, LAR);
  …
}

// `LP` has the type of `Loop&`
for (Loop *SubLP : LP) {
  // `SubLP` is one of the sub-loops at the next layer
}

#include "llvm/Analysis/LoopInfo.h"
#include "llvm/ADT/DepthFirstIterator.h"
…
// `RootL` has the type of `Loop*`
for (GraphTraits, we can have more flexibility when it comes to traversing a loop tree.

// Perfect loops
for(int i=…) {
  for(int j=…){…}
}
// Non-perfect loops
for(int x=…) {
  foo call site is the gap between the upper and lower loops.Perfect loops are preferrable in many loop optimizations. For example, it's easier to *unroll* perfectly nested loops – ideally, we only need to duplicate the body of the innermost loop.

$ ninja opt

PreservedAnalyses
SimpleMulOpt::run(Function &F, FunctionAnalysisManager &FAM) {
  for (auto &I : instructions(F)) {
    if (auto *BinOp = dyn_cast<BinaryOperator>(&I) &&
        BinOp->getOpcode() == Instruction::Mul) {
      auto *LHS = BinOp->getOperand(0),
           *RHS = BinOp->getOperand(1);
      // `BinOp` is a multiplication, `LHS` and `RHS` are its
      // operands, now trying to optimize this instruction…
      …
    }
  }
  …
}

// (extracted from the previous snippet)
…
auto *LHS = BinOp->getOperand(0),
     *RHS = BinOp->getOperand(1);
errs() << "Found a multiplication with operands ";
LHS->printAsOperand(errs());
errs() << " and ";
RHS->printAsOperand(errs());
…

#include "llvm/Support/Debug.h"
#define DEBUG_TYPE "simple-mul-opt"
…
auto *LHS = BinOp->getOperand(0),
     *RHS = BinOp->getOperand(1);
LLVM_DEBUG(dbgs() << "Found a multiplication with operands ");
LLVM_DEBUG(LHS->printAsOperand(dbgs()));
LLVM_DEBUG(dbgs() << " and ");
LLVM_DEBUG(RHS->printAsOperand(dbgs()));
…

$ opt -O3 -debug -load-pass-plugin=… …

$ opt -O3 -debug-only=simple-mul-opt -load-pass-plugin=… …

$ opt -O3 -debug-only=sroa,simple-mul-opt -load-pass-plugin=… …

…
#define DEBUG_TYPE "simple-mul-opt"
auto *LHS = BinOp->getOperand(0),
     *RHS = BinOp->getOperand(1);
LLVM_DEBUG(dbgs() << "Found a multiplication instruction");
DEBUG_WITH_TYPE("simple-mul-opt-lhs",
               LHS->printAsOperand(dbgs() << "LHS operand: "));
DEBUG_WITH_TYPE("simple-mul-opt-rhs",
               RHS->printAsOperand(dbgs() << "RHS operand: "));
…

#define DEBUG_TYPE "simple-mul-opt"
PreservedAnalyses
SimpleMulOpt::run(Function &F, FunctionAnalysisManager &FAM) {
  unsigned NumMul = 0;
  for (auto &I : instructions(F)) {
    if (auto *BinOp = dyn_cast<BinaryOperator>(&I) &&
        BinOp->getOpcode() == Instruction::Mul) {
      ++NumMul;
      …
    }
  }
  LLVM_DEBUG(dbgs() << "Number of multiplication: " << NumMul);
  …
}

#include "llvm/ADT/Statistic.h"
#define DEBUG_TYPE "simple-mul-opt"
STATISTIC(NumMul, "Number of multiplications processed");
PreservedAnalyses
SimpleMulOpt::run(Function &F, FunctionAnalysisManager &FAM) {
  for (auto &I : instructions(F)) {
    if (auto *BinOp = dyn_cast<BinaryOperator>(&I) &&
        BinOp->getOpcode() == Instruction::Mul) {
      ++NumMul;
      …
    }
  }
  …
}

$ opt -stats –load-pass-plugin=… …
===-------------------------------===
      … Statistics Collected …
===-------------------------------===
87 simple-mul-opt - Number of multiplications processed
$

$ opt -stats –load-pass-plugin=… --passes="sroa,simple-mult-opt" …
===-------------------------------===
      … Statistics Collected …
===-------------------------------===
94  simple-mul-opt - Number of multiplications processed
87  simple-mul-opt - Number of none-power-of-two constant operands
100 sroa           - Number of alloca partition uses rewritten
34  sroa           - Number of instructions deleted
…
$

$ opt -stats -stats-json –load-pass-plugin=… …
{
        "simple-mul-opt.NumMul": 87
}
$

$ opt -stats -stats-json -info-output-file=my_stats.json …
$ cat my_stats.json
{
        "simple-mul-opt.NumMul": 87
}
$

int foo(int *a, int N) {
  int x = a[5];
  for (int i = 0; i < N; i += 3) {
    a[i] += 2;
    x = a[5];
  }
  return x;
}

int foo(int *a, int N) {
  for (int i = 0; i < N; i += 3) {
    a[i] += 2;
  }
  return a[5];
}

$ opt -licm input.ll –pass-remarks-output=licm_remarks.yaml …
$ cat licm_remarks.yaml
…
--- !Missed
Pass:            licm
Name:            LoadWithLoopInvariantAddressInvalidated
Function:        foo
Args:
  - String:          failed to move load with loop-invariant address because the loop may invalidate its value
...
$

…
for (auto &I : instructions(F)) {
  if (auto *BinOp = dyn_cast<BinaryOperator>(&I))
    if (BinOp->getOpcode() == Instruction::Mul) {
      auto *LHS = BinOp->getOperand(0),
           *RHS = BinOp->getOperand(1);
      // Has no constant operand
      if (!isa<Constant>(RHS)) continue;
      const APInt &Const = cast<ConstantInt>(RHS)->getValue();
      // Constant operand is not power of two
      if (!Const.isPowerOf2()) continue;
      …
    }
}

#include "llvm/Analysis/OptimizationRemarkEmitter.h"
PreservedAnalyses
SimpleMulOpt::run(Function &F, FunctionAnalysisManager &FAM) {
  OptimizationRemarkEmitter &ORE
    = FAM.getResult<OptimizationRemarkEmitterAnalysis>(F);
  …
}

#include "OptimizationRemarkEmitter::emit method takes a lambda function as the argument. This lambda function will be invoked to emit an optimization remark object if the optimization remark feature is turned on (via the –pass-remarks-output command-line option we've seen previously, for example).

define i32 @bar(i32 %0) {
  %2 = mul nsw i32 %0, 3
  %3 = mul nsw i32 8, %3
  ret %3
}

$ opt –load-pass-plugin=… –passes="simple-mul-opt" \
      SimpleMulOpt bailed out because it couldn't find a constant operand on one of the (multiplication) instructions. The Args section shows a detailed reason for this.With this information, we realize that `SimpleMulOpt` is unable to optimize a multiplication whose *first* operand (LHS operand) is a power-of-two constant, albeit a proper optimization opportunity. Thus, we can now fix the implementation of `SimpleMulOpt` to check if *either* of the operands is constant, as follows:

You have now learned how to emit optimization remarks in an LLVM Pass and how to use the generated report to discover potential optimization opportunities.

int foo(int *a, int N) {
  for (int i = 0; i < N; i += 3) {
    a[i] += 2;
  }
  return a[5];
}

$ clang -O3 -foptimization-record-file is the command-line option used to generate an optimization remark file with the given filename.

$ opt-viewer.py --source-dir=$PWD \ 
--target-dir=licm_remark licm.remark.yaml

#include "llvm/Support/Timer.h"
…
Timer T("MyTimer", "A simple timer");
T.startTimer();
// Do some time-consuming works…
T.stopTimer();

Timer T(…);
…
TimeRecord TR = T.getTotalTime();
TR.print(TR, errs());

===---------------------------------------------------------===
                     Miscellaneous Ungrouped Timers
===---------------------------------------------------------===
   ---User Time---   --User+System--   ---Wall Time---  --- Name ---
   0.0002 (100.0%)   0.0002 (100.0%)   0.0002 (100.0%)  A simple timer
   0.0002 (100.0%)   0.0002 (100.0%)   0.0002 (100.0%)  Total
   0.0002 (100.0%)   0.0002 (100.0%)   0.0002 (100.0%)

TimerGroup TG("MyTimerGroup", "My collection of timers");
Timer T("MyTimer", "A simple timer", TG);
T.startTimer();
// Do some time-consuming works…
T.stopTimer();
Timer T2("MyTimer2", "Yet another simple timer", TG);
T2.startTimer();
// Do some time-consuming works…
T2.stopTimer();
TG.print(errs());

===---------------------------------------------------------===
                    My collection of timers
===---------------------------------------------------------===
  Total Execution Time: 0.0004 seconds (0.0004 wall clock)
   ---User Time---   --User+System--   ---Wall Time---  --- Name ---
   0.0002 ( 62.8%)   0.0002 ( 62.8%)   0.0002 ( 62.8%)  A simple timer
   0.0001 ( 37.2%)   0.0001 ( 37.2%)   0.0001 ( 37.2%)  Yet another simple timer
   0.0004 (100.0%)   0.0004 (100.0%)   0.0004 (100.0%)  Total

TimerGroup TG("MyTimerGroup", "My collection of timers");
{
  Timer T("MyTimer", "A simple timer", TG);
  TimeRegion TR(T);
  // Do some time-consuming works…
}
{
  Timer T("MyTimer2", "Yet another simple timer", TG);
  TimeRegion TR(T);
  // Do some time-consuming works…
}
TG.print(errs());

TimeTraceScope OuterTimeScope("TheOuterScope");
for (int i = 0; i < 50; ++i) {
  {
    TimeTraceScope InnerTimeScope("TheInnerScope");
    foo();
  }
  bar();
}

$ opt –passes="…" -time-trace -time-trace-file=my_trace.json …

$ clang -O3 -ftime-trace -c foo.c

#include "llvm/Support/Error.h"
#include <system_error>
// In the header file…
struct FileNotFoundError : public ErrorInfo<FileNoteFoundError> {
  StringRef FileName;
  explicit FileNotFoundError(StringRef Name) : FileName(Name)    {}
  static char ID;
  std::error_code convertToErrorCode() const override {
    return std::errc::no_such_file_or_directory;
  }
  void log(raw_ostream &OS) const override {
    OS << FileName << ": No such file";
  }
};
// In the CPP file…
char FileNotFoundError::ID = 0;

Error NoSuchFileErr = make_error<FileNotFoundError>("foo.txt");

Program aborted due to an unhandled Error:
foo.txt: No such file

Error readFile(StringRef FileName) {
  if (openFile(FileName)) {
    // Success
    // Read the file content…
    return ErrorSuccess();
  } else
    return make_error<FileNotFoundError>(FileName);
}

Error E = readFile(…);
if (E) {
  // TODO: Handle the error
} else {
  // Success!
}

Error E = readFile(…);
if (E) {
  Error UnhandledErr = handleErrors(
    std::move(E),
    & {
      NotFound.log(errs() << "Error occurred: ");
      errs() << "\n";
    });
  …
}

Error readFile(StringRef FileName) {
  if (openFile(FileName)) {
    // Success
    …
    if (Buffer.empty())
      return make_error<FileEmptyError>();
    else
      return ErrorSuccess();
  } else
    return make_error<FileNotFoundError>(FileName);
}

Error E = readFile(…);
if (E) {
  Error UnhandledErr = handleErrors(
    std::move(E),
    & {…});
  UnhandledErr = handleErrors(
    std::move(UnhandledErr),
    & {…});
  …
}

Error E = readFile(…);
if (E) {
  Error UnhandledErr = handleErrors(
    std::move(E),
    & {…},
    & {…});
  …
}

Error E = readFile(…);
if (E) {
  switch (E) {
  case FileNotFoundError: …
  case FileEmptyError: …
  default:
    // generate the UnhandledError
  }
}

if (E) {
  Error UnhandledErr = handleErrors(
    std::move(E),
    & {…},
    & {…});
  UnhandledErr still contains an error, the cantFail function will abort the program execution and print an error message.

if (E) {
  handleAllErrors will still abort the program execution, just like what we have seen previously.

#include "llvm/Support/JSON.h"
 using namespace llvm;
…
// `InputStr` has the type of `StringRef`
Expected<json::Value> JsonOrErr = json::parse(InputStr);
if (JsonOrErr) {
  // Success!
  json::Value &Json = *JsonOrErr;
  …
} else {
  // Something goes wrong…
  Error Err = JsonOrErr.takeError();
  // Start to handle `Err`…
}

if (JsonOrErr) {
  // Success!
  …
} else {
  // Something goes wrong…
  if (JsonOrErr.errorIsA<FileNotFoundError>()) {
    …
  }
}

Expected<std::string> readFile(StringRef FileName) {
  if (openFile(FileName)) {
    std::string Content;
    // Reading the file…
    return Content;
  } else
    return make_error<FileNotFoundError>(FileName);
}

#include "llvm/Support/MemoryBuffer.h"
…
ErrorOr<std::unique_ptr<MemoryBuffer>> ErrOrBuffer
  = MemoryBuffer::getFile("foo.txt");
if (ErrOrBuffer) {
  // Success!
  std::unique_ptr<MemoryBuffer> &MB = *ErrOrBuffer;
} else {
  // Something goes wrong…
  std::error_code EC = ErrOrBuffer.getError();
  …
}

#include <system_error>
ErrorOr<std::string> readFile(StringRef FileName) {
  if (openFile(FileName)) {
    std::string Content;
    // Reading the file…
    return Content;
  } else
    return std::errc::no_such_file_or_directory;
}

//Semicolon-separated list of projects to build…
LLVM_ENABLE_PROJECTS:STRING="clang;compiler-rt"

$ ninja clang compiler-rt opt llvm-profdata

int main(int argc, char **argv) {
  int buffer[3];
  for (int i = 1; i < argc; ++i)
    buffer[i-1] = atoi(argv[i]);
  for (int i = 1; i < argc; ++i)
    printf("%d ", buffer[i-1]);
  printf("\n");
  return 0;
}

$ clang -Wall buffer_overflow.c -o buffer_overflow
$ # No error or warning

$ ./buffer_overflow 1 2 3
1 2 3
$ ./buffer_overflow 1 2 3 4
Segmentation fault (core dumped)
$

$ clang -fsanitize=address buffer_overflow.c -o san_buffer_overflow

$ ./san_buffer_overflow 1 2 3
1 2 3
$ ./san_buffer_overflow 1 2 3 4
=================================================================
==137791==ERROR: AddressSanitizer: stack-buffer-overflow on address 0x7ffea06bccac at pc 0x0000004f96df bp 0x7ffea06bcc70…
WRITE of size 4 at 0x7ffea06bccac thread T0
…
  This frame has 1 object(s):
    32, 44) 'buffer' <== Memory access at offset 44 overflows this variable
…
==137791==ABORTING
$

void foo(int S, int E, int ST, int *a) {
  for (int i = S; i < E; i += ST) {
    a[i] = a[i + 1];
  }
}
int main(int argc, char **argv) {
  int start = atoi(argv[1]),
      end = atoi(argv[2]),
      step = atoi(argv[3]);
  int a[100];
  foo(start, end, step, a);
  return 0;
}

$ clang -O1 -fsanitize=loop-counter test_lpcsan.c -o test_lpcsan

$ ./test_lpcsan 0 100 1
==143813==INFO: Found a loop with trip count 100
$ ./test_lpcsan 0 50 2
==143814==INFO: Found a loop with trip count 25
$

struct LoopCounterSanitizer
  : public PassInfoMixin<LoopCounterSanitizer> {
  PreservedAnalyses run(Loop&, LoopAnalysisManager&,
                        LoopStandardAnalysisResults&, 
                        LPMUpdater&);
private:
  // Sanitizer functions
  LPCSetStartFn and LPCAtEndFn memory variables – they will store the Function instances that collect loop trip counts (FunctionCallee is a thin wrapper around Function that provides additional function signature information).

PreservedAnalyses
LoopCounterSanitizer::run(Loop &LP, LoopAnalysisManager &LAM, LoopStandardAnalysisResults &LSR, LPMUpdater &U) {
  initializeSanitizerFuncs method in the preceding code will populate LPCSetStartFn and LPCAtEndFn. Before we go into the details of initializeSanitizerFuncs, let's talk more about LPCSetStartFn and LPCAtEndFn.

void foo(int S, int E, int ST) {
  for (int i = S; i < E; i += ST) {
    …
  }
}

void foo(int S, int E, int ST) {
  for (int i = S; i < E; i += ST) {
    lpc_set_start and lpc_at_end in the preceding code are Function instances that are stored in LPCSetStartFn and LPCAtEndFn, respectively. Here is one of the possible (pseudo) implementations of these two functions:

void LoopCounterSanitizer::initializeSanitizerFuncs(Loop &LP) {
  Module &M = *LP.getHeader()->getModule();
  auto &Ctx = M.getContext();
  Type *VoidTy = Type::__lpcsan_set_loop_start and __lpcsan_at_loop_end, from the module and storing their Function instances in LPCSetStartFn and LPCAtEndFn, respectively.The `Module::getOrInsertFunction` method either grabs the `Function` instance of the given function name from the module or creates one if it doesn't exist. If it's a newly created instance, it has an empty function body; in other words, it only has a function *declaration*.It is also worth noting that the second argument of `Module::getOrInsertFunction` is the return type of the `Function` inquiry. The rest (the arguments for `getOrInsertFunction`) represent the argument types of that `Function`.With `LPCSetStartFn` and `LPCAtEndFn` set up, let's see how we can insert them into the right place in IR.

PreservedAnalyses
LoopCounterSanitizer::run(Loop &LP, LoopAnalysisManager &LAM, LoopStandardAnalysisResults &LSR, LPMUpdater &U) {
  initializeSanitizerFuncs(LP);
  Loop::getBounds from the preceding code returned an Optional<LoopBounds> instance. The Optional<T> class is a useful container that either stores an instance of the T type or is *empty*. You can think of it as a replacement for the T* to represent a computation result where a null pointer means an empty value. However, this has the risk of dereferencing a null pointer if the programmer forgets to check the pointer first. The Optional<T> class doesn't have this problem.With a `LoopBounds` instance, we can retrieve the induction variable's range and store it in the `StartVal`, `EndVal`, and `StepVal` variables.

BasicBlock *ExitBlock = LP.__lpcsan_at_loop_end at the beginning of the *exit block*. This is because we can always expect the end value and the step value of the induction variable being defined before we leave the loop.These are all the implementation details for the `LoopCounterSanitizer` pass.

void foo(int S, int E, int ST, int *a) {
  for (int i = S; i < E; i += ST) {
    a[i] = a[i + 1];
  }
}

define void @foo(i32 %S, i32 %E, i32 %ST, i32* %a) {
  %cmp9 = icmp slt i32 %S, %E
  br i1 %cmp9, label %for.body.preheader, label %for.cond.   cleanup
for.body.preheader:  
  %0 = sext i32 %S to i64
  %1 = sext i32 %ST to i64
  %2 = sext i32 %E to i64
  br label %for.body
…
for.body:                                         
  %indvars.iv = phi i64 [ %0, %for.body.preheader ], [   %indvars.iv.next, %for.body ]
  …
  %indvars.iv.next = add i64 %indvars.iv, %1
  %cmp = icmp slt i64 %indvars.iv.next, %2
  br i1 %cmp, label %for.body, label %for.cond.cleanup
}

$ opt -S –passes="loop(lpcsan)" input.ll -o -

declare void @__lpcsan_set_loop_start(i32)
declare void @__lpcsan_at_loop_end(i32, i32)
define void @foo(i32 %S, i32 %E, i32* %a) {
  %cmp8 = icmp slt i32 %S, %E
  br i1 %cmp8, label %for.body.preheader, label %for.cond.cleanup
for.body.preheader: 
  %0 = sext i32 %S to i64
  %wide.trip.count = sext i32 %E to i64
  br label %for.body
for.cond.cleanup.loopexit:                        
  %1 = trunc i64 %wide.trip.count to i32
  call void @__lpcsan_at_loop_end(i32 %1, i32 1)
  br label %for.cond.cleanup
for.body:
  …
  %3 = trunc i64 %0 to i32
  call void @__lpcsan_set_loop_start(i32 %3)
  br i1 %exitcond.not, label %for.cond.cleanup.loopexit, label    %for.body
}

typedef int v4si __attribute__((__vector_size__(16)));
v4si v1 = (v4si){1, 2, 3, 4};
v4si v2 = (v4si){5, 6, 7, 8};
v4si v3 = v1 + v2; // = {6, 8, 10, 12}

#include "sanitizer_common/sanitizer_common.h"
#include "sanitizer_common/sanitizer_internal_defs.h"
using namespace __sanitizer;
extern "C" SANITIZER_INTERFACE_ATTRIBUTE
void s32 – available under the __sanitizer namespace – for a signed 32-bit integer rather than the normal int. The rationale behind this is that we might need to build Compiler-RT libraries for different hardware architectures or platforms, and the width of int might not be 32 bits on some of them.Second, although we are using C++ to implement our instrumentation functions, we need to expose them as C functions because C functions have a more stable `extern "C"` to functions you want to export. The `SANITIZER_INTERFACE_ATTRIBUTE` macro also ensures that the function will be exposed at the library interface correctly, so please add this as well.

static CurLoopStart is a global variable that memorizes the *initial* induction variable value of the current loop. This is updated by __lpcsan_set_loop_start.Recall that when a loop is complete, `__lpcsan_at_loop_end` will be invoked. When that happens, we use the value stored in `CurLoopStart` and the `end` and `step` arguments to calculate the exact trip count of the current loop, before printing the result.

…
set(LPCSAN_RTL_SOURCES
    lpcsan.cpp)
CMakeLists.txt. Here are some highlights:i. Compiler-RT creates its own set of CMake macros/functions. Here, we are using two of them, `add_compiler_rt_component` and `add_compiler_rt_runtime`, to create a pseudo build target for the entire LPCSan and the real library build target, respectively.ii. Different from a conventional build target, if a sanitizer wants to use supporting/utility libraries in Compiler-RT – for example, `RTSanitizerCommon` in the preceding code – we usually link against their *object files* rather than their library files. More specifically, we can use the `$<TARGET_OBJECTS:…>` directive to import supporting/utility components as one of the input sources.iii. A sanitizer library can support multiple architectures and platforms. In Compiler-RT, we are enumerating all the supported architectures and creating a sanitizer library for each of them.Again, the preceding snippet is just a small part of our build script. Please refer to our sample code folder for the complete `CMakeLists.txt` file.

$ ninja lpcsan

…
// Shadow Call Stack
SANITIZER("shadow-call-stack", ShadowCallStack)
// Loop Counter Sanitizer
LoopCounter, to the SanitizerKind class.It turns out that the driver will parse the `-fsanitize` command-line option and *automatically* translate `loop-counter` into `SanitizerKind::LoopCounter` based on the information we provided in `Sanitizers.def`.

bool needsLsanRt() const {…}
bool needsLpcsanRt() const {
  return Sanitizers.has(SanitizerKind::LoopCounter);
}

…
if (SanArgs.needsLsanRt() && SanArgs.linkRuntimes())
  StaticRuntimes.push_back("lsan");
if (SanArgs.needsLpcsanRt() && SanArgs.linkRuntimes())
  StaticRuntimes.push_back("lpcsan");
…

SanitizerMask Res = ToolChain::getSupportedSanitizers();
…
Res |= SanitizerKind::LoopCounter;
…

…
// `PB` has the type of `CodeGen, is a place where the Clang and LLVM libraries meet. Therefore, we will see several LLVM APIs appear in this place. There are primarily two tasks for this CodeGen component:a. Converting the Clang AST into its equivalent LLVM IR `module`b. Constructing an LLVM pass pipeline to optimize the IR and generate machine codeThe previous snippet was trying to customize the second task – that is, customizing the LLVM Pass pipeline. The specific function – `addSanitizers` – we are modifying here is responsible for putting sanitizer passes into the pass pipeline. To have a better understanding of this code, let's focus on two of its components:i. `PassBuilder`: This class provides predefined pass pipeline configurations for each optimization level – that is, the O0 ~ O3 notations (as well as Os and Oz for size optimization) we are familiar with. In addition to these predefined layouts, developers are free to customize the pipeline by leveraging the `PassBuilder` supports several EPs, such as at the *beginning* of the pipeline, at the *end* of the pipeline, or at the end of the vectorization process, to name a few. An example of using EP can be found in the preceding code, where we used the `PassBuilder::registerOptimizerLastEPCallback` method and a lambda function to customize the EP located at the *end* of the Pass pipeline. The lambda function has two arguments: `ModulePassManager` – which represents the pass pipeline – and the current optimization level. Developers can use `ModulePassManager::addPass` to insert arbitrary LLVM passes into this EP.ii. `ModulePassManager`: This class represents a Pass pipeline – or, more specifically, the pipeline for `Module`. There are, of course, other PassManager classes for different IR units, such as `FunctionPassManager` for `Function`. In the preceding code, we were trying to use the `ModulePassManager` instance to insert our `LoopCounterSanitizer` pass whenever `SanitizerKind::LoopCounter` was one of the sanitizers that had been designated by the user. Since `LoopCounterSanitizer` is a loop pass rather than a module pass, we need to add some *adaptors* between the pass and PassManager. The `createFunctionToLoopPassAdaptor` and `createModuleToFunctionPassAdaptor` functions we were using here created a special instance that adapts a pass to a PassManager of a different IR unit.This is all the program logic that supports our LPCSan in the Clang compilation pipeline.

…
set(COMPILER_RT_RUNTIMES effectively imports our LPCSan Compiler-RT libraries into the build.

$ clang -O1 -fsanitize=loop-counter input.c -o input

void foo(int N) {
  if (N > 100)
    bar();
  else
    zoo();
}

__attribute__((noinline))
void foo(int x) {
  if (get_random() > 5)
    printf("Hello %d\n", x * 3);
}
int main(int argc, char **argv) {
  for (int i = 0; i < argc + 10; ++i) {
    foo(i);
  }
  return 0;
}

$ clang -O1 -fprofile-generate option enables instrumentation-based PGO. The path that we added after this flag is the directory where profiling data will be stored.

$ ./pgo `seq 1 3`
Hello 0
Hello 6
…
Hello 36
Hello 39
$

$ ls pgo_prof.dir
default_10799426541722168222_0.profraw

$ llvm-profdata llvm-profdata is a powerful tool for inspecting, converting, and merging profiling data files. We will look at it in more detail later. In the preceding command, we are merging and converting all the data files under pgo_prof.dir into a *single* *.profdata file.

$ clang -O1 -fprofile-use=pgo_prof.profdata pgo.cpp \
        -emit-llvm -S -o pgo.after.ll

define void @foo(i32 %x) !prof !71 {
entry:
  %call = call i32 @get_random()
  %cmp = icmp sgt i32 %call, 5
  br i1 %cmp, label %if.then, label %if.end, !prof !72
if.then:                                          
  %mul = mul nsw i32 %x, 3
  …
}

!71 = !{!"function_entry_count", i64 110}
!72 = !{!"branch_weights", i32 57, i32 54}

$ llvm-profdata show –-all-functions –-counts pgo_prof.profdata
…
  foo:
    Hash: 0x0ae15a44542b0f02
    Counters: 2
    Block counts: [54, 57]
  main:
    Hash: 0x0209aa3e1d398548
    Counters: 2
    Block counts: [110, 1]
…
Instrumentation level: IR  entry_first = 0
Functions shown: 9
Total functions: 9
Maximum function count: …
Maximum internal block count: …

$ llvm-profdata merge –-text pgo_prof.profdata -o pgo_prof.proftext
$ cat pgo_prof.proftext
# IR level Instrumentation Flag
:ir
…
foo
# Func Hash:
784007059655560962
# Num Counters:
2
# Counter Values:
54
57
…

$ llvm-profdata merge –-binary pgo_prof.proftext -o pgo_prof.profdata

void foo(int x) {
  if (x > 10)
    puts("hello");
  else
    puts("world");
}

define void @foo(i32 %0) {
  …
  %4 = icmp sgt i32 %3, 10
  %5 or %7. Now, let's generate the IR with instrumentation-based PGO enabled with the following command:

$ clang -fprofile-use=combined_prof.profdata \
        foo.c -o optimized_foo

$ opt -pgo-test-profile-file=pgo_prof.profdata \
      --passes="pgo-instr-use,my-pass…" pgo.ll …

// `BB` has the type of `BasicBlock&`
Instruction *BranchInst = BB.getTerminator();
MDNode *BrWeightMD = BranchInst->getMetadata(LLVMContext::MD_prof);

if (BrWeightMD->getNumOperands() > 2) {
  // Taken counts for true branch
  MDNode *TrueBranchMD = BrWeightMD->getOperand(1);
  // Taken counts for false branch
  MDNode *FalseBranchMD = BrWeightMD->getOperand(2);
}

if (BrWeightMD->getNumOperands() > 2) {
  // Taken counts for true branch
  MDNode *TrueBranchMD = BrWeightMD->getOperand(1);
  ConstantInt *NumTrueBrTaken
    = mdconst::dyn_extract<ConstantInt>(TrueBranchMD);
  …
}

// `F` has the type of `Function&`
Function::ProfileCount EntryCount = F.getEntryCount();
uint64_t EntryCountVal = EntryCount.getCount();

#include "llvm/Analysis/BranchProbabilityInfo.h"
PreservedAnalyses run(Function &F, FunctionAnalysisManager &FAM) {
  BranchProbabilityInfo &BPI
    = FAM.getResult<BranchProbabilityAnalysis>(F);
  BasicBlock *Entry = F.getEntryBlock();
  BranchProbability BP = BPI.getEdgeProbability(Entry, 0);
  …
}

#include "llvm/Analysis/BlockFrequencyInfo.h"
PreservedAnalyses run(Function &F, FunctionAnalysisManager &FAM) {
  BlockFrequencyInfo &BFI
    = FAM.getResult<BlockFrequencyAnalysis>(F);
  for (BasicBlock *BB : F) {
    BlockFrequency BF = BFI.getBlockFreq(BB);
  }
  …
}

// `BB` has the type of `BasicBlock*`
// `Entry` has the type of `BasicBlock*` and represents entry // block
BlockFrequency BBFreq = BFI.getBlockFreq(BB),
               EntryFreq = BFI.getBlockFreq(Entry);
auto FreqInPercent
  = (BBFreq.getFrequency() / EntryFreq.getFrequency()) * 100;

#include "llvm/Analysis/ProfileSummaryInfo.h"
PreservedAnalyses run(Module &M, ModuleAnalysisManager &MAM) {
  ProfileSummaryInfo &PSI = MAM.  getResult<ProfileSummaryAnalysis>(M);
  …
}

#pragma that allows you to define a JavaScript function below it.

./simple_warn.c:2:7: warning: unused variable 'y'…
  int y = x + 1;
      ^
1 warning generated.

Tool*
MyCompiler – which is a class derived from Tool, if we are trying to compile the code for a certain hardware architecture.Providing an alternative compiler instance is useful when your target platform (for example, the `CUSTOM_HARDWARE` in the preceding snippet) or input file is not supported by Clang, but you still want to use the *same* `clang` command-line interface for all the build jobs. For example, suppose you are trying to cross-compile the same projects to *multiple* different architectures, but some of them are not supported by Clang yet. Therefore, you can create a custom Clang toolchain and redirect the compilation job to an external compiler (for example, `gcc`) when the `clang` command-line tool is asked to build the project for those architectures.

void
MyAssembler::ConstructJob(Compilation &C,
                          const JobAction &JA,
                          const InputInfo &Output,
                          const InputInfoList &Inputs,
                          const ArgList &Args,
                          const char *LinkingOutput)                           const {
  if (Arg *A = Args.getLastArg(options::OPT_Wl_COMMA)) {
    // `A` contains linker-specific flags
    …
  }
  …
}

struct MyPass {
  static StringRef name() { return "MyPass"; }
  PreservedAnalyses run(Function&, FunctionAnalysisManager&);
};

龙哥盟

掠夺·扩张·投机·博弈

LLVM 技巧、提示和最佳实践（全）

前言

本书面向的对象

本书涵盖的内容

要充分利用本书

下载示例代码文件

下载彩色图像

使用的约定

联系我们

评论

第一部分：构建系统和 LLVM 特定工具

第一章：第一章：构建 LLVM 时节省资源

技术要求

通过更好的工具减少构建资源

用 Ninja 替换 GNU Make

避免使用 BFD 链接器

调整 CMake 参数

选择正确的构建类型

避免构建所有目标

构建为共享库

分离调试信息

构建优化版本的llvm-tblgen

使用新的 PassManager 和 Clang

使用 GN 以获得更快的周转时间

摘要

进一步阅读

第二章：第二章：探索 LLVM 的构建系统功能

技术要求

探索 LLVM 重要 CMake 指令的词汇表

使用 CMake 函数添加新库

每个文件夹添加一个构建目标

使用 CMake 函数添加可执行文件和工具

使用 CMake 函数添加 Pass 插件

理解树外项目的 CMake 集成

摘要

第三章：第三章：使用 LLVM LIT 进行测试

技术要求

在树外项目中使用 LIT

为我们的示例项目做准备

编写 LIT 配置

LIT 内部机制

学习有用的 FileCheck 技巧

准备我们的示例项目

编写 FileCheck 指令

探索 TestSuite 框架

为我们的示例项目做准备

将代码导入到 llvm-test-suite

摘要

进一步阅读

第四章：第四章：TableGen 开发

技术要求

TableGen 语法介绍

布局和记录

Bang 操作符

多类

DAG 数据类型

在 TableGen 中编写甜甜圈配方

通过 TableGen 后端打印配方

TableGen 的高级工作流程

编写 TableGen 后端

项目设置

获取所有烘焙步骤

检索字段值

类型转换

处理 DAG 值

集成 RecipePrinter TableGen 后端

摘要

进一步阅读

第二部分：前端开发

第五章：第五章：探索 Clang 的架构

技术要求

学习 Clang 的子系统及其作用

驱动程序

词法分析和预处理器

解析器和 Sema

AST

CodeGen

构建优化版本的`llvm-tblgen`

`FrontendAction` 类