llvm-project/llvm/unittests/IR/StructuralHashTest.cpp
Kyungwoo Lee 0dd9fdcf83
[StructuralHash] Support Differences (#112638)
This computes a structural hash while allowing for selective ignoring of
certain operands based on a custom function that is provided. Instead of
a single hash value, it now returns FunctionHashInfo which includes a
hash value, an instruction mapping, and a map to track the operand
location and its corresponding hash value that is ignored.

Depends on https://github.com/llvm/llvm-project/pull/112621.
This is a patch for
https://discourse.llvm.org/t/rfc-global-function-merging/82608.
2024-10-26 20:02:05 -07:00

304 lines
13 KiB
C++

//===- llvm/unittest/IR/StructuralHashTest.cpp ----------------------------===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
#include "llvm/IR/StructuralHash.h"
#include "llvm/AsmParser/Parser.h"
#include "llvm/IR/Module.h"
#include "llvm/Support/SourceMgr.h"
#include "gmock/gmock-matchers.h"
#include "gtest/gtest.h"
#include <memory>
using namespace llvm;
namespace {
using testing::Contains;
using testing::Key;
using testing::Pair;
using testing::SizeIs;
std::unique_ptr<Module> parseIR(LLVMContext &Context, const char *IR) {
SMDiagnostic Err;
std::unique_ptr<Module> M = parseAssemblyString(IR, Err, Context);
if (!M)
Err.print("StructuralHashTest", errs());
return M;
}
TEST(StructuralHashTest, Empty) {
LLVMContext Ctx;
std::unique_ptr<Module> M1 = parseIR(Ctx, "");
std::unique_ptr<Module> M2 = parseIR(Ctx, "");
EXPECT_EQ(StructuralHash(*M1), StructuralHash(*M2));
}
TEST(StructuralHashTest, Basic) {
LLVMContext Ctx;
std::unique_ptr<Module> M0 = parseIR(Ctx, "");
std::unique_ptr<Module> M1 = parseIR(Ctx, "define void @f() { ret void }");
std::unique_ptr<Module> M2 = parseIR(Ctx, "define void @f() { ret void }");
std::unique_ptr<Module> M3 = parseIR(Ctx, "@g = global i32 2");
std::unique_ptr<Module> M4 = parseIR(Ctx, "@g = global i32 2");
EXPECT_NE(StructuralHash(*M0), StructuralHash(*M1));
EXPECT_NE(StructuralHash(*M0), StructuralHash(*M3));
EXPECT_NE(StructuralHash(*M1), StructuralHash(*M3));
EXPECT_EQ(StructuralHash(*M1), StructuralHash(*M2));
EXPECT_EQ(StructuralHash(*M3), StructuralHash(*M4));
}
TEST(StructuralHashTest, BasicFunction) {
LLVMContext Ctx;
std::unique_ptr<Module> M = parseIR(Ctx, "define void @f() {\n"
" ret void\n"
"}\n"
"define void @g() {\n"
" ret void\n"
"}\n"
"define i32 @h(i32 %i) {\n"
" ret i32 %i\n"
"}\n");
EXPECT_EQ(StructuralHash(*M->getFunction("f")),
StructuralHash(*M->getFunction("g")));
EXPECT_NE(StructuralHash(*M->getFunction("f")),
StructuralHash(*M->getFunction("h")));
}
TEST(StructuralHashTest, Declaration) {
LLVMContext Ctx;
std::unique_ptr<Module> M0 = parseIR(Ctx, "");
std::unique_ptr<Module> M1 = parseIR(Ctx, "declare void @f()");
std::unique_ptr<Module> M2 = parseIR(Ctx, "@g = external global i32");
EXPECT_EQ(StructuralHash(*M0), StructuralHash(*M1));
EXPECT_EQ(StructuralHash(*M0), StructuralHash(*M2));
}
TEST(StructuralHashTest, GlobalType) {
LLVMContext Ctx;
std::unique_ptr<Module> M1 = parseIR(Ctx, "@g = global i32 1");
std::unique_ptr<Module> M2 = parseIR(Ctx, "@g = global float 1.0");
EXPECT_NE(StructuralHash(*M1), StructuralHash(*M2));
}
TEST(StructuralHashTest, Function) {
LLVMContext Ctx;
std::unique_ptr<Module> M1 = parseIR(Ctx, "define void @f() { ret void }");
std::unique_ptr<Module> M2 = parseIR(Ctx, "define void @f(i32) { ret void }");
EXPECT_NE(StructuralHash(*M1), StructuralHash(*M2));
}
TEST(StructuralHashTest, FunctionRetType) {
LLVMContext Ctx;
std::unique_ptr<Module> M1 = parseIR(Ctx, "define void @f() { ret void }");
std::unique_ptr<Module> M2 = parseIR(Ctx, "define i32 @f() { ret i32 0 }");
EXPECT_EQ(StructuralHash(*M1), StructuralHash(*M2));
EXPECT_NE(StructuralHash(*M1, true), StructuralHash(*M2, true));
}
TEST(StructuralHashTest, InstructionOpCode) {
LLVMContext Ctx;
std::unique_ptr<Module> M1 = parseIR(Ctx, "define void @f(ptr %p) {\n"
" %a = load i32, ptr %p\n"
" ret void\n"
"}\n");
std::unique_ptr<Module> M2 =
parseIR(Ctx, "define void @f(ptr %p) {\n"
" %a = getelementptr i8, ptr %p, i32 1\n"
" ret void\n"
"}\n");
EXPECT_NE(StructuralHash(*M1), StructuralHash(*M2));
}
TEST(StructuralHashTest, InstructionSubType) {
LLVMContext Ctx;
std::unique_ptr<Module> M1 = parseIR(Ctx, "define void @f(ptr %p) {\n"
" %a = load i32, ptr %p\n"
" ret void\n"
"}\n");
std::unique_ptr<Module> M2 = parseIR(Ctx, "define void @f(ptr %p) {\n"
" %a = load i64, ptr %p\n"
" ret void\n"
"}\n");
EXPECT_EQ(StructuralHash(*M1), StructuralHash(*M2));
EXPECT_NE(StructuralHash(*M1, true), StructuralHash(*M2, true));
}
TEST(StructuralHashTest, InstructionType) {
LLVMContext Ctx;
std::unique_ptr<Module> M1 = parseIR(Ctx, "define void @f(ptr %p) {\n"
" %1 = load i32, ptr %p\n"
" ret void\n"
"}\n");
std::unique_ptr<Module> M2 = parseIR(Ctx, "define void @f(ptr %p) {\n"
" %1 = load float, ptr %p\n"
" ret void\n"
"}\n");
EXPECT_EQ(StructuralHash(*M1), StructuralHash(*M2));
EXPECT_NE(StructuralHash(*M1, true), StructuralHash(*M2, true));
}
TEST(StructuralHashTest, IgnoredMetadata) {
LLVMContext Ctx;
std::unique_ptr<Module> M1 = parseIR(Ctx, "@a = global i32 1\n");
// clang-format off
std::unique_ptr<Module> M2 = parseIR(
Ctx, R"(
@a = global i32 1
@llvm.embedded.object = private constant [4 x i8] c"BC\C0\00", section ".llvm.lto", align 1, !exclude !0
@llvm.compiler.used = appending global [1 x ptr] [ptr @llvm.embedded.object], section "llvm.metadata"
!llvm.embedded.objects = !{!1}
!0 = !{}
!1 = !{ptr @llvm.embedded.object, !".llvm.lto"}
)");
// clang-format on
EXPECT_EQ(StructuralHash(*M1), StructuralHash(*M2));
}
TEST(StructuralHashTest, ComparisonInstructionPredicate) {
LLVMContext Ctx;
std::unique_ptr<Module> M1 = parseIR(Ctx, "define i1 @f(i64 %a, i64 %b) {\n"
" %1 = icmp eq i64 %a, %b\n"
" ret i1 %1\n"
"}\n");
std::unique_ptr<Module> M2 = parseIR(Ctx, "define i1 @f(i64 %a, i64 %b) {\n"
" %1 = icmp ne i64 %a, %b\n"
" ret i1 %1\n"
"}\n");
EXPECT_EQ(StructuralHash(*M1), StructuralHash(*M2));
EXPECT_NE(StructuralHash(*M1, true), StructuralHash(*M2, true));
}
TEST(StructuralHashTest, IntrinsicInstruction) {
LLVMContext Ctx;
std::unique_ptr<Module> M1 =
parseIR(Ctx, "define float @f(float %a) {\n"
" %b = call float @llvm.sin.f32(float %a)\n"
" ret float %b\n"
"}\n"
"declare float @llvm.sin.f32(float)\n");
std::unique_ptr<Module> M2 =
parseIR(Ctx, "define float @f(float %a) {\n"
" %b = call float @llvm.cos.f32(float %a)\n"
" ret float %b\n"
"}\n"
"declare float @llvm.cos.f32(float)\n");
EXPECT_EQ(StructuralHash(*M1), StructuralHash(*M2));
EXPECT_NE(StructuralHash(*M1, true), StructuralHash(*M2, true));
}
TEST(StructuralHashTest, CallInstruction) {
LLVMContext Ctx;
std::unique_ptr<Module> M1 = parseIR(Ctx, "define i64 @f(i64 %a) {\n"
" %b = call i64 @f1(i64 %a)\n"
" ret i64 %b\n"
"}\n"
"declare i64 @f1(i64)");
std::unique_ptr<Module> M2 = parseIR(Ctx, "define i64 @f(i64 %a) {\n"
" %b = call i64 @f2(i64 %a)\n"
" ret i64 %b\n"
"}\n"
"declare i64 @f2(i64)");
EXPECT_EQ(StructuralHash(*M1), StructuralHash(*M2));
EXPECT_NE(StructuralHash(*M1, true), StructuralHash(*M2, true));
}
TEST(StructuralHashTest, ConstantInteger) {
LLVMContext Ctx;
std::unique_ptr<Module> M1 = parseIR(Ctx, "define i64 @f1() {\n"
" ret i64 1\n"
"}\n");
std::unique_ptr<Module> M2 = parseIR(Ctx, "define i64 @f2() {\n"
" ret i64 2\n"
"}\n");
EXPECT_EQ(StructuralHash(*M1), StructuralHash(*M2));
EXPECT_NE(StructuralHash(*M1, true), StructuralHash(*M2, true));
}
TEST(StructuralHashTest, BigConstantInteger) {
LLVMContext Ctx;
std::unique_ptr<Module> M1 = parseIR(Ctx, "define i128 @f1() {\n"
" ret i128 18446744073709551616\n"
"}\n");
std::unique_ptr<Module> M2 = parseIR(Ctx, "define i128 @f2() {\n"
" ret i128 18446744073709551617\n"
"}\n");
EXPECT_EQ(StructuralHash(*M1), StructuralHash(*M2));
EXPECT_NE(StructuralHash(*M1, true), StructuralHash(*M2, true));
}
TEST(StructuralHashTest, ArgumentNumber) {
LLVMContext Ctx;
std::unique_ptr<Module> M1 = parseIR(Ctx, "define i64 @f1(i64 %a, i64 %b) {\n"
" ret i64 %a\n"
"}\n");
std::unique_ptr<Module> M2 = parseIR(Ctx, "define i64 @f2(i64 %a, i64 %b) {\n"
" ret i64 %b\n"
"}\n");
EXPECT_EQ(StructuralHash(*M1), StructuralHash(*M2));
EXPECT_NE(StructuralHash(*M1, true), StructuralHash(*M2, true));
}
TEST(StructuralHashTest, Differences) {
LLVMContext Ctx;
std::unique_ptr<Module> M1 = parseIR(Ctx, "define i64 @f(i64 %a) {\n"
" %c = add i64 %a, 1\n"
" %b = call i64 @f1(i64 %c)\n"
" ret i64 %b\n"
"}\n"
"declare i64 @f1(i64)");
auto *F1 = M1->getFunction("f");
std::unique_ptr<Module> M2 = parseIR(Ctx, "define i64 @g(i64 %a) {\n"
" %c = add i64 %a, 1\n"
" %b = call i64 @f2(i64 %c)\n"
" ret i64 %b\n"
"}\n"
"declare i64 @f2(i64)");
auto *F2 = M2->getFunction("g");
// They are originally different when not ignoring any operand.
EXPECT_NE(StructuralHash(*F1, true), StructuralHash(*F2, true));
EXPECT_NE(StructuralHashWithDifferences(*F1, nullptr).FunctionHash,
StructuralHashWithDifferences(*F2, nullptr).FunctionHash);
// When we ignore the call target f1 vs f2, they have the same hash.
auto IgnoreOp = [&](const Instruction *I, unsigned OpndIdx) {
return I->getOpcode() == Instruction::Call && OpndIdx == 1;
};
auto FuncHashInfo1 = StructuralHashWithDifferences(*F1, IgnoreOp);
auto FuncHashInfo2 = StructuralHashWithDifferences(*F2, IgnoreOp);
EXPECT_EQ(FuncHashInfo1.FunctionHash, FuncHashInfo2.FunctionHash);
// There are total 3 instructions.
EXPECT_THAT(*FuncHashInfo1.IndexInstruction, SizeIs(3));
EXPECT_THAT(*FuncHashInfo2.IndexInstruction, SizeIs(3));
// The only 1 operand (the call target) has been ignored.
EXPECT_THAT(*FuncHashInfo1.IndexOperandHashMap, SizeIs(1u));
EXPECT_THAT(*FuncHashInfo2.IndexOperandHashMap, SizeIs(1u));
// The index pair of instruction and operand (1, 1) is a key in the map.
ASSERT_THAT(*FuncHashInfo1.IndexOperandHashMap, Contains(Key(Pair(1, 1))));
ASSERT_THAT(*FuncHashInfo2.IndexOperandHashMap, Contains(Key(Pair(1, 1))));
// The indexed instruciton must be the call instruction as shown in the
// IgnoreOp above.
EXPECT_EQ(FuncHashInfo1.IndexInstruction->lookup(1)->getOpcode(),
Instruction::Call);
EXPECT_EQ(FuncHashInfo2.IndexInstruction->lookup(1)->getOpcode(),
Instruction::Call);
// The ignored operand hashes (for f1 vs. f2) are different.
EXPECT_NE(FuncHashInfo1.IndexOperandHashMap->lookup({1, 1}),
FuncHashInfo2.IndexOperandHashMap->lookup({1, 1}));
}
} // end anonymous namespace