llvm-project/mlir/lib/IR/Verifier.cpp

520 lines
18 KiB
C++
Raw Normal View History

//===- Verifier.cpp - MLIR Verifier Implementation ------------------------===//
//
// Copyright 2019 The MLIR Authors.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
// =============================================================================
//
// This file implements the verify() methods on the various IR types, performing
// (potentially expensive) checks on the holistic structure of the code. This
// can be used for detecting bugs in compiler transformations and hand written
// .mlir files.
//
// The checks in this file are only for things that can occur as part of IR
// transformations: e.g. violation of dominance information, malformed operation
// attributes, etc. MLIR supports transformations moving IR through locally
// invalid states (e.g. unlinking an instruction from an instruction before
// re-inserting it in a new place), but each transformation must complete with
// the IR in a valid form.
//
// This should not check for things that are always wrong by construction (e.g.
// affine maps or other immutable structures that are incorrect), because those
// are not mutable and can be checked at time of construction.
//
//===----------------------------------------------------------------------===//
#include "mlir/IR/Attributes.h"
#include "mlir/IR/CFGFunction.h"
#include "mlir/IR/MLFunction.h"
#include "mlir/IR/Module.h"
#include "mlir/IR/OperationSet.h"
#include "mlir/IR/Statements.h"
#include "mlir/IR/StmtVisitor.h"
#include "llvm/ADT/ScopedHashTable.h"
#include "llvm/ADT/Twine.h"
#include "llvm/Support/PrettyStackTrace.h"
#include "llvm/Support/raw_ostream.h"
using namespace mlir;
namespace {
/// Base class for the verifiers in this file. It is a pervasive truth that
/// this file treats "true" as an error that needs to be recovered from, and
/// "false" as success.
///
class Verifier {
public:
template <typename T>
static void failure(const Twine &message, const T &value, raw_ostream &os) {
// Print the error message and flush the stream in case printing the value
// causes a crash.
os << "MLIR verification failure: " + message + "\n";
os.flush();
value.print(os);
}
template <typename T>
bool failure(const Twine &message, const T &value) {
// If the caller isn't trying to collect failure information, just print
// the result and abort.
if (!errorResult) {
failure(message, value, llvm::errs());
abort();
}
// Otherwise, emit the error into the string and return true.
llvm::raw_string_ostream os(*errorResult);
failure(message, value, os);
os.flush();
return true;
}
bool opFailure(const Twine &message, const Operation &value) {
value.emitError(message);
return true;
}
bool verifyOperation(const Operation &op);
bool verifyAttribute(Attribute *attr, const Operation &op);
protected:
explicit Verifier(std::string *errorResult, const Function &fn)
: errorResult(errorResult), fn(fn),
operationSet(OperationSet::get(fn.getContext())) {}
private:
/// If the verifier is returning errors back to a client, this is the error to
/// fill in.
std::string *errorResult;
/// The function being checked.
const Function &fn;
/// The operation set installed in the current MLIR context.
OperationSet &operationSet;
};
} // end anonymous namespace
// Check that function attributes are all well formed.
bool Verifier::verifyAttribute(Attribute *attr, const Operation &op) {
if (!attr->isOrContainsFunction())
return false;
// If we have a function attribute, check that it is non-null and in the
// same module as the operation that refers to it.
if (auto *fnAttr = dyn_cast<FunctionAttr>(attr)) {
if (!fnAttr->getValue())
return opFailure("attribute refers to deallocated function!", op);
if (fnAttr->getValue()->getModule() != fn.getModule())
return opFailure("attribute refers to function '" +
Twine(fnAttr->getValue()->getName()) +
"' defined in another module!",
op);
return false;
}
// Otherwise, we must have an array attribute, remap the elements.
for (auto *elt : cast<ArrayAttr>(attr)->getValue()) {
if (verifyAttribute(elt, op))
return true;
}
return false;
}
/// Check the invariants of the specified operation instruction or statement.
bool Verifier::verifyOperation(const Operation &op) {
if (op.getOperationFunction() != &fn)
return opFailure("operation in the wrong function", op);
// TODO: Check that operands are non-nil and structurally ok.
// Verify all attributes are ok. We need to check Function attributes, since
// they are actually mutable (the function they refer to can be deleted), and
// we have to check array attributes that can refer to them.
for (auto attr : op.getAttrs()) {
if (verifyAttribute(attr.second, op))
return true;
}
// If we can get operation info for this, check the custom hook.
if (auto *opInfo = op.getAbstractOperation()) {
if (auto *errorMessage = opInfo->verifyInvariants(&op))
return opFailure(Twine("'") + op.getName().str() + "' op " + errorMessage,
op);
}
return false;
}
//===----------------------------------------------------------------------===//
// CFG Functions
//===----------------------------------------------------------------------===//
namespace {
struct CFGFuncVerifier : public Verifier {
const CFGFunction &fn;
CFGFuncVerifier(const CFGFunction &fn, std::string *errorResult)
: Verifier(errorResult, fn), fn(fn) {}
bool verify();
bool verifyBlock(const BasicBlock &block);
bool verifyTerminator(const TerminatorInst &term);
bool verifyReturn(const ReturnInst &inst);
bool verifyBranch(const BranchInst &inst);
bool verifyCondBranch(const CondBranchInst &inst);
// Given a list of "operands" and "arguments" that are the same length, verify
// that the types of operands pointwise match argument types. The iterator
// types must expose the "getType()" function when dereferenced twice; that
// is, the iterator's value_type must be equivalent to SSAValue*.
template <typename OperandIteratorTy, typename ArgumentIteratorTy>
bool verifyOperandsMatchArguments(OperandIteratorTy opBegin,
OperandIteratorTy opEnd,
ArgumentIteratorTy argBegin,
const Instruction &instContext);
};
} // end anonymous namespace
bool CFGFuncVerifier::verify() {
llvm::PrettyStackTraceFormat fmt("MLIR Verifier: cfgfunc @%s",
fn.getName().c_str());
// TODO: Lots to be done here, including verifying dominance information when
// we have uses and defs.
// TODO: Verify the first block has no predecessors.
if (fn.empty())
return failure("cfgfunc must have at least one basic block", fn);
// Verify that the argument list of the function and the arg list of the first
// block line up.
auto *firstBB = &fn.front();
auto fnInputTypes = fn.getType()->getInputs();
if (fnInputTypes.size() != firstBB->getNumArguments())
return failure("first block of cfgfunc must have " +
Twine(fnInputTypes.size()) +
" arguments to match function signature",
fn);
for (unsigned i = 0, e = firstBB->getNumArguments(); i != e; ++i)
if (fnInputTypes[i] != firstBB->getArgument(i)->getType())
return failure(
"type of argument #" + Twine(i) +
" must match corresponding argument in function signature",
fn);
for (auto &block : fn) {
if (verifyBlock(block))
return true;
}
return false;
}
bool CFGFuncVerifier::verifyBlock(const BasicBlock &block) {
if (!block.getTerminator())
return failure("basic block with no terminator", block);
if (verifyTerminator(*block.getTerminator()))
return true;
for (auto *arg : block.getArguments()) {
if (arg->getOwner() != &block)
return failure("basic block argument not owned by block", block);
}
for (auto &inst : block) {
if (verifyOperation(inst))
return true;
}
return false;
}
bool CFGFuncVerifier::verifyTerminator(const TerminatorInst &term) {
if (term.getFunction() != &fn)
return failure("terminator in the wrong function", term);
// TODO: Check that operands are structurally ok.
// TODO: Check that successors are in the right function.
if (auto *ret = dyn_cast<ReturnInst>(&term))
return verifyReturn(*ret);
if (auto *br = dyn_cast<BranchInst>(&term))
return verifyBranch(*br);
if (auto *br = dyn_cast<CondBranchInst>(&term))
return verifyCondBranch(*br);
return false;
}
bool CFGFuncVerifier::verifyReturn(const ReturnInst &inst) {
// Verify that the return operands match the results of the function.
auto results = fn.getType()->getResults();
if (inst.getNumOperands() != results.size())
return failure("return has " + Twine(inst.getNumOperands()) +
" operands, but enclosing function returns " +
Twine(results.size()),
inst);
for (unsigned i = 0, e = results.size(); i != e; ++i)
if (inst.getOperand(i)->getType() != results[i])
return failure("type of return operand " + Twine(i) +
" doesn't match function result type",
inst);
return false;
}
bool CFGFuncVerifier::verifyBranch(const BranchInst &inst) {
// Verify that the number of operands lines up with the number of BB arguments
// in the successor.
auto dest = inst.getDest();
if (inst.getNumOperands() != dest->getNumArguments())
return failure("branch has " + Twine(inst.getNumOperands()) +
" operands, but target block has " +
Twine(dest->getNumArguments()),
inst);
for (unsigned i = 0, e = inst.getNumOperands(); i != e; ++i)
if (inst.getOperand(i)->getType() != dest->getArgument(i)->getType())
return failure("type of branch operand " + Twine(i) +
" doesn't match target bb argument type",
inst);
return false;
}
template <typename OperandIteratorTy, typename ArgumentIteratorTy>
bool CFGFuncVerifier::verifyOperandsMatchArguments(
OperandIteratorTy opBegin, OperandIteratorTy opEnd,
ArgumentIteratorTy argBegin, const Instruction &instContext) {
OperandIteratorTy opIt = opBegin;
ArgumentIteratorTy argIt = argBegin;
for (; opIt != opEnd; ++opIt, ++argIt) {
if ((*opIt)->getType() != (*argIt)->getType())
return failure("type of operand " + Twine(std::distance(opBegin, opIt)) +
" doesn't match argument type",
instContext);
}
return false;
}
bool CFGFuncVerifier::verifyCondBranch(const CondBranchInst &inst) {
// Verify that the number of operands lines up with the number of BB arguments
// in the true successor.
auto trueDest = inst.getTrueDest();
if (inst.getNumTrueOperands() != trueDest->getNumArguments())
return failure("branch has " + Twine(inst.getNumTrueOperands()) +
" true operands, but true target block has " +
Twine(trueDest->getNumArguments()),
inst);
if (verifyOperandsMatchArguments(inst.true_operand_begin(),
inst.true_operand_end(),
trueDest->args_begin(), inst))
return true;
// And the false successor.
auto falseDest = inst.getFalseDest();
if (inst.getNumFalseOperands() != falseDest->getNumArguments())
return failure("branch has " + Twine(inst.getNumFalseOperands()) +
" false operands, but false target block has " +
Twine(falseDest->getNumArguments()),
inst);
if (verifyOperandsMatchArguments(inst.false_operand_begin(),
inst.false_operand_end(),
falseDest->args_begin(), inst))
return true;
if (inst.getCondition()->getType() != Type::getInteger(1, fn.getContext()))
return failure("type of condition is not boolean (i1)", inst);
return false;
}
//===----------------------------------------------------------------------===//
// ML Functions
//===----------------------------------------------------------------------===//
namespace {
struct MLFuncVerifier : public Verifier, public StmtWalker<MLFuncVerifier> {
const MLFunction &fn;
bool hadError = false;
MLFuncVerifier(const MLFunction &fn, std::string *errorResult)
: Verifier(errorResult, fn), fn(fn) {}
void visitOperationStmt(OperationStmt *opStmt) {
hadError |= verifyOperation(*opStmt);
}
bool verify() {
llvm::PrettyStackTraceFormat fmt("MLIR Verifier: mlfunc @%s",
fn.getName().c_str());
// Check basic structural properties.
walk(const_cast<MLFunction *>(&fn));
if (hadError)
return true;
// TODO: check that operation is not a return statement unless it's
// the last one in the function.
// TODO: check that loop bounds and if conditions are properly formed.
if (verifyReturn())
return true;
return verifyDominance();
}
/// Walk all of the code in this MLFunc and verify that the operands of any
/// operations are properly dominated by their definitions.
bool verifyDominance();
/// Verify that function has a return statement that matches its signature.
bool verifyReturn();
};
} // end anonymous namespace
/// Walk all of the code in this MLFunc and verify that the operands of any
/// operations are properly dominated by their definitions.
bool MLFuncVerifier::verifyDominance() {
using HashTable = llvm::ScopedHashTable<const SSAValue *, bool>;
HashTable liveValues;
HashTable::ScopeTy topScope(liveValues);
// All of the arguments to the function are live for the whole function.
for (auto *arg : fn.getArguments())
liveValues.insert(arg, true);
// This recursive function walks the statement list pushing scopes onto the
// stack as it goes, and popping them to remove them from the table.
std::function<bool(const StmtBlock &block)> walkBlock;
walkBlock = [&](const StmtBlock &block) -> bool {
HashTable::ScopeTy blockScope(liveValues);
// The induction variable of a for statement is live within its body.
if (auto *forStmt = dyn_cast<ForStmt>(&block))
liveValues.insert(forStmt, true);
for (auto &stmt : block) {
// Verify that each of the operands are live.
unsigned operandNo = 0;
for (auto *opValue : stmt.getOperands()) {
if (!liveValues.count(opValue)) {
stmt.emitError("operand #" + Twine(operandNo) +
" does not dominate this use");
if (auto *useStmt = opValue->getDefiningStmt())
useStmt->emitNote("operand defined here");
return true;
}
++operandNo;
}
if (auto *opStmt = dyn_cast<OperationStmt>(&stmt)) {
// Operations define values, add them to the hash table.
for (auto *result : opStmt->getResults())
liveValues.insert(result, true);
continue;
}
// If this is an if or for, recursively walk the block they contain.
if (auto *ifStmt = dyn_cast<IfStmt>(&stmt)) {
if (walkBlock(*ifStmt->getThen()))
return true;
if (auto *elseClause = ifStmt->getElse())
if (walkBlock(*elseClause))
return true;
}
if (auto *forStmt = dyn_cast<ForStmt>(&stmt))
if (walkBlock(*forStmt))
return true;
}
return false;
};
// Check the whole function out.
return walkBlock(fn);
}
bool MLFuncVerifier::verifyReturn() {
// TODO: fold return verification in the pass that verifies all statements.
const char missingReturnMsg[] = "ML function must end with return statement";
if (fn.getStatements().empty())
return failure(missingReturnMsg, fn);
const auto &stmt = fn.getStatements().back();
if (const auto *op = dyn_cast<OperationStmt>(&stmt)) {
if (!op->isReturn())
return failure(missingReturnMsg, fn);
// The operand number and types must match the function signature.
// TODO: move this verification in ReturnOp::verify() if printing
// of the error messages below can be made to work there.
const auto &results = fn.getType()->getResults();
if (op->getNumOperands() != results.size())
return failure("return has " + Twine(op->getNumOperands()) +
" operands, but enclosing function returns " +
Twine(results.size()),
*op);
for (unsigned i = 0, e = results.size(); i != e; ++i)
if (op->getOperand(i)->getType() != results[i])
return failure("type of return operand " + Twine(i) +
" doesn't match function result type",
*op);
return false;
}
return failure(missingReturnMsg, fn);
}
//===----------------------------------------------------------------------===//
// Entrypoints
//===----------------------------------------------------------------------===//
/// Perform (potentially expensive) checks of invariants, used to detect
/// compiler bugs. On error, this fills in the string and return true,
/// or aborts if the string was not provided.
bool Function::verify(std::string *errorResult) const {
switch (getKind()) {
case Kind::ExtFunc:
// No body, nothing can be wrong here.
return false;
case Kind::CFGFunc:
return CFGFuncVerifier(*cast<CFGFunction>(this), errorResult).verify();
case Kind::MLFunc:
return MLFuncVerifier(*cast<MLFunction>(this), errorResult).verify();
}
}
/// Perform (potentially expensive) checks of invariants, used to detect
/// compiler bugs. On error, this fills in the string and return true,
/// or aborts if the string was not provided.
bool Module::verify(std::string *errorResult) const {
/// Check that each function is correct.
for (auto &fn : *this) {
if (fn.verify(errorResult))
return true;
}
// Make sure the error string is empty on success.
if (errorResult)
errorResult->clear();
return false;
}