mirror of
https://github.com/llvm/llvm-project.git
synced 2025-05-14 12:06:07 +00:00

OpenCL runtime tracks the invoke function emitted for any block expression. Due to restrictions on blocks in OpenCL (v2.0 s6.12.5), it is always possible to know the block invoke function when emitting call of block expression or __enqueue_kernel builtin functions. Since __enqueu_kernel already has an argument for the invoke function, it is redundant to have invoke function member in the llvm block literal structure. This patch removes invoke function from the llvm block literal structure. It also removes the bitcast of block invoke function to the generic block literal type which is useless for OpenCL. This will save some space for the kernel argument, and also eliminate some store instructions. Differential Revision: https://reviews.llvm.org/D43783 llvm-svn: 326937
100 lines
3.2 KiB
C++
100 lines
3.2 KiB
C++
//===----- CGOpenCLRuntime.h - Interface to OpenCL Runtimes -----*- C++ -*-===//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This provides an abstract class for OpenCL code generation. Concrete
|
|
// subclasses of this implement code generation for specific OpenCL
|
|
// runtime libraries.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#ifndef LLVM_CLANG_LIB_CODEGEN_CGOPENCLRUNTIME_H
|
|
#define LLVM_CLANG_LIB_CODEGEN_CGOPENCLRUNTIME_H
|
|
|
|
#include "clang/AST/Type.h"
|
|
#include "llvm/ADT/DenseMap.h"
|
|
#include "llvm/IR/Type.h"
|
|
#include "llvm/IR/Value.h"
|
|
|
|
namespace clang {
|
|
|
|
class BlockExpr;
|
|
class Expr;
|
|
class VarDecl;
|
|
|
|
namespace CodeGen {
|
|
|
|
class CodeGenFunction;
|
|
class CodeGenModule;
|
|
|
|
class CGOpenCLRuntime {
|
|
protected:
|
|
CodeGenModule &CGM;
|
|
llvm::Type *PipeTy;
|
|
llvm::PointerType *SamplerTy;
|
|
|
|
/// Structure for enqueued block information.
|
|
struct EnqueuedBlockInfo {
|
|
llvm::Function *InvokeFunc; /// Block invoke function.
|
|
llvm::Function *Kernel; /// Enqueued block kernel.
|
|
llvm::Value *BlockArg; /// The first argument to enqueued block kernel.
|
|
};
|
|
/// Maps block expression to block information.
|
|
llvm::DenseMap<const Expr *, EnqueuedBlockInfo> EnqueuedBlockMap;
|
|
|
|
public:
|
|
CGOpenCLRuntime(CodeGenModule &CGM) : CGM(CGM), PipeTy(nullptr),
|
|
SamplerTy(nullptr) {}
|
|
virtual ~CGOpenCLRuntime();
|
|
|
|
/// Emit the IR required for a work-group-local variable declaration, and add
|
|
/// an entry to CGF's LocalDeclMap for D. The base class does this using
|
|
/// CodeGenFunction::EmitStaticVarDecl to emit an internal global for D.
|
|
virtual void EmitWorkGroupLocalVarDecl(CodeGenFunction &CGF,
|
|
const VarDecl &D);
|
|
|
|
virtual llvm::Type *convertOpenCLSpecificType(const Type *T);
|
|
|
|
virtual llvm::Type *getPipeType(const PipeType *T);
|
|
|
|
llvm::PointerType *getSamplerType(const Type *T);
|
|
|
|
// \brief Returnes a value which indicates the size in bytes of the pipe
|
|
// element.
|
|
virtual llvm::Value *getPipeElemSize(const Expr *PipeArg);
|
|
|
|
// \brief Returnes a value which indicates the alignment in bytes of the pipe
|
|
// element.
|
|
virtual llvm::Value *getPipeElemAlign(const Expr *PipeArg);
|
|
|
|
/// \return __generic void* type.
|
|
llvm::PointerType *getGenericVoidPointerType();
|
|
|
|
/// \return enqueued block information for enqueued block.
|
|
EnqueuedBlockInfo emitOpenCLEnqueuedBlock(CodeGenFunction &CGF,
|
|
const Expr *E);
|
|
|
|
/// \brief Record invoke function and block literal emitted during normal
|
|
/// codegen for a block expression. The information is used by
|
|
/// emitOpenCLEnqueuedBlock to emit wrapper kernel.
|
|
///
|
|
/// \param InvokeF invoke function emitted for the block expression.
|
|
/// \param Block block literal emitted for the block expression.
|
|
void recordBlockInfo(const BlockExpr *E, llvm::Function *InvokeF,
|
|
llvm::Value *Block);
|
|
|
|
/// \return LLVM block invoke function emitted for an expression derived from
|
|
/// the block expression.
|
|
llvm::Function *getInvokeFunction(const Expr *E);
|
|
};
|
|
|
|
}
|
|
}
|
|
|
|
#endif
|