//===-- R600KernelParameters.cpp - TODO: Add brief description -------===// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // // TODO: Add full description // //===----------------------------------------------------------------------===// #include #include "R600KernelParameters.h" #include "R600OpenCLUtils.h" #include "llvm/Constants.h" #include "llvm/Intrinsics.h" #include "llvm/Support/IRBuilder.h" #include "llvm/Support/TypeBuilder.h" // #include "llvm/CodeGen/Function.h" namespace AMDILAS { enum AddressSpaces { PRIVATE_ADDRESS = 0, // Address space for private memory. GLOBAL_ADDRESS = 1, // Address space for global memory (RAT0, VTX0). CONSTANT_ADDRESS = 2, // Address space for constant memory. LOCAL_ADDRESS = 3, // Address space for local memory. REGION_ADDRESS = 4, // Address space for region memory. ADDRESS_NONE = 5, // Address space for unknown memory. PARAM_D_ADDRESS = 6, // Address space for direct addressible parameter memory (CONST0) PARAM_I_ADDRESS = 7, // Address space for indirect addressible parameter memory (VTX1) LAST_ADDRESS = 8 }; } #include #include using namespace llvm; using namespace std; #define CONSTANT_CACHE_SIZE_DW 127 class R600KernelParameters : public llvm::FunctionPass { const llvm::TargetData * TD; LLVMContext* Context; Module *mod; struct param { param() : val(NULL), ptr_val(NULL), offset_in_dw(0), size_in_dw(0), indirect(false), specialID(0) {} llvm::Value* val; llvm::Value* ptr_val; int offset_in_dw; int size_in_dw; bool indirect; string specialType; int specialID; int end() { return offset_in_dw + size_in_dw; } /* The first 9 dwords are reserved for the grid sizes. */ int get_rat_offset() { return 9 + offset_in_dw; } }; std::vector params; int getLastSpecialID(const string& TypeName); int getListSize(); void AddParam(llvm::Argument* arg); int calculateArgumentSize(llvm::Argument* arg); void RunAna(llvm::Function* fun); void Replace(llvm::Function* fun); bool isIndirect(Value* val, set& visited); void Propagate(llvm::Function* fun); void Propagate(llvm::Value* v, const llvm::Twine& name, bool indirect = false); Value* ConstantRead(Function* fun, param& p); Value* handleSpecial(Function* fun, param& p); bool isSpecialType(Type*); string getSpecialTypeName(Type*); public: static char ID; R600KernelParameters() : FunctionPass(ID) {}; R600KernelParameters(const llvm::TargetData* TD) : FunctionPass(ID), TD(TD) {} // bool runOnFunction (llvm::Function &F); bool runOnFunction (llvm::Function &F); void getAnalysisUsage(AnalysisUsage &AU) const; const char *getPassName() const; bool doInitialization(Module &M); bool doFinalization(Module &M); }; char R600KernelParameters::ID = 0; static RegisterPass X("kerparam", "OpenCL Kernel Parameter conversion", false, false); int R600KernelParameters::getLastSpecialID(const string& TypeName) { int lastID = -1; for (vector::iterator i = params.begin(); i != params.end(); i++) { if (i->specialType == TypeName) { lastID = i->specialID; } } return lastID; } int R600KernelParameters::getListSize() { if (params.size() == 0) { return 0; } return params.back().end(); } bool R600KernelParameters::isIndirect(Value* val, set& visited) { if (isa(val)) { return false; } if (isa(val->getType())) { assert(0 and "Internal error"); return false; } if (visited.count(val)) { return false; } visited.insert(val); if (isa(val)) { GetElementPtrInst* GEP = dyn_cast(val); GetElementPtrInst::op_iterator i = GEP->op_begin(); for (i++; i != GEP->op_end(); i++) { if (!isa(*i)) { return true; } } } for (Value::use_iterator i = val->use_begin(); i != val->use_end(); i++) { Value* v2 = dyn_cast(*i); if (v2) { if (isIndirect(v2, visited)) { return true; } } } return false; } void R600KernelParameters::AddParam(llvm::Argument* arg) { param p; p.val = dyn_cast(arg); p.offset_in_dw = getListSize(); p.size_in_dw = calculateArgumentSize(arg); if (isa(arg->getType()) and arg->hasByValAttr()) { set visited; p.indirect = isIndirect(p.val, visited); } params.push_back(p); } int R600KernelParameters::calculateArgumentSize(llvm::Argument* arg) { Type* t = arg->getType(); if (arg->hasByValAttr() and dyn_cast(t)) { t = dyn_cast(t)->getElementType(); } int store_size_in_dw = (TD->getTypeStoreSize(t) + 3)/4; assert(store_size_in_dw); return store_size_in_dw; } void R600KernelParameters::RunAna(llvm::Function* fun) { assert(isOpenCLKernel(fun)); for (Function::arg_iterator i = fun->arg_begin(); i != fun->arg_end(); i++) { AddParam(i); } } void R600KernelParameters::Replace(llvm::Function* fun) { for (std::vector::iterator i = params.begin(); i != params.end(); i++) { Value *new_val; if (isSpecialType(i->val->getType())) { new_val = handleSpecial(fun, *i); } else { new_val = ConstantRead(fun, *i); } if (new_val) { i->val->replaceAllUsesWith(new_val); } } } void R600KernelParameters::Propagate(llvm::Function* fun) { for (std::vector::iterator i = params.begin(); i != params.end(); i++) { if (i->ptr_val) { Propagate(i->ptr_val, i->val->getName(), i->indirect); } } } void R600KernelParameters::Propagate(Value* v, const Twine& name, bool indirect) { LoadInst* load = dyn_cast(v); GetElementPtrInst *GEP = dyn_cast(v); unsigned addrspace; if (indirect) { addrspace = AMDILAS::PARAM_I_ADDRESS; } else { addrspace = AMDILAS::PARAM_D_ADDRESS; } if (GEP and GEP->getType()->getAddressSpace() != addrspace) { Value* op = GEP->getPointerOperand(); if (dyn_cast(op->getType())->getAddressSpace() != addrspace) { op = new BitCastInst(op, PointerType::get(dyn_cast(op->getType())->getElementType(), addrspace), name, dyn_cast(v)); } vector params(GEP->idx_begin(), GEP->idx_end()); GetElementPtrInst* GEP2 = GetElementPtrInst::Create(op, params, name, dyn_cast(v)); GEP2->setIsInBounds(GEP->isInBounds()); v = dyn_cast(GEP2); GEP->replaceAllUsesWith(GEP2); GEP->eraseFromParent(); load = NULL; } if (load) { if (load->getPointerAddressSpace() != addrspace) ///normally at this point we have the right address space { Value *orig_ptr = load->getPointerOperand(); PointerType *orig_ptr_type = dyn_cast(orig_ptr->getType()); Type* new_ptr_type = PointerType::get(orig_ptr_type->getElementType(), addrspace); Value* new_ptr = orig_ptr; if (orig_ptr->getType() != new_ptr_type) { new_ptr = new BitCastInst(orig_ptr, new_ptr_type, "prop_cast", load); } Value* new_load = new LoadInst(new_ptr, name, load); load->replaceAllUsesWith(new_load); load->eraseFromParent(); } return; } vector users(v->use_begin(), v->use_end()); for (int i = 0; i < int(users.size()); i++) { Value* v2 = dyn_cast(users[i]); if (v2) { Propagate(v2, name, indirect); } } } Value* R600KernelParameters::ConstantRead(Function* fun, param& p) { assert(fun->front().begin() != fun->front().end()); Instruction *first_inst = fun->front().begin(); IRBuilder <> builder (first_inst); /* First 3 dwords are reserved for the dimmension info */ if (!p.val->hasNUsesOrMore(1)) { return NULL; } unsigned addrspace; if (p.indirect) { addrspace = AMDILAS::PARAM_I_ADDRESS; } else { addrspace = AMDILAS::PARAM_D_ADDRESS; } Argument *arg = dyn_cast(p.val); Type * argType = p.val->getType(); PointerType * argPtrType = dyn_cast(p.val->getType()); if (argPtrType and arg->hasByValAttr()) { Value* param_addr_space_ptr = ConstantPointerNull::get(PointerType::get(Type::getInt32Ty(*Context), addrspace)); Value* param_ptr = GetElementPtrInst::Create(param_addr_space_ptr, ConstantInt::get(Type::getInt32Ty(*Context), p.get_rat_offset()), arg->getName(), first_inst); param_ptr = new BitCastInst(param_ptr, PointerType::get(argPtrType->getElementType(), addrspace), arg->getName(), first_inst); p.ptr_val = param_ptr; return param_ptr; } else { Value* param_addr_space_ptr = ConstantPointerNull::get(PointerType::get(argType, addrspace)); Value* param_ptr = builder.CreateGEP(param_addr_space_ptr, ConstantInt::get(Type::getInt32Ty(*Context), p.get_rat_offset()), arg->getName()); Value* param_value = builder.CreateLoad(param_ptr, arg->getName()); return param_value; } } Value* R600KernelParameters::handleSpecial(Function* fun, param& p) { string name = getSpecialTypeName(p.val->getType()); int ID; assert(!name.empty()); if (name == "image2d_t" or name == "image3d_t") { int lastID = max(getLastSpecialID("image2d_t"), getLastSpecialID("image3d_t")); if (lastID == -1) { ID = 2; ///ID0 and ID1 are used internally by the driver } else { ID = lastID + 1; } } else if (name == "sampler_t") { int lastID = getLastSpecialID("sampler_t"); if (lastID == -1) { ID = 0; } else { ID = lastID + 1; } } else { ///TODO: give some error message return NULL; } p.specialType = name; p.specialID = ID; Instruction *first_inst = fun->front().begin(); return new IntToPtrInst(ConstantInt::get(Type::getInt32Ty(*Context), p.specialID), p.val->getType(), "resourceID", first_inst); } bool R600KernelParameters::isSpecialType(Type* t) { return !getSpecialTypeName(t).empty(); } string R600KernelParameters::getSpecialTypeName(Type* t) { PointerType *pt = dyn_cast(t); StructType *st = NULL; if (pt) { st = dyn_cast(pt->getElementType()); } if (st) { string prefix = "struct.opencl_builtin_type_"; string name = st->getName().str(); if (name.substr(0, prefix.length()) == prefix) { return name.substr(prefix.length(), name.length()); } } return ""; } bool R600KernelParameters::runOnFunction (Function &F) { if (!isOpenCLKernel(&F)) { return false; } // F.dump(); RunAna(&F); Replace(&F); Propagate(&F); mod->dump(); return false; } void R600KernelParameters::getAnalysisUsage(AnalysisUsage &AU) const { // AU.addRequired(); FunctionPass::getAnalysisUsage(AU); AU.setPreservesAll(); } const char *R600KernelParameters::getPassName() const { return "OpenCL Kernel parameter conversion to memory"; } bool R600KernelParameters::doInitialization(Module &M) { Context = &M.getContext(); mod = &M; return false; } bool R600KernelParameters::doFinalization(Module &M) { return false; } llvm::FunctionPass* createR600KernelParametersPass(const llvm::TargetData* TD) { FunctionPass *p = new R600KernelParameters(TD); return p; }