/* * Copyright 2014 Advanced Micro Devices, Inc. * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the * "Software"), to deal in the Software without restriction, including * without limitation the rights to use, copy, modify, merge, publish, * distribute, sub license, and/or sell copies of the Software, and to * permit persons to whom the Software is furnished to do so, subject to * the following conditions: * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE * USE OR OTHER DEALINGS IN THE SOFTWARE. * * The above copyright notice and this permission notice (including the * next paragraph) shall be included in all copies or substantial portions * of the Software. * */ /* based on Marek's patch to lp_bld_misc.cpp */ // Workaround http://llvm.org/PR23628 #pragma push_macro("DEBUG") #undef DEBUG #include "ac_binary.h" #include "ac_llvm_util.h" #include "ac_llvm_build.h" #include #include #include #include #include #include void ac_add_attr_dereferenceable(LLVMValueRef val, uint64_t bytes) { llvm::Argument *A = llvm::unwrap(val); A->addAttr(llvm::Attribute::getWithDereferenceableBytes(A->getContext(), bytes)); } bool ac_is_sgpr_param(LLVMValueRef arg) { llvm::Argument *A = llvm::unwrap(arg); llvm::AttributeList AS = A->getParent()->getAttributes(); unsigned ArgNo = A->getArgNo(); return AS.hasAttribute(ArgNo + 1, llvm::Attribute::InReg); } LLVMValueRef ac_llvm_get_called_value(LLVMValueRef call) { return LLVMGetCalledValue(call); } bool ac_llvm_is_function(LLVMValueRef v) { return LLVMGetValueKind(v) == LLVMFunctionValueKind; } LLVMModuleRef ac_create_module(LLVMTargetMachineRef tm, LLVMContextRef ctx) { llvm::TargetMachine *TM = reinterpret_cast(tm); LLVMModuleRef module = LLVMModuleCreateWithNameInContext("mesa-shader", ctx); llvm::unwrap(module)->setTargetTriple(TM->getTargetTriple().getTriple()); llvm::unwrap(module)->setDataLayout(TM->createDataLayout()); return module; } LLVMBuilderRef ac_create_builder(LLVMContextRef ctx, enum ac_float_mode float_mode) { LLVMBuilderRef builder = LLVMCreateBuilderInContext(ctx); llvm::FastMathFlags flags; switch (float_mode) { case AC_FLOAT_MODE_DEFAULT: break; case AC_FLOAT_MODE_NO_SIGNED_ZEROS_FP_MATH: flags.setNoSignedZeros(); llvm::unwrap(builder)->setFastMathFlags(flags); break; case AC_FLOAT_MODE_UNSAFE_FP_MATH: flags.setFast(); llvm::unwrap(builder)->setFastMathFlags(flags); break; } return builder; } LLVMTargetLibraryInfoRef ac_create_target_library_info(const char *triple) { return reinterpret_cast(new llvm::TargetLibraryInfoImpl(llvm::Triple(triple))); } void ac_dispose_target_library_info(LLVMTargetLibraryInfoRef library_info) { delete reinterpret_cast(library_info); } /* The LLVM compiler is represented as a pass manager containing passes for * optimizations, instruction selection, and code generation. */ struct ac_compiler_passes { ac_compiler_passes(): ostream(code_string) {} llvm::SmallString<0> code_string; /* ELF shader binary */ llvm::raw_svector_ostream ostream; /* stream for appending data to the binary */ llvm::legacy::PassManager passmgr; /* list of passes */ }; struct ac_compiler_passes *ac_create_llvm_passes(LLVMTargetMachineRef tm) { struct ac_compiler_passes *p = new ac_compiler_passes(); if (!p) return NULL; llvm::TargetMachine *TM = reinterpret_cast(tm); if (TM->addPassesToEmitFile(p->passmgr, p->ostream, nullptr, llvm::TargetMachine::CGFT_ObjectFile)) { fprintf(stderr, "amd: TargetMachine can't emit a file of this type!\n"); delete p; return NULL; } return p; } void ac_destroy_llvm_passes(struct ac_compiler_passes *p) { delete p; } /* This returns false on failure. */ bool ac_compile_module_to_binary(struct ac_compiler_passes *p, LLVMModuleRef module, struct ac_shader_binary *binary) { p->passmgr.run(*llvm::unwrap(module)); llvm::StringRef data = p->ostream.str(); bool success = ac_elf_read(data.data(), data.size(), binary); p->code_string = ""; /* release the ELF shader binary */ if (!success) fprintf(stderr, "amd: cannot read an ELF shader binary\n"); return success; } void ac_llvm_add_barrier_noop_pass(LLVMPassManagerRef passmgr) { llvm::unwrap(passmgr)->add(llvm::createBarrierNoopPass()); } void ac_enable_global_isel(LLVMTargetMachineRef tm) { reinterpret_cast(tm)->setGlobalISel(true); } LLVMValueRef ac_build_atomic_rmw(struct ac_llvm_context *ctx, LLVMAtomicRMWBinOp op, LLVMValueRef ptr, LLVMValueRef val, const char *sync_scope) { llvm::AtomicRMWInst::BinOp binop; switch (op) { case LLVMAtomicRMWBinOpXchg: binop = llvm::AtomicRMWInst::Xchg; break; case LLVMAtomicRMWBinOpAdd: binop = llvm::AtomicRMWInst::Add; break; case LLVMAtomicRMWBinOpSub: binop = llvm::AtomicRMWInst::Sub; break; case LLVMAtomicRMWBinOpAnd: binop = llvm::AtomicRMWInst::And; break; case LLVMAtomicRMWBinOpNand: binop = llvm::AtomicRMWInst::Nand; break; case LLVMAtomicRMWBinOpOr: binop = llvm::AtomicRMWInst::Or; break; case LLVMAtomicRMWBinOpXor: binop = llvm::AtomicRMWInst::Xor; break; case LLVMAtomicRMWBinOpMax: binop = llvm::AtomicRMWInst::Max; break; case LLVMAtomicRMWBinOpMin: binop = llvm::AtomicRMWInst::Min; break; case LLVMAtomicRMWBinOpUMax: binop = llvm::AtomicRMWInst::UMax; break; case LLVMAtomicRMWBinOpUMin: binop = llvm::AtomicRMWInst::UMin; break; default: unreachable(!"invalid LLVMAtomicRMWBinOp"); break; } unsigned SSID = llvm::unwrap(ctx->context)->getOrInsertSyncScopeID(sync_scope); return llvm::wrap(llvm::unwrap(ctx->builder)->CreateAtomicRMW( binop, llvm::unwrap(ptr), llvm::unwrap(val), llvm::AtomicOrdering::SequentiallyConsistent, SSID)); } LLVMValueRef ac_build_atomic_cmp_xchg(struct ac_llvm_context *ctx, LLVMValueRef ptr, LLVMValueRef cmp, LLVMValueRef val, const char *sync_scope) { unsigned SSID = llvm::unwrap(ctx->context)->getOrInsertSyncScopeID(sync_scope); return llvm::wrap(llvm::unwrap(ctx->builder)->CreateAtomicCmpXchg( llvm::unwrap(ptr), llvm::unwrap(cmp), llvm::unwrap(val), llvm::AtomicOrdering::SequentiallyConsistent, llvm::AtomicOrdering::SequentiallyConsistent, SSID)); }