// // Copyright 2012 Francisco Jerez // // Permission is hereby granted, free of charge, to any person obtaining a // copy of this software and associated documentation files (the "Software"), // to deal in the Software without restriction, including without limitation // the rights to use, copy, modify, merge, publish, distribute, sublicense, // and/or sell copies of the Software, and to permit persons to whom the // Software is furnished to do so, subject to the following conditions: // // The above copyright notice and this permission notice shall be included in // all copies or substantial portions of the Software. // // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL // THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR // OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, // ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR // OTHER DEALINGS IN THE SOFTWARE. // #include "core/compiler.hpp" #include #include #include #include #include #include #include #if HAVE_LLVM < 0x0305 #include #else #include #endif #if HAVE_LLVM < 0x0303 #include #include #include #else #include #include #include #include #include #endif #include #include #include #if HAVE_LLVM < 0x0303 #include #endif #include #include #if HAVE_LLVM < 0x0302 #include #elif HAVE_LLVM < 0x0303 #include #else #include #endif #include "pipe/p_state.h" #include "util/u_memory.h" #include "util/u_math.h" #include #include #include #include #include using namespace clover; namespace { #if 0 void build_binary(const std::string &source, const std::string &target, const std::string &name) { clang::CompilerInstance c; clang::EmitObjAction act(&llvm::getGlobalContext()); std::string log; llvm::raw_string_ostream s_log(log); LLVMInitializeTGSITarget(); LLVMInitializeTGSITargetInfo(); LLVMInitializeTGSITargetMC(); LLVMInitializeTGSIAsmPrinter(); c.getFrontendOpts().Inputs.push_back( std::make_pair(clang::IK_OpenCL, name)); c.getHeaderSearchOpts().UseBuiltinIncludes = false; c.getHeaderSearchOpts().UseStandardIncludes = false; c.getLangOpts().NoBuiltin = true; c.getTargetOpts().Triple = target; c.getInvocation().setLangDefaults(clang::IK_OpenCL); c.createDiagnostics(0, NULL, new clang::TextDiagnosticPrinter( s_log, c.getDiagnosticOpts())); c.getPreprocessorOpts().addRemappedFile( name, llvm::MemoryBuffer::getMemBuffer(source)); if (!c.ExecuteAction(act)) throw build_error(log); } module load_binary(const char *name) { std::ifstream fs((name)); std::vector str((std::istreambuf_iterator(fs)), (std::istreambuf_iterator())); compat::istream cs(str); return module::deserialize(cs); } #endif llvm::Module * compile(llvm::LLVMContext &llvm_ctx, const std::string &source, const std::string &name, const std::string &triple, const std::string &processor, const std::string &opts, clang::LangAS::Map& address_spaces, compat::string &r_log) { clang::CompilerInstance c; clang::EmitLLVMOnlyAction act(&llvm_ctx); std::string log; llvm::raw_string_ostream s_log(log); std::string libclc_path = LIBCLC_LIBEXECDIR + processor + "-" + triple + ".bc"; // Parse the compiler options: std::vector opts_array; std::istringstream ss(opts); while (!ss.eof()) { std::string opt; getline(ss, opt, ' '); opts_array.push_back(opt); } opts_array.push_back(name); std::vector opts_carray; for (unsigned i = 0; i < opts_array.size(); i++) { opts_carray.push_back(opts_array.at(i).c_str()); } llvm::IntrusiveRefCntPtr DiagID; llvm::IntrusiveRefCntPtr DiagOpts; clang::TextDiagnosticBuffer *DiagsBuffer; DiagID = new clang::DiagnosticIDs(); DiagOpts = new clang::DiagnosticOptions(); DiagsBuffer = new clang::TextDiagnosticBuffer(); clang::DiagnosticsEngine Diags(DiagID, &*DiagOpts, DiagsBuffer); bool Success; Success = clang::CompilerInvocation::CreateFromArgs(c.getInvocation(), opts_carray.data(), opts_carray.data() + opts_carray.size(), Diags); if (!Success) { throw error(CL_INVALID_BUILD_OPTIONS); } c.getFrontendOpts().ProgramAction = clang::frontend::EmitLLVMOnly; c.getHeaderSearchOpts().UseBuiltinIncludes = true; c.getHeaderSearchOpts().UseStandardSystemIncludes = true; c.getHeaderSearchOpts().ResourceDir = CLANG_RESOURCE_DIR; // Add libclc generic search path c.getHeaderSearchOpts().AddPath(LIBCLC_INCLUDEDIR, clang::frontend::Angled, false, false #if HAVE_LLVM < 0x0303 , false #endif ); // Add libclc include c.getPreprocessorOpts().Includes.push_back("clc/clc.h"); // clc.h requires that this macro be defined: c.getPreprocessorOpts().addMacroDef("cl_clang_storage_class_specifiers"); c.getPreprocessorOpts().addMacroDef("cl_khr_fp64"); c.getLangOpts().NoBuiltin = true; c.getTargetOpts().Triple = triple; c.getTargetOpts().CPU = processor; // This is a workaround for a Clang bug which causes the number // of warnings and errors to be printed to stderr. // http://www.llvm.org/bugs/show_bug.cgi?id=19735 c.getDiagnosticOpts().ShowCarets = false; #if HAVE_LLVM <= 0x0301 c.getInvocation().setLangDefaults(clang::IK_OpenCL); #else c.getInvocation().setLangDefaults(c.getLangOpts(), clang::IK_OpenCL, clang::LangStandard::lang_opencl11); #endif c.createDiagnostics( #if HAVE_LLVM < 0x0303 0, NULL, #endif new clang::TextDiagnosticPrinter( s_log, #if HAVE_LLVM <= 0x0301 c.getDiagnosticOpts())); #else &c.getDiagnosticOpts())); #endif c.getPreprocessorOpts().addRemappedFile(name, llvm::MemoryBuffer::getMemBuffer(source)); // Setting this attribute tells clang to link this file before // performing any optimizations. This is required so that // we can replace calls to the OpenCL C barrier() builtin // with calls to target intrinsics that have the noduplicate // attribute. This attribute will prevent Clang from creating // illegal uses of barrier() (e.g. Moving barrier() inside a conditional // that is no executed by all threads) during its optimizaton passes. c.getCodeGenOpts().LinkBitcodeFile = libclc_path; // Compile the code bool ExecSuccess = c.ExecuteAction(act); r_log = log; if (!ExecSuccess) throw build_error(); // Get address spaces map to be able to find kernel argument address space memcpy(address_spaces, c.getTarget().getAddressSpaceMap(), sizeof(address_spaces)); #if HAVE_LLVM >= 0x0306 return act.takeModule().release(); #else return act.takeModule(); #endif } void find_kernels(llvm::Module *mod, std::vector &kernels) { const llvm::NamedMDNode *kernel_node = mod->getNamedMetadata("opencl.kernels"); // This means there are no kernels in the program. The spec does not // require that we return an error here, but there will be an error if // the user tries to pass this program to a clCreateKernel() call. if (!kernel_node) { return; } for (unsigned i = 0; i < kernel_node->getNumOperands(); ++i) { kernels.push_back(llvm::dyn_cast( kernel_node->getOperand(i)->getOperand(0))); } } void internalize_functions(llvm::Module *mod, const std::vector &kernels) { llvm::PassManager PM; // Add a function internalizer pass. // // By default, the function internalizer pass will look for a function // called "main" and then mark all other functions as internal. Marking // functions as internal enables the optimizer to perform optimizations // like function inlining and global dead-code elimination. // // When there is no "main" function in a module, the internalize pass will // treat the module like a library, and it won't internalize any functions. // Since there is no "main" function in our kernels, we need to tell // the internalizer pass that this module is not a library by passing a // list of kernel functions to the internalizer. The internalizer will // treat the functions in the list as "main" functions and internalize // all of the other functions. std::vector export_list; for (std::vector::const_iterator I = kernels.begin(), E = kernels.end(); I != E; ++I) { llvm::Function *kernel = *I; export_list.push_back(kernel->getName().data()); } PM.add(llvm::createInternalizePass(export_list)); PM.run(*mod); } module build_module_llvm(llvm::Module *mod, const std::vector &kernels, clang::LangAS::Map& address_spaces) { module m; struct pipe_llvm_program_header header; llvm::SmallVector llvm_bitcode; llvm::raw_svector_ostream bitcode_ostream(llvm_bitcode); llvm::BitstreamWriter writer(llvm_bitcode); llvm::WriteBitcodeToFile(mod, bitcode_ostream); bitcode_ostream.flush(); for (unsigned i = 0; i < kernels.size(); ++i) { llvm::Function *kernel_func; std::string kernel_name; compat::vector args; kernel_func = kernels[i]; kernel_name = kernel_func->getName(); for (llvm::Function::arg_iterator I = kernel_func->arg_begin(), E = kernel_func->arg_end(); I != E; ++I) { llvm::Argument &arg = *I; #if HAVE_LLVM < 0x0302 llvm::TargetData TD(kernel_func->getParent()); #elif HAVE_LLVM < 0x0305 llvm::DataLayout TD(kernel_func->getParent()->getDataLayout()); #else llvm::DataLayout TD(mod); #endif llvm::Type *arg_type = arg.getType(); const unsigned arg_store_size = TD.getTypeStoreSize(arg_type); // OpenCL 1.2 specification, Ch. 6.1.5: "A built-in data // type that is not a power of two bytes in size must be // aligned to the next larger power of two". We need this // alignment for three element vectors, which have // non-power-of-2 store size. const unsigned arg_api_size = util_next_power_of_two(arg_store_size); llvm::Type *target_type = arg_type->isIntegerTy() ? TD.getSmallestLegalIntType(mod->getContext(), arg_store_size * 8) : arg_type; unsigned target_size = TD.getTypeStoreSize(target_type); unsigned target_align = TD.getABITypeAlignment(target_type); if (llvm::isa(arg_type) && arg.hasByValAttr()) { arg_type = llvm::dyn_cast(arg_type)->getElementType(); } if (arg_type->isPointerTy()) { unsigned address_space = llvm::cast(arg_type)->getAddressSpace(); if (address_space == address_spaces[clang::LangAS::opencl_local - clang::LangAS::Offset]) { args.push_back(module::argument(module::argument::local, arg_api_size, target_size, target_align, module::argument::zero_ext)); } else { // XXX: Correctly handle constant address space. There is no // way for r600g to pass a handle for constant buffers back // to clover like it can for global buffers, so // creating constant arguments will break r600g. For now, // continue treating constant buffers as global buffers // until we can come up with a way to create handles for // constant buffers. args.push_back(module::argument(module::argument::global, arg_api_size, target_size, target_align, module::argument::zero_ext)); } } else { llvm::AttributeSet attrs = kernel_func->getAttributes(); enum module::argument::ext_type ext_type = (attrs.hasAttribute(arg.getArgNo() + 1, llvm::Attribute::SExt) ? module::argument::sign_ext : module::argument::zero_ext); args.push_back( module::argument(module::argument::scalar, arg_api_size, target_size, target_align, ext_type)); } } m.syms.push_back(module::symbol(kernel_name, 0, i, args )); } header.num_bytes = llvm_bitcode.size(); std::string data; data.insert(0, (char*)(&header), sizeof(header)); data.insert(data.end(), llvm_bitcode.begin(), llvm_bitcode.end()); m.secs.push_back(module::section(0, module::section::text, header.num_bytes, data)); return m; } } // End anonymous namespace module clover::compile_program_llvm(const compat::string &source, enum pipe_shader_ir ir, const compat::string &target, const compat::string &opts, compat::string &r_log) { std::vector kernels; size_t processor_str_len = std::string(target.begin()).find_first_of("-"); std::string processor(target.begin(), 0, processor_str_len); std::string triple(target.begin(), processor_str_len + 1, target.size() - processor_str_len - 1); clang::LangAS::Map address_spaces; llvm::LLVMContext llvm_ctx; // The input file name must have the .cl extension in order for the // CompilerInvocation class to recognize it as an OpenCL source file. llvm::Module *mod = compile(llvm_ctx, source, "input.cl", triple, processor, opts, address_spaces, r_log); find_kernels(mod, kernels); internalize_functions(mod, kernels); module m; // Build the clover::module switch (ir) { case PIPE_SHADER_IR_TGSI: //XXX: Handle TGSI assert(0); m = module(); break; default: m = build_module_llvm(mod, kernels, address_spaces); break; } #if HAVE_LLVM >= 0x0306 // LLVM 3.6 and newer, the user takes ownership of the module. delete mod; #endif return m; }