// // Copyright 2012-2016 Francisco Jerez // Copyright 2012-2016 Advanced Micro Devices, Inc. // Copyright 2014-2016 Jan Vesely // Copyright 2014-2015 Serge Martin // Copyright 2015 Zoltan Gilian // // Permission is hereby granted, free of charge, to any person obtaining a // copy of this software and associated documentation files (the "Software"), // to deal in the Software without restriction, including without limitation // the rights to use, copy, modify, merge, publish, distribute, sublicense, // and/or sell copies of the Software, and to permit persons to whom the // Software is furnished to do so, subject to the following conditions: // // The above copyright notice and this permission notice shall be included in // all copies or substantial portions of the Software. // // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL // THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR // OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, // ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR // OTHER DEALINGS IN THE SOFTWARE. // #include #include #include #include #include #include #ifdef HAVE_CLOVER_SPIRV #include #endif #include #include #include #include #include // We need to include internal headers last, because the internal headers // include CL headers which have #define's like: // //#define cl_khr_gl_sharing 1 //#define cl_khr_icd 1 // // Which will break the compilation of clang/Basic/OpenCLOptions.h #include "core/error.hpp" #include "llvm/codegen.hpp" #include "llvm/compat.hpp" #include "llvm/invocation.hpp" #include "llvm/metadata.hpp" #include "llvm/util.hpp" #ifdef HAVE_CLOVER_SPIRV #include "spirv/invocation.hpp" #endif #include "util/algorithm.hpp" using clover::binary; using clover::device; using clover::build_error; using clover::invalid_build_options_error; using clover::map; using clover::header_map; using namespace clover::llvm; using ::llvm::Function; using ::llvm::LLVMContext; using ::llvm::Module; using ::llvm::raw_string_ostream; namespace { static const cl_version ANY_VERSION = CL_MAKE_VERSION(9, 9, 9); const cl_version cl_versions[] = { CL_MAKE_VERSION(1, 1, 0), CL_MAKE_VERSION(1, 2, 0), CL_MAKE_VERSION(2, 0, 0), CL_MAKE_VERSION(2, 1, 0), CL_MAKE_VERSION(2, 2, 0), CL_MAKE_VERSION(3, 0, 0), }; struct clc_version_lang_std { cl_version version_number; // CLC Version clang::LangStandard::Kind clc_lang_standard; }; const clc_version_lang_std cl_version_lang_stds[] = { { CL_MAKE_VERSION(1, 0, 0), clang::LangStandard::lang_opencl10}, { CL_MAKE_VERSION(1, 1, 0), clang::LangStandard::lang_opencl11}, { CL_MAKE_VERSION(1, 2, 0), clang::LangStandard::lang_opencl12}, { CL_MAKE_VERSION(2, 0, 0), clang::LangStandard::lang_opencl20}, #if LLVM_VERSION_MAJOR >= 12 { CL_MAKE_VERSION(3, 0, 0), clang::LangStandard::lang_opencl30}, #endif }; bool are_equal(cl_version_khr version1, cl_version_khr version2, bool ignore_patch_version = false) { if (ignore_patch_version) { version1 &= ~CL_VERSION_PATCH_MASK_KHR; version2 &= ~CL_VERSION_PATCH_MASK_KHR; } return version1 == version2; } void init_targets() { static bool targets_initialized = false; if (!targets_initialized) { LLVMInitializeAllTargets(); LLVMInitializeAllTargetInfos(); LLVMInitializeAllTargetMCs(); LLVMInitializeAllAsmParsers(); LLVMInitializeAllAsmPrinters(); targets_initialized = true; } } void diagnostic_handler(const ::llvm::DiagnosticInfo &di, void *data) { if (di.getSeverity() == ::llvm::DS_Error) { raw_string_ostream os { *reinterpret_cast(data) }; ::llvm::DiagnosticPrinterRawOStream printer { os }; di.print(printer); throw build_error(); } } std::unique_ptr create_context(std::string &r_log) { init_targets(); std::unique_ptr ctx { new LLVMContext }; ctx->setDiagnosticHandlerCallBack(diagnostic_handler, &r_log); return ctx; } const struct clc_version_lang_std& get_cl_lang_standard(unsigned requested, unsigned max = ANY_VERSION) { for (const struct clc_version_lang_std &version : cl_version_lang_stds) { if (version.version_number == max || version.version_number == requested) { return version; } } throw build_error("Unknown/Unsupported language version"); } const cl_version get_cl_version(cl_version requested, cl_version max = ANY_VERSION) { for (const auto &version : cl_versions) { if (are_equal(version, max, true) || are_equal(version, requested, true)) { return version; } } throw build_error("Unknown/Unsupported language version"); } clang::LangStandard::Kind get_lang_standard_from_version(const cl_version input_version, bool is_build_opt = false) { //Per CL 2.0 spec, section 5.8.4.5: // If it's an option, use the value directly. // If it's a device version, clamp to max 1.x version, a.k.a. 1.2 const cl_version version = get_cl_version(input_version, is_build_opt ? ANY_VERSION : 120); const struct clc_version_lang_std standard = get_cl_lang_standard(version); return standard.clc_lang_standard; } clang::LangStandard::Kind get_language_version(const std::vector &opts, const cl_version device_version) { const std::string search = "-cl-std=CL"; for (auto &opt: opts) { auto pos = opt.find(search); if (pos == 0){ std::stringstream ver_str(opt.substr(pos + search.size())); unsigned int ver_major = 0; char separator = '\0'; unsigned int ver_minor = 0; ver_str >> ver_major >> separator >> ver_minor; if (ver_str.fail() || ver_str.bad() || !ver_str.eof() || separator != '.') { throw build_error(); } const auto ver = CL_MAKE_VERSION_KHR(ver_major, ver_minor, 0); const auto device_ver = get_cl_version(device_version); const auto requested = get_cl_version(ver); if (requested > device_ver) { throw build_error(); } return get_lang_standard_from_version(ver, true); } } return get_lang_standard_from_version(device_version); } std::unique_ptr create_compiler_instance(const device &dev, const std::string& ir_target, const std::vector &opts, std::string &r_log) { std::unique_ptr c { new clang::CompilerInstance }; clang::TextDiagnosticBuffer *diag_buffer = new clang::TextDiagnosticBuffer; clang::DiagnosticsEngine diag { new clang::DiagnosticIDs, new clang::DiagnosticOptions, diag_buffer }; // Parse the compiler options. A file name should be present at the end // and must have the .cl extension in order for the CompilerInvocation // class to recognize it as an OpenCL source file. #if LLVM_VERSION_MAJOR >= 12 std::vector copts; for (auto &opt : opts) { if (opt == "-cl-denorms-are-zero") copts.push_back("-fdenormal-fp-math=positive-zero"); else copts.push_back(opt.c_str()); } #else const std::vector copts = map(std::mem_fn(&std::string::c_str), opts); #endif const target &target = ir_target; const cl_version device_clc_version = dev.device_clc_version(); if (!compat::create_compiler_invocation_from_args( c->getInvocation(), copts, diag)) throw invalid_build_options_error(); diag_buffer->FlushDiagnostics(diag); if (diag.hasErrorOccurred()) throw invalid_build_options_error(); c->getTargetOpts().CPU = target.cpu; c->getTargetOpts().Triple = target.triple; c->getLangOpts().NoBuiltin = true; #if LLVM_VERSION_MAJOR >= 13 c->getTargetOpts().OpenCLExtensionsAsWritten.push_back("-__opencl_c_generic_address_space"); c->getTargetOpts().OpenCLExtensionsAsWritten.push_back("-__opencl_c_pipes"); c->getTargetOpts().OpenCLExtensionsAsWritten.push_back("-__opencl_c_device_enqueue"); c->getTargetOpts().OpenCLExtensionsAsWritten.push_back("-__opencl_c_program_scope_global_variables"); c->getTargetOpts().OpenCLExtensionsAsWritten.push_back("-__opencl_c_subgroups"); c->getTargetOpts().OpenCLExtensionsAsWritten.push_back("-__opencl_c_work_group_collective_functions"); c->getTargetOpts().OpenCLExtensionsAsWritten.push_back("-__opencl_c_atomic_scope_device"); c->getTargetOpts().OpenCLExtensionsAsWritten.push_back("-__opencl_c_atomic_order_seq_cst"); #endif // This is a workaround for a Clang bug which causes the number // of warnings and errors to be printed to stderr. // http://www.llvm.org/bugs/show_bug.cgi?id=19735 c->getDiagnosticOpts().ShowCarets = false; compat::compiler_set_lang_defaults(c, compat::ik_opencl, ::llvm::Triple(target.triple), get_language_version(opts, device_clc_version)); c->createDiagnostics(new clang::TextDiagnosticPrinter( *new raw_string_ostream(r_log), &c->getDiagnosticOpts(), true)); c->setTarget(clang::TargetInfo::CreateTargetInfo( c->getDiagnostics(), c->getInvocation().TargetOpts)); return c; } std::unique_ptr compile(LLVMContext &ctx, clang::CompilerInstance &c, const std::string &name, const std::string &source, const header_map &headers, const device &dev, const std::string &opts, bool use_libclc, std::string &r_log) { c.getFrontendOpts().ProgramAction = clang::frontend::EmitLLVMOnly; c.getHeaderSearchOpts().UseBuiltinIncludes = true; c.getHeaderSearchOpts().UseStandardSystemIncludes = true; c.getHeaderSearchOpts().ResourceDir = CLANG_RESOURCE_DIR; if (use_libclc) { // Add libclc generic search path c.getHeaderSearchOpts().AddPath(LIBCLC_INCLUDEDIR, clang::frontend::Angled, false, false); // Add libclc include c.getPreprocessorOpts().Includes.push_back("clc/clc.h"); } else { // Add opencl-c generic search path c.getHeaderSearchOpts().AddPath(CLANG_RESOURCE_DIR, clang::frontend::Angled, false, false); // Add opencl include c.getPreprocessorOpts().Includes.push_back("opencl-c.h"); } // Add definition for the OpenCL version const auto dev_version = dev.device_version(); c.getPreprocessorOpts().addMacroDef("__OPENCL_VERSION__=" + std::to_string(CL_VERSION_MAJOR_KHR(dev_version)) + std::to_string(CL_VERSION_MINOR_KHR(dev_version)) + "0"); if (CL_VERSION_MAJOR(dev.version) >= 3) { const auto features = dev.opencl_c_features(); for (const auto &feature : features) c.getPreprocessorOpts().addMacroDef(feature.name); } // clc.h requires that this macro be defined: c.getPreprocessorOpts().addMacroDef("cl_clang_storage_class_specifiers"); c.getPreprocessorOpts().addRemappedFile( name, ::llvm::MemoryBuffer::getMemBuffer(source).release()); if (headers.size()) { const std::string tmp_header_path = "/tmp/clover/"; c.getHeaderSearchOpts().AddPath(tmp_header_path, clang::frontend::Angled, false, false); for (const auto &header : headers) c.getPreprocessorOpts().addRemappedFile( tmp_header_path + header.first, ::llvm::MemoryBuffer::getMemBuffer(header.second).release()); } // Tell clang to link this file before performing any // optimizations. This is required so that we can replace calls // to the OpenCL C barrier() builtin with calls to target // intrinsics that have the noduplicate attribute. This // attribute will prevent Clang from creating illegal uses of // barrier() (e.g. Moving barrier() inside a conditional that is // no executed by all threads) during its optimizaton passes. if (use_libclc) { clang::CodeGenOptions::BitcodeFileToLink F; F.Filename = LIBCLC_LIBEXECDIR + dev.ir_target() + ".bc"; F.PropagateAttrs = true; F.LinkFlags = ::llvm::Linker::Flags::None; c.getCodeGenOpts().LinkBitcodeFiles.emplace_back(F); } // undefine __IMAGE_SUPPORT__ for device without image support if (!dev.image_support()) c.getPreprocessorOpts().addMacroUndef("__IMAGE_SUPPORT__"); // Compile the code clang::EmitLLVMOnlyAction act(&ctx); if (!c.ExecuteAction(act)) throw build_error(); return act.takeModule(); } #ifdef HAVE_CLOVER_SPIRV SPIRV::TranslatorOpts get_spirv_translator_options(const device &dev) { const auto supported_versions = clover::spirv::supported_versions(); const auto max_supported = clover::spirv::to_spirv_version_encoding(supported_versions.back().version); const auto maximum_spirv_version = std::min(static_cast(max_supported), SPIRV::VersionNumber::MaximumVersion); SPIRV::TranslatorOpts::ExtensionsStatusMap spirv_extensions; for (auto &ext : clover::spirv::supported_extensions()) { #define EXT(X) if (ext == #X) spirv_extensions.insert({ SPIRV::ExtensionID::X, true }); #include #undef EXT } return SPIRV::TranslatorOpts(maximum_spirv_version, spirv_extensions); } #endif } binary clover::llvm::compile_program(const std::string &source, const header_map &headers, const device &dev, const std::string &opts, std::string &r_log) { if (has_flag(debug::clc)) debug::log(".cl", "// Options: " + opts + '\n' + source); auto ctx = create_context(r_log); auto c = create_compiler_instance(dev, dev.ir_target(), tokenize(opts + " input.cl"), r_log); auto mod = compile(*ctx, *c, "input.cl", source, headers, dev, opts, true, r_log); if (has_flag(debug::llvm)) debug::log(".ll", print_module_bitcode(*mod)); return build_module_library(*mod, binary::section::text_intermediate); } namespace { void optimize(Module &mod, unsigned optimization_level, bool internalize_symbols) { ::llvm::legacy::PassManager pm; // By default, the function internalizer pass will look for a function // called "main" and then mark all other functions as internal. Marking // functions as internal enables the optimizer to perform optimizations // like function inlining and global dead-code elimination. // // When there is no "main" function in a binary, the internalize pass will // treat the binary like a library, and it won't internalize any functions. // Since there is no "main" function in our kernels, we need to tell // the internalizer pass that this binary is not a library by passing a // list of kernel functions to the internalizer. The internalizer will // treat the functions in the list as "main" functions and internalize // all of the other functions. if (internalize_symbols) { std::vector names = map(std::mem_fn(&Function::getName), get_kernels(mod)); pm.add(::llvm::createInternalizePass( [=](const ::llvm::GlobalValue &gv) { return std::find(names.begin(), names.end(), gv.getName()) != names.end(); })); } ::llvm::PassManagerBuilder pmb; pmb.OptLevel = optimization_level; pmb.LibraryInfo = new ::llvm::TargetLibraryInfoImpl( ::llvm::Triple(mod.getTargetTriple())); pmb.populateModulePassManager(pm); pm.run(mod); } std::unique_ptr link(LLVMContext &ctx, const clang::CompilerInstance &c, const std::vector &binaries, std::string &r_log) { std::unique_ptr mod { new Module("link", ctx) }; std::unique_ptr< ::llvm::Linker> linker { new ::llvm::Linker(*mod) }; for (auto &b : binaries) { if (linker->linkInModule(parse_module_library(b, ctx, r_log))) throw build_error(); } return mod; } } binary clover::llvm::link_program(const std::vector &binaries, const device &dev, const std::string &opts, std::string &r_log) { std::vector options = tokenize(opts + " input.cl"); const bool create_library = count("-create-library", options); erase_if(equals("-create-library"), options); auto ctx = create_context(r_log); auto c = create_compiler_instance(dev, dev.ir_target(), options, r_log); auto mod = link(*ctx, *c, binaries, r_log); optimize(*mod, c->getCodeGenOpts().OptimizationLevel, !create_library); static std::atomic_uint seq(0); const std::string id = "." + mod->getModuleIdentifier() + "-" + std::to_string(seq++); if (has_flag(debug::llvm)) debug::log(id + ".ll", print_module_bitcode(*mod)); if (create_library) { return build_module_library(*mod, binary::section::text_library); } else if (dev.ir_format() == PIPE_SHADER_IR_NATIVE) { if (has_flag(debug::native)) debug::log(id + ".asm", print_module_native(*mod, dev.ir_target())); return build_module_native(*mod, dev.ir_target(), *c, r_log); } else { unreachable("Unsupported IR."); } } #ifdef HAVE_CLOVER_SPIRV binary clover::llvm::compile_to_spirv(const std::string &source, const header_map &headers, const device &dev, const std::string &opts, std::string &r_log) { if (has_flag(debug::clc)) debug::log(".cl", "// Options: " + opts + '\n' + source); auto ctx = create_context(r_log); const std::string target = dev.address_bits() == 32u ? "-spir-unknown-unknown" : "-spir64-unknown-unknown"; auto c = create_compiler_instance(dev, target, tokenize(opts + " -O0 -fgnu89-inline input.cl"), r_log); auto mod = compile(*ctx, *c, "input.cl", source, headers, dev, opts, false, r_log); if (has_flag(debug::llvm)) debug::log(".ll", print_module_bitcode(*mod)); const auto spirv_options = get_spirv_translator_options(dev); std::string error_msg; std::ostringstream os; if (!::llvm::writeSpirv(mod.get(), spirv_options, os, error_msg)) { r_log += "Translation from LLVM IR to SPIR-V failed: " + error_msg + ".\n"; throw error(CL_INVALID_VALUE); } const std::string osContent = os.str(); std::string binary(osContent.begin(), osContent.end()); if (binary.empty()) { r_log += "Failed to retrieve SPIR-V binary.\n"; throw error(CL_INVALID_VALUE); } if (has_flag(debug::spirv)) debug::log(".spvasm", spirv::print_module(binary, dev.device_version())); return spirv::compile_program(binary, dev, r_log); } #endif