e682abb47e
SWDEV-94610 - Code provided by Wilkin - Implement the roc Program Manager to call the Lightning Compiler instead of the compiler library. - Embed and use the pre-compiled header generated by the built-in library build - If LLVM_BIN is not set, try to find Clang from the libamdocl path Testing: http://ocltc.amd.com:8111/viewModification.html?modId=75068&personal=true&buildTypeId=&tab=vcsModificationBuilds&show_all_builds=true Affected files ... ... //depot/stg/opencl/drivers/opencl/compiler/lib/loaders/elf/elf.cpp#35 edit ... //depot/stg/opencl/drivers/opencl/compiler/lib/loaders/elf/elf.hpp#24 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/blitcl.cpp#9 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/device.cpp#200 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/build/Makefile.oclrocm#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/roccompiler.cpp#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocdevice.cpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rockernel.cpp#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rockernel.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocmetadata.cpp#1 add ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocmetadata.hpp#1 add ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocprogram.cpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocprogram.hpp#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocvirtual.cpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/program.cpp#81 edit
1326 lines
50 KiB
C++
1326 lines
50 KiB
C++
//
|
|
// Copyright (c) 2008 Advanced Micro Devices, Inc. All rights reserved.
|
|
//
|
|
|
|
|
|
#ifndef WITHOUT_HSA_BACKEND
|
|
|
|
#include "rocprogram.hpp"
|
|
|
|
#include "compiler/lib/loaders/elf/elf.hpp"
|
|
#include "compiler/lib/utils/options.hpp"
|
|
#include "rockernel.hpp"
|
|
#if defined(WITH_LIGHTNING_COMPILER)
|
|
#include "driver/AmdCompiler.h"
|
|
#include "opencl-c.amdgcn.inc"
|
|
#include "builtins-irif.amdgcn.inc"
|
|
#include "builtins-ockl.amdgcn.inc"
|
|
#include "builtins-ocml.amdgcn.inc"
|
|
#include "builtins-opencl.amdgcn.inc"
|
|
#include "correctly_rounded_sqrt_off.amdgcn.inc"
|
|
#include "correctly_rounded_sqrt_on.amdgcn.inc"
|
|
#include "daz_opt_off.amdgcn.inc"
|
|
#include "daz_opt_on.amdgcn.inc"
|
|
#include "finite_only_off.amdgcn.inc"
|
|
#include "finite_only_on.amdgcn.inc"
|
|
#include "isa_version_701.amdgcn.inc"
|
|
#include "isa_version_800.amdgcn.inc"
|
|
#include "isa_version_801.amdgcn.inc"
|
|
#include "isa_version_802.amdgcn.inc"
|
|
#include "isa_version_803.amdgcn.inc"
|
|
#include "isa_version_804.amdgcn.inc"
|
|
#include "isa_version_810.amdgcn.inc"
|
|
#include "unsafe_math_off.amdgcn.inc"
|
|
#include "unsafe_math_on.amdgcn.inc"
|
|
#else // !defined(WITH_LIGHTNING_COMPILER)
|
|
#include "roccompilerlib.hpp"
|
|
#endif // !defined(WITH_LIGHTNING_COMPILER)
|
|
#include "utils/bif_section_labels.hpp"
|
|
|
|
#include <string>
|
|
#include <vector>
|
|
#include <cstring>
|
|
#include <fstream>
|
|
#include <sstream>
|
|
#include <iostream>
|
|
#include <istream>
|
|
|
|
|
|
#endif // WITHOUT_HSA_BACKEND
|
|
|
|
namespace roc {
|
|
#ifndef WITHOUT_HSA_BACKEND
|
|
|
|
#if defined(WITH_LIGHTNING_COMPILER)
|
|
static hsa_status_t GetKernelNamesCallback(
|
|
hsa_executable_t exec,
|
|
hsa_executable_symbol_t symbol,
|
|
void *data ) {
|
|
std::vector<std::string>* symNameList = (reinterpret_cast<std::vector<std::string> *>(data));
|
|
|
|
hsa_symbol_kind_t sym_type;
|
|
hsa_executable_symbol_get_info(symbol, HSA_EXECUTABLE_SYMBOL_INFO_TYPE, &sym_type);
|
|
|
|
if (sym_type == HSA_SYMBOL_KIND_KERNEL) {
|
|
uint32_t len;
|
|
hsa_executable_symbol_get_info(symbol, HSA_EXECUTABLE_SYMBOL_INFO_NAME_LENGTH, &len);
|
|
|
|
char* symName = (char*) malloc(len);
|
|
hsa_executable_symbol_get_info(symbol, HSA_EXECUTABLE_SYMBOL_INFO_NAME, symName);
|
|
|
|
std::string kernelName(symName,len);
|
|
symNameList->push_back(kernelName);
|
|
|
|
free(symName);
|
|
}
|
|
|
|
return HSA_STATUS_SUCCESS;
|
|
}
|
|
#endif // defined(WITH_LIGHTNING_COMPILER)
|
|
|
|
/* Temporary log function for the compiler library */
|
|
static void logFunction(const char *msg, size_t size) {
|
|
std::cout << "Compiler Library log :" << msg << std::endl;
|
|
}
|
|
|
|
HSAILProgram::~HSAILProgram() {
|
|
acl_error error;
|
|
// Free the elf binary
|
|
if (binaryElf_ != NULL) {
|
|
#if defined(WITH_LIGHTNING_COMPILER)
|
|
if (lcBinaryElf_) {
|
|
free(lcBinaryElf_);
|
|
}
|
|
#else // !defined(WITH_LIGHTNING_COMPILER)
|
|
error = g_complibApi._aclBinaryFini(binaryElf_);
|
|
if (error != ACL_SUCCESS) {
|
|
LogWarning( "Error while destroying the acl binary \n" );
|
|
}
|
|
#endif // !defined(WITH_LIGHTNING_COMPILER)
|
|
}
|
|
// Destroy the executable.
|
|
if (hsaExecutable_.handle != 0) {
|
|
hsa_executable_destroy(hsaExecutable_);
|
|
}
|
|
// Destroy the code object.
|
|
if (hsaProgramCodeObject_.handle != 0) {
|
|
hsa_code_object_destroy(hsaProgramCodeObject_);
|
|
}
|
|
// Destroy the program handle.
|
|
if (hsaProgramHandle_.handle != 0) {
|
|
hsa_ext_program_destroy(hsaProgramHandle_);
|
|
}
|
|
destroyBrigModule();
|
|
destroyBrigContainer();
|
|
releaseClBinary();
|
|
}
|
|
|
|
HSAILProgram::HSAILProgram(roc::NullDevice& device): device::Program(device),
|
|
llvmBinary_(),
|
|
binaryElf_(NULL),
|
|
device_(device),
|
|
brigModule_(NULL),
|
|
hsaBrigContainer_(NULL)
|
|
{
|
|
memset(&binOpts_, 0, sizeof(binOpts_));
|
|
binOpts_.struct_size = sizeof(binOpts_);
|
|
//binOpts_.elfclass = LP64_SWITCH( ELFCLASS32, ELFCLASS64 );
|
|
//Setting as 32 bit because hsail64 returns an invalid aclTargetInfo
|
|
//when aclGetTargetInfo is called - EPR# 377910
|
|
binOpts_.elfclass = ELFCLASS32;
|
|
binOpts_.bitness = ELFDATA2LSB;
|
|
binOpts_.alloc = &::malloc;
|
|
binOpts_.dealloc = &::free;
|
|
hsaProgramHandle_.handle = 0;
|
|
hsaProgramCodeObject_.handle = 0;
|
|
hsaExecutable_.handle = 0;
|
|
|
|
#if defined(WITH_LIGHTNING_COMPILER)
|
|
lcProgramCodeObject_.handle = 0;
|
|
lcExecutable_.handle = 0;
|
|
codeObjBinary_ = NULL;
|
|
lcBinaryElf_ = NULL;
|
|
lcBinaryElfSize_ = 0;
|
|
#endif // defined(WITH_LIGHTNING_COMPILER)
|
|
}
|
|
|
|
bool HSAILProgram::initClBinary(char *binaryIn, size_t size) { // Save the
|
|
// original
|
|
// binary that
|
|
// isn't owned
|
|
// by ClBinary
|
|
clBinary()->saveOrigBinary(binaryIn, size);
|
|
|
|
char *bin = binaryIn;
|
|
size_t sz = size;
|
|
|
|
int encryptCode;
|
|
|
|
char *decryptedBin;
|
|
size_t decryptedSize;
|
|
if (!clBinary()->decryptElf(binaryIn, size,
|
|
&decryptedBin, &decryptedSize, &encryptCode)) {
|
|
return false;
|
|
}
|
|
if (decryptedBin != NULL) {
|
|
// It is decrypted binary.
|
|
bin = decryptedBin;
|
|
sz = decryptedSize;
|
|
}
|
|
|
|
// Both 32-bit and 64-bit are allowed!
|
|
if (!amd::isElfMagic(bin)) {
|
|
// Invalid binary.
|
|
if (decryptedBin != NULL) {
|
|
delete[]decryptedBin;
|
|
}
|
|
return false;
|
|
}
|
|
|
|
clBinary()->setFlags(encryptCode);
|
|
|
|
return clBinary()->setBinary(bin, sz, (decryptedBin != NULL));
|
|
}
|
|
|
|
|
|
bool HSAILProgram::initBuild(amd::option::Options *options) {
|
|
compileOptions_ = options->origOptionStr;
|
|
|
|
if (!device::Program::initBuild(options)) {
|
|
return false;
|
|
}
|
|
// Elf Binary setup
|
|
std::string outFileName;
|
|
|
|
// true means hsail required
|
|
clBinary()->init(options, true);
|
|
if (options->isDumpFlagSet(amd::option::DUMP_BIF)) {
|
|
outFileName = options->getDumpFileName(".bin");
|
|
}
|
|
|
|
#if defined(WITH_LIGHTNING_COMPILER)
|
|
bool useELF64 = true;
|
|
#else // !defined(WITH_LIGHTNING_COMPILER)
|
|
bool useELF64 = getCompilerOptions()->oVariables->EnableGpuElf64;
|
|
#endif // !defined(WITH_LIGHTNING_COMPILER)
|
|
if (!clBinary()->setElfOut(useELF64 ? ELFCLASS64 : ELFCLASS32,
|
|
(outFileName.size() >
|
|
0) ? outFileName.c_str() : NULL)) {
|
|
LogError("Setup elf out for gpu failed");
|
|
return false;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
// ! post-compile setup for GPU
|
|
bool HSAILProgram::finiBuild(bool isBuildGood) {
|
|
clBinary()->resetElfOut();
|
|
clBinary()->resetElfIn();
|
|
|
|
if (!isBuildGood) {
|
|
// Prevent the encrypted binary form leaking out
|
|
clBinary()->setBinary(NULL, 0);
|
|
|
|
}
|
|
|
|
return device::Program::finiBuild(isBuildGood);
|
|
}
|
|
|
|
static char *readFile(std::string source_filename, size_t &size) {
|
|
FILE *fp = ::fopen(source_filename.c_str(), "rb");
|
|
unsigned int length;
|
|
size_t offset = 0;
|
|
char *ptr;
|
|
|
|
if (!fp) {
|
|
return NULL;
|
|
}
|
|
|
|
// obtain file size.
|
|
::fseek(fp, 0, SEEK_END);
|
|
length = ::ftell(fp);
|
|
::rewind(fp);
|
|
|
|
ptr = reinterpret_cast<char *>(malloc(offset + length + 1));
|
|
if (length != fread(&ptr[offset], 1, length, fp)) {
|
|
free(ptr);
|
|
return NULL;
|
|
}
|
|
|
|
ptr[offset + length] = '\0';
|
|
size = offset + length;
|
|
::fclose(fp);
|
|
return ptr;
|
|
}
|
|
|
|
aclType HSAILProgram::getCompilationStagesFromBinary(std::vector<aclType>& completeStages, bool& needOptionsCheck)
|
|
{
|
|
acl_error errorCode;
|
|
size_t secSize = 0;
|
|
completeStages.clear();
|
|
aclType from = ACL_TYPE_DEFAULT;
|
|
needOptionsCheck = true;
|
|
size_t boolSize = sizeof(bool);
|
|
//! @todo Should we also check for ACL_TYPE_OPENCL & ACL_TYPE_LLVMIR_TEXT?
|
|
// Checking llvmir in .llvmir section
|
|
bool containsLlvmirText = true;
|
|
#if defined(WITH_LIGHTNING_COMPILER)
|
|
// TODO:FIXME_Wilkin - Query
|
|
bool containsOpts = false;
|
|
bool containsHsailText = false;
|
|
bool containsBrig = false;
|
|
#else // !defined(WITH_LIGHTNING_COMPILER)
|
|
errorCode = g_complibApi._aclQueryInfo(device().compiler(), binaryElf_, RT_CONTAINS_LLVMIR, NULL, &containsLlvmirText, &boolSize);
|
|
if (errorCode != ACL_SUCCESS) {
|
|
containsLlvmirText = false;
|
|
}
|
|
// Checking compile & link options in .comment section
|
|
bool containsOpts = true;
|
|
errorCode = g_complibApi._aclQueryInfo(device().compiler(), binaryElf_, RT_CONTAINS_OPTIONS, NULL, &containsOpts, &boolSize);
|
|
if (errorCode != ACL_SUCCESS) {
|
|
containsOpts = false;
|
|
}
|
|
if (containsLlvmirText && containsOpts) {
|
|
completeStages.push_back(from);
|
|
from = ACL_TYPE_LLVMIR_BINARY;
|
|
}
|
|
// Checking HSAIL in .cg section
|
|
bool containsHsailText = true;
|
|
errorCode = g_complibApi._aclQueryInfo(device().compiler(), binaryElf_, RT_CONTAINS_HSAIL, NULL, &containsHsailText, &boolSize);
|
|
if (errorCode != ACL_SUCCESS) {
|
|
containsHsailText = false;
|
|
}
|
|
// Checking BRIG sections
|
|
bool containsBrig = true;
|
|
errorCode = g_complibApi._aclQueryInfo(device().compiler(), binaryElf_, RT_CONTAINS_BRIG, NULL, &containsBrig, &boolSize);
|
|
if (errorCode != ACL_SUCCESS) {
|
|
containsBrig = false;
|
|
}
|
|
#endif // !defined(WITH_LIGHTNING_COMPILER)
|
|
if (containsBrig) {
|
|
completeStages.push_back(from);
|
|
from = ACL_TYPE_HSAIL_BINARY;
|
|
// Here we should check that CG stage was done.
|
|
// Right now there are 2 criterions to check it (besides BRIG itself):
|
|
// 1. matadata symbols symOpenclKernel for every kernel.
|
|
// 2. HSAIL text in aclCODEGEN section.
|
|
// Unfortunately there is no appropriate way in Compiler Lib to check 1.
|
|
// because kernel names are unknown here, therefore only 2.
|
|
if (containsHsailText) {
|
|
completeStages.push_back(from);
|
|
from = ACL_TYPE_CG;
|
|
}
|
|
}
|
|
else if (containsHsailText) {
|
|
completeStages.push_back(from);
|
|
from = ACL_TYPE_HSAIL_TEXT;
|
|
}
|
|
// Checking ISA in .text section
|
|
bool containsShaderIsa = true;
|
|
#if defined(WITH_LIGHTNING_COMPILER)
|
|
assert(!"FIXME_Wilkin");
|
|
errorCode = ACL_ERROR;
|
|
#else // !defined(WITH_LIGHTNING_COMPILER)
|
|
errorCode = g_complibApi._aclQueryInfo(device().compiler(), binaryElf_, RT_CONTAINS_ISA, NULL, &containsShaderIsa, &boolSize);
|
|
#endif // !defined(WITH_LIGHTNING_COMPILER)
|
|
if (errorCode != ACL_SUCCESS) {
|
|
containsShaderIsa = false;
|
|
}
|
|
if (containsShaderIsa) {
|
|
completeStages.push_back(from);
|
|
from = ACL_TYPE_ISA;
|
|
}
|
|
std::string sCurOptions = compileOptions_ + linkOptions_;
|
|
amd::option::Options curOptions;
|
|
if (!amd::option::parseAllOptions(sCurOptions, curOptions)) {
|
|
buildLog_ += curOptions.optionsLog();
|
|
LogError("Parsing compile options failed.");
|
|
return ACL_TYPE_DEFAULT;
|
|
}
|
|
switch (from) {
|
|
// compile from HSAIL text, no matter prev. stages and options
|
|
case ACL_TYPE_HSAIL_TEXT:
|
|
needOptionsCheck = false;
|
|
break;
|
|
case ACL_TYPE_HSAIL_BINARY:
|
|
case ACL_TYPE_CG:
|
|
// do not check options, if LLVMIR is absent or might be absent or options are absent
|
|
if (curOptions.oVariables->BinLLVMIR || !containsLlvmirText || !containsOpts) {
|
|
needOptionsCheck = false;
|
|
}
|
|
break;
|
|
case ACL_TYPE_ISA:
|
|
// do not check options, if LLVMIR is absent or might be absent or options are absent
|
|
if (curOptions.oVariables->BinLLVMIR || !containsLlvmirText || !containsOpts) {
|
|
needOptionsCheck = false;
|
|
}
|
|
if (containsBrig && containsHsailText && curOptions.oVariables->BinHSAIL) {
|
|
needOptionsCheck = false;
|
|
// recompile from prev. stage, if BRIG || HSAIL are absent
|
|
} else {
|
|
from = completeStages.back();
|
|
completeStages.pop_back();
|
|
needOptionsCheck = true;
|
|
}
|
|
break;
|
|
// recompilation might be needed
|
|
case ACL_TYPE_LLVMIR_BINARY:
|
|
case ACL_TYPE_DEFAULT:
|
|
default:
|
|
break;
|
|
}
|
|
return from;
|
|
}
|
|
|
|
aclType HSAILProgram::getNextCompilationStageFromBinary(amd::option::Options* options) {
|
|
aclType continueCompileFrom = ACL_TYPE_DEFAULT;
|
|
binary_t binary = this->binary();
|
|
// If the binary already exists
|
|
if ((binary.first != NULL) && (binary.second > 0)) {
|
|
void *mem = const_cast<void *>(binary.first);
|
|
acl_error errorCode;
|
|
#if defined(WITH_LIGHTNING_COMPILER)
|
|
// TODO: FIXME_Wilkin
|
|
#else // !defined(WITH_LIGHTNING_COMPILER)
|
|
binaryElf_ = g_complibApi._aclReadFromMem(mem, binary.second, &errorCode);
|
|
if (errorCode != ACL_SUCCESS) {
|
|
buildLog_ += "Error while BRIG Codegen phase: aclReadFromMem failure \n" ;
|
|
return continueCompileFrom;
|
|
}
|
|
#endif // !defined(WITH_LIGHTNING_COMPILER)
|
|
// Calculate the next stage to compile from, based on sections in binaryElf_;
|
|
// No any validity checks here
|
|
std::vector<aclType> completeStages;
|
|
bool needOptionsCheck = true;
|
|
continueCompileFrom = getCompilationStagesFromBinary(completeStages, needOptionsCheck);
|
|
// Saving binary in the interface class,
|
|
// which also load compile & link options from binary
|
|
setBinary(static_cast<char*>(mem), binary.second);
|
|
if (!options || !needOptionsCheck) {
|
|
return continueCompileFrom;
|
|
}
|
|
bool recompile = false;
|
|
//! @todo Should we also check for ACL_TYPE_OPENCL & ACL_TYPE_LLVMIR_TEXT?
|
|
switch (continueCompileFrom) {
|
|
case ACL_TYPE_HSAIL_BINARY:
|
|
case ACL_TYPE_CG:
|
|
case ACL_TYPE_ISA: {
|
|
// Compare options loaded from binary with current ones, recompile if differ;
|
|
// If compile options are absent in binary, do not compare and recompile
|
|
if (compileOptions_.empty())
|
|
break;
|
|
const oclBIFSymbolStruct* symbol = findBIF30SymStruct(symOpenclCompilerOptions);
|
|
assert(symbol && "symbol not found");
|
|
std::string symName = std::string(symbol->str[bif::PRE]) + std::string(symbol->str[bif::POST]);
|
|
size_t symSize = 0;
|
|
#if defined(WITH_LIGHTNING_COMPILER)
|
|
assert(!"FIXME_Wilkin");
|
|
const void *opts = NULL;
|
|
#else // !defined(WITH_LIGHTNING_COMPILER)
|
|
const void *opts = g_complibApi._aclExtractSymbol(device().compiler(),
|
|
binaryElf_, &symSize, aclCOMMENT, symName.c_str(), &errorCode);
|
|
if (errorCode != ACL_SUCCESS) {
|
|
recompile = true;
|
|
break;
|
|
}
|
|
#endif // !defined(WITH_LIGHTNING_COMPILER)
|
|
std::string sBinOptions = std::string((char*)opts, symSize);
|
|
std::string sCurOptions = compileOptions_ + linkOptions_;
|
|
amd::option::Options curOptions, binOptions;
|
|
if (!amd::option::parseAllOptions(sBinOptions, binOptions)) {
|
|
buildLog_ += binOptions.optionsLog();
|
|
LogError("Parsing compile options from binary failed.");
|
|
return ACL_TYPE_DEFAULT;
|
|
}
|
|
if (!amd::option::parseAllOptions(sCurOptions, curOptions)) {
|
|
buildLog_ += curOptions.optionsLog();
|
|
LogError("Parsing compile options failed.");
|
|
return ACL_TYPE_DEFAULT;
|
|
}
|
|
if (!curOptions.equals(binOptions)) {
|
|
recompile = true;
|
|
}
|
|
break;
|
|
}
|
|
default:
|
|
break;
|
|
}
|
|
if (recompile) {
|
|
while (!completeStages.empty()) {
|
|
continueCompileFrom = completeStages.back();
|
|
if (continueCompileFrom == ACL_TYPE_LLVMIR_BINARY ||
|
|
continueCompileFrom == ACL_TYPE_DEFAULT) {
|
|
break;
|
|
}
|
|
completeStages.pop_back();
|
|
}
|
|
}
|
|
}
|
|
return continueCompileFrom;
|
|
}
|
|
|
|
bool HSAILProgram::saveBinaryAndSetType(type_t type) {
|
|
//Write binary to memory
|
|
void *rawBinary = NULL;
|
|
size_t size = 0;
|
|
#if defined(WITH_LIGHTNING_COMPILER)
|
|
rawBinary = codeObjBinary_->Binary();
|
|
size = codeObjBinary_->BinarySize();
|
|
#else // !defined(WITH_LIGHTNING_COMPILER)
|
|
if (g_complibApi._aclWriteToMem(binaryElf_, &rawBinary, &size)
|
|
!= ACL_SUCCESS) {
|
|
buildLog_ += "Failed to write binary to memory \n";
|
|
return false;
|
|
}
|
|
#endif // !defined(WITH_LIGHTNING_COMPILER)
|
|
clBinary()->saveBIFBinary((char*)rawBinary, size);
|
|
//Set the type of binary
|
|
setType(type);
|
|
#if !defined(WITH_LIGHTNING_COMPILER)
|
|
//Free memory containing rawBinary
|
|
binaryElf_->binOpts.dealloc(rawBinary);
|
|
#endif // !defined(WITH_LIGHTNING_COMPILER)
|
|
return true;
|
|
}
|
|
|
|
bool HSAILProgram::linkImpl(const std::vector<Program *> &inputPrograms,
|
|
amd::option::Options *options,
|
|
bool createLibrary) {
|
|
#if defined(WITH_LIGHTNING_COMPILER)
|
|
assert(!"FIXME_Wilkin");
|
|
return false;
|
|
#else // !defined(WITH_LIGHTNING_COMPILER)
|
|
std::vector<device::Program *>::const_iterator it
|
|
= inputPrograms.begin();
|
|
std::vector<device::Program *>::const_iterator itEnd
|
|
= inputPrograms.end();
|
|
acl_error errorCode;
|
|
|
|
// For each program we need to extract the LLVMIR and create
|
|
// aclBinary for each
|
|
std::vector<aclBinary *> binaries_to_link;
|
|
|
|
for (size_t i = 0; it != itEnd; ++it, ++i) {
|
|
HSAILProgram *program = (HSAILProgram *)*it;
|
|
// Check if the program was created with clCreateProgramWIthBinary
|
|
binary_t binary = program->binary();
|
|
if ((binary.first != NULL) && (binary.second > 0)) {
|
|
// Binary already exists -- we can also check if there is no
|
|
// opencl source code
|
|
// Need to check if LLVMIR exists in the binary
|
|
// If LLVMIR does not exist then is it valid
|
|
// We need to pull out all the compiled kernels
|
|
// We cannot do this at present because we need at least
|
|
// Hsail text to pull the kernels oout
|
|
void *mem = const_cast<void *>(binary.first);
|
|
binaryElf_ = g_complibApi._aclReadFromMem(mem,
|
|
binary.second,
|
|
&errorCode);
|
|
|
|
if (errorCode != ACL_SUCCESS) {
|
|
LogWarning("Error while linking : Could not read from raw binary");
|
|
return false;
|
|
}
|
|
}
|
|
// At this stage each HSAILProgram contains a valid binary_elf
|
|
// Check if LLVMIR is in the binary
|
|
size_t boolSize = sizeof(bool);
|
|
bool containsLLLVMIR = false;
|
|
errorCode = g_complibApi._aclQueryInfo(device().compiler(), binaryElf_,
|
|
RT_CONTAINS_LLVMIR, NULL, &containsLLLVMIR, &boolSize);
|
|
if (errorCode != ACL_SUCCESS || !containsLLLVMIR) {
|
|
buildLog_ +="Error while linking : Invalid binary (Missing LLVMIR section)";
|
|
return false;
|
|
}
|
|
// Create a new aclBinary for each LLVMIR and save it in a list
|
|
aclBIFVersion ver = g_complibApi._aclBinaryVersion(binaryElf_);
|
|
aclBinary *bin = g_complibApi._aclCreateFromBinary(binaryElf_, ver);
|
|
binaries_to_link.push_back(bin);
|
|
}
|
|
|
|
// At this stage each HSAILProgram in the list has an aclBinary initialized
|
|
// and contains LLVMIR
|
|
// We can now go ahead and link them.
|
|
if (binaries_to_link.size() > 1) {
|
|
errorCode = g_complibApi._aclLink(device().compiler(),
|
|
binaries_to_link[0],
|
|
binaries_to_link.size() - 1,
|
|
&binaries_to_link[1],
|
|
ACL_TYPE_LLVMIR_BINARY,
|
|
"-create-library",
|
|
NULL);
|
|
}
|
|
else {
|
|
errorCode = g_complibApi._aclLink(device().compiler(),
|
|
binaries_to_link[0],
|
|
0,
|
|
NULL,
|
|
ACL_TYPE_LLVMIR_BINARY,
|
|
"-create-library",
|
|
NULL);
|
|
}
|
|
if (errorCode != ACL_SUCCESS) {
|
|
buildLog_ += "Failed to link programs";
|
|
return false;
|
|
}
|
|
// Store the newly linked aclBinary for this program.
|
|
binaryElf_ = binaries_to_link[0];
|
|
// Free all the other aclBinaries
|
|
for (size_t i = 1; i < binaries_to_link.size(); i++) {
|
|
g_complibApi._aclBinaryFini(binaries_to_link[i]);
|
|
}
|
|
if (createLibrary) {
|
|
saveBinaryAndSetType(TYPE_LIBRARY);
|
|
return true;
|
|
}
|
|
|
|
// Now call linkImpl with the new options
|
|
return linkImpl(options);
|
|
#endif // !defined(WITH_LIGHTNING_COMPILER)
|
|
}
|
|
|
|
bool HSAILProgram::initBrigModule() {
|
|
#if defined(WITH_LIGHTNING_COMPILER)
|
|
brigModule_ = NULL;
|
|
#else // !defined(WITH_LIGHTNING_COMPILER)
|
|
const char *symbol_name = "__BRIG__";
|
|
BrigModuleHeader* brig;
|
|
acl_error error_code;
|
|
size_t size;
|
|
const void* symbol_data = g_complibApi._aclExtractSymbol(
|
|
device().compiler(),
|
|
binaryElf_,
|
|
&size,
|
|
aclBRIG,
|
|
symbol_name,
|
|
&error_code);
|
|
if (error_code != ACL_SUCCESS) {
|
|
std::string error = "Could not find Brig in BIF: ";
|
|
error += symbol_name;
|
|
LogError(error.c_str());
|
|
buildLog_ += error;
|
|
return false;
|
|
}
|
|
brig = (BrigModuleHeader*)malloc(size);
|
|
memcpy(brig, symbol_data, size);
|
|
brigModule_ = brig;
|
|
#endif // !defined(WITH_LIGHTNING_COMPILER)
|
|
return true;
|
|
}
|
|
void HSAILProgram::destroyBrigModule() {
|
|
if (brigModule_ != NULL) {
|
|
free(brigModule_);
|
|
}
|
|
}
|
|
bool HSAILProgram::initBrigContainer() {
|
|
#if defined(WITH_LIGHTNING_COMPILER)
|
|
hsaBrigContainer_ = NULL;
|
|
#else // !defined(WITH_LIGHTNING_COMPILER)
|
|
assert(brigModule_ != NULL);
|
|
|
|
//Create a BRIG container
|
|
hsaBrigContainer_ = new BrigContainer(brigModule_);
|
|
if (!hsaBrigContainer_) {
|
|
return false;
|
|
}
|
|
#endif // !defined(WITH_LIGHTNING_COMPILER)
|
|
return true;
|
|
}
|
|
|
|
void HSAILProgram::destroyBrigContainer() {
|
|
delete (hsaBrigContainer_);
|
|
}
|
|
|
|
|
|
void HSAILProgram::hsaError(const char *msg, hsa_status_t status) {
|
|
std::string fmsg;
|
|
fmsg += msg;
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
const char *hmsg = 0;
|
|
hsa_status_string(status, &hmsg);
|
|
if (hmsg) {
|
|
fmsg += ": ";
|
|
fmsg += hmsg;
|
|
}
|
|
}
|
|
LogError(fmsg.c_str());
|
|
buildLog_ += fmsg;
|
|
}
|
|
|
|
#if defined(WITH_LIGHTNING_COMPILER)
|
|
bool HSAILProgram::linkImpl_LC(amd::option::Options *options) {
|
|
// call LinkLLVMBitcode
|
|
std::vector<amd::opencl_driver::Data*> inputs;
|
|
|
|
amd::opencl_driver::Data* opencl_bc = device().compiler()->NewBufferReference(
|
|
amd::opencl_driver::DT_LLVM_BC,
|
|
(const char*) builtins_opencl_amdgcn,
|
|
builtins_opencl_amdgcn_size);
|
|
if (opencl_bc == NULL) {
|
|
buildLog_ += "Error while open opencl library bitcode ";
|
|
return false;
|
|
}
|
|
|
|
amd::opencl_driver::Data* ocml_bc = device().compiler()->NewBufferReference(
|
|
amd::opencl_driver::DT_LLVM_BC,
|
|
(const char*) builtins_ocml_amdgcn,
|
|
builtins_ocml_amdgcn_size);
|
|
if (ocml_bc == NULL) {
|
|
buildLog_ += "Error while open ocml library bitcode ";
|
|
return false;
|
|
}
|
|
amd::opencl_driver::Data* ockl_bc = device().compiler()->NewBufferReference(
|
|
amd::opencl_driver::DT_LLVM_BC,
|
|
(const char*) builtins_ockl_amdgcn,
|
|
builtins_ockl_amdgcn_size);
|
|
if (ockl_bc == NULL) {
|
|
buildLog_ += "Error while open ockl library bitcode ";
|
|
return false;
|
|
}
|
|
|
|
amd::opencl_driver::Data* irif_bc = device().compiler()->NewBufferReference(
|
|
amd::opencl_driver::DT_LLVM_BC,
|
|
(const char*) builtins_irif_amdgcn,
|
|
builtins_irif_amdgcn_size);
|
|
if (irif_bc == NULL) {
|
|
buildLog_ += "Error while open irif (llvm) library bitcode ";
|
|
return false;
|
|
}
|
|
|
|
const std::string llvmIR = codeObjBinary_->getLlvmIR();
|
|
amd::opencl_driver::Data* llvm_src = device().compiler()->NewBufferReference(
|
|
amd::opencl_driver::DT_LLVM_BC,
|
|
llvmIR.c_str(),
|
|
llvmIR.length());
|
|
if (llvm_src == NULL) {
|
|
buildLog_ += "Error while creating data from LLVM bitcode";
|
|
return false;
|
|
}
|
|
|
|
inputs.push_back(llvm_src);
|
|
inputs.push_back(opencl_bc);
|
|
inputs.push_back(ocml_bc);
|
|
inputs.push_back(ockl_bc);
|
|
inputs.push_back(irif_bc);
|
|
|
|
std::vector<std::string> linkOptions;
|
|
amd::opencl_driver::Data* linked_bc = device().compiler()->NewBuffer(
|
|
amd::opencl_driver::DT_LLVM_BC);
|
|
if (!device().compiler()->LinkLLVMBitcode(inputs, linked_bc, linkOptions)) {
|
|
buildLog_ += "Error while linking source & LLVM library: linking source & IR library";
|
|
#if 0
|
|
std::cerr << "\n**** Compiler Output After LinkLLVMBitcode ****\n";
|
|
std::cerr << device().compiler()->Output().c_str();
|
|
std::cerr << "***********************************************\n\n";
|
|
#endif
|
|
return false;
|
|
}
|
|
|
|
|
|
// convert option string into vector here as clang treats option
|
|
// with leading space as file name
|
|
std::vector<std::string> complibOptions;
|
|
if (!options->origOptionStr.empty())
|
|
{
|
|
std::istringstream buf(options->origOptionStr);
|
|
std::istream_iterator<std::string> beg(buf), end;
|
|
std::vector<std::string> origOptions(beg, end);
|
|
|
|
complibOptions.insert( complibOptions.end(),
|
|
origOptions.begin(),
|
|
origOptions.end());
|
|
}
|
|
|
|
appendHsailOptions(complibOptions);
|
|
complibOptions.push_back("-mcpu=fiji");
|
|
|
|
inputs.clear();
|
|
inputs.push_back(linked_bc);
|
|
|
|
amd::opencl_driver::Buffer* out_exec = device().compiler()->NewBuffer(
|
|
amd::opencl_driver::DT_EXECUTABLE);
|
|
if (out_exec == NULL) {
|
|
buildLog_ += "Error while creating output file for the executable";
|
|
return false;
|
|
}
|
|
|
|
if (!device().compiler()->CompileAndLinkExecutable(inputs,
|
|
(amd::opencl_driver::Data*) out_exec,
|
|
complibOptions))
|
|
{
|
|
buildLog_ += "Error while creating executable: Compiling LLVM IRs to exe";
|
|
#if 0
|
|
std::cerr << "\n**** Compiler Output After CompileAndLinkExecutable ****\n";
|
|
std::cerr << device().compiler()->Output().c_str();
|
|
std::cerr << "********************************************************\n\n";
|
|
#endif
|
|
return false;
|
|
}
|
|
|
|
|
|
// allocate memory and store the ELF code object
|
|
lcBinaryElfSize_ = out_exec->Size();
|
|
// lcBinaryElf_ = (void *)malloc(lcBinaryElfSize_);
|
|
// memcpy(lcBinaryElf_, (void *) out_exec->Buf().data(), lcBinaryElfSize_);
|
|
|
|
hsa_status_t status;
|
|
status = hsa_code_object_deserialize( out_exec->Buf().data(),
|
|
out_exec->Size(),
|
|
NULL, &lcProgramCodeObject_ );
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to deserialize code object from a buffer.");
|
|
return false;
|
|
}
|
|
|
|
status = hsa_executable_create( HSA_PROFILE_FULL,
|
|
HSA_EXECUTABLE_STATE_UNFROZEN,
|
|
NULL, &lcExecutable_ );
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to create executable", status);
|
|
return false;
|
|
}
|
|
|
|
// Load the code object.
|
|
hsa_agent_t hsaDevice = dev().getBackendDevice();
|
|
status = hsa_executable_load_code_object( lcExecutable_, hsaDevice,
|
|
lcProgramCodeObject_, NULL );
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to load code object", status);
|
|
return false;
|
|
}
|
|
|
|
// Freeze the executable.
|
|
status = hsa_executable_freeze( lcExecutable_, NULL );
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to freeze executable");
|
|
return false;
|
|
}
|
|
|
|
//TODO: WC - use the proper target code based on the agent
|
|
std::string target = "AMD:AMDGPU:8:0:3";
|
|
codeObjBinary_->init( target, out_exec->Buf().data(), out_exec->Size());
|
|
saveBinaryAndSetType(TYPE_EXECUTABLE);
|
|
|
|
buildLog_ += device().compiler()->Output();
|
|
|
|
// Get the list of kernels
|
|
std::vector<std::string> kernelNameList;
|
|
status = hsa_executable_iterate_symbols( lcExecutable_, GetKernelNamesCallback,
|
|
(void *) &kernelNameList );
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to get kernel names");
|
|
return false;
|
|
}
|
|
|
|
for ( auto &kernelName : kernelNameList )
|
|
{
|
|
hsa_executable_symbol_t kernelSymbol;
|
|
hsa_executable_get_symbol ( lcExecutable_, "", kernelName.c_str(),
|
|
hsaDevice, 0, &kernelSymbol );
|
|
|
|
uint64_t kernelCodeHandle;
|
|
status = hsa_executable_symbol_get_info(
|
|
kernelSymbol,
|
|
HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_OBJECT,
|
|
&kernelCodeHandle);
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to get the kernel code", status);
|
|
return false;
|
|
}
|
|
|
|
uint32_t workgroupGroupSegmentByteSize;
|
|
status = hsa_executable_symbol_get_info(
|
|
kernelSymbol,
|
|
HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_GROUP_SEGMENT_SIZE,
|
|
&workgroupGroupSegmentByteSize);
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to get group segment size info", status);
|
|
return false;
|
|
}
|
|
|
|
uint32_t workitemPrivateSegmentByteSize;
|
|
status = hsa_executable_symbol_get_info(
|
|
kernelSymbol,
|
|
HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_PRIVATE_SEGMENT_SIZE,
|
|
&workitemPrivateSegmentByteSize);
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to get private segment size info", status);
|
|
return false;
|
|
}
|
|
|
|
uint32_t kernargSegmentByteSize;
|
|
status = hsa_executable_symbol_get_info(
|
|
kernelSymbol,
|
|
HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_KERNARG_SEGMENT_SIZE,
|
|
&kernargSegmentByteSize);
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to get kernarg segment size info", status);
|
|
return false;
|
|
}
|
|
|
|
uint32_t kernargSegmentAlignment;
|
|
status = hsa_executable_symbol_get_info(
|
|
kernelSymbol,
|
|
HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_KERNARG_SEGMENT_ALIGNMENT,
|
|
&kernargSegmentAlignment);
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to get kernarg segment alignment info", status);
|
|
return false;
|
|
}
|
|
|
|
// for OpenCL default hidden kernel arguments assuming there is no printf
|
|
size_t numHiddenKernelArgs = 0; // FIXME_lmoriche:3;
|
|
|
|
// Fix the kernel name issue that causes string comparison does not work
|
|
// due to an extra character at the end
|
|
// TODO: find out the root cause
|
|
kernelName.resize(kernelName.length()-1);
|
|
|
|
Kernel *aKernel = new roc::Kernel(
|
|
kernelName,
|
|
this,
|
|
kernelCodeHandle,
|
|
workgroupGroupSegmentByteSize,
|
|
workitemPrivateSegmentByteSize,
|
|
// TODO: remove the workaround
|
|
// add 24 bytes for global offsets as workaround for LC reporting
|
|
// excluded the hidden arguments
|
|
kernargSegmentByteSize /* FIXME_lmoriche:+24*/,
|
|
kernargSegmentAlignment,
|
|
numHiddenKernelArgs
|
|
);
|
|
if (!aKernel->init()) {
|
|
return false;
|
|
}
|
|
aKernel->setUniformWorkGroupSize(options->oVariables->UniformWorkGroupSize);
|
|
kernels()[kernelName] = aKernel;
|
|
}
|
|
|
|
#if 0
|
|
// Cleaning up
|
|
status = hsa_code_object_destroy( lcProgramCodeObject_ );
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to destory the code object", status);
|
|
return false;
|
|
}
|
|
|
|
status = hsa_executable_destroy( lcExecutable_ );
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to destory the executable", status);
|
|
return false;
|
|
}
|
|
#endif
|
|
return true;
|
|
}
|
|
#endif // defined(WITH_LIGHTNING_COMPILER)
|
|
|
|
bool HSAILProgram::linkImpl(amd::option::Options *options) {
|
|
acl_error errorCode;
|
|
aclType continueCompileFrom = ACL_TYPE_LLVMIR_BINARY;
|
|
bool finalize = true;
|
|
// If !binaryElf_ then program must have been created using clCreateProgramWithBinary
|
|
#if defined(WITH_LIGHTNING_COMPILER)
|
|
if (!codeObjBinary_)
|
|
#else // !defined(WITH_LIGHTNING_COMPILER)
|
|
if (!binaryElf_)
|
|
#endif // !defined(WITH_LIGHTNING_COMPILER)
|
|
{
|
|
continueCompileFrom = getNextCompilationStageFromBinary(options);
|
|
}
|
|
switch (continueCompileFrom) {
|
|
// Compilation from ACL_TYPE_LLVMIR_BINARY to ACL_TYPE_CG in cases:
|
|
// 1. if the program is not created with binary;
|
|
// 2. if the program is created with binary and contains only .llvmir & .comment
|
|
// 3. if the program is created with binary, contains .llvmir, .comment, brig sections,
|
|
// but the binary's compile & link options differ from current ones (recompilation);
|
|
case ACL_TYPE_LLVMIR_BINARY:
|
|
// Compilation from ACL_TYPE_HSAIL_BINARY to ACL_TYPE_CG in cases:
|
|
// 1. if the program is created with binary and contains only brig sections
|
|
case ACL_TYPE_HSAIL_BINARY:
|
|
// Compilation from ACL_TYPE_HSAIL_TEXT to ACL_TYPE_CG in cases:
|
|
// 1. if the program is created with binary and contains only hsail text
|
|
case ACL_TYPE_HSAIL_TEXT: {
|
|
#if defined(WITH_LIGHTNING_COMPILER)
|
|
if (!linkImpl_LC(options)) {
|
|
return false;
|
|
}
|
|
#else // !defined(WITH_LIGHTNING_COMPILER)
|
|
std::string curOptions = options->origOptionStr + hsailOptions();
|
|
errorCode = g_complibApi._aclCompile(device().compiler(), binaryElf_,
|
|
curOptions.c_str(), continueCompileFrom, ACL_TYPE_CG, logFunction);
|
|
buildLog_ += g_complibApi._aclGetCompilerLog(device().compiler());
|
|
if (errorCode != ACL_SUCCESS) {
|
|
buildLog_ += "Error while BRIG Codegen phase: compilation error \n" ;
|
|
return false;
|
|
}
|
|
#endif // !defined(WITH_LIGHTNING_COMPILER)
|
|
break;
|
|
}
|
|
case ACL_TYPE_CG:
|
|
break;
|
|
case ACL_TYPE_ISA:
|
|
finalize = false;
|
|
break;
|
|
default:
|
|
buildLog_ += "Error while BRIG Codegen phase: the binary is incomplete \n" ;
|
|
return false;
|
|
}
|
|
//Stop compilation if it is an offline device - HSA runtime does not
|
|
//support ISA compiled offline
|
|
if (!dev().isOnline()) {
|
|
return true;
|
|
}
|
|
|
|
#if !defined(WITH_LIGHTNING_COMPILER)
|
|
hsa_agent_t hsaDevice = dev().getBackendDevice();
|
|
if (!initBrigModule()) {
|
|
hsaError("Failed to create Brig Module");
|
|
return false;
|
|
}
|
|
|
|
// Create a BrigContainer.
|
|
if (!initBrigContainer()) {
|
|
hsaError("Failed to create Brig Container");
|
|
return false;
|
|
}
|
|
// Create a program.
|
|
hsa_status_t status = hsa_ext_program_create(
|
|
HSA_MACHINE_MODEL_LARGE,
|
|
HSA_PROFILE_FULL,
|
|
HSA_DEFAULT_FLOAT_ROUNDING_MODE_ZERO,
|
|
NULL,
|
|
&hsaProgramHandle_
|
|
);
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to create hsail program", status);
|
|
return false;
|
|
}
|
|
|
|
// Add module to a program.
|
|
hsa_ext_module_t programModule =
|
|
reinterpret_cast<hsa_ext_module_t>(brigModule_);
|
|
status = hsa_ext_program_add_module(
|
|
hsaProgramHandle_, programModule
|
|
);
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to add a module to the program", status);
|
|
return false;
|
|
}
|
|
|
|
// Obtain agent's Isa.
|
|
hsa_isa_t hsaDeviceIsa;
|
|
status = hsa_agent_get_info(
|
|
hsaDevice, HSA_AGENT_INFO_ISA, &hsaDeviceIsa
|
|
);
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to create hsail program", status);
|
|
return false;
|
|
}
|
|
|
|
// Finalize a program.
|
|
hsa_ext_control_directives_t hsaControlDirectives;
|
|
memset(&hsaControlDirectives, 0, sizeof(hsa_ext_control_directives_t));
|
|
status = hsa_ext_program_finalize(
|
|
hsaProgramHandle_,
|
|
hsaDeviceIsa,
|
|
0,
|
|
hsaControlDirectives,
|
|
NULL,
|
|
HSA_CODE_OBJECT_TYPE_PROGRAM,
|
|
&hsaProgramCodeObject_
|
|
);
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to finalize hsail program", status);
|
|
return false;
|
|
}
|
|
|
|
// HLC always generates full profile
|
|
hsa_profile_t profile = HSA_PROFILE_FULL;
|
|
|
|
// Create an executable.
|
|
status = hsa_executable_create(
|
|
profile,
|
|
HSA_EXECUTABLE_STATE_UNFROZEN,
|
|
"",
|
|
&hsaExecutable_
|
|
);
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to create executable", status);
|
|
return false;
|
|
}
|
|
|
|
// Load the code object.
|
|
status = hsa_executable_load_code_object(
|
|
hsaExecutable_, hsaDevice, hsaProgramCodeObject_, NULL
|
|
);
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to load code object", status);
|
|
return false;
|
|
}
|
|
|
|
// Freeze the executable.
|
|
status = hsa_executable_freeze(hsaExecutable_, NULL);
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to freeze executable", status);
|
|
return false;
|
|
}
|
|
|
|
Code first_d = hsaBrigContainer_->code().begin();
|
|
Code last_d = hsaBrigContainer_->code().end();
|
|
//Iterate through the symbols using brig assembler
|
|
for (;first_d != last_d;first_d = first_d.next()) {
|
|
if (DirectiveExecutable de = first_d) {
|
|
// Disable function compilation unconditionally.
|
|
// TODO: May remove this after the finalizer supports function compilation.
|
|
if (DirectiveFunction df = first_d) {
|
|
continue;
|
|
}
|
|
|
|
std::string kernelName = (SRef)de.name();
|
|
if (de.linkage() != BRIG_LINKAGE_PROGRAM) {
|
|
kernelName.insert(0, "am::");
|
|
}
|
|
// Query symbol handle for this symbol.
|
|
hsa_executable_symbol_t kernelSymbol;
|
|
status = hsa_executable_get_symbol(
|
|
hsaExecutable_, NULL, kernelName.c_str(), hsaDevice, 0, &kernelSymbol
|
|
);
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to get executable symbol", status);
|
|
return false;
|
|
}
|
|
|
|
// Query code handle for this symbol.
|
|
uint64_t kernelCodeHandle;
|
|
status = hsa_executable_symbol_get_info(
|
|
kernelSymbol, HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_OBJECT, &kernelCodeHandle
|
|
);
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to get executable symbol info", status);
|
|
return false;
|
|
}
|
|
|
|
std::string openclKernelName = kernelName;
|
|
// Strip the opencl and kernel name
|
|
kernelName = kernelName.substr(strlen("&__OpenCL_"), kernelName.size());
|
|
kernelName = kernelName.substr(0,kernelName.size() - strlen("_kernel"));
|
|
aclMetadata md;
|
|
md.numHiddenKernelArgs = 0;
|
|
|
|
size_t sizeOfnumHiddenKernelArgs = sizeof(md.numHiddenKernelArgs);
|
|
errorCode = g_complibApi._aclQueryInfo(device().compiler(), binaryElf_, RT_NUM_KERNEL_HIDDEN_ARGS,
|
|
openclKernelName.c_str(), &md.numHiddenKernelArgs, &sizeOfnumHiddenKernelArgs);
|
|
if (errorCode != ACL_SUCCESS) {
|
|
buildLog_ += "Error while Finalization phase: Kernel extra arguments count querying from the ELF failed\n";
|
|
return false;
|
|
}
|
|
|
|
uint32_t workgroupGroupSegmentByteSize;
|
|
status = hsa_executable_symbol_get_info(
|
|
kernelSymbol,
|
|
HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_GROUP_SEGMENT_SIZE,
|
|
&workgroupGroupSegmentByteSize);
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to get group segment size info", status);
|
|
return false;
|
|
}
|
|
|
|
uint32_t workitemPrivateSegmentByteSize;
|
|
status = hsa_executable_symbol_get_info(
|
|
kernelSymbol,
|
|
HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_PRIVATE_SEGMENT_SIZE,
|
|
&workitemPrivateSegmentByteSize);
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to get private segment size info", status);
|
|
return false;
|
|
}
|
|
|
|
uint32_t kernargSegmentByteSize;
|
|
status = hsa_executable_symbol_get_info(
|
|
kernelSymbol,
|
|
HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_KERNARG_SEGMENT_SIZE,
|
|
&kernargSegmentByteSize);
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to get kernarg segment size info", status);
|
|
return false;
|
|
}
|
|
|
|
uint32_t kernargSegmentAlignment;
|
|
status = hsa_executable_symbol_get_info(
|
|
kernelSymbol,
|
|
HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_KERNARG_SEGMENT_ALIGNMENT,
|
|
&kernargSegmentAlignment);
|
|
if (status != HSA_STATUS_SUCCESS) {
|
|
hsaError("Failed to get kernarg segment alignment info", status);
|
|
return false;
|
|
}
|
|
|
|
Kernel *aKernel = new roc::Kernel(
|
|
kernelName,
|
|
this,
|
|
kernelCodeHandle,
|
|
workgroupGroupSegmentByteSize,
|
|
workitemPrivateSegmentByteSize,
|
|
kernargSegmentByteSize,
|
|
kernargSegmentAlignment,
|
|
md.numHiddenKernelArgs
|
|
);
|
|
if (!aKernel->init()) {
|
|
return false;
|
|
}
|
|
aKernel->setUniformWorkGroupSize(options->oVariables->UniformWorkGroupSize);
|
|
kernels()[kernelName] = aKernel;
|
|
}
|
|
}
|
|
saveBinaryAndSetType(TYPE_EXECUTABLE);
|
|
buildLog_ += g_complibApi._aclGetCompilerLog(device().compiler());
|
|
#endif // !defined(WITH_LIGHTNING_COMPILER)
|
|
return true;
|
|
}
|
|
|
|
bool HSAILProgram::createBinary(amd::option::Options *options) {
|
|
return false;
|
|
}
|
|
|
|
bool HSAILProgram::initClBinary() {
|
|
if (clBinary_ == NULL) {
|
|
clBinary_ = new ClBinary(static_cast<const Device &>(device()));
|
|
if (clBinary_ == NULL) {
|
|
return false;
|
|
}
|
|
}
|
|
return true;
|
|
}
|
|
|
|
void HSAILProgram::releaseClBinary() {
|
|
if (clBinary_ != NULL) {
|
|
delete clBinary_;
|
|
clBinary_ = NULL;
|
|
}
|
|
}
|
|
|
|
std::string HSAILProgram::hsailOptions() {
|
|
std::string hsailOptions;
|
|
//Set options for the standard device specific options
|
|
//This is just for legacy compiler code
|
|
// All our devices support these options now
|
|
hsailOptions.append(" -DFP_FAST_FMAF=1");
|
|
hsailOptions.append(" -DFP_FAST_FMA=1");
|
|
//TODO: this is a quick fix to restore original f32 denorm flushing
|
|
//Make this target/option dependent
|
|
#if !defined(WITH_LIGHTNING_COMPILER) // TODO: WC
|
|
hsailOptions.append(" -cl-denorms-are-zero");
|
|
#endif // !defined(WITH_LIGHTNING_COMPILER)
|
|
//TODO(sramalin) : Query the device for opencl version
|
|
// and only set if -cl-std wasn't specified in
|
|
// original build options (app)
|
|
//hsailOptions.append(" -cl-std=CL1.2");
|
|
//check if the host is 64 bit or 32 bit
|
|
LP64_ONLY(hsailOptions.append(" -m64"));
|
|
//Now append each extension supported by the device
|
|
// one by one
|
|
std::string token;
|
|
std::istringstream iss("");
|
|
iss.str(device().info().extensions_);
|
|
while (getline(iss, token, ' ')) {
|
|
if (!token.empty()) {
|
|
hsailOptions.append(" -D");
|
|
hsailOptions.append(token);
|
|
hsailOptions.append("=1");
|
|
}
|
|
}
|
|
return hsailOptions;
|
|
}
|
|
|
|
#if defined(WITH_LIGHTNING_COMPILER)
|
|
void HSAILProgram::appendHsailOptions(std::vector<std::string>& options)
|
|
{
|
|
//TODO: this is a quick fix to restore original f32 denorm flushing
|
|
//Make this target/option dependent
|
|
options.push_back("-Xclang");
|
|
options.push_back("-cl-denorms-are-zero");
|
|
#if 0
|
|
// option to debug metadata section
|
|
|
|
options.push_back("-Xclang");
|
|
options.push_back("-backend-option");
|
|
|
|
options.push_back("-Xclang");
|
|
options.push_back("-print-after-all");
|
|
#endif
|
|
//options.push_back("-mcpu=fiji");
|
|
//options.push_back("-include"); options.push_back("opencl-c.h");
|
|
|
|
//Set options for the standard device specific options
|
|
//This is just for legacy compiler code
|
|
// All our devices support these options now
|
|
options.push_back("-DFP_FAST_FMAF=1");
|
|
options.push_back("-DFP_FAST_FMA=1");
|
|
|
|
//TODO(sramalin) : Query the device for opencl version
|
|
// and only set if -cl-std wasn't specified in
|
|
// original build options (app)
|
|
//options.push_back(" -cl-std=CL1.2");
|
|
|
|
//check if the host is 64 bit or 32 bit
|
|
LP64_ONLY(options.push_back("-m64"));
|
|
|
|
//Now append each extension supported by the device
|
|
// one by one
|
|
std::string token;
|
|
std::istringstream iss("");
|
|
iss.str(device().info().extensions_);
|
|
while (getline(iss, token, ' ')) {
|
|
if (!token.empty()) {
|
|
options.push_back("-D"+token+"=1");
|
|
}
|
|
}
|
|
return;
|
|
}
|
|
|
|
void CodeObjBinary::init(std::string& target, void* binary, size_t binarySize)
|
|
{
|
|
target_ = target;
|
|
binary_ = binary;
|
|
binarySize_ = binarySize;
|
|
|
|
oclElf_ = new amd::OclElf(ELFCLASS64, (char *)binary_, binarySize_, NULL, ELF_C_READ);
|
|
|
|
// load the runtime metadata
|
|
runtimeMD_ = new roc::RuntimeMD::Program::Metadata();
|
|
}
|
|
|
|
void CodeObjBinary::fini()
|
|
{
|
|
if (oclElf_) {
|
|
delete oclElf_;
|
|
}
|
|
|
|
if (runtimeMD_) {
|
|
delete runtimeMD_;
|
|
}
|
|
|
|
target_ = "";
|
|
binary_ = NULL;
|
|
binarySize_ = 0;
|
|
}
|
|
|
|
const RuntimeMD::Program::Metadata* CodeObjBinary::GetProgramMetadata() const
|
|
{
|
|
char* metaData;
|
|
size_t metaSize;
|
|
if (!oclElf_->getSection(amd::OclElf::RUNTIME_METADATA, &metaData, &metaSize)) {
|
|
LogWarning( "Error while access runtime metadata section from the binary \n" );
|
|
}
|
|
|
|
if (!runtimeMD_->ReadFrom((void *) metaData, metaSize)) {
|
|
LogWarning( "Error while parsing runtime metadata \n" );
|
|
}
|
|
|
|
return runtimeMD_;
|
|
}
|
|
#endif // defined(WITH_LIGHTNING_COMPILER)
|
|
#endif // WITHOUT_HSA_BACKEND
|
|
} // namespace roc
|
|
|