diff options
Diffstat (limited to 'lld/ELF/Arch/AMDGPU.cpp')
-rw-r--r-- | lld/ELF/Arch/AMDGPU.cpp | 75 |
1 files changed, 73 insertions, 2 deletions
diff --git a/lld/ELF/Arch/AMDGPU.cpp b/lld/ELF/Arch/AMDGPU.cpp index 4f4ce0094bbf..466ad81922d0 100644 --- a/lld/ELF/Arch/AMDGPU.cpp +++ b/lld/ELF/Arch/AMDGPU.cpp @@ -22,6 +22,10 @@ using namespace lld::elf; namespace { class AMDGPU final : public TargetInfo { +private: + uint32_t calcEFlagsV3() const; + uint32_t calcEFlagsV4() const; + public: AMDGPU(); uint32_t calcEFlags() const override; @@ -44,8 +48,7 @@ static uint32_t getEFlags(InputFile *file) { return cast<ObjFile<ELF64LE>>(file)->getObj().getHeader().e_flags; } -uint32_t AMDGPU::calcEFlags() const { - assert(!objectFiles.empty()); +uint32_t AMDGPU::calcEFlagsV3() const { uint32_t ret = getEFlags(objectFiles[0]); // Verify that all input files have the same e_flags. @@ -58,6 +61,67 @@ uint32_t AMDGPU::calcEFlags() const { return ret; } +uint32_t AMDGPU::calcEFlagsV4() const { + uint32_t retMach = getEFlags(objectFiles[0]) & EF_AMDGPU_MACH; + uint32_t retXnack = getEFlags(objectFiles[0]) & EF_AMDGPU_FEATURE_XNACK_V4; + uint32_t retSramEcc = + getEFlags(objectFiles[0]) & EF_AMDGPU_FEATURE_SRAMECC_V4; + + // Verify that all input files have compatible e_flags (same mach, all + // features in the same category are either ANY, ANY and ON, or ANY and OFF). + for (InputFile *f : makeArrayRef(objectFiles).slice(1)) { + if (retMach != (getEFlags(f) & EF_AMDGPU_MACH)) { + error("incompatible mach: " + toString(f)); + return 0; + } + + if (retXnack == EF_AMDGPU_FEATURE_XNACK_UNSUPPORTED_V4 || + (retXnack != EF_AMDGPU_FEATURE_XNACK_ANY_V4 && + (getEFlags(f) & EF_AMDGPU_FEATURE_XNACK_V4) + != EF_AMDGPU_FEATURE_XNACK_ANY_V4)) { + if (retXnack != (getEFlags(f) & EF_AMDGPU_FEATURE_XNACK_V4)) { + error("incompatible xnack: " + toString(f)); + return 0; + } + } else { + if (retXnack == EF_AMDGPU_FEATURE_XNACK_ANY_V4) + retXnack = getEFlags(f) & EF_AMDGPU_FEATURE_XNACK_V4; + } + + if (retSramEcc == EF_AMDGPU_FEATURE_SRAMECC_UNSUPPORTED_V4 || + (retSramEcc != EF_AMDGPU_FEATURE_SRAMECC_ANY_V4 && + (getEFlags(f) & EF_AMDGPU_FEATURE_SRAMECC_V4) != + EF_AMDGPU_FEATURE_SRAMECC_ANY_V4)) { + if (retSramEcc != (getEFlags(f) & EF_AMDGPU_FEATURE_SRAMECC_V4)) { + error("incompatible sramecc: " + toString(f)); + return 0; + } + } else { + if (retSramEcc == EF_AMDGPU_FEATURE_SRAMECC_ANY_V4) + retSramEcc = getEFlags(f) & EF_AMDGPU_FEATURE_SRAMECC_V4; + } + } + + return retMach | retXnack | retSramEcc; +} + +uint32_t AMDGPU::calcEFlags() const { + assert(!objectFiles.empty()); + + uint8_t abiVersion = cast<ObjFile<ELF64LE>>(objectFiles[0])->getObj() + .getHeader().e_ident[EI_ABIVERSION]; + switch (abiVersion) { + case ELFABIVERSION_AMDGPU_HSA_V2: + case ELFABIVERSION_AMDGPU_HSA_V3: + return calcEFlagsV3(); + case ELFABIVERSION_AMDGPU_HSA_V4: + return calcEFlagsV4(); + default: + error("unknown abi version: " + Twine(abiVersion)); + return 0; + } +} + void AMDGPU::relocate(uint8_t *loc, const Relocation &rel, uint64_t val) const { switch (rel.type) { case R_AMDGPU_ABS32: @@ -75,6 +139,12 @@ void AMDGPU::relocate(uint8_t *loc, const Relocation &rel, uint64_t val) const { case R_AMDGPU_REL32_HI: write32le(loc, val >> 32); break; + case R_AMDGPU_REL16: { + int64_t simm = (static_cast<int64_t>(val) - 4) / 4; + checkInt(loc, simm, 16, rel); + write16le(loc, simm); + break; + } default: llvm_unreachable("unknown relocation"); } @@ -90,6 +160,7 @@ RelExpr AMDGPU::getRelExpr(RelType type, const Symbol &s, case R_AMDGPU_REL32_LO: case R_AMDGPU_REL32_HI: case R_AMDGPU_REL64: + case R_AMDGPU_REL16: return R_PC; case R_AMDGPU_GOTPCREL: case R_AMDGPU_GOTPCREL32_LO: |