|
| 1 | +//===---- ObjectUtilities.cpp - AMDGPU ELF utilities -------------- C++ -*-===// |
| 2 | +// |
| 3 | +// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | +// See https://llvm.org/LICENSE.txt for license information. |
| 5 | +// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | +// |
| 7 | +//===----------------------------------------------------------------------===// |
| 8 | +// |
| 9 | +// This file defines AMDGPU ELF related utilities. |
| 10 | +// |
| 11 | +//===----------------------------------------------------------------------===// |
| 12 | + |
| 13 | +#include "llvm/Frontend/Offloading/AMDGPU/ObjectUtilities.h" |
| 14 | + |
| 15 | +#include "llvm/BinaryFormat/AMDGPUMetadataVerifier.h" |
| 16 | +#include "llvm/BinaryFormat/ELF.h" |
| 17 | +#include "llvm/BinaryFormat/MsgPackDocument.h" |
| 18 | +#include "llvm/Object/ELFObjectFile.h" |
| 19 | +#include "llvm/Support/MemoryBufferRef.h" |
| 20 | +#include "llvm/Support/YAMLTraits.h" |
| 21 | + |
| 22 | +using namespace llvm; |
| 23 | +using namespace llvm::ELF; |
| 24 | +using namespace llvm::offloading::amdgpu; |
| 25 | + |
| 26 | +bool llvm::offloading::amdgpu::isImageCompatibleWithEnv(StringRef ImageArch, |
| 27 | + uint32_t ImageFlags, |
| 28 | + StringRef EnvTargetID) { |
| 29 | + StringRef EnvArch = EnvTargetID.split(":").first; |
| 30 | + |
| 31 | + // Trivial check if the base processors match. |
| 32 | + if (EnvArch != ImageArch) |
| 33 | + return false; |
| 34 | + |
| 35 | + // Check if the image is requesting xnack on or off. |
| 36 | + switch (ImageFlags & EF_AMDGPU_FEATURE_XNACK_V4) { |
| 37 | + case EF_AMDGPU_FEATURE_XNACK_OFF_V4: |
| 38 | + // The image is 'xnack-' so the environment must be 'xnack-'. |
| 39 | + if (!EnvTargetID.contains("xnack-")) |
| 40 | + return false; |
| 41 | + break; |
| 42 | + case EF_AMDGPU_FEATURE_XNACK_ON_V4: |
| 43 | + // The image is 'xnack+' so the environment must be 'xnack+'. |
| 44 | + if (!EnvTargetID.contains("xnack+")) |
| 45 | + return false; |
| 46 | + break; |
| 47 | + case EF_AMDGPU_FEATURE_XNACK_UNSUPPORTED_V4: |
| 48 | + case EF_AMDGPU_FEATURE_XNACK_ANY_V4: |
| 49 | + default: |
| 50 | + break; |
| 51 | + } |
| 52 | + |
| 53 | + // Check if the image is requesting sramecc on or off. |
| 54 | + switch (ImageFlags & EF_AMDGPU_FEATURE_SRAMECC_V4) { |
| 55 | + case EF_AMDGPU_FEATURE_SRAMECC_OFF_V4: |
| 56 | + // The image is 'sramecc-' so the environment must be 'sramecc-'. |
| 57 | + if (!EnvTargetID.contains("sramecc-")) |
| 58 | + return false; |
| 59 | + break; |
| 60 | + case EF_AMDGPU_FEATURE_SRAMECC_ON_V4: |
| 61 | + // The image is 'sramecc+' so the environment must be 'sramecc+'. |
| 62 | + if (!EnvTargetID.contains("sramecc+")) |
| 63 | + return false; |
| 64 | + break; |
| 65 | + case EF_AMDGPU_FEATURE_SRAMECC_UNSUPPORTED_V4: |
| 66 | + case EF_AMDGPU_FEATURE_SRAMECC_ANY_V4: |
| 67 | + break; |
| 68 | + } |
| 69 | + |
| 70 | + return true; |
| 71 | +} |
| 72 | + |
| 73 | +namespace { |
| 74 | +/// Reads the AMDGPU specific per-kernel-metadata from an image. |
| 75 | +class KernelInfoReader { |
| 76 | +public: |
| 77 | + KernelInfoReader(StringMap<offloading::amdgpu::AMDGPUKernelMetaData> &KIM) |
| 78 | + : KernelInfoMap(KIM) {} |
| 79 | + |
| 80 | + /// Process ELF note to read AMDGPU metadata from respective information |
| 81 | + /// fields. |
| 82 | + Error processNote(const llvm::object::ELF64LE::Note &Note, size_t Align) { |
| 83 | + if (Note.getName() != "AMDGPU") |
| 84 | + return Error::success(); // We are not interested in other things |
| 85 | + |
| 86 | + assert(Note.getType() == ELF::NT_AMDGPU_METADATA && |
| 87 | + "Parse AMDGPU MetaData"); |
| 88 | + auto Desc = Note.getDesc(Align); |
| 89 | + StringRef MsgPackString = |
| 90 | + StringRef(reinterpret_cast<const char *>(Desc.data()), Desc.size()); |
| 91 | + msgpack::Document MsgPackDoc; |
| 92 | + if (!MsgPackDoc.readFromBlob(MsgPackString, /*Multi=*/false)) |
| 93 | + return Error::success(); |
| 94 | + |
| 95 | + AMDGPU::HSAMD::V3::MetadataVerifier Verifier(true); |
| 96 | + if (!Verifier.verify(MsgPackDoc.getRoot())) |
| 97 | + return Error::success(); |
| 98 | + |
| 99 | + auto RootMap = MsgPackDoc.getRoot().getMap(true); |
| 100 | + |
| 101 | + if (auto Err = iterateAMDKernels(RootMap)) |
| 102 | + return Err; |
| 103 | + |
| 104 | + return Error::success(); |
| 105 | + } |
| 106 | + |
| 107 | +private: |
| 108 | + /// Extracts the relevant information via simple string look-up in the msgpack |
| 109 | + /// document elements. |
| 110 | + Error |
| 111 | + extractKernelData(msgpack::MapDocNode::MapTy::value_type V, |
| 112 | + std::string &KernelName, |
| 113 | + offloading::amdgpu::AMDGPUKernelMetaData &KernelData) { |
| 114 | + if (!V.first.isString()) |
| 115 | + return Error::success(); |
| 116 | + |
| 117 | + const auto IsKey = [](const msgpack::DocNode &DK, StringRef SK) { |
| 118 | + return DK.getString() == SK; |
| 119 | + }; |
| 120 | + |
| 121 | + const auto GetSequenceOfThreeInts = [](msgpack::DocNode &DN, |
| 122 | + uint32_t *Vals) { |
| 123 | + assert(DN.isArray() && "MsgPack DocNode is an array node"); |
| 124 | + auto DNA = DN.getArray(); |
| 125 | + assert(DNA.size() == 3 && "ArrayNode has at most three elements"); |
| 126 | + |
| 127 | + int I = 0; |
| 128 | + for (auto DNABegin = DNA.begin(), DNAEnd = DNA.end(); DNABegin != DNAEnd; |
| 129 | + ++DNABegin) { |
| 130 | + Vals[I++] = DNABegin->getUInt(); |
| 131 | + } |
| 132 | + }; |
| 133 | + |
| 134 | + if (IsKey(V.first, ".name")) { |
| 135 | + KernelName = V.second.toString(); |
| 136 | + } else if (IsKey(V.first, ".sgpr_count")) { |
| 137 | + KernelData.SGPRCount = V.second.getUInt(); |
| 138 | + } else if (IsKey(V.first, ".sgpr_spill_count")) { |
| 139 | + KernelData.SGPRSpillCount = V.second.getUInt(); |
| 140 | + } else if (IsKey(V.first, ".vgpr_count")) { |
| 141 | + KernelData.VGPRCount = V.second.getUInt(); |
| 142 | + } else if (IsKey(V.first, ".vgpr_spill_count")) { |
| 143 | + KernelData.VGPRSpillCount = V.second.getUInt(); |
| 144 | + } else if (IsKey(V.first, ".agpr_count")) { |
| 145 | + KernelData.AGPRCount = V.second.getUInt(); |
| 146 | + } else if (IsKey(V.first, ".private_segment_fixed_size")) { |
| 147 | + KernelData.PrivateSegmentSize = V.second.getUInt(); |
| 148 | + } else if (IsKey(V.first, ".group_segment_fixed_size")) { |
| 149 | + KernelData.GroupSegmentList = V.second.getUInt(); |
| 150 | + } else if (IsKey(V.first, ".reqd_workgroup_size")) { |
| 151 | + GetSequenceOfThreeInts(V.second, KernelData.RequestedWorkgroupSize); |
| 152 | + } else if (IsKey(V.first, ".workgroup_size_hint")) { |
| 153 | + GetSequenceOfThreeInts(V.second, KernelData.WorkgroupSizeHint); |
| 154 | + } else if (IsKey(V.first, ".wavefront_size")) { |
| 155 | + KernelData.WavefrontSize = V.second.getUInt(); |
| 156 | + } else if (IsKey(V.first, ".max_flat_workgroup_size")) { |
| 157 | + KernelData.MaxFlatWorkgroupSize = V.second.getUInt(); |
| 158 | + } |
| 159 | + |
| 160 | + return Error::success(); |
| 161 | + } |
| 162 | + |
| 163 | + /// Get the "amdhsa.kernels" element from the msgpack Document |
| 164 | + Expected<msgpack::ArrayDocNode> getAMDKernelsArray(msgpack::MapDocNode &MDN) { |
| 165 | + auto Res = MDN.find("amdhsa.kernels"); |
| 166 | + if (Res == MDN.end()) |
| 167 | + return createStringError(inconvertibleErrorCode(), |
| 168 | + "Could not find amdhsa.kernels key"); |
| 169 | + |
| 170 | + auto Pair = *Res; |
| 171 | + assert(Pair.second.isArray() && |
| 172 | + "AMDGPU kernel entries are arrays of entries"); |
| 173 | + |
| 174 | + return Pair.second.getArray(); |
| 175 | + } |
| 176 | + |
| 177 | + /// Iterate all entries for one "amdhsa.kernels" entry. Each entry is a |
| 178 | + /// MapDocNode that either maps a string to a single value (most of them) or |
| 179 | + /// to another array of things. Currently, we only handle the case that maps |
| 180 | + /// to scalar value. |
| 181 | + Error generateKernelInfo(msgpack::ArrayDocNode::ArrayTy::iterator It) { |
| 182 | + offloading::amdgpu::AMDGPUKernelMetaData KernelData; |
| 183 | + std::string KernelName; |
| 184 | + auto Entry = (*It).getMap(); |
| 185 | + for (auto MI = Entry.begin(), E = Entry.end(); MI != E; ++MI) |
| 186 | + if (auto Err = extractKernelData(*MI, KernelName, KernelData)) |
| 187 | + return Err; |
| 188 | + |
| 189 | + KernelInfoMap.insert({KernelName, KernelData}); |
| 190 | + return Error::success(); |
| 191 | + } |
| 192 | + |
| 193 | + /// Go over the list of AMD kernels in the "amdhsa.kernels" entry |
| 194 | + Error iterateAMDKernels(msgpack::MapDocNode &MDN) { |
| 195 | + auto KernelsOrErr = getAMDKernelsArray(MDN); |
| 196 | + if (auto Err = KernelsOrErr.takeError()) |
| 197 | + return Err; |
| 198 | + |
| 199 | + auto KernelsArr = *KernelsOrErr; |
| 200 | + for (auto It = KernelsArr.begin(), E = KernelsArr.end(); It != E; ++It) { |
| 201 | + if (!It->isMap()) |
| 202 | + continue; // we expect <key,value> pairs |
| 203 | + |
| 204 | + // Obtain the value for the different entries. Each array entry is a |
| 205 | + // MapDocNode |
| 206 | + if (auto Err = generateKernelInfo(It)) |
| 207 | + return Err; |
| 208 | + } |
| 209 | + return Error::success(); |
| 210 | + } |
| 211 | + |
| 212 | + // Kernel names are the keys |
| 213 | + StringMap<offloading::amdgpu::AMDGPUKernelMetaData> &KernelInfoMap; |
| 214 | +}; |
| 215 | +} // namespace |
| 216 | + |
| 217 | +Error llvm::offloading::amdgpu::getAMDGPUMetaDataFromImage( |
| 218 | + MemoryBufferRef MemBuffer, |
| 219 | + StringMap<offloading::amdgpu::AMDGPUKernelMetaData> &KernelInfoMap, |
| 220 | + uint16_t &ELFABIVersion) { |
| 221 | + Error Err = Error::success(); // Used later as out-parameter |
| 222 | + |
| 223 | + auto ELFOrError = object::ELF64LEFile::create(MemBuffer.getBuffer()); |
| 224 | + if (auto Err = ELFOrError.takeError()) |
| 225 | + return Err; |
| 226 | + |
| 227 | + const object::ELF64LEFile ELFObj = ELFOrError.get(); |
| 228 | + Expected<ArrayRef<object::ELF64LE::Shdr>> Sections = ELFObj.sections(); |
| 229 | + if (!Sections) |
| 230 | + return Sections.takeError(); |
| 231 | + KernelInfoReader Reader(KernelInfoMap); |
| 232 | + |
| 233 | + // Read the code object version from ELF image header |
| 234 | + auto Header = ELFObj.getHeader(); |
| 235 | + ELFABIVersion = (uint8_t)(Header.e_ident[ELF::EI_ABIVERSION]); |
| 236 | + for (const auto &S : *Sections) { |
| 237 | + if (S.sh_type != ELF::SHT_NOTE) |
| 238 | + continue; |
| 239 | + |
| 240 | + for (const auto N : ELFObj.notes(S, Err)) { |
| 241 | + if (Err) |
| 242 | + return Err; |
| 243 | + // Fills the KernelInfoTabel entries in the reader |
| 244 | + if ((Err = Reader.processNote(N, S.sh_addralign))) |
| 245 | + return Err; |
| 246 | + } |
| 247 | + } |
| 248 | + return Error::success(); |
| 249 | +} |
0 commit comments