Skip to content

Commit a9b542a

Browse files
committed
[lldb] Parse and display register field enums
This teaches lldb to parse the enum XML elements sent by lldb-server, and make use of the information in `register read` and `register info`. The format is described in https://sourceware.org/gdb/current/onlinedocs/gdb.html/Enum-Target-Types.html. The target XML parser will drop any invalid enum or evalue. If we find multiple evalue for the same value, we will use the last one we find. The order of evalues from the XML is preserved as there may be good reason they are not in numerical order.
1 parent 79e668f commit a9b542a

File tree

8 files changed

+573
-22
lines changed

8 files changed

+573
-22
lines changed

lldb/include/lldb/Target/RegisterFlags.h

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -32,10 +32,15 @@ class FieldEnum {
3232
: m_value(value), m_name(std::move(name)) {}
3333

3434
void ToXML(Stream &strm) const;
35+
36+
void log(Log *log) const;
3537
};
3638

3739
typedef std::vector<Enumerator> Enumerators;
3840

41+
// GDB also includes a "size" that is the size of the underlying register.
42+
// We will not store that here but instead use the size of the register
43+
// this gets attached to when emitting XML.
3944
FieldEnum(std::string id, const Enumerators &enumerators);
4045

4146
const Enumerators &GetEnumerators() const { return m_enumerators; }
@@ -44,6 +49,8 @@ class FieldEnum {
4449

4550
void ToXML(Stream &strm, unsigned size) const;
4651

52+
void log(Log *log) const;
53+
4754
private:
4855
std::string m_id;
4956
Enumerators m_enumerators;

lldb/source/Core/DumpRegisterInfo.cpp

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -111,6 +111,11 @@ void lldb_private::DoDumpRegisterInfo(
111111
};
112112
DumpList(strm, " In sets: ", in_sets, emit_set);
113113

114-
if (flags_type)
114+
if (flags_type) {
115115
strm.Printf("\n\n%s", flags_type->AsTable(terminal_width).c_str());
116+
117+
std::string enumerators = flags_type->DumpEnums(terminal_width);
118+
if (enumerators.size())
119+
strm << "\n\n" << enumerators;
120+
}
116121
}

lldb/source/Plugins/Process/gdb-remote/ProcessGDBRemote.cpp

Lines changed: 170 additions & 18 deletions
Original file line numberDiff line numberDiff line change
@@ -4179,21 +4179,124 @@ struct GdbServerTargetInfo {
41794179
RegisterSetMap reg_set_map;
41804180
};
41814181

4182-
static std::vector<RegisterFlags::Field> ParseFlagsFields(XMLNode flags_node,
4183-
unsigned size) {
4182+
static FieldEnum::Enumerators ParseEnumEvalues(const XMLNode &enum_node) {
4183+
Log *log(GetLog(GDBRLog::Process));
4184+
// We will use the last instance of each value. Also we preserve the order
4185+
// of declaration in the XML, as it may not be numerical.
4186+
std::map<uint64_t, FieldEnum::Enumerator> enumerators;
4187+
4188+
enum_node.ForEachChildElementWithName(
4189+
"evalue", [&enumerators, &log](const XMLNode &enumerator_node) {
4190+
std::optional<llvm::StringRef> name;
4191+
std::optional<uint64_t> value;
4192+
4193+
enumerator_node.ForEachAttribute(
4194+
[&name, &value, &log](const llvm::StringRef &attr_name,
4195+
const llvm::StringRef &attr_value) {
4196+
if (attr_name == "name") {
4197+
if (attr_value.size())
4198+
name = attr_value;
4199+
else
4200+
LLDB_LOG(log, "ProcessGDBRemote::ParseEnumEvalues "
4201+
"Ignoring empty name in evalue");
4202+
} else if (attr_name == "value") {
4203+
uint64_t parsed_value = 0;
4204+
if (llvm::to_integer(attr_value, parsed_value))
4205+
value = parsed_value;
4206+
else
4207+
LLDB_LOG(log,
4208+
"ProcessGDBRemote::ParseEnumEvalues "
4209+
"Invalid value \"{0}\" in "
4210+
"evalue",
4211+
attr_value.data());
4212+
} else
4213+
LLDB_LOG(log,
4214+
"ProcessGDBRemote::ParseEnumEvalues Ignoring "
4215+
"unknown attribute "
4216+
"\"{0}\" in evalue",
4217+
attr_name.data());
4218+
4219+
// Keep walking attributes.
4220+
return true;
4221+
});
4222+
4223+
if (value && name)
4224+
enumerators.insert_or_assign(
4225+
*value, FieldEnum::Enumerator(*value, name->str()));
4226+
4227+
// Find all evalue elements.
4228+
return true;
4229+
});
4230+
4231+
FieldEnum::Enumerators final_enumerators;
4232+
for (auto [_, enumerator] : enumerators)
4233+
final_enumerators.push_back(enumerator);
4234+
4235+
return final_enumerators;
4236+
}
4237+
4238+
static void
4239+
ParseEnums(XMLNode feature_node,
4240+
llvm::StringMap<std::unique_ptr<FieldEnum>> &registers_enum_types) {
4241+
Log *log(GetLog(GDBRLog::Process));
4242+
4243+
// The top level element is "<enum...".
4244+
feature_node.ForEachChildElementWithName(
4245+
"enum", [log, &registers_enum_types](const XMLNode &enum_node) {
4246+
std::string id;
4247+
4248+
enum_node.ForEachAttribute([&id](const llvm::StringRef &attr_name,
4249+
const llvm::StringRef &attr_value) {
4250+
if (attr_name == "id")
4251+
id = attr_value;
4252+
4253+
// There is also a "size" attribute that is supposed to be the size in
4254+
// bytes of the register this applies to. However:
4255+
// * LLDB doesn't need this information.
4256+
// * It is difficult to verify because you have to wait until the
4257+
// enum is applied to a field.
4258+
//
4259+
// So we will emit this attribute in XML for GDB's sake, but will not
4260+
// bother ingesting it.
4261+
4262+
// Walk all attributes.
4263+
return true;
4264+
});
4265+
4266+
if (!id.empty()) {
4267+
FieldEnum::Enumerators enumerators = ParseEnumEvalues(enum_node);
4268+
if (!enumerators.empty()) {
4269+
LLDB_LOG(log,
4270+
"ProcessGDBRemote::ParseEnums Found enum type \"{0}\"",
4271+
id);
4272+
registers_enum_types.insert_or_assign(
4273+
id, std::make_unique<FieldEnum>(id, enumerators));
4274+
}
4275+
}
4276+
4277+
// Find all <enum> elements.
4278+
return true;
4279+
});
4280+
}
4281+
4282+
static std::vector<RegisterFlags::Field> ParseFlagsFields(
4283+
XMLNode flags_node, unsigned size,
4284+
const llvm::StringMap<std::unique_ptr<FieldEnum>> &registers_enum_types) {
41844285
Log *log(GetLog(GDBRLog::Process));
41854286
const unsigned max_start_bit = size * 8 - 1;
41864287

41874288
// Process the fields of this set of flags.
41884289
std::vector<RegisterFlags::Field> fields;
4189-
flags_node.ForEachChildElementWithName("field", [&fields, max_start_bit,
4190-
&log](const XMLNode
4191-
&field_node) {
4290+
flags_node.ForEachChildElementWithName("field", [&fields, max_start_bit, &log,
4291+
&registers_enum_types](
4292+
const XMLNode
4293+
&field_node) {
41924294
std::optional<llvm::StringRef> name;
41934295
std::optional<unsigned> start;
41944296
std::optional<unsigned> end;
4297+
std::optional<llvm::StringRef> type;
41954298

4196-
field_node.ForEachAttribute([&name, &start, &end, max_start_bit,
4299+
field_node.ForEachAttribute([&name, &start, &end, &type, max_start_bit,
41974300
&log](const llvm::StringRef &attr_name,
41984301
const llvm::StringRef &attr_value) {
41994302
// Note that XML in general requires that each of these attributes only
@@ -4240,8 +4343,7 @@ static std::vector<RegisterFlags::Field> ParseFlagsFields(XMLNode flags_node,
42404343
attr_value.data());
42414344
}
42424345
} else if (attr_name == "type") {
4243-
// Type is a known attribute but we do not currently use it and it is
4244-
// not required.
4346+
type = attr_value;
42454347
} else {
42464348
LLDB_LOG(
42474349
log,
@@ -4254,14 +4356,55 @@ static std::vector<RegisterFlags::Field> ParseFlagsFields(XMLNode flags_node,
42544356
});
42554357

42564358
if (name && start && end) {
4257-
if (*start > *end) {
4359+
if (*start > *end)
42584360
LLDB_LOG(
42594361
log,
42604362
"ProcessGDBRemote::ParseFlagsFields Start {0} > end {1} in field "
42614363
"\"{2}\", ignoring",
42624364
*start, *end, name->data());
4263-
} else {
4264-
fields.push_back(RegisterFlags::Field(name->str(), *start, *end));
4365+
else {
4366+
if (RegisterFlags::Field::GetSizeInBits(*start, *end) > 64)
4367+
LLDB_LOG(log,
4368+
"ProcessGDBRemote::ParseFlagsFields Ignoring field \"{2}\" "
4369+
"that has "
4370+
" size > 64 bits, this is not supported",
4371+
name->data());
4372+
else {
4373+
// A field's type may be set to the name of an enum type.
4374+
const FieldEnum *enum_type = nullptr;
4375+
if (type && !type->empty()) {
4376+
auto found = registers_enum_types.find(*type);
4377+
if (found != registers_enum_types.end()) {
4378+
enum_type = found->second.get();
4379+
4380+
// No enumerator can exceed the range of the field itself.
4381+
uint64_t max_value =
4382+
RegisterFlags::Field::GetMaxValue(*start, *end);
4383+
for (const auto &enumerator : enum_type->GetEnumerators()) {
4384+
if (enumerator.m_value > max_value) {
4385+
enum_type = nullptr;
4386+
LLDB_LOG(
4387+
log,
4388+
"ProcessGDBRemote::ParseFlagsFields In enum \"{0}\" "
4389+
"evalue \"{1}\" with value {2} exceeds the maximum value "
4390+
"of field \"{3}\" ({4}), ignoring enum",
4391+
type->data(), enumerator.m_name, enumerator.m_value,
4392+
name->data(), max_value);
4393+
break;
4394+
}
4395+
}
4396+
} else {
4397+
LLDB_LOG(log,
4398+
"ProcessGDBRemote::ParseFlagsFields Could not find type "
4399+
"\"{0}\" "
4400+
"for field \"{1}\", ignoring",
4401+
type->data(), name->data());
4402+
}
4403+
}
4404+
4405+
fields.push_back(
4406+
RegisterFlags::Field(name->str(), *start, *end, enum_type));
4407+
}
42654408
}
42664409
}
42674410

@@ -4272,12 +4415,14 @@ static std::vector<RegisterFlags::Field> ParseFlagsFields(XMLNode flags_node,
42724415

42734416
void ParseFlags(
42744417
XMLNode feature_node,
4275-
llvm::StringMap<std::unique_ptr<RegisterFlags>> &registers_flags_types) {
4418+
llvm::StringMap<std::unique_ptr<RegisterFlags>> &registers_flags_types,
4419+
const llvm::StringMap<std::unique_ptr<FieldEnum>> &registers_enum_types) {
42764420
Log *log(GetLog(GDBRLog::Process));
42774421

42784422
feature_node.ForEachChildElementWithName(
42794423
"flags",
4280-
[&log, &registers_flags_types](const XMLNode &flags_node) -> bool {
4424+
[&log, &registers_flags_types,
4425+
&registers_enum_types](const XMLNode &flags_node) -> bool {
42814426
LLDB_LOG(log, "ProcessGDBRemote::ParseFlags Found flags node \"{0}\"",
42824427
flags_node.GetAttributeValue("id").c_str());
42834428

@@ -4310,7 +4455,7 @@ void ParseFlags(
43104455
if (id && size) {
43114456
// Process the fields of this set of flags.
43124457
std::vector<RegisterFlags::Field> fields =
4313-
ParseFlagsFields(flags_node, *size);
4458+
ParseFlagsFields(flags_node, *size, registers_enum_types);
43144459
if (fields.size()) {
43154460
// Sort so that the fields with the MSBs are first.
43164461
std::sort(fields.rbegin(), fields.rend());
@@ -4375,13 +4520,19 @@ void ParseFlags(
43754520
bool ParseRegisters(
43764521
XMLNode feature_node, GdbServerTargetInfo &target_info,
43774522
std::vector<DynamicRegisterInfo::Register> &registers,
4378-
llvm::StringMap<std::unique_ptr<RegisterFlags>> &registers_flags_types) {
4523+
llvm::StringMap<std::unique_ptr<RegisterFlags>> &registers_flags_types,
4524+
llvm::StringMap<std::unique_ptr<FieldEnum>> &registers_enum_types) {
43794525
if (!feature_node)
43804526
return false;
43814527

43824528
Log *log(GetLog(GDBRLog::Process));
43834529

4384-
ParseFlags(feature_node, registers_flags_types);
4530+
// Enums first because they are referenced by fields in the flags.
4531+
ParseEnums(feature_node, registers_enum_types);
4532+
for (const auto &enum_type : registers_enum_types)
4533+
enum_type.second->log(log);
4534+
4535+
ParseFlags(feature_node, registers_flags_types, registers_enum_types);
43854536
for (const auto &flags : registers_flags_types)
43864537
flags.second->log(log);
43874538

@@ -4643,7 +4794,7 @@ bool ProcessGDBRemote::GetGDBServerRegisterInfoXMLAndProcess(
46434794
if (arch_to_use.IsValid()) {
46444795
for (auto &feature_node : feature_nodes) {
46454796
ParseRegisters(feature_node, target_info, registers,
4646-
m_registers_flags_types);
4797+
m_registers_flags_types, m_registers_enum_types);
46474798
}
46484799

46494800
for (const auto &include : target_info.includes) {
@@ -4708,13 +4859,14 @@ bool ProcessGDBRemote::GetGDBServerRegisterInfo(ArchSpec &arch_to_use) {
47084859
if (!m_gdb_comm.GetQXferFeaturesReadSupported())
47094860
return false;
47104861

4711-
// This holds register flags information for the whole of target.xml.
4862+
// These hold register type information for the whole of target.xml.
47124863
// target.xml may include further documents that
47134864
// GetGDBServerRegisterInfoXMLAndProcess will recurse to fetch and process.
47144865
// That's why we clear the cache here, and not in
47154866
// GetGDBServerRegisterInfoXMLAndProcess. To prevent it being cleared on every
47164867
// include read.
47174868
m_registers_flags_types.clear();
4869+
m_registers_enum_types.clear();
47184870
std::vector<DynamicRegisterInfo::Register> registers;
47194871
if (GetGDBServerRegisterInfoXMLAndProcess(arch_to_use, "target.xml",
47204872
registers))

lldb/source/Plugins/Process/gdb-remote/ProcessGDBRemote.h

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -484,6 +484,11 @@ class ProcessGDBRemote : public Process,
484484
// entries are added. Which would invalidate any pointers set in the register
485485
// info up to that point.
486486
llvm::StringMap<std::unique_ptr<RegisterFlags>> m_registers_flags_types;
487+
488+
// Enum types are referenced by register fields. This does not store the data
489+
// directly because the map may reallocate. Pointers to these are contained
490+
// within instances of RegisterFlags.
491+
llvm::StringMap<std::unique_ptr<FieldEnum>> m_registers_enum_types;
487492
};
488493

489494
} // namespace process_gdb_remote

lldb/source/Plugins/RegisterTypeBuilder/RegisterTypeBuilderClang.cpp

Lines changed: 27 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -43,8 +43,7 @@ CompilerType RegisterTypeBuilderClang::GetRegisterType(
4343
ScratchTypeSystemClang::GetForTarget(m_target);
4444
assert(type_system);
4545

46-
std::string register_type_name = "__lldb_register_fields_";
47-
register_type_name += name;
46+
std::string register_type_name = "__lldb_register_fields_" + name;
4847
// See if we have made this type before and can reuse it.
4948
CompilerType fields_type =
5049
type_system->GetTypeForIdentifier<clang::CXXRecordDecl>(
@@ -67,8 +66,33 @@ CompilerType RegisterTypeBuilderClang::GetRegisterType(
6766
// We assume that RegisterFlags has padded and sorted the fields
6867
// already.
6968
for (const RegisterFlags::Field &field : flags.GetFields()) {
69+
CompilerType field_type = field_uint_type;
70+
71+
if (const FieldEnum *enum_type = field.GetEnum()) {
72+
const FieldEnum::Enumerators &enumerators = enum_type->GetEnumerators();
73+
74+
if (enumerators.empty())
75+
continue;
76+
77+
std::string enum_type_name =
78+
register_type_name + "_" + field.GetName() + "_enum";
79+
field_type = type_system->CreateEnumerationType(
80+
enum_type_name, type_system->GetTranslationUnitDecl(),
81+
OptionalClangModuleID(), Declaration(), field_uint_type, false);
82+
83+
type_system->StartTagDeclarationDefinition(field_type);
84+
85+
Declaration decl;
86+
for (auto enumerator : enumerators)
87+
type_system->AddEnumerationValueToEnumerationType(
88+
field_type, decl, enumerator.m_name.c_str(), enumerator.m_value,
89+
byte_size * 8);
90+
91+
type_system->CompleteTagDeclarationDefinition(field_type);
92+
}
93+
7094
type_system->AddFieldToRecordType(fields_type, field.GetName(),
71-
field_uint_type, lldb::eAccessPublic,
95+
field_type, lldb::eAccessPublic,
7296
field.GetSizeInBits());
7397
}
7498

lldb/source/Target/RegisterFlags.cpp

Lines changed: 10 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -370,6 +370,16 @@ void FieldEnum::Enumerator::ToXML(Stream &strm) const {
370370
escaped_name.c_str(), m_value);
371371
}
372372

373+
void FieldEnum::Enumerator::log(Log *log) const {
374+
LLDB_LOG(log, " Name: \"{0}\" Value: {1}", m_name.c_str(), m_value);
375+
}
376+
377+
void FieldEnum::log(Log *log) const {
378+
LLDB_LOG(log, "ID: \"{0}\"", m_id.c_str());
379+
for (const auto &enumerator : GetEnumerators())
380+
enumerator.log(log);
381+
}
382+
373383
void RegisterFlags::ToXML(Stream &strm) const {
374384
// Example XML:
375385
// <flags id="cpsr_flags" size="4">

0 commit comments

Comments
 (0)