From c7fdac09d919aaf86d302e6c622de6ee000c1b7c Mon Sep 17 00:00:00 2001 From: Alan Modra Date: Wed, 20 Oct 2021 09:12:48 +1030 Subject: [PATCH] Re: PR27625, powerpc64 gold __tls_get_addr calls My previous PR27625 patch had a problem or two. For one, the error "__tls_get_addr call lacks marker reloc" on processing some calls before hitting a call without markers typically isn't seen. Instead a gold assertion fails. Either way it would be a hard error, which triggers on a file contained in libphobos.a when running the gcc testsuite. A warning isn't even appropriate since the call involved is one built by hand without any of the arg setup relocations that might result in linker optimisation. So this patch reverts most of commit 0af4fcc25dd5, instead entirely ignoring the problem of mis-optimising old-style __tls_get_addr calls without marker relocs. We can't handle them gracefully without another pass over relocations before decisions are made about GOT entries in Scan::global or Scan::local. That seems too costly, just to link object files from 2009. What's more, there doesn't seem to be any way to allow the libphobos explicit __tls_get_addr call, but not old TLS sequences without marker relocs. Examining instructions before the __tls_get_addr call is out of the question: program flow might reach the call via a branch. Putting an R_PPC64_TLSGD marker with zero sym on the call might be a solution, but current linkers will then merrily optimise away the call! PR gold/27625 * powerpc.cc (Powerpc_relobj): Delete no_tls_marker_, tls_marker_, and tls_opt_error_ variables and accessors. Remove all uses. --- gold/powerpc.cc | 192 +++++++++--------------------------------------- 1 file changed, 36 insertions(+), 156 deletions(-) diff --git a/gold/powerpc.cc b/gold/powerpc.cc index 4266268d639..3a6d3c6f612 100644 --- a/gold/powerpc.cc +++ b/gold/powerpc.cc @@ -101,7 +101,6 @@ public: : Sized_relobj_file(name, input_file, offset, ehdr), uniq_(object_id++), special_(0), relatoc_(0), toc_(0), has_small_toc_reloc_(false), opd_valid_(false), - no_tls_marker_(false), tls_marker_(false), tls_opt_error_(false), e_flags_(ehdr.get_e_flags()), no_toc_opt_(), opd_ent_(), access_from_map_(), has14_(), stub_table_index_(), st_other_(), attributes_section_data_(NULL) @@ -162,30 +161,6 @@ public: return this->no_toc_opt_[off]; } - void - set_no_tls_marker() - { - if (!this->no_tls_marker_ && this->tls_marker_) - this->tls_opt_error_ = true; - this->no_tls_marker_ = true; - } - - bool - no_tls_marker() const - { return this->no_tls_marker_; } - - void - set_tls_marker() - { this->tls_marker_ = true; } - - bool - tls_marker() const - { return this->tls_marker_; } - - bool - tls_opt_error() const - { return this->tls_opt_error_; } - // The .got2 section shndx. unsigned int got2_shndx() const @@ -473,19 +448,6 @@ private: // access_from_map_. bool opd_valid_; - // Set when finding a __tls_get_addr call without marker relocs. - // Such a call disables GD and LD tls optimisations for the object file. - bool no_tls_marker_; - - // Set when finding a __tls_get_addr call with marker relocs, or - // when finding a relocation that needs __tls_get_addr calls with - // marker relocs. - bool tls_marker_; - - // Set when seeing a __tls_get_addr call without marker relocs after - // seeing some __tls_get_addr calls with marker relocs. - bool tls_opt_error_; - // Header e_flags elfcpp::Elf_Word e_flags_; @@ -7911,42 +7873,23 @@ Target_powerpc::Scan::local( Powerpc_relobj* ppc_object = static_cast*>(object); - switch (this->maybe_skip_tls_get_addr_call(target, r_type, NULL)) - { - case Track_tls::NOT_EXPECTED: - ppc_object->set_no_tls_marker(); - break; - default: - break; - } + this->maybe_skip_tls_get_addr_call(target, r_type, NULL); if ((size == 64 && r_type == elfcpp::R_PPC64_TLSGD) || (size == 32 && r_type == elfcpp::R_PPC_TLSGD)) { this->expect_tls_get_addr_call(); - if (!ppc_object->no_tls_marker()) - { - tls::Tls_optimization tls_type = target->optimize_tls_gd(true); - if (tls_type != tls::TLSOPT_NONE) - { - this->skip_next_tls_get_addr_call(); - ppc_object->set_tls_marker(); - } - } + tls::Tls_optimization tls_type = target->optimize_tls_gd(true); + if (tls_type != tls::TLSOPT_NONE) + this->skip_next_tls_get_addr_call(); } else if ((size == 64 && r_type == elfcpp::R_PPC64_TLSLD) || (size == 32 && r_type == elfcpp::R_PPC_TLSLD)) { this->expect_tls_get_addr_call(); - if (!ppc_object->no_tls_marker()) - { - tls::Tls_optimization tls_type = target->optimize_tls_ld(); - if (tls_type != tls::TLSOPT_NONE) - { - this->skip_next_tls_get_addr_call(); - ppc_object->set_tls_marker(); - } - } + tls::Tls_optimization tls_type = target->optimize_tls_ld(); + if (tls_type != tls::TLSOPT_NONE) + this->skip_next_tls_get_addr_call(); } if (is_discarded) @@ -8248,9 +8191,7 @@ Target_powerpc::Scan::local( case elfcpp::R_POWERPC_GOT_TLSGD16_HI: case elfcpp::R_POWERPC_GOT_TLSGD16_HA: { - tls::Tls_optimization tls_type = tls::TLSOPT_NONE; - if (!ppc_object->no_tls_marker()) - tls_type = target->optimize_tls_gd(true); + tls::Tls_optimization tls_type = target->optimize_tls_gd(true); if (tls_type == tls::TLSOPT_NONE) { Got_type got_type = ((size == 32 @@ -8268,7 +8209,6 @@ Target_powerpc::Scan::local( else if (tls_type == tls::TLSOPT_TO_LE) { // no GOT relocs needed for Local Exec. - ppc_object->set_tls_marker(); } else gold_unreachable(); @@ -8281,9 +8221,7 @@ Target_powerpc::Scan::local( case elfcpp::R_POWERPC_GOT_TLSLD16_HI: case elfcpp::R_POWERPC_GOT_TLSLD16_HA: { - tls::Tls_optimization tls_type = tls::TLSOPT_NONE; - if (!ppc_object->no_tls_marker()) - tls_type = target->optimize_tls_ld(); + tls::Tls_optimization tls_type = target->optimize_tls_ld(); if (tls_type == tls::TLSOPT_NONE) target->tlsld_got_offset(symtab, layout, object); else if (tls_type == tls::TLSOPT_TO_LE) @@ -8295,7 +8233,6 @@ Target_powerpc::Scan::local( gold_assert(os != NULL); os->set_needs_symtab_index(); } - ppc_object->set_tls_marker(); } else gold_unreachable(); @@ -8638,9 +8575,6 @@ Target_powerpc::Scan::global( switch (this->maybe_skip_tls_get_addr_call(target, r_type, gsym)) { - case Track_tls::NOT_EXPECTED: - ppc_object->set_no_tls_marker(); - break; case Track_tls::SKIP: return; default: @@ -8656,30 +8590,18 @@ Target_powerpc::Scan::global( || (size == 32 && r_type == elfcpp::R_PPC_TLSGD)) { this->expect_tls_get_addr_call(); - if (!ppc_object->no_tls_marker()) - { - bool final = gsym->final_value_is_known(); - tls::Tls_optimization tls_type = target->optimize_tls_gd(final); - if (tls_type != tls::TLSOPT_NONE) - { - this->skip_next_tls_get_addr_call(); - ppc_object->set_tls_marker(); - } - } + bool final = gsym->final_value_is_known(); + tls::Tls_optimization tls_type = target->optimize_tls_gd(final); + if (tls_type != tls::TLSOPT_NONE) + this->skip_next_tls_get_addr_call(); } else if ((size == 64 && r_type == elfcpp::R_PPC64_TLSLD) || (size == 32 && r_type == elfcpp::R_PPC_TLSLD)) { this->expect_tls_get_addr_call(); - if (!ppc_object->no_tls_marker()) - { - tls::Tls_optimization tls_type = target->optimize_tls_ld(); - if (tls_type != tls::TLSOPT_NONE) - { - this->skip_next_tls_get_addr_call(); - ppc_object->set_tls_marker(); - } - } + tls::Tls_optimization tls_type = target->optimize_tls_ld(); + if (tls_type != tls::TLSOPT_NONE) + this->skip_next_tls_get_addr_call(); } // A STT_GNU_IFUNC symbol may require a PLT entry. @@ -9061,12 +8983,8 @@ Target_powerpc::Scan::global( case elfcpp::R_POWERPC_GOT_TLSGD16_HI: case elfcpp::R_POWERPC_GOT_TLSGD16_HA: { - tls::Tls_optimization tls_type = tls::TLSOPT_NONE; - if (!ppc_object->no_tls_marker()) - { - bool final = gsym->final_value_is_known(); - tls_type = target->optimize_tls_gd(final); - } + bool final = gsym->final_value_is_known(); + tls::Tls_optimization tls_type = target->optimize_tls_gd(final); if (tls_type == tls::TLSOPT_NONE) { Got_type got_type = ((size == 32 @@ -9107,12 +9025,10 @@ Target_powerpc::Scan::global( got, off, addend); } } - ppc_object->set_tls_marker(); } else if (tls_type == tls::TLSOPT_TO_LE) { // no GOT relocs needed for Local Exec. - ppc_object->set_tls_marker(); } else gold_unreachable(); @@ -9125,9 +9041,7 @@ Target_powerpc::Scan::global( case elfcpp::R_POWERPC_GOT_TLSLD16_HI: case elfcpp::R_POWERPC_GOT_TLSLD16_HA: { - tls::Tls_optimization tls_type = tls::TLSOPT_NONE; - if (!ppc_object->no_tls_marker()) - tls_type = target->optimize_tls_ld(); + tls::Tls_optimization tls_type = target->optimize_tls_ld(); if (tls_type == tls::TLSOPT_NONE) target->tlsld_got_offset(symtab, layout, object); else if (tls_type == tls::TLSOPT_TO_LE) @@ -9139,7 +9053,6 @@ Target_powerpc::Scan::global( gold_assert(os != NULL); os->set_needs_symtab_index(); } - ppc_object->set_tls_marker(); } else gold_unreachable(); @@ -10515,20 +10428,11 @@ Target_powerpc::Relocate::relocate( switch (this->maybe_skip_tls_get_addr_call(target, r_type, gsym)) { case Track_tls::NOT_EXPECTED: - if (!parameters->options().shared() - && parameters->options().tls_optimize()) - { - // It is a hard error to see a __tls_get_addr call without - // marker relocs after seeing calls with marker relocs in the - // same object file, because dynamic relocation accounting - // will be wrong. - if (object->tls_opt_error()) - gold_error_at_location(relinfo, relnum, rela.get_r_offset(), - _("__tls_get_addr call lacks marker reloc")); - else - gold_warning_at_location(relinfo, relnum, rela.get_r_offset(), - _("__tls_get_addr call lacks marker reloc")); - } + // No warning. This will result in really old code without tls + // marker relocs being mis-optimised, but there shouldn't be too + // much of that code around. The problem with warning is that + // glibc and libphobos both construct direct calls to + // __tls_get_addr in a way that is harmless. break; case Track_tls::EXPECTED: // We have already complained. @@ -10807,12 +10711,8 @@ Target_powerpc::Relocate::relocate( || r_type == elfcpp::R_PPC64_GOT_TLSGD_PCREL34) { // First instruction of a global dynamic sequence, arg setup insn. - tls::Tls_optimization tls_type = tls::TLSOPT_NONE; - if (!object->no_tls_marker()) - { - bool final = gsym == NULL || gsym->final_value_is_known(); - tls_type = target->optimize_tls_gd(final); - } + bool final = gsym == NULL || gsym->final_value_is_known(); + tls::Tls_optimization tls_type = target->optimize_tls_gd(final); Got_type got_type = ((size == 32 || r_type == elfcpp::R_POWERPC_GOT_TLSGD16) ? GOT_TYPE_SMALL : GOT_TYPE_STANDARD); @@ -10914,9 +10814,7 @@ Target_powerpc::Relocate::relocate( || r_type == elfcpp::R_PPC64_GOT_TLSLD_PCREL34) { // First instruction of a local dynamic sequence, arg setup insn. - tls::Tls_optimization tls_type = tls::TLSOPT_NONE; - if (!object->no_tls_marker()) - tls_type = target->optimize_tls_ld(); + tls::Tls_optimization tls_type = target->optimize_tls_ld(); if (tls_type == tls::TLSOPT_NONE) { value = target->tlsld_got_offset(); @@ -11057,12 +10955,8 @@ Target_powerpc::Relocate::relocate( // Second instruction of a global dynamic sequence, // the __tls_get_addr call this->expect_tls_get_addr_call(relinfo, relnum, rela.get_r_offset()); - tls::Tls_optimization tls_type = tls::TLSOPT_NONE; - if (!object->no_tls_marker()) - { - bool final = gsym == NULL || gsym->final_value_is_known(); - tls_type = target->optimize_tls_gd(final); - } + bool final = gsym == NULL || gsym->final_value_is_known(); + tls::Tls_optimization tls_type = target->optimize_tls_gd(final); if (tls_type != tls::TLSOPT_NONE) { if (tls_type == tls::TLSOPT_TO_IE) @@ -11113,9 +11007,7 @@ Target_powerpc::Relocate::relocate( // Second instruction of a local dynamic sequence, // the __tls_get_addr call this->expect_tls_get_addr_call(relinfo, relnum, rela.get_r_offset()); - tls::Tls_optimization tls_type = tls::TLSOPT_NONE; - if (!object->no_tls_marker()) - tls_type = target->optimize_tls_ld(); + tls::Tls_optimization tls_type = target->optimize_tls_ld(); if (tls_type == tls::TLSOPT_TO_LE) { bool is_pcrel = false; @@ -12605,12 +12497,8 @@ Target_powerpc::relocate_relocs( { // First instruction of a global dynamic sequence, // arg setup insn. - tls::Tls_optimization tls_type = tls::TLSOPT_NONE; - if (!object->no_tls_marker()) - { - bool final = gsym == NULL || gsym->final_value_is_known(); - tls_type = this->optimize_tls_gd(final); - } + bool final = gsym == NULL || gsym->final_value_is_known(); + tls::Tls_optimization tls_type = this->optimize_tls_gd(final); switch (tls_type) { case tls::TLSOPT_TO_IE: @@ -12638,9 +12526,7 @@ Target_powerpc::relocate_relocs( { // First instruction of a local dynamic sequence, // arg setup insn. - tls::Tls_optimization tls_type = tls::TLSOPT_NONE; - if (!object->no_tls_marker()) - tls_type = this->optimize_tls_ld(); + tls::Tls_optimization tls_type = this->optimize_tls_ld(); if (tls_type == tls::TLSOPT_TO_LE) { if (r_type == elfcpp::R_POWERPC_GOT_TLSLD16 @@ -12685,12 +12571,8 @@ Target_powerpc::relocate_relocs( { // Second instruction of a global dynamic sequence, // the __tls_get_addr call - tls::Tls_optimization tls_type = tls::TLSOPT_NONE; - if (!object->no_tls_marker()) - { - bool final = gsym == NULL || gsym->final_value_is_known(); - tls_type = this->optimize_tls_gd(final); - } + bool final = gsym == NULL || gsym->final_value_is_known(); + tls::Tls_optimization tls_type = this->optimize_tls_gd(final); switch (tls_type) { case tls::TLSOPT_TO_IE: @@ -12711,9 +12593,7 @@ Target_powerpc::relocate_relocs( { // Second instruction of a local dynamic sequence, // the __tls_get_addr call - tls::Tls_optimization tls_type = tls::TLSOPT_NONE; - if (!object->no_tls_marker()) - tls_type = this->optimize_tls_ld(); + tls::Tls_optimization tls_type = this->optimize_tls_ld(); if (tls_type == tls::TLSOPT_TO_LE) { const Output_section* os = relinfo->layout->tls_segment() -- 2.30.2