Hi Marcus,

applied and pushed, after intensive testing with Qemu and
uClibc-ng-test.

 thanks
  Waldemar

Marcus Hähnel wrote,

> ... and here is the attachment ...
> 
> 
> 
> 
> On Thu, 2025-03-20 at 09:39 +0100, Marcus Hähnel wrote:
> > Dear List
> > 
> > So far, uclibc relied on the informal behaviour of GNU ld to put the link 
> > address of the _DYNAMIC symbol in the first GOT
> > entry. This does not work with LLVM lld which does not follow this 
> > convention. Consequently, glibc has abandoned its usage
> > in favour of using __ehdr_start as magic symbol to infer the load address 
> > [1]. 
> > 
> > Note that this implies that the link time address of __ehdr_start is 
> > *always* 0! So far, this seems to be the case on all
> > platforms.
> > 
> > We implemented this change only for the platforms which we actively support 
> > and test at Kernkonzept (arm64, arm, i386,
> > x86_64 and and riscv). The riscv64 dl-sysdep.h already used the method we 
> > converted the others to. For the other platforms
> > we do not have the capacity to port this, but as long as noone wants to 
> > build them using lld this should not be an issue.
> > 
> > Please feel free to test this on the relevant platforms before merging, to 
> > be sure it works as intended with the upstream
> > version of the lib. 
> > 
> > Best regards,
> > 
> > - Marcus
> > 
> > 
> > [1] https://sourceware.org/bugzilla/show_bug.cgi?id=28203
> > 
> > 
> > 
> > 
> 
> -- 
> +++++++++++++++++++
> 
> 
> Register now for our workshop "Get to know L4Re in 3 days" on April 8-10. 
> Learn to design and deploy secure system
> architectures for your product with L4Re: 
> https://www.kernkonzept.com/workshop-getting-started-with-l4re/
> 
> +++++++++++++++++++
> 
> Kernkonzept GmbH
> Sitz: Dresden
> HRB 31129
> Geschäftsführer: Dr.-Ing. Michael Hohmuth
> 
> 

> From 9a4929ce522d34bed13c24e88c58ae48f1c538c5 Mon Sep 17 00:00:00 2001
> From: =?UTF-8?q?Jan=20Kl=C3=B6tzke?= <jan.kloet...@kernkonzept.com>
> Date: Tue, 18 Mar 2025 07:41:47 +0100
> Subject: [PATCH] Use __ehdr_start to compute load address
> 
> So far, uclibc relied on the informal behaviour of GNU ld to put the
> link address of the _DYNAMIC symbol in the first GOT entry. This does
> not work with LLVM lld which does not follow this convention.
> Consequently, glibc has abandoned its usage in favour of using
> __ehdr_start as magic symbol to infer the load address [1].
> 
> Note that this implies that the link time address of __ehdr_start is
> *always* 0! So far, this seems to be the case on all platforms.
> 
> [1] https://sourceware.org/bugzilla/show_bug.cgi?id=28203
> 
> Signed-off-by: Marcus Haehnel <marcus.haeh...@kernkonzept.com>
> ---
>  ldso/ldso/aarch64/dl-sysdep.h | 25 +++++--------
>  ldso/ldso/arm/dl-sysdep.h     | 69 +++++------------------------------
>  ldso/ldso/i386/dl-sysdep.h    | 27 +++++---------
>  ldso/ldso/riscv32/dl-sysdep.h | 22 +++++------
>  ldso/ldso/x86_64/dl-sysdep.h  | 45 +++++------------------
>  5 files changed, 48 insertions(+), 140 deletions(-)
> 
> diff --git a/ldso/ldso/aarch64/dl-sysdep.h b/ldso/ldso/aarch64/dl-sysdep.h
> index 6d9d2c1fb..3466920d9 100644
> --- a/ldso/ldso/aarch64/dl-sysdep.h
> +++ b/ldso/ldso/aarch64/dl-sysdep.h
> @@ -54,28 +54,21 @@ unsigned long _dl_linux_resolver(struct elf_resolve * 
> tpnt, int reloc_entry);
>       || (type) == R_AARCH64_TLSDESC) * ELF_RTYPE_CLASS_PLT)          \
>     | (((type) == R_AARCH64_COPY) * ELF_RTYPE_CLASS_COPY))
>  
> -/* Return the link-time address of _DYNAMIC.  Conveniently, this is the
> -   first element of the GOT. */
> -extern const ElfW(Addr) _GLOBAL_OFFSET_TABLE_[] attribute_hidden;
> -static __always_inline ElfW(Addr) __attribute__ ((unused))
> -elf_machine_dynamic (void)
> -{
> -  return _GLOBAL_OFFSET_TABLE_[0];
> -}
> -
>  /* Return the run-time load address of the shared object.  */
>  
>  static __always_inline ElfW(Addr) __attribute__ ((unused))
>  elf_machine_load_address (void)
>  {
> -  /* To figure out the load address we use the definition that for any 
> symbol:
> -     dynamic_addr(symbol) = static_addr(symbol) + load_addr
> -
> -    _DYNAMIC sysmbol is used here as its link-time address stored in
> -    the special unrelocated first GOT entry.  */
> +  extern const ElfW(Ehdr) __ehdr_start attribute_hidden;
> +  return (ElfW(Addr)) &__ehdr_start;
> +}
>  
> -    extern ElfW(Dyn) _DYNAMIC[] attribute_hidden;
> -    return (ElfW(Addr)) &_DYNAMIC - elf_machine_dynamic ();
> +/* Return the link-time address of _DYNAMIC. */
> +static __always_inline ElfW(Addr) __attribute__ ((unused))
> +elf_machine_dynamic (void)
> +{
> +  extern ElfW(Dyn) _DYNAMIC[] attribute_hidden;
> +  return (ElfW(Addr)) _DYNAMIC - elf_machine_load_address ();
>  }
>  
>  static __always_inline void
> diff --git a/ldso/ldso/arm/dl-sysdep.h b/ldso/ldso/arm/dl-sysdep.h
> index 0f783e1c4..93e36b694 100644
> --- a/ldso/ldso/arm/dl-sysdep.h
> +++ b/ldso/ldso/arm/dl-sysdep.h
> @@ -96,43 +96,6 @@ unsigned long _dl_linux_resolver(struct elf_resolve * 
> tpnt, int reloc_entry);
>     | (((type) == R_ARM_COPY) * ELF_RTYPE_CLASS_COPY))
>  #endif /* __FDPIC__ */
>  
> -/* Return the link-time address of _DYNAMIC.  Conveniently, this is the
> -   first element of the GOT.  We used to use the PIC register to do this
> -   without a constant pool reference, but GCC 4.2 will use a pseudo-register
> -   for the PIC base, so it may not be in r10.  */
> -static __always_inline Elf32_Addr __attribute__ ((unused))
> -elf_machine_dynamic (void)
> -{
> -  Elf32_Addr dynamic;
> -#if !defined __thumb__
> -  __asm__ ("ldr %0, 2f\n"
> -       "1: ldr %0, [pc, %0]\n"
> -       "b 3f\n"
> -       "2: .word _GLOBAL_OFFSET_TABLE_ - (1b+8)\n"
> -       "3:" : "=r" (dynamic));
> -#else
> -  int tmp;
> -  __asm__ (".align 2\n"
> -       "bx     pc\n"
> -       "nop\n"
> -       ".arm\n"
> -       "ldr %0, 2f\n"
> -       "1: ldr %0, [pc, %0]\n"
> -       "b 3f\n"
> -       "2: .word _GLOBAL_OFFSET_TABLE_ - (1b+8)\n"
> -       "3:"
> -       ".align  2\n"
> -        "orr     %1, pc, #1\n"
> -        "bx      %1\n"
> -        ".force_thumb\n"
> -       : "=r" (dynamic), "=&r" (tmp));
> -#endif
> -
> -  return dynamic;
> -}
> -
> -extern char __dl_start[] __asm__("_dl_start");
> -
>  #ifdef __FDPIC__
>  /* We must force strings used early in the bootstrap into the data
>     segment.  */
> @@ -148,28 +111,16 @@ extern char __dl_start[] __asm__("_dl_start");
>  static __always_inline Elf32_Addr __attribute__ ((unused))
>  elf_machine_load_address (void)
>  {
> -#if defined(__FDPIC__)
> -     return 0;
> -#else
> -     Elf32_Addr got_addr = (Elf32_Addr) &__dl_start;
> -     Elf32_Addr pcrel_addr;
> -#if defined __OPTIMIZE__ && !defined __thumb__
> -     __asm__ ("adr %0, _dl_start" : "=r" (pcrel_addr));
> -#else
> -     /* A simple adr does not work in Thumb mode because the offset is
> -        negative, and for debug builds may be too large.  */
> -     int tmp;
> -     __asm__ ("adr %1, 1f\n\t"
> -              "ldr %0, [%1]\n\t"
> -              "add %0, %0, %1\n\t"
> -              "b 2f\n\t"
> -              ".align 2\n\t"
> -              "1: .word _dl_start - 1b\n\t"
> -              "2:"
> -              : "=r" (pcrel_addr), "=r" (tmp));
> -#endif
> -     return pcrel_addr - got_addr;
> -#endif
> +  extern const Elf32_Ehdr __ehdr_start attribute_hidden;
> +  return (Elf32_Addr) &__ehdr_start;
> +}
> +
> +/* Return the link-time address of _DYNAMIC. */
> +static __always_inline Elf32_Addr __attribute__ ((unused))
> +elf_machine_dynamic (void)
> +{
> +  extern Elf32_Dyn _DYNAMIC[] attribute_hidden;
> +  return (Elf32_Addr) _DYNAMIC - elf_machine_load_address ();
>  }
>  
>  static __always_inline void
> diff --git a/ldso/ldso/i386/dl-sysdep.h b/ldso/ldso/i386/dl-sysdep.h
> index b95328df4..8fc80a145 100644
> --- a/ldso/ldso/i386/dl-sysdep.h
> +++ b/ldso/ldso/i386/dl-sysdep.h
> @@ -35,28 +35,21 @@ extern unsigned long _dl_linux_resolver(struct 
> elf_resolve * tpnt, int reloc_ent
>       || (type) == R_386_TLS_TPOFF) * ELF_RTYPE_CLASS_PLT)                    
>           \
>     | (((type) == R_386_COPY) * ELF_RTYPE_CLASS_COPY))
>  
> -/* Return the link-time address of _DYNAMIC.  Conveniently, this is the
> -   first element of the GOT, a special entry that is never relocated.  */
> -extern const Elf32_Addr _GLOBAL_OFFSET_TABLE_[] attribute_hidden;
> -static __always_inline Elf32_Addr __attribute__ ((unused, const))
> -elf_machine_dynamic (void)
> -{
> -     /* This produces a GOTOFF reloc that resolves to zero at link time, so 
> in
> -        fact just loads from the GOT register directly.  By doing it without
> -        an asm we can let the compiler choose any register.  */
> -     return _GLOBAL_OFFSET_TABLE_[0];
> -}
> -
>  
> -extern Elf32_Dyn bygotoff[] __asm__ ("_DYNAMIC") attribute_hidden;
>  /* Return the run-time load address of the shared object.  */
>  static __always_inline Elf32_Addr attribute_unused
>  elf_machine_load_address (void)
>  {
> -     /* Compute the difference between the runtime address of _DYNAMIC as 
> seen
> -        by a GOTOFF reference, and the link-time address found in the special
> -        unrelocated first GOT entry.  */
> -     return (Elf32_Addr) &bygotoff - elf_machine_dynamic ();
> +     extern const Elf32_Ehdr __ehdr_start attribute_hidden;
> +     return (Elf32_Addr) &__ehdr_start;
> +}
> +
> +/* Return the link-time address of _DYNAMIC. */
> +static __always_inline Elf32_Addr __attribute__ ((unused, const))
> +elf_machine_dynamic (void)
> +{
> +     extern Elf32_Dyn _DYNAMIC[] attribute_hidden;
> +     return (Elf32_Addr) _DYNAMIC - elf_machine_load_address ();
>  }
>  
>  static __always_inline void
> diff --git a/ldso/ldso/riscv32/dl-sysdep.h b/ldso/ldso/riscv32/dl-sysdep.h
> index e0a59fddd..02296b148 100644
> --- a/ldso/ldso/riscv32/dl-sysdep.h
> +++ b/ldso/ldso/riscv32/dl-sysdep.h
> @@ -59,22 +59,20 @@ unsigned long _dl_linux_resolver(struct elf_resolve * 
> tpnt, int reloc_entry);
>     | (ELF_RTYPE_CLASS_COPY * ((type) == R_RISCV_COPY)))
>  
>  
> -/* Return the link-time address of _DYNAMIC.  */
> -static inline ElfW(Addr)
> -elf_machine_dynamic (void)
> -{
> -  extern ElfW(Addr) _GLOBAL_OFFSET_TABLE_ __attribute__ ((visibility 
> ("hidden")));
> -  return _GLOBAL_OFFSET_TABLE_;
> -}
> -
> -
>  /* Return the run-time load address of the shared object.  */
>  static __always_inline ElfW(Addr) __attribute__ ((unused))
>  elf_machine_load_address (void)
>  {
> -  ElfW(Addr) load_addr;
> -  __asm__ ("lla %0, _DYNAMIC" : "=r" (load_addr));
> -  return load_addr - elf_machine_dynamic ();
> +  extern const ElfW(Ehdr) __ehdr_start attribute_hidden;
> +  return (ElfW(Addr)) &__ehdr_start;
> +}
> +
> +/* Return the link-time address of _DYNAMIC.  */
> +static inline ElfW(Addr)
> +elf_machine_dynamic (void)
> +{
> +  extern ElfW(Dyn) _DYNAMIC[] attribute_hidden;
> +  return (ElfW(Addr)) _DYNAMIC - elf_machine_load_address ();
>  }
>  
>  static __always_inline void
> diff --git a/ldso/ldso/x86_64/dl-sysdep.h b/ldso/ldso/x86_64/dl-sysdep.h
> index ccf9a8851..58447a951 100644
> --- a/ldso/ldso/x86_64/dl-sysdep.h
> +++ b/ldso/ldso/x86_64/dl-sysdep.h
> @@ -52,48 +52,21 @@ extern unsigned long _dl_linux_resolver(struct 
> elf_resolve * tpnt, int reloc_ent
>      * ELF_RTYPE_CLASS_PLT)                                                 \
>     | (((type) == R_X86_64_COPY) * ELF_RTYPE_CLASS_COPY))
>  
> -/* Return the link-time address of _DYNAMIC.  Conveniently, this is the
> -   first element of the GOT.  This must be inlined in a function which
> -   uses global data.  */
> -static __always_inline Elf64_Addr __attribute__ ((unused))
> -elf_machine_dynamic (void)
> -{
> -  Elf64_Addr addr;
> -
> -  /* This works because we have our GOT address available in the small PIC
> -     model.  */
> -  addr = (Elf64_Addr) &_DYNAMIC;
> -
> -  return addr;
> -}
> -
>  
>  /* Return the run-time load address of the shared object.  */
>  static __always_inline Elf64_Addr __attribute__ ((unused))
>  elf_machine_load_address (void)
>  {
> -  register Elf64_Addr addr, tmp;
> -
> -  /* The easy way is just the same as on x86:
> -       leaq _dl_start, %0
> -       leaq _dl_start(%%rip), %1
> -       subq %0, %1
> -     but this does not work with binutils since we then have
> -     a R_X86_64_32S relocation in a shared lib.
> -
> -     Instead we store the address of _dl_start in the data section
> -     and compare it with the current value that we can get via
> -     an RIP relative addressing mode.  */
> -
> -  __asm__ ("movq 1f(%%rip), %1\n"
> -       "0:\tleaq _dl_start(%%rip), %0\n\t"
> -       "subq %1, %0\n\t"
> -       ".section\t.data\n"
> -       "1:\t.quad _dl_start\n\t"
> -       ".previous\n\t"
> -       : "=r" (addr), "=r" (tmp) : : "cc");
> +  extern const Elf64_Ehdr __ehdr_start attribute_hidden;
> +  return (Elf64_Addr) &__ehdr_start;
> +}
>  
> -  return addr;
> +/* Return the link-time address of _DYNAMIC. */
> +static __always_inline Elf64_Addr __attribute__ ((unused))
> +elf_machine_dynamic (void)
> +{
> +  extern Elf64_Dyn _DYNAMIC[] attribute_hidden;
> +  return (Elf64_Addr) _DYNAMIC - elf_machine_load_address ();
>  }
>  
>  static __always_inline void
> -- 
> 2.47.1
> 




> _______________________________________________
> devel mailing list -- devel@uclibc-ng.org
> To unsubscribe send an email to devel-le...@uclibc-ng.org

_______________________________________________
devel mailing list -- devel@uclibc-ng.org
To unsubscribe send an email to devel-le...@uclibc-ng.org

Reply via email to