2015-04-13 09:56:26 +03:00
|
|
|
#include <stddef.h>
|
|
|
|
#include "dynlink.h"
|
2018-09-05 19:43:34 +03:00
|
|
|
#include "libc.h"
|
2015-04-13 09:56:26 +03:00
|
|
|
|
|
|
|
#ifndef START
|
|
|
|
#define START "_dlstart"
|
|
|
|
#endif
|
|
|
|
|
2016-02-18 07:13:05 +03:00
|
|
|
#define SHARED
|
|
|
|
|
2015-04-13 09:56:26 +03:00
|
|
|
#include "crt_arch.h"
|
|
|
|
|
2015-09-17 11:05:34 +03:00
|
|
|
#ifndef GETFUNCSYM
|
|
|
|
#define GETFUNCSYM(fp, sym, got) do { \
|
2018-09-05 19:43:34 +03:00
|
|
|
hidden void sym(); \
|
2015-09-17 11:05:34 +03:00
|
|
|
static void (*static_func_ptr)() = sym; \
|
|
|
|
__asm__ __volatile__ ( "" : "+m"(static_func_ptr) : : "memory"); \
|
|
|
|
*(fp) = static_func_ptr; } while(0)
|
|
|
|
#endif
|
|
|
|
|
2018-09-05 19:43:34 +03:00
|
|
|
hidden void _dlstart_c(size_t *sp, size_t *dynv)
|
2015-04-13 09:56:26 +03:00
|
|
|
{
|
|
|
|
size_t i, aux[AUX_CNT], dyn[DYN_CNT];
|
2015-09-21 23:42:44 +03:00
|
|
|
size_t *rel, rel_size, base;
|
2015-04-13 09:56:26 +03:00
|
|
|
|
|
|
|
int argc = *sp;
|
|
|
|
char **argv = (void *)(sp+1);
|
|
|
|
|
|
|
|
for (i=argc+1; argv[i]; i++);
|
|
|
|
size_t *auxv = (void *)(argv+i+1);
|
|
|
|
|
|
|
|
for (i=0; i<AUX_CNT; i++) aux[i] = 0;
|
|
|
|
for (i=0; auxv[i]; i+=2) if (auxv[i]<AUX_CNT)
|
|
|
|
aux[auxv[i]] = auxv[i+1];
|
|
|
|
|
2015-09-22 06:54:42 +03:00
|
|
|
#if DL_FDPIC
|
|
|
|
struct fdpic_loadseg *segs, fakeseg;
|
|
|
|
size_t j;
|
|
|
|
if (dynv) {
|
|
|
|
/* crt_arch.h entry point asm is responsible for reserving
|
|
|
|
* space and moving the extra fdpic arguments to the stack
|
|
|
|
* vector where they are easily accessible from C. */
|
|
|
|
segs = ((struct fdpic_loadmap *)(sp[-1] ? sp[-1] : sp[-2]))->segs;
|
|
|
|
} else {
|
|
|
|
/* If dynv is null, the entry point was started from loader
|
|
|
|
* that is not fdpic-aware. We can assume normal fixed-
|
|
|
|
* displacement ELF loading was performed, but when ldso was
|
|
|
|
* run as a command, finding the Ehdr is a heursitic: we
|
|
|
|
* have to assume Phdrs start in the first 4k of the file. */
|
|
|
|
base = aux[AT_BASE];
|
|
|
|
if (!base) base = aux[AT_PHDR] & -4096;
|
|
|
|
segs = &fakeseg;
|
|
|
|
segs[0].addr = base;
|
|
|
|
segs[0].p_vaddr = 0;
|
|
|
|
segs[0].p_memsz = -1;
|
|
|
|
Ehdr *eh = (void *)base;
|
|
|
|
Phdr *ph = (void *)(base + eh->e_phoff);
|
|
|
|
size_t phnum = eh->e_phnum;
|
|
|
|
size_t phent = eh->e_phentsize;
|
|
|
|
while (phnum-- && ph->p_type != PT_DYNAMIC)
|
|
|
|
ph = (void *)((size_t)ph + phent);
|
|
|
|
dynv = (void *)(base + ph->p_vaddr);
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2015-04-13 09:56:26 +03:00
|
|
|
for (i=0; i<DYN_CNT; i++) dyn[i] = 0;
|
|
|
|
for (i=0; dynv[i]; i+=2) if (dynv[i]<DYN_CNT)
|
|
|
|
dyn[dynv[i]] = dynv[i+1];
|
|
|
|
|
2015-09-22 06:54:42 +03:00
|
|
|
#if DL_FDPIC
|
|
|
|
for (i=0; i<DYN_CNT; i++) {
|
|
|
|
if (i==DT_RELASZ || i==DT_RELSZ) continue;
|
|
|
|
if (!dyn[i]) continue;
|
|
|
|
for (j=0; dyn[i]-segs[j].p_vaddr >= segs[j].p_memsz; j++);
|
|
|
|
dyn[i] += segs[j].addr - segs[j].p_vaddr;
|
|
|
|
}
|
|
|
|
base = 0;
|
|
|
|
|
|
|
|
const Sym *syms = (void *)dyn[DT_SYMTAB];
|
|
|
|
|
|
|
|
rel = (void *)dyn[DT_RELA];
|
|
|
|
rel_size = dyn[DT_RELASZ];
|
|
|
|
for (; rel_size; rel+=3, rel_size-=3*sizeof(size_t)) {
|
|
|
|
if (!IS_RELATIVE(rel[1], syms)) continue;
|
|
|
|
for (j=0; rel[0]-segs[j].p_vaddr >= segs[j].p_memsz; j++);
|
|
|
|
size_t *rel_addr = (void *)
|
|
|
|
(rel[0] + segs[j].addr - segs[j].p_vaddr);
|
|
|
|
if (R_TYPE(rel[1]) == REL_FUNCDESC_VAL) {
|
|
|
|
*rel_addr += segs[rel_addr[1]].addr
|
|
|
|
- segs[rel_addr[1]].p_vaddr
|
|
|
|
+ syms[R_SYM(rel[1])].st_value;
|
|
|
|
rel_addr[1] = dyn[DT_PLTGOT];
|
|
|
|
} else {
|
|
|
|
size_t val = syms[R_SYM(rel[1])].st_value;
|
|
|
|
for (j=0; val-segs[j].p_vaddr >= segs[j].p_memsz; j++);
|
|
|
|
*rel_addr = rel[2] + segs[j].addr - segs[j].p_vaddr + val;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
#else
|
2015-04-13 09:56:26 +03:00
|
|
|
/* If the dynamic linker is invoked as a command, its load
|
|
|
|
* address is not available in the aux vector. Instead, compute
|
|
|
|
* the load address as the difference between &_DYNAMIC and the
|
|
|
|
* virtual address in the PT_DYNAMIC program header. */
|
2015-09-21 23:42:44 +03:00
|
|
|
base = aux[AT_BASE];
|
2015-04-13 09:56:26 +03:00
|
|
|
if (!base) {
|
|
|
|
size_t phnum = aux[AT_PHNUM];
|
|
|
|
size_t phentsize = aux[AT_PHENT];
|
|
|
|
Phdr *ph = (void *)aux[AT_PHDR];
|
|
|
|
for (i=phnum; i--; ph = (void *)((char *)ph + phentsize)) {
|
|
|
|
if (ph->p_type == PT_DYNAMIC) {
|
2015-09-21 23:42:44 +03:00
|
|
|
base = (size_t)dynv - ph->p_vaddr;
|
2015-04-13 09:56:26 +03:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/* MIPS uses an ugly packed form for GOT relocations. Since we
|
|
|
|
* can't make function calls yet and the code is tiny anyway,
|
|
|
|
* it's simply inlined here. */
|
|
|
|
if (NEED_MIPS_GOT_RELOCS) {
|
|
|
|
size_t local_cnt = 0;
|
|
|
|
size_t *got = (void *)(base + dyn[DT_PLTGOT]);
|
|
|
|
for (i=0; dynv[i]; i+=2) if (dynv[i]==DT_MIPS_LOCAL_GOTNO)
|
|
|
|
local_cnt = dynv[i+1];
|
2015-09-21 23:42:44 +03:00
|
|
|
for (i=0; i<local_cnt; i++) got[i] += base;
|
2015-04-13 09:56:26 +03:00
|
|
|
}
|
|
|
|
|
2015-05-25 07:32:37 +03:00
|
|
|
rel = (void *)(base+dyn[DT_REL]);
|
|
|
|
rel_size = dyn[DT_RELSZ];
|
|
|
|
for (; rel_size; rel+=2, rel_size-=2*sizeof(size_t)) {
|
2015-09-22 06:54:42 +03:00
|
|
|
if (!IS_RELATIVE(rel[1], 0)) continue;
|
2015-05-25 07:32:37 +03:00
|
|
|
size_t *rel_addr = (void *)(base + rel[0]);
|
2015-09-21 23:42:44 +03:00
|
|
|
*rel_addr += base;
|
2015-05-25 07:32:37 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
rel = (void *)(base+dyn[DT_RELA]);
|
|
|
|
rel_size = dyn[DT_RELASZ];
|
|
|
|
for (; rel_size; rel+=3, rel_size-=3*sizeof(size_t)) {
|
2015-09-22 06:54:42 +03:00
|
|
|
if (!IS_RELATIVE(rel[1], 0)) continue;
|
2015-05-25 07:32:37 +03:00
|
|
|
size_t *rel_addr = (void *)(base + rel[0]);
|
2015-09-21 23:42:44 +03:00
|
|
|
*rel_addr = base + rel[2];
|
2015-04-13 09:56:26 +03:00
|
|
|
}
|
2022-09-12 15:30:36 +03:00
|
|
|
|
|
|
|
rel = (void *)(base+dyn[DT_RELR]);
|
|
|
|
rel_size = dyn[DT_RELRSZ];
|
|
|
|
size_t *relr_addr = 0;
|
|
|
|
for (; rel_size; rel++, rel_size-=sizeof(size_t)) {
|
|
|
|
if ((rel[0]&1) == 0) {
|
|
|
|
relr_addr = (void *)(base + rel[0]);
|
|
|
|
*relr_addr++ += base;
|
|
|
|
} else {
|
|
|
|
for (size_t i=0, bitmap=rel[0]; bitmap>>=1; i++)
|
|
|
|
if (bitmap&1)
|
|
|
|
relr_addr[i] += base;
|
|
|
|
relr_addr += 8*sizeof(size_t)-1;
|
|
|
|
}
|
|
|
|
}
|
2015-09-22 06:54:42 +03:00
|
|
|
#endif
|
2015-04-13 09:56:26 +03:00
|
|
|
|
introduce new symbol-lookup-free rcrt1/dlstart stage chaining
previously, the call into stage 2 was made by looking up the symbol
name "__dls2" (which was chosen short to be easy to look up) from the
dynamic symbol table. this was no problem for the dynamic linker,
since it always exports all its symbols. in the case of the static pie
entry point, however, the dynamic symbol table does not contain the
necessary symbol unless -rdynamic/-E was used when linking. this
linking requirement is a major obstacle both to practical use of
static-pie as a nommu binary format (since it greatly enlarges the
file) and to upstream toolchain support for static-pie (adding -E to
default linking specs is not reasonable).
this patch replaces the runtime symbolic lookup with a link-time
lookup via an inline asm fragment, which reloc.h is responsible for
providing. in this initial commit, the asm is provided only for i386,
and the old lookup code is left in place as a fallback for archs that
have not yet transitioned.
modifying crt_arch.h to pass the stage-2 function pointer as an
argument was considered as an alternative, but such an approach would
not be compatible with fdpic, where it's impossible to compute
function pointers without already having performed relocations. it was
also deemed desirable to keep crt_arch.h as simple/minimal as
possible.
in principle, archs with pc-relative or got-relative addressing of
static variables could instead load the stage-2 function pointer from
a static volatile object. that does not work for fdpic, and is not
safe against reordering on mips-like archs that use got slots even for
static functions, but it's a valid on i386 and many others, and could
provide a reasonable default implementation in the future.
2015-09-17 09:30:55 +03:00
|
|
|
stage2_func dls2;
|
|
|
|
GETFUNCSYM(&dls2, __dls2, base+dyn[DT_PLTGOT]);
|
2015-09-21 23:42:44 +03:00
|
|
|
dls2((void *)base, sp);
|
2015-04-13 09:56:26 +03:00
|
|
|
}
|