mirror of
https://github.com/frida/tinycc
synced 2024-11-30 19:43:07 +03:00
3426 lines
110 KiB
C
3426 lines
110 KiB
C
/*
|
|
* ELF file handling for TCC
|
|
*
|
|
* Copyright (c) 2001-2004 Fabrice Bellard
|
|
*
|
|
* This library is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2 of the License, or (at your option) any later version.
|
|
*
|
|
* This library is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with this library; if not, write to the Free Software
|
|
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
|
*/
|
|
|
|
#include "tcc.h"
|
|
|
|
/* Define this to get some debug output during relocation processing. */
|
|
#undef DEBUG_RELOC
|
|
|
|
/********************************************************/
|
|
/* global variables */
|
|
|
|
ST_DATA Section *text_section, *data_section, *bss_section; /* predefined sections */
|
|
ST_DATA Section *common_section;
|
|
ST_DATA Section *cur_text_section; /* current section where function code is generated */
|
|
#ifdef CONFIG_TCC_ASM
|
|
ST_DATA Section *last_text_section; /* to handle .previous asm directive */
|
|
#endif
|
|
#ifdef CONFIG_TCC_BCHECK
|
|
/* bound check related sections */
|
|
ST_DATA Section *bounds_section; /* contains global data bound description */
|
|
ST_DATA Section *lbounds_section; /* contains local data bound description */
|
|
#endif
|
|
/* symbol sections */
|
|
ST_DATA Section *symtab_section;
|
|
/* debug sections */
|
|
ST_DATA Section *stab_section, *stabstr_section;
|
|
|
|
/* elf version information */
|
|
struct sym_version {
|
|
char *lib;
|
|
char *version;
|
|
int out_index;
|
|
int prev_same_lib;
|
|
};
|
|
static int nb_sym_versions;
|
|
static struct sym_version *sym_versions;
|
|
static int nb_sym_to_version;
|
|
static int *sym_to_version;
|
|
static int dt_verneednum;
|
|
static Section *versym_section;
|
|
static Section *verneed_section;
|
|
|
|
/* XXX: avoid static variable */
|
|
static int new_undef_sym = 0; /* Is there a new undefined sym since last new_undef_sym() */
|
|
|
|
/* special flag to indicate that the section should not be linked to the other ones */
|
|
#define SHF_PRIVATE 0x80000000
|
|
/* section is dynsymtab_section */
|
|
#define SHF_DYNSYM 0x40000000
|
|
|
|
/* ------------------------------------------------------------------------- */
|
|
|
|
ST_FUNC void tccelf_new(TCCState *s)
|
|
{
|
|
/* no section zero */
|
|
dynarray_add(&s->sections, &s->nb_sections, NULL);
|
|
|
|
/* create standard sections */
|
|
text_section = new_section(s, ".text", SHT_PROGBITS, SHF_ALLOC | SHF_EXECINSTR);
|
|
data_section = new_section(s, ".data", SHT_PROGBITS, SHF_ALLOC | SHF_WRITE);
|
|
bss_section = new_section(s, ".bss", SHT_NOBITS, SHF_ALLOC | SHF_WRITE);
|
|
versym_section = new_section(s, ".gnu.version", SHT_GNU_versym, SHF_ALLOC);
|
|
versym_section->sh_entsize = sizeof(ElfW(Half));
|
|
verneed_section = new_section(s, ".gnu.version_r", SHT_GNU_verneed, SHF_ALLOC);
|
|
common_section = new_section(s, ".common", SHT_NOBITS, SHF_PRIVATE);
|
|
common_section->sh_num = SHN_COMMON;
|
|
|
|
/* symbols are always generated for linking stage */
|
|
symtab_section = new_symtab(s, ".symtab", SHT_SYMTAB, 0,
|
|
".strtab",
|
|
".hashtab", SHF_PRIVATE);
|
|
s->symtab = symtab_section;
|
|
|
|
/* private symbol table for dynamic symbols */
|
|
s->dynsymtab_section = new_symtab(s, ".dynsymtab", SHT_SYMTAB, SHF_PRIVATE|SHF_DYNSYM,
|
|
".dynstrtab",
|
|
".dynhashtab", SHF_PRIVATE);
|
|
get_sym_attr(s, 0, 1);
|
|
}
|
|
|
|
#ifdef CONFIG_TCC_BCHECK
|
|
ST_FUNC void tccelf_bounds_new(TCCState *s)
|
|
{
|
|
/* create bounds sections */
|
|
bounds_section = new_section(s, ".bounds",
|
|
SHT_PROGBITS, SHF_ALLOC);
|
|
lbounds_section = new_section(s, ".lbounds",
|
|
SHT_PROGBITS, SHF_ALLOC);
|
|
}
|
|
#endif
|
|
|
|
ST_FUNC void tccelf_stab_new(TCCState *s)
|
|
{
|
|
stab_section = new_section(s, ".stab", SHT_PROGBITS, 0);
|
|
stab_section->sh_entsize = sizeof(Stab_Sym);
|
|
stabstr_section = new_section(s, ".stabstr", SHT_STRTAB, 0);
|
|
put_elf_str(stabstr_section, "");
|
|
stab_section->link = stabstr_section;
|
|
/* put first entry */
|
|
put_stabs("", 0, 0, 0, 0);
|
|
}
|
|
|
|
static void free_section(Section *s)
|
|
{
|
|
tcc_free(s->data);
|
|
}
|
|
|
|
ST_FUNC void tccelf_delete(TCCState *s1)
|
|
{
|
|
int i;
|
|
|
|
/* free symbol versions */
|
|
for (i = 0; i < nb_sym_versions; i++) {
|
|
tcc_free(sym_versions[i].version);
|
|
tcc_free(sym_versions[i].lib);
|
|
}
|
|
tcc_free(sym_versions);
|
|
sym_versions = NULL;
|
|
nb_sym_versions = 0;
|
|
tcc_free(sym_to_version);
|
|
sym_to_version = NULL;
|
|
nb_sym_to_version = 0;
|
|
|
|
/* free all sections */
|
|
for(i = 1; i < s1->nb_sections; i++)
|
|
free_section(s1->sections[i]);
|
|
dynarray_reset(&s1->sections, &s1->nb_sections);
|
|
|
|
for(i = 0; i < s1->nb_priv_sections; i++)
|
|
free_section(s1->priv_sections[i]);
|
|
dynarray_reset(&s1->priv_sections, &s1->nb_priv_sections);
|
|
|
|
/* free any loaded DLLs */
|
|
#ifdef TCC_IS_NATIVE
|
|
for ( i = 0; i < s1->nb_loaded_dlls; i++) {
|
|
DLLReference *ref = s1->loaded_dlls[i];
|
|
if ( ref->handle )
|
|
# ifdef _WIN32
|
|
FreeLibrary((HMODULE)ref->handle);
|
|
# else
|
|
dlclose(ref->handle);
|
|
# endif
|
|
}
|
|
#endif
|
|
/* free loaded dlls array */
|
|
dynarray_reset(&s1->loaded_dlls, &s1->nb_loaded_dlls);
|
|
tcc_free(s1->sym_attrs);
|
|
|
|
symtab_section = NULL; /* for tccrun.c:rt_printline() */
|
|
}
|
|
|
|
/* save section data state */
|
|
ST_FUNC void tccelf_begin_file(TCCState *s1)
|
|
{
|
|
Section *s; int i;
|
|
for (i = 1; i < s1->nb_sections; i++) {
|
|
s = s1->sections[i];
|
|
s->sh_offset = s->data_offset;
|
|
}
|
|
/* disable symbol hashing during compilation */
|
|
s = s1->symtab, s->reloc = s->hash, s->hash = NULL;
|
|
#if defined TCC_TARGET_X86_64 && defined TCC_TARGET_PE
|
|
s1->uw_sym = 0;
|
|
#endif
|
|
}
|
|
|
|
/* At the end of compilation, convert any UNDEF syms to global, and merge
|
|
with previously existing symbols */
|
|
ST_FUNC void tccelf_end_file(TCCState *s1)
|
|
{
|
|
Section *s = s1->symtab;
|
|
int first_sym, nb_syms, *tr, i;
|
|
|
|
first_sym = s->sh_offset / sizeof (ElfSym);
|
|
nb_syms = s->data_offset / sizeof (ElfSym) - first_sym;
|
|
s->data_offset = s->sh_offset;
|
|
s->link->data_offset = s->link->sh_offset;
|
|
s->hash = s->reloc, s->reloc = NULL;
|
|
tr = tcc_mallocz(nb_syms * sizeof *tr);
|
|
|
|
for (i = 0; i < nb_syms; ++i) {
|
|
ElfSym *sym = (ElfSym*)s->data + first_sym + i;
|
|
if (sym->st_shndx == SHN_UNDEF
|
|
&& ELFW(ST_BIND)(sym->st_info) == STB_LOCAL)
|
|
sym->st_info = ELFW(ST_INFO)(STB_GLOBAL, ELFW(ST_TYPE)(sym->st_info));
|
|
tr[i] = set_elf_sym(s, sym->st_value, sym->st_size, sym->st_info,
|
|
sym->st_other, sym->st_shndx, (char*)s->link->data + sym->st_name);
|
|
}
|
|
/* now update relocations */
|
|
for (i = 1; i < s1->nb_sections; i++) {
|
|
Section *sr = s1->sections[i];
|
|
if (sr->sh_type == SHT_RELX && sr->link == s) {
|
|
ElfW_Rel *rel = (ElfW_Rel*)(sr->data + sr->sh_offset);
|
|
ElfW_Rel *rel_end = (ElfW_Rel*)(sr->data + sr->data_offset);
|
|
for (; rel < rel_end; ++rel) {
|
|
int n = ELFW(R_SYM)(rel->r_info) - first_sym;
|
|
//if (n < 0) tcc_error("internal: invalid symbol index in relocation");
|
|
rel->r_info = ELFW(R_INFO)(tr[n], ELFW(R_TYPE)(rel->r_info));
|
|
}
|
|
}
|
|
}
|
|
tcc_free(tr);
|
|
}
|
|
|
|
ST_FUNC Section *new_section(TCCState *s1, const char *name, int sh_type, int sh_flags)
|
|
{
|
|
Section *sec;
|
|
|
|
sec = tcc_mallocz(sizeof(Section) + strlen(name));
|
|
strcpy(sec->name, name);
|
|
sec->sh_type = sh_type;
|
|
sec->sh_flags = sh_flags;
|
|
switch(sh_type) {
|
|
case SHT_GNU_versym:
|
|
sec->sh_addralign = 2;
|
|
break;
|
|
case SHT_HASH:
|
|
case SHT_REL:
|
|
case SHT_RELA:
|
|
case SHT_DYNSYM:
|
|
case SHT_SYMTAB:
|
|
case SHT_DYNAMIC:
|
|
case SHT_GNU_verneed:
|
|
case SHT_GNU_verdef:
|
|
sec->sh_addralign = PTR_SIZE;
|
|
break;
|
|
case SHT_STRTAB:
|
|
sec->sh_addralign = 1;
|
|
break;
|
|
default:
|
|
sec->sh_addralign = PTR_SIZE; /* gcc/pcc default alignment */
|
|
break;
|
|
}
|
|
|
|
if (sh_flags & SHF_PRIVATE) {
|
|
dynarray_add(&s1->priv_sections, &s1->nb_priv_sections, sec);
|
|
} else {
|
|
sec->sh_num = s1->nb_sections;
|
|
dynarray_add(&s1->sections, &s1->nb_sections, sec);
|
|
}
|
|
|
|
return sec;
|
|
}
|
|
|
|
ST_FUNC Section *new_symtab(TCCState *s1,
|
|
const char *symtab_name, int sh_type, int sh_flags,
|
|
const char *strtab_name,
|
|
const char *hash_name, int hash_sh_flags)
|
|
{
|
|
Section *symtab, *strtab, *hash;
|
|
int *ptr, nb_buckets;
|
|
|
|
symtab = new_section(s1, symtab_name, sh_type, sh_flags);
|
|
symtab->sh_entsize = sizeof(ElfW(Sym));
|
|
strtab = new_section(s1, strtab_name, SHT_STRTAB, sh_flags);
|
|
put_elf_str(strtab, "");
|
|
symtab->link = strtab;
|
|
put_elf_sym(symtab, 0, 0, 0, 0, 0, NULL);
|
|
|
|
nb_buckets = 1;
|
|
|
|
hash = new_section(s1, hash_name, SHT_HASH, hash_sh_flags);
|
|
hash->sh_entsize = sizeof(int);
|
|
symtab->hash = hash;
|
|
hash->link = symtab;
|
|
|
|
ptr = section_ptr_add(hash, (2 + nb_buckets + 1) * sizeof(int));
|
|
ptr[0] = nb_buckets;
|
|
ptr[1] = 1;
|
|
memset(ptr + 2, 0, (nb_buckets + 1) * sizeof(int));
|
|
return symtab;
|
|
}
|
|
|
|
/* realloc section and set its content to zero */
|
|
ST_FUNC void section_realloc(Section *sec, unsigned long new_size)
|
|
{
|
|
unsigned long size;
|
|
unsigned char *data;
|
|
|
|
size = sec->data_allocated;
|
|
if (size == 0)
|
|
size = 1;
|
|
while (size < new_size)
|
|
size = size * 2;
|
|
data = tcc_realloc(sec->data, size);
|
|
memset(data + sec->data_allocated, 0, size - sec->data_allocated);
|
|
sec->data = data;
|
|
sec->data_allocated = size;
|
|
}
|
|
|
|
/* reserve at least 'size' bytes aligned per 'align' in section
|
|
'sec' from current offset, and return the aligned offset */
|
|
ST_FUNC size_t section_add(Section *sec, addr_t size, int align)
|
|
{
|
|
size_t offset, offset1;
|
|
|
|
offset = (sec->data_offset + align - 1) & -align;
|
|
offset1 = offset + size;
|
|
if (sec->sh_type != SHT_NOBITS && offset1 > sec->data_allocated)
|
|
section_realloc(sec, offset1);
|
|
sec->data_offset = offset1;
|
|
if (align > sec->sh_addralign)
|
|
sec->sh_addralign = align;
|
|
return offset;
|
|
}
|
|
|
|
/* reserve at least 'size' bytes in section 'sec' from
|
|
sec->data_offset. */
|
|
ST_FUNC void *section_ptr_add(Section *sec, addr_t size)
|
|
{
|
|
size_t offset = section_add(sec, size, 1);
|
|
return sec->data + offset;
|
|
}
|
|
|
|
/* reserve at least 'size' bytes from section start */
|
|
ST_FUNC void section_reserve(Section *sec, unsigned long size)
|
|
{
|
|
if (size > sec->data_allocated)
|
|
section_realloc(sec, size);
|
|
if (size > sec->data_offset)
|
|
sec->data_offset = size;
|
|
}
|
|
|
|
static Section *find_section_create (TCCState *s1, const char *name, int create)
|
|
{
|
|
Section *sec;
|
|
int i;
|
|
for(i = 1; i < s1->nb_sections; i++) {
|
|
sec = s1->sections[i];
|
|
if (!strcmp(name, sec->name))
|
|
return sec;
|
|
}
|
|
/* sections are created as PROGBITS */
|
|
return create ? new_section(s1, name, SHT_PROGBITS, SHF_ALLOC) : NULL;
|
|
}
|
|
|
|
/* return a reference to a section, and create it if it does not
|
|
exists */
|
|
ST_FUNC Section *find_section(TCCState *s1, const char *name)
|
|
{
|
|
return find_section_create (s1, name, 1);
|
|
}
|
|
|
|
/* ------------------------------------------------------------------------- */
|
|
|
|
ST_FUNC int put_elf_str(Section *s, const char *sym)
|
|
{
|
|
int offset, len;
|
|
char *ptr;
|
|
|
|
len = strlen(sym) + 1;
|
|
offset = s->data_offset;
|
|
ptr = section_ptr_add(s, len);
|
|
memmove(ptr, sym, len);
|
|
return offset;
|
|
}
|
|
|
|
/* elf symbol hashing function */
|
|
static unsigned long elf_hash(const unsigned char *name)
|
|
{
|
|
unsigned long h = 0, g;
|
|
|
|
while (*name) {
|
|
h = (h << 4) + *name++;
|
|
g = h & 0xf0000000;
|
|
if (g)
|
|
h ^= g >> 24;
|
|
h &= ~g;
|
|
}
|
|
return h;
|
|
}
|
|
|
|
/* rebuild hash table of section s */
|
|
/* NOTE: we do factorize the hash table code to go faster */
|
|
static void rebuild_hash(Section *s, unsigned int nb_buckets)
|
|
{
|
|
ElfW(Sym) *sym;
|
|
int *ptr, *hash, nb_syms, sym_index, h;
|
|
unsigned char *strtab;
|
|
|
|
strtab = s->link->data;
|
|
nb_syms = s->data_offset / sizeof(ElfW(Sym));
|
|
|
|
if (!nb_buckets)
|
|
nb_buckets = ((int*)s->hash->data)[0];
|
|
|
|
s->hash->data_offset = 0;
|
|
ptr = section_ptr_add(s->hash, (2 + nb_buckets + nb_syms) * sizeof(int));
|
|
ptr[0] = nb_buckets;
|
|
ptr[1] = nb_syms;
|
|
ptr += 2;
|
|
hash = ptr;
|
|
memset(hash, 0, (nb_buckets + 1) * sizeof(int));
|
|
ptr += nb_buckets + 1;
|
|
|
|
sym = (ElfW(Sym) *)s->data + 1;
|
|
for(sym_index = 1; sym_index < nb_syms; sym_index++) {
|
|
if (ELFW(ST_BIND)(sym->st_info) != STB_LOCAL) {
|
|
h = elf_hash(strtab + sym->st_name) % nb_buckets;
|
|
*ptr = hash[h];
|
|
hash[h] = sym_index;
|
|
} else {
|
|
*ptr = 0;
|
|
}
|
|
ptr++;
|
|
sym++;
|
|
}
|
|
}
|
|
|
|
/* return the symbol number */
|
|
ST_FUNC int put_elf_sym(Section *s, addr_t value, unsigned long size,
|
|
int info, int other, int shndx, const char *name)
|
|
{
|
|
int name_offset, sym_index;
|
|
int nbuckets, h;
|
|
ElfW(Sym) *sym;
|
|
Section *hs;
|
|
|
|
sym = section_ptr_add(s, sizeof(ElfW(Sym)));
|
|
if (name && name[0])
|
|
name_offset = put_elf_str(s->link, name);
|
|
else
|
|
name_offset = 0;
|
|
/* XXX: endianness */
|
|
sym->st_name = name_offset;
|
|
sym->st_value = value;
|
|
sym->st_size = size;
|
|
sym->st_info = info;
|
|
sym->st_other = other;
|
|
sym->st_shndx = shndx;
|
|
sym_index = sym - (ElfW(Sym) *)s->data;
|
|
hs = s->hash;
|
|
if (hs) {
|
|
int *ptr, *base;
|
|
ptr = section_ptr_add(hs, sizeof(int));
|
|
base = (int *)hs->data;
|
|
/* only add global or weak symbols. */
|
|
if (ELFW(ST_BIND)(info) != STB_LOCAL) {
|
|
/* add another hashing entry */
|
|
nbuckets = base[0];
|
|
h = elf_hash((unsigned char *)s->link->data + name_offset) % nbuckets;
|
|
*ptr = base[2 + h];
|
|
base[2 + h] = sym_index;
|
|
base[1]++;
|
|
/* we resize the hash table */
|
|
hs->nb_hashed_syms++;
|
|
if (hs->nb_hashed_syms > 2 * nbuckets) {
|
|
rebuild_hash(s, 2 * nbuckets);
|
|
}
|
|
} else {
|
|
*ptr = 0;
|
|
base[1]++;
|
|
}
|
|
}
|
|
return sym_index;
|
|
}
|
|
|
|
ST_FUNC int find_elf_sym(Section *s, const char *name)
|
|
{
|
|
ElfW(Sym) *sym;
|
|
Section *hs;
|
|
int nbuckets, sym_index, h;
|
|
const char *name1;
|
|
|
|
hs = s->hash;
|
|
if (!hs)
|
|
return 0;
|
|
nbuckets = ((int *)hs->data)[0];
|
|
h = elf_hash((unsigned char *) name) % nbuckets;
|
|
sym_index = ((int *)hs->data)[2 + h];
|
|
while (sym_index != 0) {
|
|
sym = &((ElfW(Sym) *)s->data)[sym_index];
|
|
name1 = (char *) s->link->data + sym->st_name;
|
|
if (!strcmp(name, name1))
|
|
return sym_index;
|
|
sym_index = ((int *)hs->data)[2 + nbuckets + sym_index];
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
/* return elf symbol value, signal error if 'err' is nonzero */
|
|
ST_FUNC addr_t get_elf_sym_addr(TCCState *s, const char *name, int err)
|
|
{
|
|
int sym_index;
|
|
ElfW(Sym) *sym;
|
|
|
|
sym_index = find_elf_sym(s->symtab, name);
|
|
sym = &((ElfW(Sym) *)s->symtab->data)[sym_index];
|
|
if (!sym_index || sym->st_shndx == SHN_UNDEF) {
|
|
if (err)
|
|
tcc_error("%s not defined", name);
|
|
return 0;
|
|
}
|
|
return sym->st_value;
|
|
}
|
|
|
|
/* list elf symbol names and values */
|
|
ST_FUNC void list_elf_symbols(TCCState *s, void *ctx,
|
|
void (*symbol_cb)(void *ctx, const char *name, const void *val))
|
|
{
|
|
ElfW(Sym) *sym;
|
|
Section *symtab;
|
|
int sym_index, end_sym;
|
|
const char *name;
|
|
unsigned char sym_vis, sym_bind;
|
|
|
|
symtab = s->symtab;
|
|
end_sym = symtab->data_offset / sizeof (ElfSym);
|
|
for (sym_index = 0; sym_index < end_sym; ++sym_index) {
|
|
sym = &((ElfW(Sym) *)symtab->data)[sym_index];
|
|
if (sym->st_value) {
|
|
name = (char *) symtab->link->data + sym->st_name;
|
|
sym_bind = ELFW(ST_BIND)(sym->st_info);
|
|
sym_vis = ELFW(ST_VISIBILITY)(sym->st_other);
|
|
if (sym_bind == STB_GLOBAL && sym_vis == STV_DEFAULT)
|
|
symbol_cb(ctx, name, (void*)(uintptr_t)sym->st_value);
|
|
}
|
|
}
|
|
}
|
|
|
|
/* return elf symbol value */
|
|
LIBTCCAPI void *tcc_get_symbol(TCCState *s, const char *name)
|
|
{
|
|
return (void*)(uintptr_t)get_elf_sym_addr(s, name, 0);
|
|
}
|
|
|
|
/* list elf symbol names and values */
|
|
LIBTCCAPI void tcc_list_symbols(TCCState *s, void *ctx,
|
|
void (*symbol_cb)(void *ctx, const char *name, const void *val))
|
|
{
|
|
list_elf_symbols(s, ctx, symbol_cb);
|
|
}
|
|
|
|
#if defined TCC_IS_NATIVE || defined TCC_TARGET_PE
|
|
/* return elf symbol value or error */
|
|
ST_FUNC void* tcc_get_symbol_err(TCCState *s, const char *name)
|
|
{
|
|
return (void*)(uintptr_t)get_elf_sym_addr(s, name, 1);
|
|
}
|
|
#endif
|
|
|
|
static void
|
|
version_add (TCCState *s)
|
|
{
|
|
int i;
|
|
ElfW(Sym) *sym;
|
|
ElfW(Verneed) *vn = NULL;
|
|
Section *symtab;
|
|
int sym_index, end_sym, nb_versions = 2, nb_entries = 0;
|
|
ElfW(Half) *versym;
|
|
const char *name;
|
|
|
|
/* add needed symbols */
|
|
symtab = s->dynsym;
|
|
end_sym = symtab->data_offset / sizeof (ElfSym);
|
|
versym = section_ptr_add(versym_section, end_sym * sizeof(ElfW(Half)));
|
|
for (sym_index = 0; sym_index < end_sym; ++sym_index) {
|
|
int dllindex, verndx;
|
|
sym = &((ElfW(Sym) *)symtab->data)[sym_index];
|
|
name = (char *) symtab->link->data + sym->st_name;
|
|
dllindex = find_elf_sym(s->dynsymtab_section, name);
|
|
verndx = (dllindex && dllindex < nb_sym_to_version)
|
|
? sym_to_version[dllindex] : -1;
|
|
if (verndx >= 0) {
|
|
if (!sym_versions[verndx].out_index)
|
|
sym_versions[verndx].out_index = nb_versions++;
|
|
versym[sym_index] = sym_versions[verndx].out_index;
|
|
} else
|
|
versym[sym_index] = 0;
|
|
}
|
|
/* generate verneed section */
|
|
for (i = nb_sym_versions; i-- > 0;) {
|
|
struct sym_version *sv = &sym_versions[i];
|
|
int n_same_libs = 0, prev;
|
|
size_t vnofs;
|
|
ElfW(Vernaux) *vna = vna;
|
|
if (sv->out_index < 1)
|
|
continue;
|
|
vnofs = section_add(verneed_section, sizeof(*vn), 1);
|
|
vn = (ElfW(Verneed)*)(verneed_section->data + vnofs);
|
|
vn->vn_version = 1;
|
|
vn->vn_file = put_elf_str(verneed_section->link, sv->lib);
|
|
vn->vn_aux = sizeof (*vn);
|
|
do {
|
|
prev = sv->prev_same_lib;
|
|
if (sv->out_index > 0) {
|
|
vna = section_ptr_add(verneed_section, sizeof(*vna));
|
|
vna->vna_hash = elf_hash (sv->version);
|
|
vna->vna_flags = 0;
|
|
vna->vna_other = sv->out_index;
|
|
sv->out_index = -2;
|
|
vna->vna_name = put_elf_str(verneed_section->link, sv->version);
|
|
vna->vna_next = sizeof (*vna);
|
|
n_same_libs++;
|
|
}
|
|
sv = &sym_versions[prev];
|
|
} while(prev >= 0);
|
|
vna->vna_next = 0;
|
|
vn = (ElfW(Verneed)*)(verneed_section->data + vnofs);
|
|
vn->vn_cnt = n_same_libs;
|
|
vn->vn_next = sizeof(*vn) + n_same_libs * sizeof(*vna);
|
|
nb_entries++;
|
|
}
|
|
if (vn)
|
|
vn->vn_next = 0;
|
|
verneed_section->sh_info = nb_entries;
|
|
dt_verneednum = nb_entries;
|
|
}
|
|
|
|
/* add an elf symbol : check if it is already defined and patch
|
|
it. Return symbol index. NOTE that sh_num can be SHN_UNDEF. */
|
|
ST_FUNC int set_elf_sym(Section *s, addr_t value, unsigned long size,
|
|
int info, int other, int shndx, const char *name)
|
|
{
|
|
ElfW(Sym) *esym;
|
|
int sym_bind, sym_index, sym_type, esym_bind;
|
|
unsigned char sym_vis, esym_vis, new_vis;
|
|
|
|
sym_bind = ELFW(ST_BIND)(info);
|
|
sym_type = ELFW(ST_TYPE)(info);
|
|
sym_vis = ELFW(ST_VISIBILITY)(other);
|
|
|
|
if (sym_bind != STB_LOCAL) {
|
|
/* we search global or weak symbols */
|
|
sym_index = find_elf_sym(s, name);
|
|
if (!sym_index)
|
|
goto do_def;
|
|
esym = &((ElfW(Sym) *)s->data)[sym_index];
|
|
if (esym->st_value == value && esym->st_size == size && esym->st_info == info
|
|
&& esym->st_other == other && esym->st_shndx == shndx)
|
|
return sym_index;
|
|
if (esym->st_shndx != SHN_UNDEF) {
|
|
esym_bind = ELFW(ST_BIND)(esym->st_info);
|
|
/* propagate the most constraining visibility */
|
|
/* STV_DEFAULT(0)<STV_PROTECTED(3)<STV_HIDDEN(2)<STV_INTERNAL(1) */
|
|
esym_vis = ELFW(ST_VISIBILITY)(esym->st_other);
|
|
if (esym_vis == STV_DEFAULT) {
|
|
new_vis = sym_vis;
|
|
} else if (sym_vis == STV_DEFAULT) {
|
|
new_vis = esym_vis;
|
|
} else {
|
|
new_vis = (esym_vis < sym_vis) ? esym_vis : sym_vis;
|
|
}
|
|
esym->st_other = (esym->st_other & ~ELFW(ST_VISIBILITY)(-1))
|
|
| new_vis;
|
|
other = esym->st_other; /* in case we have to patch esym */
|
|
if (shndx == SHN_UNDEF) {
|
|
/* ignore adding of undefined symbol if the
|
|
corresponding symbol is already defined */
|
|
} else if (sym_bind == STB_GLOBAL && esym_bind == STB_WEAK) {
|
|
/* global overrides weak, so patch */
|
|
goto do_patch;
|
|
} else if (sym_bind == STB_WEAK && esym_bind == STB_GLOBAL) {
|
|
/* weak is ignored if already global */
|
|
} else if (sym_bind == STB_WEAK && esym_bind == STB_WEAK) {
|
|
/* keep first-found weak definition, ignore subsequents */
|
|
} else if (sym_vis == STV_HIDDEN || sym_vis == STV_INTERNAL) {
|
|
/* ignore hidden symbols after */
|
|
} else if ((esym->st_shndx == SHN_COMMON
|
|
|| esym->st_shndx == bss_section->sh_num)
|
|
&& (shndx < SHN_LORESERVE
|
|
&& shndx != bss_section->sh_num)) {
|
|
/* data symbol gets precedence over common/bss */
|
|
goto do_patch;
|
|
} else if (shndx == SHN_COMMON || shndx == bss_section->sh_num) {
|
|
/* data symbol keeps precedence over common/bss */
|
|
} else if (s->sh_flags & SHF_DYNSYM) {
|
|
/* we accept that two DLL define the same symbol */
|
|
} else if (esym->st_other & ST_ASM_SET) {
|
|
/* If the existing symbol came from an asm .set
|
|
we can override. */
|
|
goto do_patch;
|
|
} else {
|
|
#if 0
|
|
printf("new_bind=%x new_shndx=%x new_vis=%x old_bind=%x old_shndx=%x old_vis=%x\n",
|
|
sym_bind, shndx, new_vis, esym_bind, esym->st_shndx, esym_vis);
|
|
#endif
|
|
tcc_error_noabort("'%s' defined twice", name);
|
|
}
|
|
} else {
|
|
do_patch:
|
|
esym->st_info = ELFW(ST_INFO)(sym_bind, sym_type);
|
|
esym->st_shndx = shndx;
|
|
new_undef_sym = 1;
|
|
esym->st_value = value;
|
|
esym->st_size = size;
|
|
esym->st_other = other;
|
|
}
|
|
} else {
|
|
do_def:
|
|
sym_index = put_elf_sym(s, value, size,
|
|
ELFW(ST_INFO)(sym_bind, sym_type), other,
|
|
shndx, name);
|
|
}
|
|
return sym_index;
|
|
}
|
|
|
|
/* put relocation */
|
|
ST_FUNC void put_elf_reloca(Section *symtab, Section *s, unsigned long offset,
|
|
int type, int symbol, addr_t addend)
|
|
{
|
|
char buf[256];
|
|
Section *sr;
|
|
ElfW_Rel *rel;
|
|
|
|
sr = s->reloc;
|
|
if (!sr) {
|
|
/* if no relocation section, create it */
|
|
snprintf(buf, sizeof(buf), REL_SECTION_FMT, s->name);
|
|
/* if the symtab is allocated, then we consider the relocation
|
|
are also */
|
|
sr = new_section(tcc_state, buf, SHT_RELX, symtab->sh_flags);
|
|
sr->sh_entsize = sizeof(ElfW_Rel);
|
|
sr->link = symtab;
|
|
sr->sh_info = s->sh_num;
|
|
s->reloc = sr;
|
|
}
|
|
rel = section_ptr_add(sr, sizeof(ElfW_Rel));
|
|
rel->r_offset = offset;
|
|
rel->r_info = ELFW(R_INFO)(symbol, type);
|
|
#if SHT_RELX == SHT_RELA
|
|
rel->r_addend = addend;
|
|
#else
|
|
if (addend)
|
|
tcc_error("non-zero addend on REL architecture");
|
|
#endif
|
|
}
|
|
|
|
ST_FUNC void put_elf_reloc(Section *symtab, Section *s, unsigned long offset,
|
|
int type, int symbol)
|
|
{
|
|
put_elf_reloca(symtab, s, offset, type, symbol, 0);
|
|
}
|
|
|
|
/* Remove relocations for section S->reloc starting at oldrelocoffset
|
|
that are to the same place, retaining the last of them. As side effect
|
|
the relocations are sorted. Possibly reduces the number of relocs. */
|
|
ST_FUNC void squeeze_multi_relocs(Section *s, size_t oldrelocoffset)
|
|
{
|
|
Section *sr = s->reloc;
|
|
ElfW_Rel *r, *dest;
|
|
ssize_t a;
|
|
ElfW(Addr) addr;
|
|
|
|
if (oldrelocoffset + sizeof(*r) >= sr->data_offset)
|
|
return;
|
|
/* The relocs we're dealing with are the result of initializer parsing.
|
|
So they will be mostly in order and there aren't many of them.
|
|
Secondly we need a stable sort (which qsort isn't). We use
|
|
a simple insertion sort. */
|
|
for (a = oldrelocoffset + sizeof(*r); a < sr->data_offset; a += sizeof(*r)) {
|
|
ssize_t i = a - sizeof(*r);
|
|
addr = ((ElfW_Rel*)(sr->data + a))->r_offset;
|
|
for (; i >= (ssize_t)oldrelocoffset &&
|
|
((ElfW_Rel*)(sr->data + i))->r_offset > addr; i -= sizeof(*r)) {
|
|
ElfW_Rel tmp = *(ElfW_Rel*)(sr->data + a);
|
|
*(ElfW_Rel*)(sr->data + a) = *(ElfW_Rel*)(sr->data + i);
|
|
*(ElfW_Rel*)(sr->data + i) = tmp;
|
|
}
|
|
}
|
|
|
|
r = (ElfW_Rel*)(sr->data + oldrelocoffset);
|
|
dest = r;
|
|
for (; r < (ElfW_Rel*)(sr->data + sr->data_offset); r++) {
|
|
if (dest->r_offset != r->r_offset)
|
|
dest++;
|
|
*dest = *r;
|
|
}
|
|
sr->data_offset = (unsigned char*)dest - sr->data + sizeof(*r);
|
|
}
|
|
|
|
/* put stab debug information */
|
|
|
|
ST_FUNC void put_stabs(const char *str, int type, int other, int desc,
|
|
unsigned long value)
|
|
{
|
|
Stab_Sym *sym;
|
|
|
|
sym = section_ptr_add(stab_section, sizeof(Stab_Sym));
|
|
if (str) {
|
|
sym->n_strx = put_elf_str(stabstr_section, str);
|
|
} else {
|
|
sym->n_strx = 0;
|
|
}
|
|
sym->n_type = type;
|
|
sym->n_other = other;
|
|
sym->n_desc = desc;
|
|
sym->n_value = value;
|
|
}
|
|
|
|
ST_FUNC void put_stabs_r(const char *str, int type, int other, int desc,
|
|
unsigned long value, Section *sec, int sym_index)
|
|
{
|
|
put_stabs(str, type, other, desc, value);
|
|
put_elf_reloc(symtab_section, stab_section,
|
|
stab_section->data_offset - sizeof(unsigned int),
|
|
R_DATA_32, sym_index);
|
|
}
|
|
|
|
ST_FUNC void put_stabn(int type, int other, int desc, int value)
|
|
{
|
|
put_stabs(NULL, type, other, desc, value);
|
|
}
|
|
|
|
ST_FUNC void put_stabd(int type, int other, int desc)
|
|
{
|
|
put_stabs(NULL, type, other, desc, 0);
|
|
}
|
|
|
|
ST_FUNC struct sym_attr *get_sym_attr(TCCState *s1, int index, int alloc)
|
|
{
|
|
int n;
|
|
struct sym_attr *tab;
|
|
|
|
if (index >= s1->nb_sym_attrs) {
|
|
if (!alloc)
|
|
return s1->sym_attrs;
|
|
/* find immediately bigger power of 2 and reallocate array */
|
|
n = 1;
|
|
while (index >= n)
|
|
n *= 2;
|
|
tab = tcc_realloc(s1->sym_attrs, n * sizeof(*s1->sym_attrs));
|
|
s1->sym_attrs = tab;
|
|
memset(s1->sym_attrs + s1->nb_sym_attrs, 0,
|
|
(n - s1->nb_sym_attrs) * sizeof(*s1->sym_attrs));
|
|
s1->nb_sym_attrs = n;
|
|
}
|
|
return &s1->sym_attrs[index];
|
|
}
|
|
|
|
/* Browse each elem of type <type> in section <sec> starting at elem <startoff>
|
|
using variable <elem> */
|
|
#define for_each_elem(sec, startoff, elem, type) \
|
|
for (elem = (type *) sec->data + startoff; \
|
|
elem < (type *) (sec->data + sec->data_offset); elem++)
|
|
|
|
/* In an ELF file symbol table, the local symbols must appear below
|
|
the global and weak ones. Since TCC cannot sort it while generating
|
|
the code, we must do it after. All the relocation tables are also
|
|
modified to take into account the symbol table sorting */
|
|
static void sort_syms(TCCState *s1, Section *s)
|
|
{
|
|
int *old_to_new_syms;
|
|
ElfW(Sym) *new_syms;
|
|
int nb_syms, i;
|
|
ElfW(Sym) *p, *q;
|
|
ElfW_Rel *rel;
|
|
Section *sr;
|
|
int type, sym_index;
|
|
|
|
nb_syms = s->data_offset / sizeof(ElfW(Sym));
|
|
new_syms = tcc_malloc(nb_syms * sizeof(ElfW(Sym)));
|
|
old_to_new_syms = tcc_malloc(nb_syms * sizeof(int));
|
|
|
|
/* first pass for local symbols */
|
|
p = (ElfW(Sym) *)s->data;
|
|
q = new_syms;
|
|
for(i = 0; i < nb_syms; i++) {
|
|
if (ELFW(ST_BIND)(p->st_info) == STB_LOCAL) {
|
|
old_to_new_syms[i] = q - new_syms;
|
|
*q++ = *p;
|
|
}
|
|
p++;
|
|
}
|
|
/* save the number of local symbols in section header */
|
|
if( s->sh_size ) /* this 'if' makes IDA happy */
|
|
s->sh_info = q - new_syms;
|
|
|
|
/* then second pass for non local symbols */
|
|
p = (ElfW(Sym) *)s->data;
|
|
for(i = 0; i < nb_syms; i++) {
|
|
if (ELFW(ST_BIND)(p->st_info) != STB_LOCAL) {
|
|
old_to_new_syms[i] = q - new_syms;
|
|
*q++ = *p;
|
|
}
|
|
p++;
|
|
}
|
|
|
|
/* we copy the new symbols to the old */
|
|
memcpy(s->data, new_syms, nb_syms * sizeof(ElfW(Sym)));
|
|
tcc_free(new_syms);
|
|
|
|
/* now we modify all the relocations */
|
|
for(i = 1; i < s1->nb_sections; i++) {
|
|
sr = s1->sections[i];
|
|
if (sr->sh_type == SHT_RELX && sr->link == s) {
|
|
for_each_elem(sr, 0, rel, ElfW_Rel) {
|
|
sym_index = ELFW(R_SYM)(rel->r_info);
|
|
type = ELFW(R_TYPE)(rel->r_info);
|
|
sym_index = old_to_new_syms[sym_index];
|
|
rel->r_info = ELFW(R_INFO)(sym_index, type);
|
|
}
|
|
}
|
|
}
|
|
|
|
tcc_free(old_to_new_syms);
|
|
}
|
|
|
|
/* relocate symbol table, resolve undefined symbols if do_resolve is
|
|
true and output error if undefined symbol. */
|
|
ST_FUNC void relocate_syms(TCCState *s1, Section *symtab, int do_resolve)
|
|
{
|
|
ElfW(Sym) *sym;
|
|
int sym_bind, sh_num;
|
|
const char *name;
|
|
|
|
for_each_elem(symtab, 1, sym, ElfW(Sym)) {
|
|
sh_num = sym->st_shndx;
|
|
if (sh_num == SHN_UNDEF) {
|
|
name = (char *) s1->symtab->link->data + sym->st_name;
|
|
/* Use ld.so to resolve symbol for us (for tcc -run) */
|
|
if (do_resolve) {
|
|
#if defined TCC_IS_NATIVE && !defined TCC_TARGET_PE
|
|
void *addr = dlsym(RTLD_DEFAULT, name);
|
|
if (addr) {
|
|
sym->st_value = (addr_t) addr;
|
|
#ifdef DEBUG_RELOC
|
|
printf ("relocate_sym: %s -> 0x%lx\n", name, sym->st_value);
|
|
#endif
|
|
goto found;
|
|
}
|
|
#endif
|
|
/* if dynamic symbol exist, it will be used in relocate_section */
|
|
} else if (s1->dynsym && find_elf_sym(s1->dynsym, name))
|
|
goto found;
|
|
/* XXX: _fp_hw seems to be part of the ABI, so we ignore
|
|
it */
|
|
if (!strcmp(name, "_fp_hw"))
|
|
goto found;
|
|
/* only weak symbols are accepted to be undefined. Their
|
|
value is zero */
|
|
sym_bind = ELFW(ST_BIND)(sym->st_info);
|
|
if (sym_bind == STB_WEAK)
|
|
sym->st_value = 0;
|
|
else
|
|
tcc_error_noabort("undefined symbol '%s'", name);
|
|
} else if (sh_num < SHN_LORESERVE) {
|
|
/* add section base */
|
|
sym->st_value += s1->sections[sym->st_shndx]->sh_addr;
|
|
}
|
|
found: ;
|
|
}
|
|
}
|
|
|
|
/* relocate a given section (CPU dependent) by applying the relocations
|
|
in the associated relocation section */
|
|
ST_FUNC void relocate_section(TCCState *s1, Section *s)
|
|
{
|
|
Section *sr = s->reloc;
|
|
ElfW_Rel *rel;
|
|
ElfW(Sym) *sym;
|
|
int type, sym_index;
|
|
unsigned char *ptr;
|
|
addr_t tgt, addr;
|
|
|
|
relocate_init(sr);
|
|
|
|
for_each_elem(sr, 0, rel, ElfW_Rel) {
|
|
ptr = s->data + rel->r_offset;
|
|
sym_index = ELFW(R_SYM)(rel->r_info);
|
|
sym = &((ElfW(Sym) *)symtab_section->data)[sym_index];
|
|
type = ELFW(R_TYPE)(rel->r_info);
|
|
tgt = sym->st_value;
|
|
#if SHT_RELX == SHT_RELA
|
|
tgt += rel->r_addend;
|
|
#endif
|
|
addr = s->sh_addr + rel->r_offset;
|
|
relocate(s1, rel, type, ptr, addr, tgt);
|
|
}
|
|
/* if the relocation is allocated, we change its symbol table */
|
|
if (sr->sh_flags & SHF_ALLOC)
|
|
sr->link = s1->dynsym;
|
|
}
|
|
|
|
/* relocate relocation table in 'sr' */
|
|
static void relocate_rel(TCCState *s1, Section *sr)
|
|
{
|
|
Section *s;
|
|
ElfW_Rel *rel;
|
|
|
|
s = s1->sections[sr->sh_info];
|
|
for_each_elem(sr, 0, rel, ElfW_Rel)
|
|
rel->r_offset += s->sh_addr;
|
|
}
|
|
|
|
/* count the number of dynamic relocations so that we can reserve
|
|
their space */
|
|
static int prepare_dynamic_rel(TCCState *s1, Section *sr)
|
|
{
|
|
int count = 0;
|
|
#if defined(TCC_TARGET_I386) || defined(TCC_TARGET_X86_64)
|
|
ElfW_Rel *rel;
|
|
for_each_elem(sr, 0, rel, ElfW_Rel) {
|
|
int sym_index = ELFW(R_SYM)(rel->r_info);
|
|
int type = ELFW(R_TYPE)(rel->r_info);
|
|
switch(type) {
|
|
#if defined(TCC_TARGET_I386)
|
|
case R_386_32:
|
|
if (!get_sym_attr(s1, sym_index, 0)->dyn_index
|
|
&& ((ElfW(Sym)*)symtab_section->data + sym_index)->st_shndx == SHN_UNDEF) {
|
|
/* don't fixup unresolved (weak) symbols */
|
|
rel->r_info = ELFW(R_INFO)(sym_index, R_386_RELATIVE);
|
|
break;
|
|
}
|
|
#elif defined(TCC_TARGET_X86_64)
|
|
case R_X86_64_32:
|
|
case R_X86_64_32S:
|
|
case R_X86_64_64:
|
|
#endif
|
|
count++;
|
|
break;
|
|
#if defined(TCC_TARGET_I386)
|
|
case R_386_PC32:
|
|
#elif defined(TCC_TARGET_X86_64)
|
|
case R_X86_64_PC32:
|
|
#endif
|
|
if (get_sym_attr(s1, sym_index, 0)->dyn_index)
|
|
count++;
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
}
|
|
if (count) {
|
|
/* allocate the section */
|
|
sr->sh_flags |= SHF_ALLOC;
|
|
sr->sh_size = count * sizeof(ElfW_Rel);
|
|
}
|
|
#endif
|
|
return count;
|
|
}
|
|
|
|
static void build_got(TCCState *s1)
|
|
{
|
|
/* if no got, then create it */
|
|
s1->got = new_section(s1, ".got", SHT_PROGBITS, SHF_ALLOC | SHF_WRITE);
|
|
s1->got->sh_entsize = 4;
|
|
set_elf_sym(symtab_section, 0, 4, ELFW(ST_INFO)(STB_GLOBAL, STT_OBJECT),
|
|
0, s1->got->sh_num, "_GLOBAL_OFFSET_TABLE_");
|
|
/* keep space for _DYNAMIC pointer and two dummy got entries */
|
|
section_ptr_add(s1->got, 3 * PTR_SIZE);
|
|
}
|
|
|
|
/* Create a GOT and (for function call) a PLT entry corresponding to a symbol
|
|
in s1->symtab. When creating the dynamic symbol table entry for the GOT
|
|
relocation, use 'size' and 'info' for the corresponding symbol metadata.
|
|
Returns the offset of the GOT or (if any) PLT entry. */
|
|
static struct sym_attr * put_got_entry(TCCState *s1, int dyn_reloc_type,
|
|
int sym_index)
|
|
{
|
|
int need_plt_entry;
|
|
const char *name;
|
|
ElfW(Sym) *sym;
|
|
struct sym_attr *attr;
|
|
unsigned got_offset;
|
|
char plt_name[100];
|
|
int len;
|
|
|
|
need_plt_entry = (dyn_reloc_type == R_JMP_SLOT);
|
|
attr = get_sym_attr(s1, sym_index, 1);
|
|
|
|
/* In case a function is both called and its address taken 2 GOT entries
|
|
are created, one for taking the address (GOT) and the other for the PLT
|
|
entry (PLTGOT). */
|
|
if (need_plt_entry ? attr->plt_offset : attr->got_offset)
|
|
return attr;
|
|
|
|
/* create the GOT entry */
|
|
got_offset = s1->got->data_offset;
|
|
section_ptr_add(s1->got, PTR_SIZE);
|
|
|
|
/* Create the GOT relocation that will insert the address of the object or
|
|
function of interest in the GOT entry. This is a static relocation for
|
|
memory output (dlsym will give us the address of symbols) and dynamic
|
|
relocation otherwise (executable and DLLs). The relocation should be
|
|
done lazily for GOT entry with *_JUMP_SLOT relocation type (the one
|
|
associated to a PLT entry) but is currently done at load time for an
|
|
unknown reason. */
|
|
|
|
sym = &((ElfW(Sym) *) symtab_section->data)[sym_index];
|
|
name = (char *) symtab_section->link->data + sym->st_name;
|
|
|
|
if (s1->dynsym) {
|
|
if (ELFW(ST_BIND)(sym->st_info) == STB_LOCAL) {
|
|
/* Hack alarm. We don't want to emit dynamic symbols
|
|
and symbol based relocs for STB_LOCAL symbols, but rather
|
|
want to resolve them directly. At this point the symbol
|
|
values aren't final yet, so we must defer this. We will later
|
|
have to create a RELATIVE reloc anyway, so we misuse the
|
|
relocation slot to smuggle the symbol reference until
|
|
fill_local_got_entries. Not that the sym_index is
|
|
relative to symtab_section, not s1->dynsym! Nevertheless
|
|
we use s1->dyn_sym so that if this is the first call
|
|
that got->reloc is correctly created. Also note that
|
|
RELATIVE relocs are not normally created for the .got,
|
|
so the types serves as a marker for later (and is retained
|
|
also for the final output, which is okay because then the
|
|
got is just normal data). */
|
|
put_elf_reloc(s1->dynsym, s1->got, got_offset, R_RELATIVE,
|
|
sym_index);
|
|
} else {
|
|
if (0 == attr->dyn_index)
|
|
attr->dyn_index = set_elf_sym(s1->dynsym, sym->st_value,
|
|
sym->st_size, sym->st_info, 0,
|
|
sym->st_shndx, name);
|
|
put_elf_reloc(s1->dynsym, s1->got, got_offset, dyn_reloc_type,
|
|
attr->dyn_index);
|
|
}
|
|
} else {
|
|
put_elf_reloc(symtab_section, s1->got, got_offset, dyn_reloc_type,
|
|
sym_index);
|
|
}
|
|
|
|
if (need_plt_entry) {
|
|
if (!s1->plt) {
|
|
s1->plt = new_section(s1, ".plt", SHT_PROGBITS,
|
|
SHF_ALLOC | SHF_EXECINSTR);
|
|
s1->plt->sh_entsize = 4;
|
|
}
|
|
|
|
attr->plt_offset = create_plt_entry(s1, got_offset, attr);
|
|
|
|
/* create a symbol 'sym@plt' for the PLT jump vector */
|
|
len = strlen(name);
|
|
if (len > sizeof plt_name - 5)
|
|
len = sizeof plt_name - 5;
|
|
memcpy(plt_name, name, len);
|
|
strcpy(plt_name + len, "@plt");
|
|
attr->plt_sym = put_elf_sym(s1->symtab, attr->plt_offset, sym->st_size,
|
|
ELFW(ST_INFO)(STB_GLOBAL, STT_FUNC), 0, s1->plt->sh_num, plt_name);
|
|
|
|
} else {
|
|
attr->got_offset = got_offset;
|
|
}
|
|
|
|
return attr;
|
|
}
|
|
|
|
/* build GOT and PLT entries */
|
|
ST_FUNC void build_got_entries(TCCState *s1)
|
|
{
|
|
Section *s;
|
|
ElfW_Rel *rel;
|
|
ElfW(Sym) *sym;
|
|
int i, type, gotplt_entry, reloc_type, sym_index;
|
|
struct sym_attr *attr;
|
|
|
|
for(i = 1; i < s1->nb_sections; i++) {
|
|
s = s1->sections[i];
|
|
if (s->sh_type != SHT_RELX)
|
|
continue;
|
|
/* no need to handle got relocations */
|
|
if (s->link != symtab_section)
|
|
continue;
|
|
for_each_elem(s, 0, rel, ElfW_Rel) {
|
|
type = ELFW(R_TYPE)(rel->r_info);
|
|
gotplt_entry = gotplt_entry_type(type);
|
|
sym_index = ELFW(R_SYM)(rel->r_info);
|
|
sym = &((ElfW(Sym) *)symtab_section->data)[sym_index];
|
|
|
|
if (gotplt_entry == NO_GOTPLT_ENTRY) {
|
|
continue;
|
|
}
|
|
|
|
/* Automatically create PLT/GOT [entry] if it is an undefined
|
|
reference (resolved at runtime), or the symbol is absolute,
|
|
probably created by tcc_add_symbol, and thus on 64-bit
|
|
targets might be too far from application code. */
|
|
if (gotplt_entry == AUTO_GOTPLT_ENTRY) {
|
|
if (sym->st_shndx == SHN_UNDEF) {
|
|
ElfW(Sym) *esym;
|
|
int dynindex;
|
|
if (s1->output_type == TCC_OUTPUT_DLL && ! PCRELATIVE_DLLPLT)
|
|
continue;
|
|
/* Relocations for UNDEF symbols would normally need
|
|
to be transferred into the executable or shared object.
|
|
If that were done AUTO_GOTPLT_ENTRY wouldn't exist.
|
|
But TCC doesn't do that (at least for exes), so we
|
|
need to resolve all such relocs locally. And that
|
|
means PLT slots for functions in DLLs and COPY relocs for
|
|
data symbols. COPY relocs were generated in
|
|
bind_exe_dynsyms (and the symbol adjusted to be defined),
|
|
and for functions we were generated a dynamic symbol
|
|
of function type. */
|
|
if (s1->dynsym) {
|
|
/* dynsym isn't set for -run :-/ */
|
|
dynindex = get_sym_attr(s1, sym_index, 0)->dyn_index;
|
|
esym = (ElfW(Sym) *)s1->dynsym->data + dynindex;
|
|
if (dynindex
|
|
&& (ELFW(ST_TYPE)(esym->st_info) == STT_FUNC
|
|
|| (ELFW(ST_TYPE)(esym->st_info) == STT_NOTYPE
|
|
&& ELFW(ST_TYPE)(sym->st_info) == STT_FUNC)))
|
|
goto jmp_slot;
|
|
}
|
|
} else if (!(sym->st_shndx == SHN_ABS
|
|
#ifndef TCC_TARGET_ARM
|
|
&& PTR_SIZE == 8
|
|
#endif
|
|
))
|
|
continue;
|
|
}
|
|
|
|
#ifdef TCC_TARGET_X86_64
|
|
if ((type == R_X86_64_PLT32 || type == R_X86_64_PC32) &&
|
|
sym->st_shndx != SHN_UNDEF &&
|
|
(ELFW(ST_VISIBILITY)(sym->st_other) != STV_DEFAULT ||
|
|
ELFW(ST_BIND)(sym->st_info) == STB_LOCAL ||
|
|
s1->output_type == TCC_OUTPUT_EXE)) {
|
|
rel->r_info = ELFW(R_INFO)(sym_index, R_X86_64_PC32);
|
|
continue;
|
|
}
|
|
#endif
|
|
if (code_reloc(type)) {
|
|
jmp_slot:
|
|
reloc_type = R_JMP_SLOT;
|
|
} else
|
|
reloc_type = R_GLOB_DAT;
|
|
|
|
if (!s1->got)
|
|
build_got(s1);
|
|
|
|
if (gotplt_entry == BUILD_GOT_ONLY)
|
|
continue;
|
|
|
|
attr = put_got_entry(s1, reloc_type, sym_index);
|
|
|
|
if (reloc_type == R_JMP_SLOT)
|
|
rel->r_info = ELFW(R_INFO)(attr->plt_sym, type);
|
|
}
|
|
}
|
|
}
|
|
|
|
/* put dynamic tag */
|
|
static void put_dt(Section *dynamic, int dt, addr_t val)
|
|
{
|
|
ElfW(Dyn) *dyn;
|
|
dyn = section_ptr_add(dynamic, sizeof(ElfW(Dyn)));
|
|
dyn->d_tag = dt;
|
|
dyn->d_un.d_val = val;
|
|
}
|
|
|
|
static void add_init_array_defines(TCCState *s1, const char *section_name)
|
|
{
|
|
Section *s;
|
|
long end_offset;
|
|
char sym_start[1024];
|
|
char sym_end[1024];
|
|
|
|
snprintf(sym_start, sizeof(sym_start), "__%s_start", section_name + 1);
|
|
snprintf(sym_end, sizeof(sym_end), "__%s_end", section_name + 1);
|
|
|
|
s = find_section(s1, section_name);
|
|
if (!s) {
|
|
end_offset = 0;
|
|
s = data_section;
|
|
} else {
|
|
end_offset = s->data_offset;
|
|
}
|
|
|
|
set_elf_sym(symtab_section,
|
|
0, 0,
|
|
ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
|
|
s->sh_num, sym_start);
|
|
set_elf_sym(symtab_section,
|
|
end_offset, 0,
|
|
ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
|
|
s->sh_num, sym_end);
|
|
}
|
|
|
|
#ifndef TCC_TARGET_PE
|
|
static int tcc_add_support(TCCState *s1, const char *filename)
|
|
{
|
|
char buf[1024];
|
|
snprintf(buf, sizeof(buf), "%s/%s", s1->tcc_lib_path, filename);
|
|
return tcc_add_file(s1, buf);
|
|
}
|
|
#endif
|
|
|
|
static void add_array (const char *section, TCCState *s1, Sym *sym)
|
|
{
|
|
Section *s;
|
|
unsigned char *ptr;
|
|
|
|
s = find_section(s1, section);
|
|
if (s) {
|
|
s->sh_flags |= SHF_WRITE;
|
|
ptr = section_ptr_add(s, PTR_SIZE);
|
|
memset (ptr, 0, PTR_SIZE);
|
|
put_elf_reloc (s1->symtab, s, ptr - s->data, R_DATA_PTR, sym->c);
|
|
}
|
|
}
|
|
|
|
ST_FUNC void add_init_array (TCCState *s1, Sym *sym)
|
|
{
|
|
add_array (".init_array", s1, sym);
|
|
}
|
|
|
|
ST_FUNC void add_fini_array (TCCState *s1, Sym *sym)
|
|
{
|
|
add_array (".fini_array", s1, sym);
|
|
}
|
|
|
|
ST_FUNC void tcc_add_bcheck(TCCState *s1)
|
|
{
|
|
#ifdef CONFIG_TCC_BCHECK
|
|
addr_t *ptr;
|
|
int sym_index;
|
|
|
|
if (0 == s1->do_bounds_check)
|
|
return;
|
|
/* XXX: add an object file to do that */
|
|
ptr = section_ptr_add(bounds_section, sizeof(*ptr));
|
|
*ptr = 0;
|
|
set_elf_sym(symtab_section, 0, 0,
|
|
ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
|
|
bounds_section->sh_num, "__bounds_start");
|
|
/* pull bcheck.o from libtcc1.a */
|
|
sym_index = set_elf_sym(symtab_section, 0, 0,
|
|
ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
|
|
SHN_UNDEF, "__bound_init");
|
|
if (s1->output_type != TCC_OUTPUT_MEMORY) {
|
|
/* add 'call __bound_init()' in .init section */
|
|
Section *init_section = find_section(s1, ".init");
|
|
unsigned char *pinit = section_ptr_add(init_section, 5);
|
|
pinit[0] = 0xe8;
|
|
write32le(pinit + 1, -4);
|
|
put_elf_reloc(symtab_section, init_section,
|
|
init_section->data_offset - 4, R_386_PC32, sym_index);
|
|
/* R_386_PC32 = R_X86_64_PC32 = 2 */
|
|
}
|
|
#endif
|
|
}
|
|
|
|
/* add tcc runtime libraries */
|
|
ST_FUNC void tcc_add_runtime(TCCState *s1)
|
|
{
|
|
s1->filetype = 0;
|
|
tcc_add_bcheck(s1);
|
|
tcc_add_pragma_libs(s1);
|
|
#ifndef TCC_TARGET_PE
|
|
/* add libc */
|
|
if (!s1->nostdlib) {
|
|
tcc_add_library_err(s1, "c");
|
|
#ifdef TCC_LIBGCC
|
|
if (!s1->static_link) {
|
|
if (TCC_LIBGCC[0] == '/')
|
|
tcc_add_file(s1, TCC_LIBGCC);
|
|
else
|
|
tcc_add_dll(s1, TCC_LIBGCC, 0);
|
|
}
|
|
#endif
|
|
tcc_add_support(s1, TCC_LIBTCC1);
|
|
/* add crt end if not memory output */
|
|
if (s1->output_type != TCC_OUTPUT_MEMORY)
|
|
tcc_add_crt(s1, "crtn.o");
|
|
}
|
|
#endif
|
|
}
|
|
|
|
/* add various standard linker symbols (must be done after the
|
|
sections are filled (for example after allocating common
|
|
symbols)) */
|
|
static void tcc_add_linker_symbols(TCCState *s1)
|
|
{
|
|
char buf[1024];
|
|
int i;
|
|
Section *s;
|
|
|
|
set_elf_sym(symtab_section,
|
|
text_section->data_offset, 0,
|
|
ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
|
|
text_section->sh_num, "_etext");
|
|
set_elf_sym(symtab_section,
|
|
data_section->data_offset, 0,
|
|
ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
|
|
data_section->sh_num, "_edata");
|
|
set_elf_sym(symtab_section,
|
|
bss_section->data_offset, 0,
|
|
ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
|
|
bss_section->sh_num, "_end");
|
|
#ifdef TCC_TARGET_RISCV64
|
|
/* XXX should be .sdata+0x800, not .data+0x800 */
|
|
set_elf_sym(symtab_section,
|
|
0x800, 0,
|
|
ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
|
|
data_section->sh_num, "__global_pointer$");
|
|
#endif
|
|
/* horrible new standard ldscript defines */
|
|
add_init_array_defines(s1, ".preinit_array");
|
|
add_init_array_defines(s1, ".init_array");
|
|
add_init_array_defines(s1, ".fini_array");
|
|
|
|
/* add start and stop symbols for sections whose name can be
|
|
expressed in C */
|
|
for(i = 1; i < s1->nb_sections; i++) {
|
|
s = s1->sections[i];
|
|
if (s->sh_type == SHT_PROGBITS &&
|
|
(s->sh_flags & SHF_ALLOC)) {
|
|
const char *p;
|
|
int ch;
|
|
|
|
/* check if section name can be expressed in C */
|
|
p = s->name;
|
|
for(;;) {
|
|
ch = *p;
|
|
if (!ch)
|
|
break;
|
|
if (!isid(ch) && !isnum(ch))
|
|
goto next_sec;
|
|
p++;
|
|
}
|
|
snprintf(buf, sizeof(buf), "__start_%s", s->name);
|
|
set_elf_sym(symtab_section,
|
|
0, 0,
|
|
ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
|
|
s->sh_num, buf);
|
|
snprintf(buf, sizeof(buf), "__stop_%s", s->name);
|
|
set_elf_sym(symtab_section,
|
|
s->data_offset, 0,
|
|
ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
|
|
s->sh_num, buf);
|
|
}
|
|
next_sec: ;
|
|
}
|
|
}
|
|
|
|
ST_FUNC void resolve_common_syms(TCCState *s1)
|
|
{
|
|
ElfW(Sym) *sym;
|
|
|
|
/* Allocate common symbols in BSS. */
|
|
for_each_elem(symtab_section, 1, sym, ElfW(Sym)) {
|
|
if (sym->st_shndx == SHN_COMMON) {
|
|
/* symbol alignment is in st_value for SHN_COMMONs */
|
|
sym->st_value = section_add(bss_section, sym->st_size,
|
|
sym->st_value);
|
|
sym->st_shndx = bss_section->sh_num;
|
|
}
|
|
}
|
|
|
|
/* Now assign linker provided symbols their value. */
|
|
tcc_add_linker_symbols(s1);
|
|
}
|
|
|
|
static void tcc_output_binary(TCCState *s1, FILE *f,
|
|
const int *sec_order)
|
|
{
|
|
Section *s;
|
|
int i, offset, size;
|
|
|
|
offset = 0;
|
|
for(i=1;i<s1->nb_sections;i++) {
|
|
s = s1->sections[sec_order[i]];
|
|
if (s->sh_type != SHT_NOBITS &&
|
|
(s->sh_flags & SHF_ALLOC)) {
|
|
while (offset < s->sh_offset) {
|
|
fputc(0, f);
|
|
offset++;
|
|
}
|
|
size = s->sh_size;
|
|
fwrite(s->data, 1, size, f);
|
|
offset += size;
|
|
}
|
|
}
|
|
}
|
|
|
|
ST_FUNC void fill_got_entry(TCCState *s1, ElfW_Rel *rel)
|
|
{
|
|
int sym_index = ELFW(R_SYM) (rel->r_info);
|
|
ElfW(Sym) *sym = &((ElfW(Sym) *) symtab_section->data)[sym_index];
|
|
struct sym_attr *attr = get_sym_attr(s1, sym_index, 0);
|
|
unsigned offset = attr->got_offset;
|
|
|
|
if (0 == offset)
|
|
return;
|
|
section_reserve(s1->got, offset + PTR_SIZE);
|
|
#ifdef TCC_TARGET_X86_64
|
|
write64le(s1->got->data + offset, sym->st_value);
|
|
#else
|
|
write32le(s1->got->data + offset, sym->st_value);
|
|
#endif
|
|
}
|
|
|
|
/* Perform relocation to GOT or PLT entries */
|
|
ST_FUNC void fill_got(TCCState *s1)
|
|
{
|
|
Section *s;
|
|
ElfW_Rel *rel;
|
|
int i;
|
|
|
|
for(i = 1; i < s1->nb_sections; i++) {
|
|
s = s1->sections[i];
|
|
if (s->sh_type != SHT_RELX)
|
|
continue;
|
|
/* no need to handle got relocations */
|
|
if (s->link != symtab_section)
|
|
continue;
|
|
for_each_elem(s, 0, rel, ElfW_Rel) {
|
|
switch (ELFW(R_TYPE) (rel->r_info)) {
|
|
case R_X86_64_GOT32:
|
|
case R_X86_64_GOTPCREL:
|
|
case R_X86_64_GOTPCRELX:
|
|
case R_X86_64_REX_GOTPCRELX:
|
|
case R_X86_64_PLT32:
|
|
fill_got_entry(s1, rel);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
/* See put_got_entry for a description. This is the second stage
|
|
where GOT references to local defined symbols are rewritten. */
|
|
static void fill_local_got_entries(TCCState *s1)
|
|
{
|
|
ElfW_Rel *rel;
|
|
if (!s1->got->reloc)
|
|
return;
|
|
for_each_elem(s1->got->reloc, 0, rel, ElfW_Rel) {
|
|
if (ELFW(R_TYPE)(rel->r_info) == R_RELATIVE) {
|
|
int sym_index = ELFW(R_SYM) (rel->r_info);
|
|
ElfW(Sym) *sym = &((ElfW(Sym) *) symtab_section->data)[sym_index];
|
|
struct sym_attr *attr = get_sym_attr(s1, sym_index, 0);
|
|
unsigned offset = attr->got_offset;
|
|
if (offset != rel->r_offset - s1->got->sh_addr)
|
|
tcc_error_noabort("huh");
|
|
rel->r_info = ELFW(R_INFO)(0, R_RELATIVE);
|
|
#if SHT_RELX == SHT_RELA
|
|
rel->r_addend = sym->st_value;
|
|
#else
|
|
/* All our REL architectures also happen to be 32bit LE. */
|
|
write32le(s1->got->data + offset, sym->st_value);
|
|
#endif
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Bind symbols of executable: resolve undefined symbols from exported symbols
|
|
in shared libraries and export non local defined symbols to shared libraries
|
|
if -rdynamic switch was given on command line */
|
|
static void bind_exe_dynsyms(TCCState *s1)
|
|
{
|
|
const char *name;
|
|
int sym_index, index;
|
|
ElfW(Sym) *sym, *esym;
|
|
int type;
|
|
|
|
/* Resolve undefined symbols from dynamic symbols. When there is a match:
|
|
- if STT_FUNC or STT_GNU_IFUNC symbol -> add it in PLT
|
|
- if STT_OBJECT symbol -> add it in .bss section with suitable reloc */
|
|
for_each_elem(symtab_section, 1, sym, ElfW(Sym)) {
|
|
if (sym->st_shndx == SHN_UNDEF) {
|
|
name = (char *) symtab_section->link->data + sym->st_name;
|
|
sym_index = find_elf_sym(s1->dynsymtab_section, name);
|
|
if (sym_index) {
|
|
esym = &((ElfW(Sym) *)s1->dynsymtab_section->data)[sym_index];
|
|
type = ELFW(ST_TYPE)(esym->st_info);
|
|
if ((type == STT_FUNC) || (type == STT_GNU_IFUNC)) {
|
|
/* Indirect functions shall have STT_FUNC type in executable
|
|
* dynsym section. Indeed, a dlsym call following a lazy
|
|
* resolution would pick the symbol value from the
|
|
* executable dynsym entry which would contain the address
|
|
* of the function wanted by the caller of dlsym instead of
|
|
* the address of the function that would return that
|
|
* address */
|
|
int dynindex
|
|
= put_elf_sym(s1->dynsym, 0, esym->st_size,
|
|
ELFW(ST_INFO)(STB_GLOBAL,STT_FUNC), 0, 0,
|
|
name);
|
|
int index = sym - (ElfW(Sym) *) symtab_section->data;
|
|
get_sym_attr(s1, index, 1)->dyn_index = dynindex;
|
|
} else if (type == STT_OBJECT) {
|
|
unsigned long offset;
|
|
ElfW(Sym) *dynsym;
|
|
offset = bss_section->data_offset;
|
|
/* XXX: which alignment ? */
|
|
offset = (offset + 16 - 1) & -16;
|
|
set_elf_sym (s1->symtab, offset, esym->st_size,
|
|
esym->st_info, 0, bss_section->sh_num, name);
|
|
index = put_elf_sym(s1->dynsym, offset, esym->st_size,
|
|
esym->st_info, 0, bss_section->sh_num,
|
|
name);
|
|
|
|
/* Ensure R_COPY works for weak symbol aliases */
|
|
if (ELFW(ST_BIND)(esym->st_info) == STB_WEAK) {
|
|
for_each_elem(s1->dynsymtab_section, 1, dynsym, ElfW(Sym)) {
|
|
if ((dynsym->st_value == esym->st_value)
|
|
&& (ELFW(ST_BIND)(dynsym->st_info) == STB_GLOBAL)) {
|
|
char *dynname = (char *) s1->dynsymtab_section->link->data
|
|
+ dynsym->st_name;
|
|
put_elf_sym(s1->dynsym, offset, dynsym->st_size,
|
|
dynsym->st_info, 0,
|
|
bss_section->sh_num, dynname);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
put_elf_reloc(s1->dynsym, bss_section,
|
|
offset, R_COPY, index);
|
|
offset += esym->st_size;
|
|
bss_section->data_offset = offset;
|
|
}
|
|
} else {
|
|
/* STB_WEAK undefined symbols are accepted */
|
|
/* XXX: _fp_hw seems to be part of the ABI, so we ignore it */
|
|
if (ELFW(ST_BIND)(sym->st_info) == STB_WEAK ||
|
|
!strcmp(name, "_fp_hw")) {
|
|
} else {
|
|
tcc_error_noabort("undefined symbol '%s'", name);
|
|
}
|
|
}
|
|
} else if (s1->rdynamic && ELFW(ST_BIND)(sym->st_info) != STB_LOCAL) {
|
|
/* if -rdynamic option, then export all non local symbols */
|
|
name = (char *) symtab_section->link->data + sym->st_name;
|
|
set_elf_sym(s1->dynsym, sym->st_value, sym->st_size, sym->st_info,
|
|
0, sym->st_shndx, name);
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Bind symbols of libraries: export all non local symbols of executable that
|
|
are referenced by shared libraries. The reason is that the dynamic loader
|
|
search symbol first in executable and then in libraries. Therefore a
|
|
reference to a symbol already defined by a library can still be resolved by
|
|
a symbol in the executable. */
|
|
static void bind_libs_dynsyms(TCCState *s1)
|
|
{
|
|
const char *name;
|
|
int sym_index;
|
|
ElfW(Sym) *sym, *esym;
|
|
|
|
for_each_elem(s1->dynsymtab_section, 1, esym, ElfW(Sym)) {
|
|
name = (char *) s1->dynsymtab_section->link->data + esym->st_name;
|
|
sym_index = find_elf_sym(symtab_section, name);
|
|
sym = &((ElfW(Sym) *)symtab_section->data)[sym_index];
|
|
if (sym_index && sym->st_shndx != SHN_UNDEF
|
|
&& ELFW(ST_BIND)(sym->st_info) != STB_LOCAL) {
|
|
set_elf_sym(s1->dynsym, sym->st_value, sym->st_size,
|
|
sym->st_info, 0, sym->st_shndx, name);
|
|
} else if (esym->st_shndx == SHN_UNDEF) {
|
|
/* weak symbols can stay undefined */
|
|
if (ELFW(ST_BIND)(esym->st_info) != STB_WEAK)
|
|
tcc_warning("undefined dynamic symbol '%s'", name);
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Export all non local symbols. This is used by shared libraries so that the
|
|
non local symbols they define can resolve a reference in another shared
|
|
library or in the executable. Correspondingly, it allows undefined local
|
|
symbols to be resolved by other shared libraries or by the executable. */
|
|
static void export_global_syms(TCCState *s1)
|
|
{
|
|
int dynindex, index;
|
|
const char *name;
|
|
ElfW(Sym) *sym;
|
|
|
|
for_each_elem(symtab_section, 1, sym, ElfW(Sym)) {
|
|
if (ELFW(ST_BIND)(sym->st_info) != STB_LOCAL) {
|
|
name = (char *) symtab_section->link->data + sym->st_name;
|
|
dynindex = put_elf_sym(s1->dynsym, sym->st_value, sym->st_size,
|
|
sym->st_info, 0, sym->st_shndx, name);
|
|
index = sym - (ElfW(Sym) *) symtab_section->data;
|
|
get_sym_attr(s1, index, 1)->dyn_index = dynindex;
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Allocate strings for section names and decide if an unallocated section
|
|
should be output.
|
|
NOTE: the strsec section comes last, so its size is also correct ! */
|
|
static int alloc_sec_names(TCCState *s1, int file_type, Section *strsec)
|
|
{
|
|
int i;
|
|
Section *s;
|
|
int textrel = 0;
|
|
|
|
/* Allocate strings for section names */
|
|
for(i = 1; i < s1->nb_sections; i++) {
|
|
s = s1->sections[i];
|
|
/* when generating a DLL, we include relocations but we may
|
|
patch them */
|
|
if (file_type == TCC_OUTPUT_DLL &&
|
|
s->sh_type == SHT_RELX &&
|
|
!(s->sh_flags & SHF_ALLOC) &&
|
|
(s1->sections[s->sh_info]->sh_flags & SHF_ALLOC) &&
|
|
prepare_dynamic_rel(s1, s)) {
|
|
if (s1->sections[s->sh_info]->sh_flags & SHF_EXECINSTR)
|
|
textrel = 1;
|
|
} else if ((s1->do_debug && s->sh_type != SHT_RELX) ||
|
|
file_type == TCC_OUTPUT_OBJ ||
|
|
(s->sh_flags & SHF_ALLOC) ||
|
|
i == (s1->nb_sections - 1)) {
|
|
/* we output all sections if debug or object file */
|
|
s->sh_size = s->data_offset;
|
|
}
|
|
if (s->sh_size || (s->sh_flags & SHF_ALLOC))
|
|
s->sh_name = put_elf_str(strsec, s->name);
|
|
}
|
|
strsec->sh_size = strsec->data_offset;
|
|
return textrel;
|
|
}
|
|
|
|
/* Info to be copied in dynamic section */
|
|
struct dyn_inf {
|
|
Section *dynamic;
|
|
Section *dynstr;
|
|
unsigned long data_offset;
|
|
addr_t rel_addr;
|
|
addr_t rel_size;
|
|
#if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
|
|
addr_t bss_addr;
|
|
addr_t bss_size;
|
|
#endif
|
|
};
|
|
|
|
/* Assign sections to segments and decide how are sections laid out when loaded
|
|
in memory. This function also fills corresponding program headers. */
|
|
static int layout_sections(TCCState *s1, ElfW(Phdr) *phdr, int phnum,
|
|
Section *interp, Section* strsec,
|
|
struct dyn_inf *dyninf, int *sec_order)
|
|
{
|
|
int i, j, k, file_type, sh_order_index, file_offset;
|
|
unsigned long s_align;
|
|
long long tmp;
|
|
addr_t addr;
|
|
ElfW(Phdr) *ph;
|
|
Section *s;
|
|
|
|
file_type = s1->output_type;
|
|
sh_order_index = 1;
|
|
file_offset = 0;
|
|
if (s1->output_format == TCC_OUTPUT_FORMAT_ELF)
|
|
file_offset = sizeof(ElfW(Ehdr)) + phnum * sizeof(ElfW(Phdr));
|
|
s_align = ELF_PAGE_SIZE;
|
|
if (s1->section_align)
|
|
s_align = s1->section_align;
|
|
|
|
if (phnum > 0) {
|
|
if (s1->has_text_addr) {
|
|
int a_offset, p_offset;
|
|
addr = s1->text_addr;
|
|
/* we ensure that (addr % ELF_PAGE_SIZE) == file_offset %
|
|
ELF_PAGE_SIZE */
|
|
a_offset = (int) (addr & (s_align - 1));
|
|
p_offset = file_offset & (s_align - 1);
|
|
if (a_offset < p_offset)
|
|
a_offset += s_align;
|
|
file_offset += (a_offset - p_offset);
|
|
} else {
|
|
if (file_type == TCC_OUTPUT_DLL)
|
|
addr = 0;
|
|
else
|
|
addr = ELF_START_ADDR;
|
|
/* compute address after headers */
|
|
addr += (file_offset & (s_align - 1));
|
|
}
|
|
|
|
ph = &phdr[0];
|
|
/* Leave one program headers for the program interpreter and one for
|
|
the program header table itself if needed. These are done later as
|
|
they require section layout to be done first. */
|
|
if (interp)
|
|
ph += 2;
|
|
|
|
/* dynamic relocation table information, for .dynamic section */
|
|
dyninf->rel_addr = dyninf->rel_size = 0;
|
|
#if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
|
|
dyninf->bss_addr = dyninf->bss_size = 0;
|
|
#endif
|
|
|
|
for(j = 0; j < 2; j++) {
|
|
ph->p_type = PT_LOAD;
|
|
if (j == 0)
|
|
ph->p_flags = PF_R | PF_X;
|
|
else
|
|
ph->p_flags = PF_R | PF_W;
|
|
ph->p_align = s_align;
|
|
|
|
/* Decide the layout of sections loaded in memory. This must
|
|
be done before program headers are filled since they contain
|
|
info about the layout. We do the following ordering: interp,
|
|
symbol tables, relocations, progbits, nobits */
|
|
/* XXX: do faster and simpler sorting */
|
|
for(k = 0; k < 5; k++) {
|
|
for(i = 1; i < s1->nb_sections; i++) {
|
|
s = s1->sections[i];
|
|
/* compute if section should be included */
|
|
if (j == 0) {
|
|
if ((s->sh_flags & (SHF_ALLOC | SHF_WRITE)) !=
|
|
SHF_ALLOC)
|
|
continue;
|
|
} else {
|
|
if ((s->sh_flags & (SHF_ALLOC | SHF_WRITE)) !=
|
|
(SHF_ALLOC | SHF_WRITE))
|
|
continue;
|
|
}
|
|
if (s == interp) {
|
|
if (k != 0)
|
|
continue;
|
|
} else if (s->sh_type == SHT_DYNSYM ||
|
|
s->sh_type == SHT_STRTAB ||
|
|
s->sh_type == SHT_HASH) {
|
|
if (k != 1)
|
|
continue;
|
|
} else if (s->sh_type == SHT_RELX) {
|
|
if (k != 2)
|
|
continue;
|
|
} else if (s->sh_type == SHT_NOBITS) {
|
|
if (k != 4)
|
|
continue;
|
|
} else {
|
|
if (k != 3)
|
|
continue;
|
|
}
|
|
sec_order[sh_order_index++] = i;
|
|
|
|
/* section matches: we align it and add its size */
|
|
tmp = addr;
|
|
addr = (addr + s->sh_addralign - 1) &
|
|
~(s->sh_addralign - 1);
|
|
file_offset += (int) ( addr - tmp );
|
|
s->sh_offset = file_offset;
|
|
s->sh_addr = addr;
|
|
|
|
/* update program header infos */
|
|
if (ph->p_offset == 0) {
|
|
ph->p_offset = file_offset;
|
|
ph->p_vaddr = addr;
|
|
ph->p_paddr = ph->p_vaddr;
|
|
}
|
|
/* update dynamic relocation infos */
|
|
if (s->sh_type == SHT_RELX) {
|
|
#if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
|
|
if (!strcmp(strsec->data + s->sh_name, ".rel.got")) {
|
|
dyninf->rel_addr = addr;
|
|
dyninf->rel_size += s->sh_size; /* XXX only first rel. */
|
|
}
|
|
if (!strcmp(strsec->data + s->sh_name, ".rel.bss")) {
|
|
dyninf->bss_addr = addr;
|
|
dyninf->bss_size = s->sh_size; /* XXX only first rel. */
|
|
}
|
|
#else
|
|
if (dyninf->rel_size == 0)
|
|
dyninf->rel_addr = addr;
|
|
dyninf->rel_size += s->sh_size;
|
|
#endif
|
|
}
|
|
addr += s->sh_size;
|
|
if (s->sh_type != SHT_NOBITS)
|
|
file_offset += s->sh_size;
|
|
}
|
|
}
|
|
if (j == 0) {
|
|
/* Make the first PT_LOAD segment include the program
|
|
headers itself (and the ELF header as well), it'll
|
|
come out with same memory use but will make various
|
|
tools like binutils strip work better. */
|
|
ph->p_offset &= ~(ph->p_align - 1);
|
|
ph->p_vaddr &= ~(ph->p_align - 1);
|
|
ph->p_paddr &= ~(ph->p_align - 1);
|
|
}
|
|
ph->p_filesz = file_offset - ph->p_offset;
|
|
ph->p_memsz = addr - ph->p_vaddr;
|
|
ph++;
|
|
if (j == 0) {
|
|
if (s1->output_format == TCC_OUTPUT_FORMAT_ELF) {
|
|
/* if in the middle of a page, we duplicate the page in
|
|
memory so that one copy is RX and the other is RW */
|
|
if ((addr & (s_align - 1)) != 0)
|
|
addr += s_align;
|
|
} else {
|
|
addr = (addr + s_align - 1) & ~(s_align - 1);
|
|
file_offset = (file_offset + s_align - 1) & ~(s_align - 1);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
/* all other sections come after */
|
|
for(i = 1; i < s1->nb_sections; i++) {
|
|
s = s1->sections[i];
|
|
if (phnum > 0 && (s->sh_flags & SHF_ALLOC))
|
|
continue;
|
|
sec_order[sh_order_index++] = i;
|
|
|
|
file_offset = (file_offset + s->sh_addralign - 1) &
|
|
~(s->sh_addralign - 1);
|
|
s->sh_offset = file_offset;
|
|
if (s->sh_type != SHT_NOBITS)
|
|
file_offset += s->sh_size;
|
|
}
|
|
|
|
return file_offset;
|
|
}
|
|
|
|
static void fill_unloadable_phdr(ElfW(Phdr) *phdr, int phnum, Section *interp,
|
|
Section *dynamic)
|
|
{
|
|
ElfW(Phdr) *ph;
|
|
|
|
/* if interpreter, then add corresponding program header */
|
|
if (interp) {
|
|
ph = &phdr[0];
|
|
|
|
ph->p_type = PT_PHDR;
|
|
ph->p_offset = sizeof(ElfW(Ehdr));
|
|
ph->p_filesz = ph->p_memsz = phnum * sizeof(ElfW(Phdr));
|
|
ph->p_vaddr = interp->sh_addr - ph->p_filesz;
|
|
ph->p_paddr = ph->p_vaddr;
|
|
ph->p_flags = PF_R | PF_X;
|
|
ph->p_align = 4; /* interp->sh_addralign; */
|
|
ph++;
|
|
|
|
ph->p_type = PT_INTERP;
|
|
ph->p_offset = interp->sh_offset;
|
|
ph->p_vaddr = interp->sh_addr;
|
|
ph->p_paddr = ph->p_vaddr;
|
|
ph->p_filesz = interp->sh_size;
|
|
ph->p_memsz = interp->sh_size;
|
|
ph->p_flags = PF_R;
|
|
ph->p_align = interp->sh_addralign;
|
|
}
|
|
|
|
/* if dynamic section, then add corresponding program header */
|
|
if (dynamic) {
|
|
ph = &phdr[phnum - 1];
|
|
|
|
ph->p_type = PT_DYNAMIC;
|
|
ph->p_offset = dynamic->sh_offset;
|
|
ph->p_vaddr = dynamic->sh_addr;
|
|
ph->p_paddr = ph->p_vaddr;
|
|
ph->p_filesz = dynamic->sh_size;
|
|
ph->p_memsz = dynamic->sh_size;
|
|
ph->p_flags = PF_R | PF_W;
|
|
ph->p_align = dynamic->sh_addralign;
|
|
}
|
|
}
|
|
|
|
/* Fill the dynamic section with tags describing the address and size of
|
|
sections */
|
|
static void fill_dynamic(TCCState *s1, struct dyn_inf *dyninf)
|
|
{
|
|
Section *dynamic = dyninf->dynamic;
|
|
Section *s;
|
|
|
|
/* put dynamic section entries */
|
|
put_dt(dynamic, DT_HASH, s1->dynsym->hash->sh_addr);
|
|
put_dt(dynamic, DT_STRTAB, dyninf->dynstr->sh_addr);
|
|
put_dt(dynamic, DT_SYMTAB, s1->dynsym->sh_addr);
|
|
put_dt(dynamic, DT_STRSZ, dyninf->dynstr->data_offset);
|
|
put_dt(dynamic, DT_SYMENT, sizeof(ElfW(Sym)));
|
|
#if PTR_SIZE == 8
|
|
put_dt(dynamic, DT_RELA, dyninf->rel_addr);
|
|
put_dt(dynamic, DT_RELASZ, dyninf->rel_size);
|
|
put_dt(dynamic, DT_RELAENT, sizeof(ElfW_Rel));
|
|
#else
|
|
#if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
|
|
put_dt(dynamic, DT_PLTGOT, s1->got->sh_addr);
|
|
put_dt(dynamic, DT_PLTRELSZ, dyninf->rel_size);
|
|
put_dt(dynamic, DT_JMPREL, dyninf->rel_addr);
|
|
put_dt(dynamic, DT_PLTREL, DT_REL);
|
|
put_dt(dynamic, DT_REL, dyninf->bss_addr);
|
|
put_dt(dynamic, DT_RELSZ, dyninf->bss_size);
|
|
#else
|
|
put_dt(dynamic, DT_REL, dyninf->rel_addr);
|
|
put_dt(dynamic, DT_RELSZ, dyninf->rel_size);
|
|
put_dt(dynamic, DT_RELENT, sizeof(ElfW_Rel));
|
|
#endif
|
|
#endif
|
|
put_dt(dynamic, DT_VERNEED, verneed_section->sh_addr);
|
|
put_dt(dynamic, DT_VERNEEDNUM, dt_verneednum);
|
|
put_dt(dynamic, DT_VERSYM, versym_section->sh_addr);
|
|
s = find_section_create (s1, ".preinit_array", 0);
|
|
if (s && s->data_offset) {
|
|
put_dt(dynamic, DT_PREINIT_ARRAY, s->sh_addr);
|
|
put_dt(dynamic, DT_PREINIT_ARRAYSZ, s->data_offset);
|
|
}
|
|
s = find_section_create (s1, ".init_array", 0);
|
|
if (s && s->data_offset) {
|
|
put_dt(dynamic, DT_INIT_ARRAY, s->sh_addr);
|
|
put_dt(dynamic, DT_INIT_ARRAYSZ, s->data_offset);
|
|
}
|
|
s = find_section_create (s1, ".fini_array", 0);
|
|
if (s && s->data_offset) {
|
|
put_dt(dynamic, DT_FINI_ARRAY, s->sh_addr);
|
|
put_dt(dynamic, DT_FINI_ARRAYSZ, s->data_offset);
|
|
}
|
|
s = find_section_create (s1, ".init", 0);
|
|
if (s && s->data_offset) {
|
|
put_dt(dynamic, DT_INIT, s->sh_addr);
|
|
}
|
|
s = find_section_create (s1, ".fini", 0);
|
|
if (s && s->data_offset) {
|
|
put_dt(dynamic, DT_FINI, s->sh_addr);
|
|
}
|
|
if (s1->do_debug)
|
|
put_dt(dynamic, DT_DEBUG, 0);
|
|
put_dt(dynamic, DT_NULL, 0);
|
|
}
|
|
|
|
/* Relocate remaining sections and symbols (that is those not related to
|
|
dynamic linking) */
|
|
static int final_sections_reloc(TCCState *s1)
|
|
{
|
|
int i;
|
|
Section *s;
|
|
|
|
relocate_syms(s1, s1->symtab, 0);
|
|
|
|
if (s1->nb_errors != 0)
|
|
return -1;
|
|
|
|
/* relocate sections */
|
|
/* XXX: ignore sections with allocated relocations ? */
|
|
for(i = 1; i < s1->nb_sections; i++) {
|
|
s = s1->sections[i];
|
|
if (s->reloc && (s != s1->got || s1->static_link))
|
|
relocate_section(s1, s);
|
|
}
|
|
|
|
/* relocate relocation entries if the relocation tables are
|
|
allocated in the executable */
|
|
for(i = 1; i < s1->nb_sections; i++) {
|
|
s = s1->sections[i];
|
|
if ((s->sh_flags & SHF_ALLOC) &&
|
|
s->sh_type == SHT_RELX) {
|
|
relocate_rel(s1, s);
|
|
}
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
/* Create an ELF file on disk.
|
|
This function handle ELF specific layout requirements */
|
|
static void tcc_output_elf(TCCState *s1, FILE *f, int phnum, ElfW(Phdr) *phdr,
|
|
int file_offset, int *sec_order)
|
|
{
|
|
int i, shnum, offset, size, file_type;
|
|
Section *s;
|
|
ElfW(Ehdr) ehdr;
|
|
ElfW(Shdr) shdr, *sh;
|
|
|
|
file_type = s1->output_type;
|
|
shnum = s1->nb_sections;
|
|
|
|
memset(&ehdr, 0, sizeof(ehdr));
|
|
|
|
if (phnum > 0) {
|
|
ehdr.e_phentsize = sizeof(ElfW(Phdr));
|
|
ehdr.e_phnum = phnum;
|
|
ehdr.e_phoff = sizeof(ElfW(Ehdr));
|
|
}
|
|
|
|
/* align to 4 */
|
|
file_offset = (file_offset + 3) & -4;
|
|
|
|
/* fill header */
|
|
ehdr.e_ident[0] = ELFMAG0;
|
|
ehdr.e_ident[1] = ELFMAG1;
|
|
ehdr.e_ident[2] = ELFMAG2;
|
|
ehdr.e_ident[3] = ELFMAG3;
|
|
ehdr.e_ident[4] = ELFCLASSW;
|
|
ehdr.e_ident[5] = ELFDATA2LSB;
|
|
ehdr.e_ident[6] = EV_CURRENT;
|
|
#if !defined(TCC_TARGET_PE) && (defined(__FreeBSD__) || defined(__FreeBSD_kernel__))
|
|
/* FIXME: should set only for freebsd _target_, but we exclude only PE target */
|
|
ehdr.e_ident[EI_OSABI] = ELFOSABI_FREEBSD;
|
|
#endif
|
|
#ifdef TCC_TARGET_ARM
|
|
#ifdef TCC_ARM_EABI
|
|
ehdr.e_ident[EI_OSABI] = 0;
|
|
ehdr.e_flags = EF_ARM_EABI_VER4;
|
|
if (file_type == TCC_OUTPUT_EXE || file_type == TCC_OUTPUT_DLL)
|
|
ehdr.e_flags |= EF_ARM_HASENTRY;
|
|
if (s1->float_abi == ARM_HARD_FLOAT)
|
|
ehdr.e_flags |= EF_ARM_VFP_FLOAT;
|
|
else
|
|
ehdr.e_flags |= EF_ARM_SOFT_FLOAT;
|
|
#else
|
|
ehdr.e_ident[EI_OSABI] = ELFOSABI_ARM;
|
|
#endif
|
|
#elif defined TCC_TARGET_RISCV64
|
|
ehdr.e_flags = EF_RISCV_FLOAT_ABI_DOUBLE;
|
|
#endif
|
|
switch(file_type) {
|
|
default:
|
|
case TCC_OUTPUT_EXE:
|
|
ehdr.e_type = ET_EXEC;
|
|
ehdr.e_entry = get_elf_sym_addr(s1, "_start", 1);
|
|
break;
|
|
case TCC_OUTPUT_DLL:
|
|
ehdr.e_type = ET_DYN;
|
|
ehdr.e_entry = text_section->sh_addr; /* XXX: is it correct ? */
|
|
break;
|
|
case TCC_OUTPUT_OBJ:
|
|
ehdr.e_type = ET_REL;
|
|
break;
|
|
}
|
|
ehdr.e_machine = EM_TCC_TARGET;
|
|
ehdr.e_version = EV_CURRENT;
|
|
ehdr.e_shoff = file_offset;
|
|
ehdr.e_ehsize = sizeof(ElfW(Ehdr));
|
|
ehdr.e_shentsize = sizeof(ElfW(Shdr));
|
|
ehdr.e_shnum = shnum;
|
|
ehdr.e_shstrndx = shnum - 1;
|
|
|
|
fwrite(&ehdr, 1, sizeof(ElfW(Ehdr)), f);
|
|
fwrite(phdr, 1, phnum * sizeof(ElfW(Phdr)), f);
|
|
offset = sizeof(ElfW(Ehdr)) + phnum * sizeof(ElfW(Phdr));
|
|
|
|
sort_syms(s1, symtab_section);
|
|
for(i = 1; i < s1->nb_sections; i++) {
|
|
s = s1->sections[sec_order[i]];
|
|
if (s->sh_type != SHT_NOBITS) {
|
|
while (offset < s->sh_offset) {
|
|
fputc(0, f);
|
|
offset++;
|
|
}
|
|
size = s->sh_size;
|
|
if (size)
|
|
fwrite(s->data, 1, size, f);
|
|
offset += size;
|
|
}
|
|
}
|
|
|
|
/* output section headers */
|
|
while (offset < ehdr.e_shoff) {
|
|
fputc(0, f);
|
|
offset++;
|
|
}
|
|
|
|
for(i = 0; i < s1->nb_sections; i++) {
|
|
sh = &shdr;
|
|
memset(sh, 0, sizeof(ElfW(Shdr)));
|
|
s = s1->sections[i];
|
|
if (s) {
|
|
sh->sh_name = s->sh_name;
|
|
sh->sh_type = s->sh_type;
|
|
sh->sh_flags = s->sh_flags;
|
|
sh->sh_entsize = s->sh_entsize;
|
|
sh->sh_info = s->sh_info;
|
|
if (s->link)
|
|
sh->sh_link = s->link->sh_num;
|
|
sh->sh_addralign = s->sh_addralign;
|
|
sh->sh_addr = s->sh_addr;
|
|
sh->sh_offset = s->sh_offset;
|
|
sh->sh_size = s->sh_size;
|
|
}
|
|
fwrite(sh, 1, sizeof(ElfW(Shdr)), f);
|
|
}
|
|
}
|
|
|
|
/* Write an elf, coff or "binary" file */
|
|
static int tcc_write_elf_file(TCCState *s1, const char *filename, int phnum,
|
|
ElfW(Phdr) *phdr, int file_offset, int *sec_order)
|
|
{
|
|
int fd, mode, file_type;
|
|
FILE *f;
|
|
|
|
file_type = s1->output_type;
|
|
if (file_type == TCC_OUTPUT_OBJ)
|
|
mode = 0666;
|
|
else
|
|
mode = 0777;
|
|
unlink(filename);
|
|
fd = open(filename, O_WRONLY | O_CREAT | O_TRUNC | O_BINARY, mode);
|
|
if (fd < 0) {
|
|
tcc_error_noabort("could not write '%s'", filename);
|
|
return -1;
|
|
}
|
|
f = fdopen(fd, "wb");
|
|
if (s1->verbose)
|
|
printf("<- %s\n", filename);
|
|
|
|
#ifdef TCC_TARGET_COFF
|
|
if (s1->output_format == TCC_OUTPUT_FORMAT_COFF)
|
|
tcc_output_coff(s1, f);
|
|
else
|
|
#endif
|
|
if (s1->output_format == TCC_OUTPUT_FORMAT_ELF)
|
|
tcc_output_elf(s1, f, phnum, phdr, file_offset, sec_order);
|
|
else
|
|
tcc_output_binary(s1, f, sec_order);
|
|
fclose(f);
|
|
|
|
return 0;
|
|
}
|
|
|
|
/* Sort section headers by assigned sh_addr, remove sections
|
|
that we aren't going to output. */
|
|
static void tidy_section_headers(TCCState *s1, int *sec_order)
|
|
{
|
|
int i, nnew, l, *backmap;
|
|
Section **snew, *s;
|
|
ElfW(Sym) *sym;
|
|
|
|
snew = tcc_malloc(s1->nb_sections * sizeof(snew[0]));
|
|
backmap = tcc_malloc(s1->nb_sections * sizeof(backmap[0]));
|
|
for (i = 0, nnew = 0, l = s1->nb_sections; i < s1->nb_sections; i++) {
|
|
s = s1->sections[sec_order[i]];
|
|
if (!i || s->sh_name) {
|
|
backmap[sec_order[i]] = nnew;
|
|
snew[nnew] = s;
|
|
++nnew;
|
|
} else {
|
|
backmap[sec_order[i]] = 0;
|
|
snew[--l] = s;
|
|
}
|
|
}
|
|
for (i = 0; i < nnew; i++) {
|
|
s = snew[i];
|
|
if (s) {
|
|
s->sh_num = i;
|
|
if (s->sh_type == SHT_RELX)
|
|
s->sh_info = backmap[s->sh_info];
|
|
}
|
|
}
|
|
|
|
for_each_elem(symtab_section, 1, sym, ElfW(Sym))
|
|
if (sym->st_shndx != SHN_UNDEF && sym->st_shndx < SHN_LORESERVE)
|
|
sym->st_shndx = backmap[sym->st_shndx];
|
|
if( !s1->static_link ) {
|
|
for_each_elem(s1->dynsym, 1, sym, ElfW(Sym))
|
|
if (sym->st_shndx != SHN_UNDEF && sym->st_shndx < SHN_LORESERVE)
|
|
sym->st_shndx = backmap[sym->st_shndx];
|
|
}
|
|
for (i = 0; i < s1->nb_sections; i++)
|
|
sec_order[i] = i;
|
|
tcc_free(s1->sections);
|
|
s1->sections = snew;
|
|
s1->nb_sections = nnew;
|
|
tcc_free(backmap);
|
|
}
|
|
|
|
/* Output an elf, coff or binary file */
|
|
/* XXX: suppress unneeded sections */
|
|
static int elf_output_file(TCCState *s1, const char *filename)
|
|
{
|
|
int i, ret, phnum, shnum, file_type, file_offset, *sec_order;
|
|
struct dyn_inf dyninf = {0};
|
|
ElfW(Phdr) *phdr;
|
|
ElfW(Sym) *sym;
|
|
Section *strsec, *interp, *dynamic, *dynstr;
|
|
int textrel;
|
|
|
|
file_type = s1->output_type;
|
|
s1->nb_errors = 0;
|
|
ret = -1;
|
|
phdr = NULL;
|
|
sec_order = NULL;
|
|
interp = dynamic = dynstr = NULL; /* avoid warning */
|
|
textrel = 0;
|
|
|
|
if (file_type != TCC_OUTPUT_OBJ) {
|
|
/* if linking, also link in runtime libraries (libc, libgcc, etc.) */
|
|
tcc_add_runtime(s1);
|
|
resolve_common_syms(s1);
|
|
|
|
if (!s1->static_link) {
|
|
if (file_type == TCC_OUTPUT_EXE) {
|
|
char *ptr;
|
|
/* allow override the dynamic loader */
|
|
const char *elfint = getenv("LD_SO");
|
|
if (elfint == NULL)
|
|
elfint = DEFAULT_ELFINTERP(s1);
|
|
/* add interpreter section only if executable */
|
|
interp = new_section(s1, ".interp", SHT_PROGBITS, SHF_ALLOC);
|
|
interp->sh_addralign = 1;
|
|
ptr = section_ptr_add(interp, 1 + strlen(elfint));
|
|
strcpy(ptr, elfint);
|
|
}
|
|
|
|
/* add dynamic symbol table */
|
|
s1->dynsym = new_symtab(s1, ".dynsym", SHT_DYNSYM, SHF_ALLOC,
|
|
".dynstr",
|
|
".hash", SHF_ALLOC);
|
|
dynstr = s1->dynsym->link;
|
|
versym_section->link = s1->dynsym;
|
|
verneed_section->link = dynstr;
|
|
|
|
/* add dynamic section */
|
|
dynamic = new_section(s1, ".dynamic", SHT_DYNAMIC,
|
|
SHF_ALLOC | SHF_WRITE);
|
|
dynamic->link = dynstr;
|
|
dynamic->sh_entsize = sizeof(ElfW(Dyn));
|
|
|
|
build_got(s1);
|
|
|
|
if (file_type == TCC_OUTPUT_EXE) {
|
|
bind_exe_dynsyms(s1);
|
|
if (s1->nb_errors)
|
|
goto the_end;
|
|
bind_libs_dynsyms(s1);
|
|
} else {
|
|
/* shared library case: simply export all global symbols */
|
|
export_global_syms(s1);
|
|
}
|
|
}
|
|
build_got_entries(s1);
|
|
version_add (s1);
|
|
}
|
|
|
|
/* we add a section for symbols */
|
|
strsec = new_section(s1, ".shstrtab", SHT_STRTAB, 0);
|
|
put_elf_str(strsec, "");
|
|
|
|
/* Allocate strings for section names */
|
|
textrel = alloc_sec_names(s1, file_type, strsec);
|
|
|
|
if (dynamic) {
|
|
/* add a list of needed dlls */
|
|
for(i = 0; i < s1->nb_loaded_dlls; i++) {
|
|
DLLReference *dllref = s1->loaded_dlls[i];
|
|
if (dllref->level == 0)
|
|
put_dt(dynamic, DT_NEEDED, put_elf_str(dynstr, dllref->name));
|
|
}
|
|
|
|
if (s1->rpath)
|
|
put_dt(dynamic, s1->enable_new_dtags ? DT_RUNPATH : DT_RPATH,
|
|
put_elf_str(dynstr, s1->rpath));
|
|
|
|
if (file_type == TCC_OUTPUT_DLL) {
|
|
if (s1->soname)
|
|
put_dt(dynamic, DT_SONAME, put_elf_str(dynstr, s1->soname));
|
|
/* XXX: currently, since we do not handle PIC code, we
|
|
must relocate the readonly segments */
|
|
if (textrel)
|
|
put_dt(dynamic, DT_TEXTREL, 0);
|
|
}
|
|
|
|
if (s1->symbolic)
|
|
put_dt(dynamic, DT_SYMBOLIC, 0);
|
|
|
|
dyninf.dynamic = dynamic;
|
|
dyninf.dynstr = dynstr;
|
|
/* remember offset and reserve space for 2nd call below */
|
|
dyninf.data_offset = dynamic->data_offset;
|
|
fill_dynamic(s1, &dyninf);
|
|
dynamic->sh_size = dynamic->data_offset;
|
|
dynstr->sh_size = dynstr->data_offset;
|
|
}
|
|
|
|
/* compute number of program headers */
|
|
if (file_type == TCC_OUTPUT_OBJ)
|
|
phnum = 0;
|
|
else if (file_type == TCC_OUTPUT_DLL)
|
|
phnum = 3;
|
|
else if (s1->static_link)
|
|
phnum = 2;
|
|
else
|
|
phnum = 5;
|
|
|
|
/* allocate program segment headers */
|
|
phdr = tcc_mallocz(phnum * sizeof(ElfW(Phdr)));
|
|
|
|
/* compute number of sections */
|
|
shnum = s1->nb_sections;
|
|
|
|
/* this array is used to reorder sections in the output file */
|
|
sec_order = tcc_malloc(sizeof(int) * shnum);
|
|
sec_order[0] = 0;
|
|
|
|
/* compute section to program header mapping */
|
|
file_offset = layout_sections(s1, phdr, phnum, interp, strsec, &dyninf,
|
|
sec_order);
|
|
|
|
/* Fill remaining program header and finalize relocation related to dynamic
|
|
linking. */
|
|
if (file_type != TCC_OUTPUT_OBJ) {
|
|
fill_unloadable_phdr(phdr, phnum, interp, dynamic);
|
|
if (dynamic) {
|
|
dynamic->data_offset = dyninf.data_offset;
|
|
fill_dynamic(s1, &dyninf);
|
|
|
|
/* put in GOT the dynamic section address and relocate PLT */
|
|
write32le(s1->got->data, dynamic->sh_addr);
|
|
if (file_type == TCC_OUTPUT_EXE
|
|
|| (RELOCATE_DLLPLT && file_type == TCC_OUTPUT_DLL))
|
|
relocate_plt(s1);
|
|
|
|
/* relocate symbols in .dynsym now that final addresses are known */
|
|
for_each_elem(s1->dynsym, 1, sym, ElfW(Sym)) {
|
|
if (sym->st_shndx != SHN_UNDEF && sym->st_shndx < SHN_LORESERVE) {
|
|
/* do symbol relocation */
|
|
sym->st_value += s1->sections[sym->st_shndx]->sh_addr;
|
|
}
|
|
}
|
|
}
|
|
|
|
/* if building executable or DLL, then relocate each section
|
|
except the GOT which is already relocated */
|
|
ret = final_sections_reloc(s1);
|
|
if (ret)
|
|
goto the_end;
|
|
tidy_section_headers(s1, sec_order);
|
|
|
|
/* Perform relocation to GOT or PLT entries */
|
|
if (file_type == TCC_OUTPUT_EXE && s1->static_link)
|
|
fill_got(s1);
|
|
else if (s1->got)
|
|
fill_local_got_entries(s1);
|
|
}
|
|
|
|
/* Create the ELF file with name 'filename' */
|
|
ret = tcc_write_elf_file(s1, filename, phnum, phdr, file_offset, sec_order);
|
|
s1->nb_sections = shnum;
|
|
the_end:
|
|
tcc_free(sec_order);
|
|
tcc_free(phdr);
|
|
return ret;
|
|
}
|
|
|
|
LIBTCCAPI int tcc_output_file(TCCState *s, const char *filename)
|
|
{
|
|
int ret;
|
|
#ifdef TCC_TARGET_PE
|
|
if (s->output_type != TCC_OUTPUT_OBJ) {
|
|
ret = pe_output_file(s, filename);
|
|
} else
|
|
#endif
|
|
ret = elf_output_file(s, filename);
|
|
return ret;
|
|
}
|
|
|
|
ssize_t full_read(int fd, void *buf, size_t count) {
|
|
char *cbuf = buf;
|
|
size_t rnum = 0;
|
|
while (1) {
|
|
ssize_t num = read(fd, cbuf, count-rnum);
|
|
if (num < 0) return num;
|
|
if (num == 0) return rnum;
|
|
rnum += num;
|
|
cbuf += num;
|
|
}
|
|
}
|
|
|
|
static void *load_data(int fd, unsigned long file_offset, unsigned long size)
|
|
{
|
|
void *data;
|
|
|
|
data = tcc_malloc(size);
|
|
lseek(fd, file_offset, SEEK_SET);
|
|
full_read(fd, data, size);
|
|
return data;
|
|
}
|
|
|
|
typedef struct SectionMergeInfo {
|
|
Section *s; /* corresponding existing section */
|
|
unsigned long offset; /* offset of the new section in the existing section */
|
|
uint8_t new_section; /* true if section 's' was added */
|
|
uint8_t link_once; /* true if link once section */
|
|
} SectionMergeInfo;
|
|
|
|
ST_FUNC int tcc_object_type(int fd, ElfW(Ehdr) *h)
|
|
{
|
|
int size = full_read(fd, h, sizeof *h);
|
|
if (size == sizeof *h && 0 == memcmp(h, ELFMAG, 4)) {
|
|
if (h->e_type == ET_REL)
|
|
return AFF_BINTYPE_REL;
|
|
if (h->e_type == ET_DYN)
|
|
return AFF_BINTYPE_DYN;
|
|
} else if (size >= 8) {
|
|
if (0 == memcmp(h, ARMAG, 8))
|
|
return AFF_BINTYPE_AR;
|
|
#ifdef TCC_TARGET_COFF
|
|
if (((struct filehdr*)h)->f_magic == COFF_C67_MAGIC)
|
|
return AFF_BINTYPE_C67;
|
|
#endif
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
/* load an object file and merge it with current files */
|
|
/* XXX: handle correctly stab (debug) info */
|
|
ST_FUNC int tcc_load_object_file(TCCState *s1,
|
|
int fd, unsigned long file_offset)
|
|
{
|
|
ElfW(Ehdr) ehdr;
|
|
ElfW(Shdr) *shdr, *sh;
|
|
int size, i, j, offset, offseti, nb_syms, sym_index, ret, seencompressed;
|
|
char *strsec, *strtab;
|
|
int *old_to_new_syms;
|
|
char *sh_name, *name;
|
|
SectionMergeInfo *sm_table, *sm;
|
|
ElfW(Sym) *sym, *symtab;
|
|
ElfW_Rel *rel;
|
|
Section *s;
|
|
|
|
int stab_index;
|
|
int stabstr_index;
|
|
|
|
stab_index = stabstr_index = 0;
|
|
|
|
lseek(fd, file_offset, SEEK_SET);
|
|
if (tcc_object_type(fd, &ehdr) != AFF_BINTYPE_REL)
|
|
goto fail1;
|
|
/* test CPU specific stuff */
|
|
if (ehdr.e_ident[5] != ELFDATA2LSB ||
|
|
ehdr.e_machine != EM_TCC_TARGET) {
|
|
fail1:
|
|
tcc_error_noabort("invalid object file");
|
|
return -1;
|
|
}
|
|
/* read sections */
|
|
shdr = load_data(fd, file_offset + ehdr.e_shoff,
|
|
sizeof(ElfW(Shdr)) * ehdr.e_shnum);
|
|
sm_table = tcc_mallocz(sizeof(SectionMergeInfo) * ehdr.e_shnum);
|
|
|
|
/* load section names */
|
|
sh = &shdr[ehdr.e_shstrndx];
|
|
strsec = load_data(fd, file_offset + sh->sh_offset, sh->sh_size);
|
|
|
|
/* load symtab and strtab */
|
|
old_to_new_syms = NULL;
|
|
symtab = NULL;
|
|
strtab = NULL;
|
|
nb_syms = 0;
|
|
seencompressed = 0;
|
|
for(i = 1; i < ehdr.e_shnum; i++) {
|
|
sh = &shdr[i];
|
|
if (sh->sh_type == SHT_SYMTAB) {
|
|
if (symtab) {
|
|
tcc_error_noabort("object must contain only one symtab");
|
|
fail:
|
|
ret = -1;
|
|
goto the_end;
|
|
}
|
|
nb_syms = sh->sh_size / sizeof(ElfW(Sym));
|
|
symtab = load_data(fd, file_offset + sh->sh_offset, sh->sh_size);
|
|
sm_table[i].s = symtab_section;
|
|
|
|
/* now load strtab */
|
|
sh = &shdr[sh->sh_link];
|
|
strtab = load_data(fd, file_offset + sh->sh_offset, sh->sh_size);
|
|
}
|
|
if (sh->sh_flags & SHF_COMPRESSED)
|
|
seencompressed = 1;
|
|
}
|
|
|
|
/* now examine each section and try to merge its content with the
|
|
ones in memory */
|
|
for(i = 1; i < ehdr.e_shnum; i++) {
|
|
/* no need to examine section name strtab */
|
|
if (i == ehdr.e_shstrndx)
|
|
continue;
|
|
sh = &shdr[i];
|
|
if (sh->sh_type == SHT_RELX)
|
|
sh = &shdr[sh->sh_info];
|
|
/* ignore sections types we do not handle (plus relocs to those) */
|
|
if (sh->sh_type != SHT_PROGBITS &&
|
|
#ifdef TCC_ARM_EABI
|
|
sh->sh_type != SHT_ARM_EXIDX &&
|
|
#endif
|
|
sh->sh_type != SHT_NOBITS &&
|
|
sh->sh_type != SHT_PREINIT_ARRAY &&
|
|
sh->sh_type != SHT_INIT_ARRAY &&
|
|
sh->sh_type != SHT_FINI_ARRAY &&
|
|
strcmp(strsec + sh->sh_name, ".stabstr")
|
|
)
|
|
continue;
|
|
if (seencompressed
|
|
&& !strncmp(strsec + sh->sh_name, ".debug_", sizeof(".debug_")-1))
|
|
continue;
|
|
|
|
sh = &shdr[i];
|
|
sh_name = strsec + sh->sh_name;
|
|
if (sh->sh_addralign < 1)
|
|
sh->sh_addralign = 1;
|
|
/* find corresponding section, if any */
|
|
for(j = 1; j < s1->nb_sections;j++) {
|
|
s = s1->sections[j];
|
|
if (!strcmp(s->name, sh_name)) {
|
|
if (!strncmp(sh_name, ".gnu.linkonce",
|
|
sizeof(".gnu.linkonce") - 1)) {
|
|
/* if a 'linkonce' section is already present, we
|
|
do not add it again. It is a little tricky as
|
|
symbols can still be defined in
|
|
it. */
|
|
sm_table[i].link_once = 1;
|
|
goto next;
|
|
} else {
|
|
goto found;
|
|
}
|
|
}
|
|
}
|
|
/* not found: create new section */
|
|
s = new_section(s1, sh_name, sh->sh_type, sh->sh_flags & ~SHF_GROUP);
|
|
/* take as much info as possible from the section. sh_link and
|
|
sh_info will be updated later */
|
|
s->sh_addralign = sh->sh_addralign;
|
|
s->sh_entsize = sh->sh_entsize;
|
|
sm_table[i].new_section = 1;
|
|
found:
|
|
if (sh->sh_type != s->sh_type) {
|
|
tcc_error_noabort("invalid section type");
|
|
goto fail;
|
|
}
|
|
|
|
/* align start of section */
|
|
offset = s->data_offset;
|
|
|
|
if (0 == strcmp(sh_name, ".stab")) {
|
|
stab_index = i;
|
|
goto no_align;
|
|
}
|
|
if (0 == strcmp(sh_name, ".stabstr")) {
|
|
stabstr_index = i;
|
|
goto no_align;
|
|
}
|
|
|
|
size = sh->sh_addralign - 1;
|
|
offset = (offset + size) & ~size;
|
|
if (sh->sh_addralign > s->sh_addralign)
|
|
s->sh_addralign = sh->sh_addralign;
|
|
s->data_offset = offset;
|
|
no_align:
|
|
sm_table[i].offset = offset;
|
|
sm_table[i].s = s;
|
|
/* concatenate sections */
|
|
size = sh->sh_size;
|
|
if (sh->sh_type != SHT_NOBITS) {
|
|
unsigned char *ptr;
|
|
lseek(fd, file_offset + sh->sh_offset, SEEK_SET);
|
|
ptr = section_ptr_add(s, size);
|
|
full_read(fd, ptr, size);
|
|
} else {
|
|
s->data_offset += size;
|
|
}
|
|
next: ;
|
|
}
|
|
|
|
/* gr relocate stab strings */
|
|
if (stab_index && stabstr_index) {
|
|
Stab_Sym *a, *b;
|
|
unsigned o;
|
|
s = sm_table[stab_index].s;
|
|
a = (Stab_Sym *)(s->data + sm_table[stab_index].offset);
|
|
b = (Stab_Sym *)(s->data + s->data_offset);
|
|
o = sm_table[stabstr_index].offset;
|
|
while (a < b) {
|
|
if (a->n_strx)
|
|
a->n_strx += o;
|
|
a++;
|
|
}
|
|
}
|
|
|
|
/* second short pass to update sh_link and sh_info fields of new
|
|
sections */
|
|
for(i = 1; i < ehdr.e_shnum; i++) {
|
|
s = sm_table[i].s;
|
|
if (!s || !sm_table[i].new_section)
|
|
continue;
|
|
sh = &shdr[i];
|
|
if (sh->sh_link > 0)
|
|
s->link = sm_table[sh->sh_link].s;
|
|
if (sh->sh_type == SHT_RELX) {
|
|
s->sh_info = sm_table[sh->sh_info].s->sh_num;
|
|
/* update backward link */
|
|
s1->sections[s->sh_info]->reloc = s;
|
|
}
|
|
}
|
|
sm = sm_table;
|
|
|
|
/* resolve symbols */
|
|
old_to_new_syms = tcc_mallocz(nb_syms * sizeof(int));
|
|
|
|
sym = symtab + 1;
|
|
for(i = 1; i < nb_syms; i++, sym++) {
|
|
if (sym->st_shndx != SHN_UNDEF &&
|
|
sym->st_shndx < SHN_LORESERVE) {
|
|
sm = &sm_table[sym->st_shndx];
|
|
if (sm->link_once) {
|
|
/* if a symbol is in a link once section, we use the
|
|
already defined symbol. It is very important to get
|
|
correct relocations */
|
|
if (ELFW(ST_BIND)(sym->st_info) != STB_LOCAL) {
|
|
name = strtab + sym->st_name;
|
|
sym_index = find_elf_sym(symtab_section, name);
|
|
if (sym_index)
|
|
old_to_new_syms[i] = sym_index;
|
|
}
|
|
continue;
|
|
}
|
|
/* if no corresponding section added, no need to add symbol */
|
|
if (!sm->s)
|
|
continue;
|
|
/* convert section number */
|
|
sym->st_shndx = sm->s->sh_num;
|
|
/* offset value */
|
|
sym->st_value += sm->offset;
|
|
}
|
|
/* add symbol */
|
|
name = strtab + sym->st_name;
|
|
sym_index = set_elf_sym(symtab_section, sym->st_value, sym->st_size,
|
|
sym->st_info, sym->st_other,
|
|
sym->st_shndx, name);
|
|
old_to_new_syms[i] = sym_index;
|
|
}
|
|
|
|
/* third pass to patch relocation entries */
|
|
for(i = 1; i < ehdr.e_shnum; i++) {
|
|
s = sm_table[i].s;
|
|
if (!s)
|
|
continue;
|
|
sh = &shdr[i];
|
|
offset = sm_table[i].offset;
|
|
switch(s->sh_type) {
|
|
case SHT_RELX:
|
|
/* take relocation offset information */
|
|
offseti = sm_table[sh->sh_info].offset;
|
|
for_each_elem(s, (offset / sizeof(*rel)), rel, ElfW_Rel) {
|
|
int type;
|
|
unsigned sym_index;
|
|
/* convert symbol index */
|
|
type = ELFW(R_TYPE)(rel->r_info);
|
|
sym_index = ELFW(R_SYM)(rel->r_info);
|
|
/* NOTE: only one symtab assumed */
|
|
if (sym_index >= nb_syms)
|
|
goto invalid_reloc;
|
|
sym_index = old_to_new_syms[sym_index];
|
|
/* ignore link_once in rel section. */
|
|
if (!sym_index && !sm->link_once
|
|
#ifdef TCC_TARGET_ARM
|
|
&& type != R_ARM_V4BX
|
|
#elif defined TCC_TARGET_RISCV64
|
|
&& type != R_RISCV_ALIGN
|
|
&& type != R_RISCV_RELAX
|
|
#endif
|
|
) {
|
|
invalid_reloc:
|
|
tcc_error_noabort("Invalid relocation entry [%2d] '%s' @ %.8x",
|
|
i, strsec + sh->sh_name, rel->r_offset);
|
|
goto fail;
|
|
}
|
|
rel->r_info = ELFW(R_INFO)(sym_index, type);
|
|
/* offset the relocation offset */
|
|
rel->r_offset += offseti;
|
|
#ifdef TCC_TARGET_ARM
|
|
/* Jumps and branches from a Thumb code to a PLT entry need
|
|
special handling since PLT entries are ARM code.
|
|
Unconditional bl instructions referencing PLT entries are
|
|
handled by converting these instructions into blx
|
|
instructions. Other case of instructions referencing a PLT
|
|
entry require to add a Thumb stub before the PLT entry to
|
|
switch to ARM mode. We set bit plt_thumb_stub of the
|
|
attribute of a symbol to indicate such a case. */
|
|
if (type == R_ARM_THM_JUMP24)
|
|
get_sym_attr(s1, sym_index, 1)->plt_thumb_stub = 1;
|
|
#endif
|
|
}
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
}
|
|
|
|
ret = 0;
|
|
the_end:
|
|
tcc_free(symtab);
|
|
tcc_free(strtab);
|
|
tcc_free(old_to_new_syms);
|
|
tcc_free(sm_table);
|
|
tcc_free(strsec);
|
|
tcc_free(shdr);
|
|
return ret;
|
|
}
|
|
|
|
typedef struct ArchiveHeader {
|
|
char ar_name[16]; /* name of this member */
|
|
char ar_date[12]; /* file mtime */
|
|
char ar_uid[6]; /* owner uid; printed as decimal */
|
|
char ar_gid[6]; /* owner gid; printed as decimal */
|
|
char ar_mode[8]; /* file mode, printed as octal */
|
|
char ar_size[10]; /* file size, printed as decimal */
|
|
char ar_fmag[2]; /* should contain ARFMAG */
|
|
} ArchiveHeader;
|
|
|
|
static int get_be32(const uint8_t *b)
|
|
{
|
|
return b[3] | (b[2] << 8) | (b[1] << 16) | (b[0] << 24);
|
|
}
|
|
|
|
static long get_be64(const uint8_t *b)
|
|
{
|
|
long long ret = get_be32(b);
|
|
ret = (ret << 32) | (unsigned)get_be32(b+4);
|
|
return (long)ret;
|
|
}
|
|
|
|
/* load only the objects which resolve undefined symbols */
|
|
static int tcc_load_alacarte(TCCState *s1, int fd, int size, int entrysize)
|
|
{
|
|
long i, bound, nsyms, sym_index, off, ret;
|
|
uint8_t *data;
|
|
const char *ar_names, *p;
|
|
const uint8_t *ar_index;
|
|
ElfW(Sym) *sym;
|
|
|
|
data = tcc_malloc(size);
|
|
if (full_read(fd, data, size) != size)
|
|
goto fail;
|
|
nsyms = entrysize == 4 ? get_be32(data) : get_be64(data);
|
|
ar_index = data + entrysize;
|
|
ar_names = (char *) ar_index + nsyms * entrysize;
|
|
|
|
do {
|
|
bound = 0;
|
|
for(p = ar_names, i = 0; i < nsyms; i++, p += strlen(p)+1) {
|
|
sym_index = find_elf_sym(symtab_section, p);
|
|
if(sym_index) {
|
|
sym = &((ElfW(Sym) *)symtab_section->data)[sym_index];
|
|
if(sym->st_shndx == SHN_UNDEF) {
|
|
off = (entrysize == 4
|
|
? get_be32(ar_index + i * 4)
|
|
: get_be64(ar_index + i * 8))
|
|
+ sizeof(ArchiveHeader);
|
|
++bound;
|
|
if(tcc_load_object_file(s1, fd, off) < 0) {
|
|
fail:
|
|
ret = -1;
|
|
goto the_end;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
} while(bound);
|
|
ret = 0;
|
|
the_end:
|
|
tcc_free(data);
|
|
return ret;
|
|
}
|
|
|
|
/* load a '.a' file */
|
|
ST_FUNC int tcc_load_archive(TCCState *s1, int fd, int alacarte)
|
|
{
|
|
ArchiveHeader hdr;
|
|
char ar_size[11];
|
|
char ar_name[17];
|
|
char magic[8];
|
|
int size, len, i;
|
|
unsigned long file_offset;
|
|
|
|
/* skip magic which was already checked */
|
|
full_read(fd, magic, sizeof(magic));
|
|
|
|
for(;;) {
|
|
len = full_read(fd, &hdr, sizeof(hdr));
|
|
if (len == 0)
|
|
break;
|
|
if (len != sizeof(hdr)) {
|
|
tcc_error_noabort("invalid archive");
|
|
return -1;
|
|
}
|
|
memcpy(ar_size, hdr.ar_size, sizeof(hdr.ar_size));
|
|
ar_size[sizeof(hdr.ar_size)] = '\0';
|
|
size = strtol(ar_size, NULL, 0);
|
|
memcpy(ar_name, hdr.ar_name, sizeof(hdr.ar_name));
|
|
for(i = sizeof(hdr.ar_name) - 1; i >= 0; i--) {
|
|
if (ar_name[i] != ' ')
|
|
break;
|
|
}
|
|
ar_name[i + 1] = '\0';
|
|
file_offset = lseek(fd, 0, SEEK_CUR);
|
|
/* align to even */
|
|
size = (size + 1) & ~1;
|
|
if (!strcmp(ar_name, "/")) {
|
|
/* coff symbol table : we handle it */
|
|
if (alacarte)
|
|
return tcc_load_alacarte(s1, fd, size, 4);
|
|
} else if (!strcmp(ar_name, "/SYM64/")) {
|
|
if (alacarte)
|
|
return tcc_load_alacarte(s1, fd, size, 8);
|
|
} else {
|
|
ElfW(Ehdr) ehdr;
|
|
if (tcc_object_type(fd, &ehdr) == AFF_BINTYPE_REL) {
|
|
if (tcc_load_object_file(s1, fd, file_offset) < 0)
|
|
return -1;
|
|
}
|
|
}
|
|
lseek(fd, file_offset + size, SEEK_SET);
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
#ifndef TCC_TARGET_PE
|
|
/* Set LV[I] to the global index of sym-version (LIB,VERSION). Maybe resizes
|
|
LV, maybe create a new entry for (LIB,VERSION). */
|
|
static void set_ver_to_ver(int *n, int **lv, int i, char *lib, char *version)
|
|
{
|
|
while (i >= *n) {
|
|
*lv = tcc_realloc(*lv, (*n + 1) * sizeof(**lv));
|
|
(*lv)[(*n)++] = -1;
|
|
}
|
|
if ((*lv)[i] == -1) {
|
|
int v, prev_same_lib = -1;
|
|
for (v = 0; v < nb_sym_versions; v++) {
|
|
if (strcmp(sym_versions[v].lib, lib))
|
|
continue;
|
|
prev_same_lib = v;
|
|
if (!strcmp(sym_versions[v].version, version))
|
|
break;
|
|
}
|
|
if (v == nb_sym_versions) {
|
|
sym_versions = tcc_realloc (sym_versions,
|
|
(v + 1) * sizeof(*sym_versions));
|
|
sym_versions[v].lib = tcc_strdup(lib);
|
|
sym_versions[v].version = tcc_strdup(version);
|
|
sym_versions[v].out_index = 0;
|
|
sym_versions[v].prev_same_lib = prev_same_lib;
|
|
nb_sym_versions++;
|
|
}
|
|
(*lv)[i] = v;
|
|
}
|
|
}
|
|
|
|
/* Associates symbol SYM_INDEX (in dynsymtab) with sym-version index
|
|
VERNDX. */
|
|
static void
|
|
set_sym_version(int sym_index, int verndx)
|
|
{
|
|
if (sym_index >= nb_sym_to_version) {
|
|
int newelems = sym_index ? sym_index * 2 : 1;
|
|
sym_to_version = tcc_realloc(sym_to_version,
|
|
newelems * sizeof(*sym_to_version));
|
|
memset(sym_to_version + nb_sym_to_version, -1,
|
|
(newelems - nb_sym_to_version) * sizeof(*sym_to_version));
|
|
nb_sym_to_version = newelems;
|
|
}
|
|
if (sym_to_version[sym_index] < 0)
|
|
sym_to_version[sym_index] = verndx;
|
|
}
|
|
|
|
/* load a DLL and all referenced DLLs. 'level = 0' means that the DLL
|
|
is referenced by the user (so it should be added as DT_NEEDED in
|
|
the generated ELF file) */
|
|
ST_FUNC int tcc_load_dll(TCCState *s1, int fd, const char *filename, int level)
|
|
{
|
|
ElfW(Ehdr) ehdr;
|
|
ElfW(Shdr) *shdr, *sh, *sh1;
|
|
int i, j, nb_syms, nb_dts, sym_bind, ret;
|
|
ElfW(Sym) *sym, *dynsym;
|
|
ElfW(Dyn) *dt, *dynamic;
|
|
int nb_versyms;
|
|
ElfW(Verdef) *verdef, *vdef;
|
|
ElfW(Verneed) *verneed, *vneed;
|
|
ElfW(Half) *versym, *vsym;
|
|
char *dynstr;
|
|
uint32_t next;
|
|
int sym_index;
|
|
char *lib, *version;
|
|
int nb_local_ver = 0, *local_ver = NULL;
|
|
const char *name, *soname;
|
|
DLLReference *dllref;
|
|
|
|
full_read(fd, &ehdr, sizeof(ehdr));
|
|
|
|
/* test CPU specific stuff */
|
|
if (ehdr.e_ident[5] != ELFDATA2LSB ||
|
|
ehdr.e_machine != EM_TCC_TARGET) {
|
|
tcc_error_noabort("bad architecture");
|
|
return -1;
|
|
}
|
|
|
|
/* read sections */
|
|
shdr = load_data(fd, ehdr.e_shoff, sizeof(ElfW(Shdr)) * ehdr.e_shnum);
|
|
|
|
/* load dynamic section and dynamic symbols */
|
|
nb_syms = 0;
|
|
nb_dts = 0;
|
|
dynamic = NULL;
|
|
dynsym = NULL; /* avoid warning */
|
|
dynstr = NULL; /* avoid warning */
|
|
nb_versyms = 0;
|
|
verdef = NULL;
|
|
verneed = NULL;
|
|
versym = NULL;
|
|
for(i = 0, sh = shdr; i < ehdr.e_shnum; i++, sh++) {
|
|
switch(sh->sh_type) {
|
|
case SHT_DYNAMIC:
|
|
nb_dts = sh->sh_size / sizeof(ElfW(Dyn));
|
|
dynamic = load_data(fd, sh->sh_offset, sh->sh_size);
|
|
break;
|
|
case SHT_DYNSYM:
|
|
nb_syms = sh->sh_size / sizeof(ElfW(Sym));
|
|
dynsym = load_data(fd, sh->sh_offset, sh->sh_size);
|
|
sh1 = &shdr[sh->sh_link];
|
|
dynstr = load_data(fd, sh1->sh_offset, sh1->sh_size);
|
|
break;
|
|
case SHT_GNU_verdef:
|
|
verdef = load_data(fd, sh->sh_offset, sh->sh_size);
|
|
break;
|
|
case SHT_GNU_verneed:
|
|
verneed = load_data(fd, sh->sh_offset, sh->sh_size);
|
|
break;
|
|
case SHT_GNU_versym:
|
|
nb_versyms = sh->sh_size / sizeof(ElfW(Half));
|
|
versym = load_data(fd, sh->sh_offset, sh->sh_size);
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
}
|
|
|
|
/* compute the real library name */
|
|
soname = tcc_basename(filename);
|
|
|
|
for(i = 0, dt = dynamic; i < nb_dts; i++, dt++) {
|
|
if (dt->d_tag == DT_SONAME) {
|
|
soname = dynstr + dt->d_un.d_val;
|
|
}
|
|
}
|
|
|
|
/* if the dll is already loaded, do not load it */
|
|
for(i = 0; i < s1->nb_loaded_dlls; i++) {
|
|
dllref = s1->loaded_dlls[i];
|
|
if (!strcmp(soname, dllref->name)) {
|
|
/* but update level if needed */
|
|
if (level < dllref->level)
|
|
dllref->level = level;
|
|
ret = 0;
|
|
goto the_end;
|
|
}
|
|
}
|
|
|
|
if (nb_versyms != nb_syms) {
|
|
tcc_free (versym);
|
|
versym = NULL;
|
|
}
|
|
|
|
#define DEBUG_VERSION 0
|
|
|
|
if (versym && verdef) {
|
|
lib = NULL;
|
|
vdef = verdef;
|
|
do {
|
|
ElfW(Verdaux) *verdaux =
|
|
(ElfW(Verdaux) *) (((char *) vdef) + vdef->vd_aux);
|
|
|
|
#if DEBUG_VERSION
|
|
printf ("verdef: version:%u flags:%u index:%u, hash:%u\n",
|
|
vdef->vd_version, vdef->vd_flags, vdef->vd_ndx,
|
|
vdef->vd_hash);
|
|
#endif
|
|
if (vdef->vd_cnt) {
|
|
version = dynstr + verdaux->vda_name;
|
|
|
|
if (lib == NULL)
|
|
lib = version;
|
|
else
|
|
set_ver_to_ver(&nb_local_ver, &local_ver, vdef->vd_ndx,
|
|
lib, version);
|
|
#if DEBUG_VERSION
|
|
printf (" verdaux(%u): %s\n", vdef->vd_ndx, version);
|
|
#endif
|
|
}
|
|
next = vdef->vd_next;
|
|
vdef = (ElfW(Verdef) *) (((char *) vdef) + next);
|
|
} while (next);
|
|
}
|
|
if (versym && verneed) {
|
|
vneed = verneed;
|
|
do {
|
|
ElfW(Vernaux) *vernaux =
|
|
(ElfW(Vernaux) *) (((char *) vneed) + vneed->vn_aux);
|
|
|
|
lib = dynstr + vneed->vn_file;
|
|
#if DEBUG_VERSION
|
|
printf ("verneed: %u %s\n", vneed->vn_version, lib);
|
|
#endif
|
|
for (i = 0; i < vneed->vn_cnt; i++) {
|
|
if ((vernaux->vna_other & 0x8000) == 0) { /* hidden */
|
|
version = dynstr + vernaux->vna_name;
|
|
set_ver_to_ver(&nb_local_ver, &local_ver, vernaux->vna_other,
|
|
lib, version);
|
|
#if DEBUG_VERSION
|
|
printf (" vernaux(%u): %u %u %s\n",
|
|
vernaux->vna_other, vernaux->vna_hash,
|
|
vernaux->vna_flags, version);
|
|
#endif
|
|
}
|
|
vernaux = (ElfW(Vernaux) *) (((char *) vernaux) + vernaux->vna_next);
|
|
}
|
|
next = vneed->vn_next;
|
|
vneed = (ElfW(Verneed) *) (((char *) vneed) + next);
|
|
} while (next);
|
|
}
|
|
|
|
#if DEBUG_VERSION
|
|
for (i = 0; i < nb_local_ver; i++) {
|
|
if (local_ver[i] > 0) {
|
|
printf ("%d: lib: %s, version %s\n",
|
|
i, sym_versions[local_ver[i]].lib,
|
|
sym_version[local_ver[i]].version);
|
|
}
|
|
}
|
|
#endif
|
|
|
|
/* add the dll and its level */
|
|
dllref = tcc_mallocz(sizeof(DLLReference) + strlen(soname));
|
|
dllref->level = level;
|
|
strcpy(dllref->name, soname);
|
|
dynarray_add(&s1->loaded_dlls, &s1->nb_loaded_dlls, dllref);
|
|
|
|
/* add dynamic symbols in dynsym_section */
|
|
for(i = 1, sym = dynsym + 1, vsym = versym + 1; i < nb_syms; i++, sym++, vsym++) {
|
|
sym_bind = ELFW(ST_BIND)(sym->st_info);
|
|
if (sym_bind == STB_LOCAL)
|
|
continue;
|
|
name = dynstr + sym->st_name;
|
|
sym_index = set_elf_sym(s1->dynsymtab_section, sym->st_value, sym->st_size,
|
|
sym->st_info, sym->st_other, sym->st_shndx, name);
|
|
if (versym && (*vsym & 0x8000) == 0 &&
|
|
*vsym > 0 && *vsym < nb_local_ver) {
|
|
set_sym_version(sym_index, local_ver[*vsym]);
|
|
}
|
|
}
|
|
|
|
/* load all referenced DLLs */
|
|
for(i = 0, dt = dynamic; i < nb_dts; i++, dt++) {
|
|
switch(dt->d_tag) {
|
|
case DT_NEEDED:
|
|
name = dynstr + dt->d_un.d_val;
|
|
for(j = 0; j < s1->nb_loaded_dlls; j++) {
|
|
dllref = s1->loaded_dlls[j];
|
|
if (!strcmp(name, dllref->name))
|
|
goto already_loaded;
|
|
}
|
|
if (tcc_add_dll(s1, name, AFF_REFERENCED_DLL) < 0) {
|
|
tcc_error_noabort("referenced dll '%s' not found", name);
|
|
ret = -1;
|
|
goto the_end;
|
|
}
|
|
already_loaded:
|
|
break;
|
|
}
|
|
}
|
|
ret = 0;
|
|
the_end:
|
|
tcc_free(local_ver);
|
|
tcc_free(dynstr);
|
|
tcc_free(dynsym);
|
|
tcc_free(dynamic);
|
|
tcc_free(verdef);
|
|
tcc_free(verneed);
|
|
tcc_free(versym);
|
|
tcc_free(shdr);
|
|
return ret;
|
|
}
|
|
|
|
#define LD_TOK_NAME 256
|
|
#define LD_TOK_EOF (-1)
|
|
|
|
/* return next ld script token */
|
|
static int ld_next(TCCState *s1, char *name, int name_size)
|
|
{
|
|
int c;
|
|
char *q;
|
|
|
|
redo:
|
|
switch(ch) {
|
|
case ' ':
|
|
case '\t':
|
|
case '\f':
|
|
case '\v':
|
|
case '\r':
|
|
case '\n':
|
|
inp();
|
|
goto redo;
|
|
case '/':
|
|
minp();
|
|
if (ch == '*') {
|
|
file->buf_ptr = parse_comment(file->buf_ptr);
|
|
ch = file->buf_ptr[0];
|
|
goto redo;
|
|
} else {
|
|
q = name;
|
|
*q++ = '/';
|
|
goto parse_name;
|
|
}
|
|
break;
|
|
case '\\':
|
|
ch = handle_eob();
|
|
if (ch != '\\')
|
|
goto redo;
|
|
/* fall through */
|
|
/* case 'a' ... 'z': */
|
|
case 'a':
|
|
case 'b':
|
|
case 'c':
|
|
case 'd':
|
|
case 'e':
|
|
case 'f':
|
|
case 'g':
|
|
case 'h':
|
|
case 'i':
|
|
case 'j':
|
|
case 'k':
|
|
case 'l':
|
|
case 'm':
|
|
case 'n':
|
|
case 'o':
|
|
case 'p':
|
|
case 'q':
|
|
case 'r':
|
|
case 's':
|
|
case 't':
|
|
case 'u':
|
|
case 'v':
|
|
case 'w':
|
|
case 'x':
|
|
case 'y':
|
|
case 'z':
|
|
/* case 'A' ... 'z': */
|
|
case 'A':
|
|
case 'B':
|
|
case 'C':
|
|
case 'D':
|
|
case 'E':
|
|
case 'F':
|
|
case 'G':
|
|
case 'H':
|
|
case 'I':
|
|
case 'J':
|
|
case 'K':
|
|
case 'L':
|
|
case 'M':
|
|
case 'N':
|
|
case 'O':
|
|
case 'P':
|
|
case 'Q':
|
|
case 'R':
|
|
case 'S':
|
|
case 'T':
|
|
case 'U':
|
|
case 'V':
|
|
case 'W':
|
|
case 'X':
|
|
case 'Y':
|
|
case 'Z':
|
|
case '_':
|
|
case '.':
|
|
case '$':
|
|
case '~':
|
|
q = name;
|
|
parse_name:
|
|
for(;;) {
|
|
if (!((ch >= 'a' && ch <= 'z') ||
|
|
(ch >= 'A' && ch <= 'Z') ||
|
|
(ch >= '0' && ch <= '9') ||
|
|
strchr("/.-_+=$:\\,~", ch)))
|
|
break;
|
|
if ((q - name) < name_size - 1) {
|
|
*q++ = ch;
|
|
}
|
|
minp();
|
|
}
|
|
*q = '\0';
|
|
c = LD_TOK_NAME;
|
|
break;
|
|
case CH_EOF:
|
|
c = LD_TOK_EOF;
|
|
break;
|
|
default:
|
|
c = ch;
|
|
inp();
|
|
break;
|
|
}
|
|
return c;
|
|
}
|
|
|
|
static int ld_add_file(TCCState *s1, const char filename[])
|
|
{
|
|
if (filename[0] == '/') {
|
|
if (CONFIG_SYSROOT[0] == '\0'
|
|
&& tcc_add_file_internal(s1, filename, AFF_TYPE_BIN) == 0)
|
|
return 0;
|
|
filename = tcc_basename(filename);
|
|
}
|
|
return tcc_add_dll(s1, filename, 0);
|
|
}
|
|
|
|
static inline int new_undef_syms(void)
|
|
{
|
|
int ret = 0;
|
|
ret = new_undef_sym;
|
|
new_undef_sym = 0;
|
|
return ret;
|
|
}
|
|
|
|
static int ld_add_file_list(TCCState *s1, const char *cmd, int as_needed)
|
|
{
|
|
char filename[1024], libname[1024];
|
|
int t, group, nblibs = 0, ret = 0;
|
|
char **libs = NULL;
|
|
|
|
group = !strcmp(cmd, "GROUP");
|
|
if (!as_needed)
|
|
new_undef_syms();
|
|
t = ld_next(s1, filename, sizeof(filename));
|
|
if (t != '(')
|
|
expect("(");
|
|
t = ld_next(s1, filename, sizeof(filename));
|
|
for(;;) {
|
|
libname[0] = '\0';
|
|
if (t == LD_TOK_EOF) {
|
|
tcc_error_noabort("unexpected end of file");
|
|
ret = -1;
|
|
goto lib_parse_error;
|
|
} else if (t == ')') {
|
|
break;
|
|
} else if (t == '-') {
|
|
t = ld_next(s1, filename, sizeof(filename));
|
|
if ((t != LD_TOK_NAME) || (filename[0] != 'l')) {
|
|
tcc_error_noabort("library name expected");
|
|
ret = -1;
|
|
goto lib_parse_error;
|
|
}
|
|
pstrcpy(libname, sizeof libname, &filename[1]);
|
|
if (s1->static_link) {
|
|
snprintf(filename, sizeof filename, "lib%s.a", libname);
|
|
} else {
|
|
snprintf(filename, sizeof filename, "lib%s.so", libname);
|
|
}
|
|
} else if (t != LD_TOK_NAME) {
|
|
tcc_error_noabort("filename expected");
|
|
ret = -1;
|
|
goto lib_parse_error;
|
|
}
|
|
if (!strcmp(filename, "AS_NEEDED")) {
|
|
ret = ld_add_file_list(s1, cmd, 1);
|
|
if (ret)
|
|
goto lib_parse_error;
|
|
} else {
|
|
/* TODO: Implement AS_NEEDED support. Ignore it for now */
|
|
if (!as_needed) {
|
|
ret = ld_add_file(s1, filename);
|
|
if (ret)
|
|
goto lib_parse_error;
|
|
if (group) {
|
|
/* Add the filename *and* the libname to avoid future conversions */
|
|
dynarray_add(&libs, &nblibs, tcc_strdup(filename));
|
|
if (libname[0] != '\0')
|
|
dynarray_add(&libs, &nblibs, tcc_strdup(libname));
|
|
}
|
|
}
|
|
}
|
|
t = ld_next(s1, filename, sizeof(filename));
|
|
if (t == ',') {
|
|
t = ld_next(s1, filename, sizeof(filename));
|
|
}
|
|
}
|
|
if (group && !as_needed) {
|
|
while (new_undef_syms()) {
|
|
int i;
|
|
|
|
for (i = 0; i < nblibs; i ++)
|
|
ld_add_file(s1, libs[i]);
|
|
}
|
|
}
|
|
lib_parse_error:
|
|
dynarray_reset(&libs, &nblibs);
|
|
return ret;
|
|
}
|
|
|
|
/* interpret a subset of GNU ldscripts to handle the dummy libc.so
|
|
files */
|
|
ST_FUNC int tcc_load_ldscript(TCCState *s1)
|
|
{
|
|
char cmd[64];
|
|
char filename[1024];
|
|
int t, ret;
|
|
|
|
ch = handle_eob();
|
|
for(;;) {
|
|
t = ld_next(s1, cmd, sizeof(cmd));
|
|
if (t == LD_TOK_EOF)
|
|
return 0;
|
|
else if (t != LD_TOK_NAME)
|
|
return -1;
|
|
if (!strcmp(cmd, "INPUT") ||
|
|
!strcmp(cmd, "GROUP")) {
|
|
ret = ld_add_file_list(s1, cmd, 0);
|
|
if (ret)
|
|
return ret;
|
|
} else if (!strcmp(cmd, "OUTPUT_FORMAT") ||
|
|
!strcmp(cmd, "TARGET")) {
|
|
/* ignore some commands */
|
|
t = ld_next(s1, cmd, sizeof(cmd));
|
|
if (t != '(')
|
|
expect("(");
|
|
for(;;) {
|
|
t = ld_next(s1, filename, sizeof(filename));
|
|
if (t == LD_TOK_EOF) {
|
|
tcc_error_noabort("unexpected end of file");
|
|
return -1;
|
|
} else if (t == ')') {
|
|
break;
|
|
}
|
|
}
|
|
} else {
|
|
return -1;
|
|
}
|
|
}
|
|
return 0;
|
|
}
|
|
#endif /* !TCC_TARGET_PE */
|