GNU libc.so 如何既是共享对象又是独立的可执行文件?

How is the GNU libc.so both a shared object and a standalone executable?

在Linux中,GNU标准C库(libc.so)的共享库不仅是共享库,还可以运行作为独立的可执行文件,这打印出版本信息:

[me@computer ~]$ /lib/libc.so.6 

GNU C Library stable release version 2.12, by Roland McGrath et al.
Copyright (C) 2010 Free Software Foundation, Inc.
This is free software; see the source for copying conditions.
There is NO warranty; not even for MERCHANTABILITY or FITNESS FOR A
PARTICULAR PURPOSE.
Compiled by GNU CC version 4.4.7 20120313 (Red Hat 4.4.7-11).
Compiled on a Linux 2.6.32 system on 2015-01-07.
Available extensions:
    The C stubs add-on version 2.1.2.
    crypt add-on version 2.1 by Michael Glad and others
    GNU Libidn by Simon Josefsson
    Native POSIX Threads Library by Ulrich Drepper et al
    BIND-8.2.3-T5B
    RT using linux kernel aio
libc ABIs: UNIQUE IFUNC
For bug reporting instructions, please see:
<http://www.gnu.org/software/libc/bugs.html>.

他们是怎么做到的?我尝试创建一个共享库,它也恰好有一个 main() 函数,但是当我尝试 运行 它时它出现了段错误。

我尝试了什么:

/* myso.c */
#include <stdlib.h>
#include <stdio.h>

static void foo(void) {
    printf("hello foo\n");
}

int main(int argc, char *argv[]) {
    printf("hello world\n");
    foo();
    return 0;
}

然后:

$ gcc -Wall -fPIC -shared -o myso.so myso.c
$ ./myso.so
Segmentation fault (core dumped)

注意:我真的不想出于任何实际目的这样做,我只是想知道 GNU 人(和女孩)是如何做到的。

glibc 的文件 Makerules 中:

# Give libc.so an entry point and make it directly runnable itself.
LDFLAGS-c.so += -e __libc_main

并且在csu/version.c

extern void __libc_print_version (void);
void
__libc_print_version (void)
{
  __write (STDOUT_FILENO, banner, sizeof banner - 1);
}

这是由 __libc_main() 调用的。

在文件elf/interp.c中,程序解释器被添加到共享对象。

这适用于我的 64 位 Linux:gcc -Wall -Wextra -fPIC -shared -o myso.so myso.c

//myso.c
#include <unistd.h>

char const __invoke_dynamic_linker__[] __attribute__ ((section (".interp")))
#ifdef __LP64__
  = "/lib64/ld-linux-x86-64.so.2";
#else
  = "/lib/ld-linux.so.2";
#endif

void _start(void)
{
    static char const msg[] = "Hello world!\n";

    write(STDOUT_FILENO, msg, sizeof msg - 1);          
    _exit(0);
}

__invoke_dynamic_linker__[] 行是必需的,因为没有它就无法动态链接 write_exit。这个变量的名字并不重要。 ld-dynamic-linker 有一个选项,它会做同样的事情,但它会被 -shared 忽略,但将该行放入源代码中是有效的。

这是一个没有动态链接的变体:

#include <unistd.h>
#include <sys/syscall.h>

__asm__(
#ifdef __LP64__
    "syscall: mov    %rdi,%rax;"
    "   mov    %rsi,%rdi;"
    "   mov    %rdx,%rsi;"
    "   mov    %rcx,%rdx;"
    "   mov    %r8,%r10;"
    "   mov    %r9,%r8;"
    "   mov    0x8(%rsp),%r9;"
    "   syscall;"
    "   cmp    [=13=]xfffffffffffff001,%rax;"
    "   jae    __syscall_error;"
    "   retq;   "
    "__syscall_error: neg    %rax;"
    "   mov    %eax,%fs:0xffffffffffffffd0;"
    "   or     [=13=]xffffffffffffffff,%rax;"
    "   retq;"   
#else
    "syscall:   push   %ebp;"
    "   push   %edi;"
    "   push   %esi;"
    "   push   %ebx;"
    "   mov    0x2c(%esp),%ebp;"
    "   mov    0x28(%esp),%edi;"
    "   mov    0x24(%esp),%esi;"
    "   mov    0x20(%esp),%edx;"
    "   mov    0x1c(%esp),%ecx;"
    "   mov    0x18(%esp),%ebx;"
    "   mov    0x14(%esp),%eax;"
    "   int    [=13=]x80;"
    "   pop    %ebx;"
    "   pop    %esi;"
    "   pop    %edi;"
    "   pop    %ebp;"
    "   cmp    [=13=]xfffff001,%eax;"
    "   jae    __syscall_error;"
    "   ret;"    
    "__syscall_error:   neg    %eax;"
    "   mov    %gs:0x0,%ecx;"
    "   mov    %eax,-0x18(%ecx);"
    "   mov    [=13=]xffffffff,%eax;"
    "   ret;"    
#endif
);

void _start(void)
{
    static char const msg[] = "Hello world!\n";

    syscall(SYS_write, STDOUT_FILENO, msg, sizeof msg - 1);
    syscall(SYS_exit, 0);
}