| /* http://www.muppetlabs.com/~breadbox/software/elfkickers.html */ |
| |
| /* sstrip: Copyright (C) 1999-2001 by Brian Raiter, under the GNU |
| * General Public License. No warranty. See COPYING for details. |
| * |
| * Aug 23, 2004 Hacked by Manuel Novoa III <mjn3@codepoet.org> to |
| * handle targets of different endianness and/or elf class, making |
| * it more useful in a cross-devel environment. |
| */ |
| |
| /* ============== original README =================== |
| * |
| * sstrip is a small utility that removes the contents at the end of an |
| * ELF file that are not part of the program's memory image. |
| * |
| * Most ELF executables are built with both a program header table and a |
| * section header table. However, only the former is required in order |
| * for the OS to load, link and execute a program. sstrip attempts to |
| * extract the ELF header, the program header table, and its contents, |
| * leaving everything else in the bit bucket. It can only remove parts of |
| * the file that occur at the end, after the parts to be saved. However, |
| * this almost always includes the section header table, and occasionally |
| * a few random sections that are not used when running a program. |
| * |
| * It should be noted that the GNU bfd library is (understandably) |
| * dependent on the section header table as an index to the file's |
| * contents. Thus, an executable file that has no section header table |
| * cannot be used with gdb, objdump, or any other program based upon the |
| * bfd library, at all. In fact, the program will not even recognize the |
| * file as a valid executable. (This limitation is noted in the source |
| * code comments for bfd, and is marked "FIXME", so this may change at |
| * some future date. However, I would imagine that it is a pretty |
| * low-priority item, as executables without a section header table are |
| * rare in the extreme.) This probably also explains why strip doesn't |
| * offer the option to do this. |
| * |
| * Shared library files may also have their section header table removed. |
| * Such a library will still function; however, it will no longer be |
| * possible for a compiler to link a new program against it. |
| * |
| * As an added bonus, sstrip also tries to removes trailing zero bytes |
| * from the end of the file. (This normally cannot be done with an |
| * executable that has a section header table.) |
| * |
| * sstrip is a very simplistic program. It depends upon the common |
| * practice of putting the parts of the file that contribute to the |
| * memory image at the front, and the remaining material at the end. This |
| * permits it to discard the latter material without affecting file |
| * offsets and memory addresses in what remains. Of course, the ELF |
| * standard permits files to be organized in almost any order, so if a |
| * pathological linker decided to put its section headers at the top, |
| * sstrip would be useless on such executables. |
| */ |
| |
| #include <stdio.h> |
| #include <stdlib.h> |
| #include <string.h> |
| #include <errno.h> |
| #include <unistd.h> |
| #include <fcntl.h> |
| #include <elf.h> |
| #include <endian.h> |
| #include <byteswap.h> |
| |
| #ifndef TRUE |
| #define TRUE 1 |
| #define FALSE 0 |
| #endif |
| |
| /* The name of the program. |
| */ |
| static char const *progname; |
| |
| /* The name of the current file. |
| */ |
| static char const *filename; |
| |
| |
| /* A simple error-handling function. FALSE is always returned for the |
| * convenience of the caller. |
| */ |
| static int err(char const *errmsg) |
| { |
| fprintf(stderr, "%s: %s: %s\n", progname, filename, errmsg); |
| return FALSE; |
| } |
| |
| /* A flag to signal the need for endian reversal. |
| */ |
| static int do_reverse_endian; |
| |
| /* Get a value from the elf header, compensating for endianness. |
| */ |
| #define EGET(X) \ |
| (__extension__ ({ \ |
| uint64_t __res; \ |
| if (!do_reverse_endian) { \ |
| __res = (X); \ |
| } else if (sizeof(X) == 1) { \ |
| __res = (X); \ |
| } else if (sizeof(X) == 2) { \ |
| __res = bswap_16((X)); \ |
| } else if (sizeof(X) == 4) { \ |
| __res = bswap_32((X)); \ |
| } else if (sizeof(X) == 8) { \ |
| __res = bswap_64((X)); \ |
| } else { \ |
| fprintf(stderr, "%s: %s: EGET failed for size %d\n", \ |
| progname, filename, sizeof(X)); \ |
| exit(EXIT_FAILURE); \ |
| } \ |
| __res; \ |
| })) |
| |
| /* Set a value 'Y' in the elf header to 'X', compensating for endianness. |
| */ |
| #define ESET(Y,X) \ |
| do if (!do_reverse_endian) { \ |
| Y = (X); \ |
| } else if (sizeof(Y) == 1) { \ |
| Y = (X); \ |
| } else if (sizeof(Y) == 2) { \ |
| Y = bswap_16((uint16_t)(X)); \ |
| } else if (sizeof(Y) == 4) { \ |
| Y = bswap_32((uint32_t)(X)); \ |
| } else if (sizeof(Y) == 8) { \ |
| Y = bswap_64((uint64_t)(X)); \ |
| } else { \ |
| fprintf(stderr, "%s: %s: ESET failed for size %d\n", \ |
| progname, filename, sizeof(Y)); \ |
| exit(EXIT_FAILURE); \ |
| } while (0) |
| |
| |
| /* A macro for I/O errors: The given error message is used only when |
| * errno is not set. |
| */ |
| #define ferr(msg) (err(errno ? strerror(errno) : (msg))) |
| |
| |
| |
| #define HEADER_FUNCTIONS(CLASS) \ |
| \ |
| /* readelfheader() reads the ELF header into our global variable, and \ |
| * checks to make sure that this is in fact a file that we should be \ |
| * munging. \ |
| */ \ |
| static int readelfheader ## CLASS (int fd, Elf ## CLASS ## _Ehdr *ehdr) \ |
| { \ |
| if (read(fd, ((char *)ehdr)+EI_NIDENT, sizeof(*ehdr) - EI_NIDENT) \ |
| != sizeof(*ehdr) - EI_NIDENT) \ |
| return ferr("missing or incomplete ELF header."); \ |
| \ |
| /* Verify the sizes of the ELF header and the program segment \ |
| * header table entries. \ |
| */ \ |
| if (EGET(ehdr->e_ehsize) != sizeof(Elf ## CLASS ## _Ehdr)) \ |
| return err("unrecognized ELF header size."); \ |
| if (EGET(ehdr->e_phentsize) != sizeof(Elf ## CLASS ## _Phdr)) \ |
| return err("unrecognized program segment header size."); \ |
| \ |
| /* Finally, check the file type. \ |
| */ \ |
| if (EGET(ehdr->e_type) != ET_EXEC && EGET(ehdr->e_type) != ET_DYN) \ |
| return err("not an executable or shared-object library."); \ |
| \ |
| return TRUE; \ |
| } \ |
| \ |
| /* readphdrtable() loads the program segment header table into memory. \ |
| */ \ |
| static int readphdrtable ## CLASS (int fd, Elf ## CLASS ## _Ehdr const *ehdr, \ |
| Elf ## CLASS ## _Phdr **phdrs) \ |
| { \ |
| size_t size; \ |
| \ |
| if (!EGET(ehdr->e_phoff) || !EGET(ehdr->e_phnum) \ |
| ) return err("ELF file has no program header table."); \ |
| \ |
| size = EGET(ehdr->e_phnum) * sizeof **phdrs; \ |
| if (!(*phdrs = malloc(size))) \ |
| return err("Out of memory!"); \ |
| \ |
| errno = 0; \ |
| if (read(fd, *phdrs, size) != (ssize_t)size) \ |
| return ferr("missing or incomplete program segment header table."); \ |
| \ |
| return TRUE; \ |
| } \ |
| \ |
| /* getmemorysize() determines the offset of the last byte of the file \ |
| * that is referenced by an entry in the program segment header table. \ |
| * (Anything in the file after that point is not used when the program \ |
| * is executing, and thus can be safely discarded.) \ |
| */ \ |
| static int getmemorysize ## CLASS (Elf ## CLASS ## _Ehdr const *ehdr, \ |
| Elf ## CLASS ## _Phdr const *phdrs, \ |
| unsigned long *newsize) \ |
| { \ |
| Elf ## CLASS ## _Phdr const *phdr; \ |
| unsigned long size, n; \ |
| int i; \ |
| \ |
| /* Start by setting the size to include the ELF header and the \ |
| * complete program segment header table. \ |
| */ \ |
| size = EGET(ehdr->e_phoff) + EGET(ehdr->e_phnum) * sizeof *phdrs; \ |
| if (size < sizeof *ehdr) \ |
| size = sizeof *ehdr; \ |
| \ |
| /* Then keep extending the size to include whatever data the \ |
| * program segment header table references. \ |
| */ \ |
| for (i = 0, phdr = phdrs ; i < EGET(ehdr->e_phnum) ; ++i, ++phdr) { \ |
| if (EGET(phdr->p_type) != PT_NULL) { \ |
| n = EGET(phdr->p_offset) + EGET(phdr->p_filesz); \ |
| if (n > size) \ |
| size = n; \ |
| } \ |
| } \ |
| \ |
| *newsize = size; \ |
| return TRUE; \ |
| } \ |
| \ |
| /* modifyheaders() removes references to the section header table if \ |
| * it was stripped, and reduces program header table entries that \ |
| * included truncated bytes at the end of the file. \ |
| */ \ |
| static int modifyheaders ## CLASS (Elf ## CLASS ## _Ehdr *ehdr, \ |
| Elf ## CLASS ## _Phdr *phdrs, \ |
| unsigned long newsize) \ |
| { \ |
| Elf ## CLASS ## _Phdr *phdr; \ |
| int i; \ |
| \ |
| /* If the section header table is gone, then remove all references \ |
| * to it in the ELF header. \ |
| */ \ |
| if (EGET(ehdr->e_shoff) >= newsize) { \ |
| ESET(ehdr->e_shoff,0); \ |
| ESET(ehdr->e_shnum,0); \ |
| ESET(ehdr->e_shentsize,0); \ |
| ESET(ehdr->e_shstrndx,0); \ |
| } \ |
| \ |
| /* The program adjusts the file size of any segment that was \ |
| * truncated. The case of a segment being completely stripped out \ |
| * is handled separately. \ |
| */ \ |
| for (i = 0, phdr = phdrs ; i < EGET(ehdr->e_phnum) ; ++i, ++phdr) { \ |
| if (EGET(phdr->p_offset) >= newsize) { \ |
| ESET(phdr->p_offset,newsize); \ |
| ESET(phdr->p_filesz,0); \ |
| } else if (EGET(phdr->p_offset) + EGET(phdr->p_filesz) > newsize) { \ |
| ESET(phdr->p_filesz, newsize - EGET(phdr->p_offset)); \ |
| } \ |
| } \ |
| \ |
| return TRUE; \ |
| } \ |
| \ |
| /* commitchanges() writes the new headers back to the original file \ |
| * and sets the file to its new size. \ |
| */ \ |
| static int commitchanges ## CLASS (int fd, Elf ## CLASS ## _Ehdr const *ehdr, \ |
| Elf ## CLASS ## _Phdr *phdrs, \ |
| unsigned long newsize) \ |
| { \ |
| size_t n; \ |
| \ |
| /* Save the changes to the ELF header, if any. \ |
| */ \ |
| if (lseek(fd, 0, SEEK_SET)) \ |
| return ferr("could not rewind file"); \ |
| errno = 0; \ |
| if (write(fd, ehdr, sizeof *ehdr) != sizeof *ehdr) \ |
| return err("could not modify file"); \ |
| \ |
| /* Save the changes to the program segment header table, if any. \ |
| */ \ |
| if (lseek(fd, EGET(ehdr->e_phoff), SEEK_SET) == (off_t)-1) { \ |
| err("could not seek in file."); \ |
| goto warning; \ |
| } \ |
| n = EGET(ehdr->e_phnum) * sizeof *phdrs; \ |
| if (write(fd, phdrs, n) != (ssize_t)n) { \ |
| err("could not write to file"); \ |
| goto warning; \ |
| } \ |
| \ |
| /* Eleventh-hour sanity check: don't truncate before the end of \ |
| * the program segment header table. \ |
| */ \ |
| if (newsize < EGET(ehdr->e_phoff) + n) \ |
| newsize = EGET(ehdr->e_phoff) + n; \ |
| \ |
| /* Chop off the end of the file. \ |
| */ \ |
| if (ftruncate(fd, newsize)) { \ |
| err("could not resize file"); \ |
| goto warning; \ |
| } \ |
| \ |
| return TRUE; \ |
| \ |
| warning: \ |
| return err("ELF file may have been corrupted!"); \ |
| } |
| |
| |
| /* First elements of Elf32_Ehdr and Elf64_Ehdr are common. |
| */ |
| static int readelfheaderident(int fd, Elf32_Ehdr *ehdr) |
| { |
| errno = 0; |
| if (read(fd, ehdr, EI_NIDENT) != EI_NIDENT) |
| return ferr("missing or incomplete ELF header."); |
| |
| /* Check the ELF signature. |
| */ |
| if (!(ehdr->e_ident[EI_MAG0] == ELFMAG0 && |
| ehdr->e_ident[EI_MAG1] == ELFMAG1 && |
| ehdr->e_ident[EI_MAG2] == ELFMAG2 && |
| ehdr->e_ident[EI_MAG3] == ELFMAG3)) |
| { |
| err("missing ELF signature."); |
| return -1; |
| } |
| |
| /* Compare the file's class and endianness with the program's. |
| */ |
| #if __BYTE_ORDER == __LITTLE_ENDIAN |
| if (ehdr->e_ident[EI_DATA] == ELFDATA2LSB) { |
| do_reverse_endian = 0; |
| } else if (ehdr->e_ident[EI_DATA] == ELFDATA2MSB) { |
| /* fprintf(stderr, "ELF file has different endianness.\n"); */ |
| do_reverse_endian = 1; |
| } |
| #elif __BYTE_ORDER == __BIG_ENDIAN |
| if (ehdr->e_ident[EI_DATA] == ELFDATA2LSB) { |
| /* fprintf(stderr, "ELF file has different endianness.\n"); */ |
| do_reverse_endian = 1; |
| } else if (ehdr->e_ident[EI_DATA] == ELFDATA2MSB) { |
| do_reverse_endian = 0; |
| } |
| #else |
| #error unkown endianness |
| #endif |
| else { |
| err("Unsupported endianness"); |
| return -1; |
| } |
| |
| /* Check the target architecture. |
| */ |
| /* if (EGET(ehdr->e_machine) != ELF_ARCH) { */ |
| /* /\* return err("ELF file created for different architecture."); *\/ */ |
| /* fprintf(stderr, "ELF file created for different architecture.\n"); */ |
| /* } */ |
| return ehdr->e_ident[EI_CLASS]; |
| } |
| |
| |
| HEADER_FUNCTIONS(32) |
| |
| HEADER_FUNCTIONS(64) |
| |
| /* truncatezeros() examines the bytes at the end of the file's |
| * size-to-be, and reduces the size to exclude any trailing zero |
| * bytes. |
| */ |
| static int truncatezeros(int fd, unsigned long *newsize) |
| { |
| unsigned char contents[1024]; |
| unsigned long size, n; |
| |
| size = *newsize; |
| do { |
| n = sizeof contents; |
| if (n > size) |
| n = size; |
| if (lseek(fd, size - n, SEEK_SET) == (off_t)-1) |
| return ferr("cannot seek in file."); |
| if (read(fd, contents, n) != (ssize_t)n) |
| return ferr("cannot read file contents"); |
| while (n && !contents[--n]) |
| --size; |
| } while (size && !n); |
| |
| /* Sanity check. |
| */ |
| if (!size) |
| return err("ELF file is completely blank!"); |
| |
| *newsize = size; |
| return TRUE; |
| } |
| |
| /* main() loops over the cmdline arguments, leaving all the real work |
| * to the other functions. |
| */ |
| int main(int argc, char *argv[]) |
| { |
| int fd; |
| union { |
| Elf32_Ehdr ehdr32; |
| Elf64_Ehdr ehdr64; |
| } e; |
| union { |
| Elf32_Phdr *phdrs32; |
| Elf64_Phdr *phdrs64; |
| } p; |
| unsigned long newsize; |
| char **arg; |
| int failures = 0; |
| |
| if (argc < 2 || argv[1][0] == '-') { |
| printf("Usage: sstrip FILE...\n" |
| "sstrip discards all nonessential bytes from an executable.\n\n" |
| "Version 2.0-X Copyright (C) 2000,2001 Brian Raiter.\n" |
| "Cross-devel hacks Copyright (C) 2004 Manuel Novoa III.\n" |
| "This program is free software, licensed under the GNU\n" |
| "General Public License. There is absolutely no warranty.\n"); |
| return EXIT_SUCCESS; |
| } |
| |
| progname = argv[0]; |
| |
| for (arg = argv + 1 ; *arg != NULL ; ++arg) { |
| filename = *arg; |
| |
| fd = open(*arg, O_RDWR); |
| if (fd < 0) { |
| ferr("can't open"); |
| ++failures; |
| continue; |
| } |
| |
| switch (readelfheaderident(fd, &e.ehdr32)) { |
| case ELFCLASS32: |
| if (!(readelfheader32(fd, &e.ehdr32) && |
| readphdrtable32(fd, &e.ehdr32, &p.phdrs32) && |
| getmemorysize32(&e.ehdr32, p.phdrs32, &newsize) && |
| truncatezeros(fd, &newsize) && |
| modifyheaders32(&e.ehdr32, p.phdrs32, newsize) && |
| commitchanges32(fd, &e.ehdr32, p.phdrs32, newsize))) |
| ++failures; |
| break; |
| case ELFCLASS64: |
| if (!(readelfheader64(fd, &e.ehdr64) && |
| readphdrtable64(fd, &e.ehdr64, &p.phdrs64) && |
| getmemorysize64(&e.ehdr64, p.phdrs64, &newsize) && |
| truncatezeros(fd, &newsize) && |
| modifyheaders64(&e.ehdr64, p.phdrs64, newsize) && |
| commitchanges64(fd, &e.ehdr64, p.phdrs64, newsize))) |
| ++failures; |
| break; |
| default: |
| ++failures; |
| break; |
| } |
| close(fd); |
| } |
| |
| return failures ? EXIT_FAILURE : EXIT_SUCCESS; |
| } |