/* http://www.muppetlabs.com/~breadbox/software/elfkickers.html */ /* sstrip: Copyright (C) 1999-2001 by Brian Raiter, under the GNU * General Public License. No warranty. See COPYING for details. * * Aug 23, 2004 Hacked by Manuel Novoa III <mjn3@codepoet.org> to * handle targets of different endianness and/or elf class, making * it more useful in a cross-devel environment. */ /* ============== original README =================== * * sstrip is a small utility that removes the contents at the end of an * ELF file that are not part of the program's memory image. * * Most ELF executables are built with both a program header table and a * section header table. However, only the former is required in order * for the OS to load, link and execute a program. sstrip attempts to * extract the ELF header, the program header table, and its contents, * leaving everything else in the bit bucket. It can only remove parts of * the file that occur at the end, after the parts to be saved. However, * this almost always includes the section header table, and occasionally * a few random sections that are not used when running a program. * * It should be noted that the GNU bfd library is (understandably) * dependent on the section header table as an index to the file's * contents. Thus, an executable file that has no section header table * cannot be used with gdb, objdump, or any other program based upon the * bfd library, at all. In fact, the program will not even recognize the * file as a valid executable. (This limitation is noted in the source * code comments for bfd, and is marked "FIXME", so this may change at * some future date. However, I would imagine that it is a pretty * low-priority item, as executables without a section header table are * rare in the extreme.) This probably also explains why strip doesn't * offer the option to do this. * * Shared library files may also have their section header table removed. * Such a library will still function; however, it will no longer be * possible for a compiler to link a new program against it. * * As an added bonus, sstrip also tries to removes trailing zero bytes * from the end of the file. (This normally cannot be done with an * executable that has a section header table.) * * sstrip is a very simplistic program. It depends upon the common * practice of putting the parts of the file that contribute to the * memory image at the front, and the remaining material at the end. This * permits it to discard the latter material without affecting file * offsets and memory addresses in what remains. Of course, the ELF * standard permits files to be organized in almost any order, so if a * pathological linker decided to put its section headers at the top, * sstrip would be useless on such executables. */ #include <stdio.h> #include <stdlib.h> #include <string.h> #include <errno.h> #include <unistd.h> #include <fcntl.h> #include <elf.h> #include <endian.h> #include <byteswap.h> #ifndef TRUE #define TRUE 1 #define FALSE 0 #endif /* The name of the program. */ static char const *progname; /* The name of the current file. */ static char const *filename; /* A simple error-handling function. FALSE is always returned for the * convenience of the caller. */ static int err(char const *errmsg) { fprintf(stderr, "%s: %s: %s\n", progname, filename, errmsg); return FALSE; } /* A flag to signal the need for endian reversal. */ static int do_reverse_endian; /* Get a value from the elf header, compensating for endianness. */ #define EGET(X) \ (__extension__ ({ \ uint64_t __res; \ if (!do_reverse_endian) { \ __res = (X); \ } else if (sizeof(X) == 1) { \ __res = (X); \ } else if (sizeof(X) == 2) { \ __res = bswap_16((X)); \ } else if (sizeof(X) == 4) { \ __res = bswap_32((X)); \ } else if (sizeof(X) == 8) { \ __res = bswap_64((X)); \ } else { \ fprintf(stderr, "%s: %s: EGET failed for size %d\n", \ progname, filename, sizeof(X)); \ exit(EXIT_FAILURE); \ } \ __res; \ })) /* Set a value 'Y' in the elf header to 'X', compensating for endianness. */ #define ESET(Y,X) \ do if (!do_reverse_endian) { \ Y = (X); \ } else if (sizeof(Y) == 1) { \ Y = (X); \ } else if (sizeof(Y) == 2) { \ Y = bswap_16((uint16_t)(X)); \ } else if (sizeof(Y) == 4) { \ Y = bswap_32((uint32_t)(X)); \ } else if (sizeof(Y) == 8) { \ Y = bswap_64((uint64_t)(X)); \ } else { \ fprintf(stderr, "%s: %s: ESET failed for size %d\n", \ progname, filename, sizeof(Y)); \ exit(EXIT_FAILURE); \ } while (0) /* A macro for I/O errors: The given error message is used only when * errno is not set. */ #define ferr(msg) (err(errno ? strerror(errno) : (msg))) #define HEADER_FUNCTIONS(CLASS) \ \ /* readelfheader() reads the ELF header into our global variable, and \ * checks to make sure that this is in fact a file that we should be \ * munging. \ */ \ static int readelfheader ## CLASS (int fd, Elf ## CLASS ## _Ehdr *ehdr) \ { \ if (read(fd, ((char *)ehdr)+EI_NIDENT, sizeof(*ehdr) - EI_NIDENT) \ != sizeof(*ehdr) - EI_NIDENT) \ return ferr("missing or incomplete ELF header."); \ \ /* Verify the sizes of the ELF header and the program segment \ * header table entries. \ */ \ if (EGET(ehdr->e_ehsize) != sizeof(Elf ## CLASS ## _Ehdr)) \ return err("unrecognized ELF header size."); \ if (EGET(ehdr->e_phentsize) != sizeof(Elf ## CLASS ## _Phdr)) \ return err("unrecognized program segment header size."); \ \ /* Finally, check the file type. \ */ \ if (EGET(ehdr->e_type) != ET_EXEC && EGET(ehdr->e_type) != ET_DYN) \ return err("not an executable or shared-object library."); \ \ return TRUE; \ } \ \ /* readphdrtable() loads the program segment header table into memory. \ */ \ static int readphdrtable ## CLASS (int fd, Elf ## CLASS ## _Ehdr const *ehdr, \ Elf ## CLASS ## _Phdr **phdrs) \ { \ size_t size; \ \ if (!EGET(ehdr->e_phoff) || !EGET(ehdr->e_phnum) \ ) return err("ELF file has no program header table."); \ \ size = EGET(ehdr->e_phnum) * sizeof **phdrs; \ if (!(*phdrs = malloc(size))) \ return err("Out of memory!"); \ \ errno = 0; \ if (read(fd, *phdrs, size) != (ssize_t)size) \ return ferr("missing or incomplete program segment header table."); \ \ return TRUE; \ } \ \ /* getmemorysize() determines the offset of the last byte of the file \ * that is referenced by an entry in the program segment header table. \ * (Anything in the file after that point is not used when the program \ * is executing, and thus can be safely discarded.) \ */ \ static int getmemorysize ## CLASS (Elf ## CLASS ## _Ehdr const *ehdr, \ Elf ## CLASS ## _Phdr const *phdrs, \ unsigned long *newsize) \ { \ Elf ## CLASS ## _Phdr const *phdr; \ unsigned long size, n; \ int i; \ \ /* Start by setting the size to include the ELF header and the \ * complete program segment header table. \ */ \ size = EGET(ehdr->e_phoff) + EGET(ehdr->e_phnum) * sizeof *phdrs; \ if (size < sizeof *ehdr) \ size = sizeof *ehdr; \ \ /* Then keep extending the size to include whatever data the \ * program segment header table references. \ */ \ for (i = 0, phdr = phdrs ; i < EGET(ehdr->e_phnum) ; ++i, ++phdr) { \ if (EGET(phdr->p_type) != PT_NULL) { \ n = EGET(phdr->p_offset) + EGET(phdr->p_filesz); \ if (n > size) \ size = n; \ } \ } \ \ *newsize = size; \ return TRUE; \ } \ \ /* modifyheaders() removes references to the section header table if \ * it was stripped, and reduces program header table entries that \ * included truncated bytes at the end of the file. \ */ \ static int modifyheaders ## CLASS (Elf ## CLASS ## _Ehdr *ehdr, \ Elf ## CLASS ## _Phdr *phdrs, \ unsigned long newsize) \ { \ Elf ## CLASS ## _Phdr *phdr; \ int i; \ \ /* If the section header table is gone, then remove all references \ * to it in the ELF header. \ */ \ if (EGET(ehdr->e_shoff) >= newsize) { \ ESET(ehdr->e_shoff,0); \ ESET(ehdr->e_shnum,0); \ ESET(ehdr->e_shentsize,0); \ ESET(ehdr->e_shstrndx,0); \ } \ \ /* The program adjusts the file size of any segment that was \ * truncated. The case of a segment being completely stripped out \ * is handled separately. \ */ \ for (i = 0, phdr = phdrs ; i < EGET(ehdr->e_phnum) ; ++i, ++phdr) { \ if (EGET(phdr->p_offset) >= newsize) { \ ESET(phdr->p_offset,newsize); \ ESET(phdr->p_filesz,0); \ } else if (EGET(phdr->p_offset) + EGET(phdr->p_filesz) > newsize) { \ ESET(phdr->p_filesz, newsize - EGET(phdr->p_offset)); \ } \ } \ \ return TRUE; \ } \ \ /* commitchanges() writes the new headers back to the original file \ * and sets the file to its new size. \ */ \ static int commitchanges ## CLASS (int fd, Elf ## CLASS ## _Ehdr const *ehdr, \ Elf ## CLASS ## _Phdr *phdrs, \ unsigned long newsize) \ { \ size_t n; \ \ /* Save the changes to the ELF header, if any. \ */ \ if (lseek(fd, 0, SEEK_SET)) \ return ferr("could not rewind file"); \ errno = 0; \ if (write(fd, ehdr, sizeof *ehdr) != sizeof *ehdr) \ return err("could not modify file"); \ \ /* Save the changes to the program segment header table, if any. \ */ \ if (lseek(fd, EGET(ehdr->e_phoff), SEEK_SET) == (off_t)-1) { \ err("could not seek in file."); \ goto warning; \ } \ n = EGET(ehdr->e_phnum) * sizeof *phdrs; \ if (write(fd, phdrs, n) != (ssize_t)n) { \ err("could not write to file"); \ goto warning; \ } \ \ /* Eleventh-hour sanity check: don't truncate before the end of \ * the program segment header table. \ */ \ if (newsize < EGET(ehdr->e_phoff) + n) \ newsize = EGET(ehdr->e_phoff) + n; \ \ /* Chop off the end of the file. \ */ \ if (ftruncate(fd, newsize)) { \ err("could not resize file"); \ goto warning; \ } \ \ return TRUE; \ \ warning: \ return err("ELF file may have been corrupted!"); \ } /* First elements of Elf32_Ehdr and Elf64_Ehdr are common. */ static int readelfheaderident(int fd, Elf32_Ehdr *ehdr) { errno = 0; if (read(fd, ehdr, EI_NIDENT) != EI_NIDENT) return ferr("missing or incomplete ELF header."); /* Check the ELF signature. */ if (!(ehdr->e_ident[EI_MAG0] == ELFMAG0 && ehdr->e_ident[EI_MAG1] == ELFMAG1 && ehdr->e_ident[EI_MAG2] == ELFMAG2 && ehdr->e_ident[EI_MAG3] == ELFMAG3)) { err("missing ELF signature."); return -1; } /* Compare the file's class and endianness with the program's. */ #if __BYTE_ORDER == __LITTLE_ENDIAN if (ehdr->e_ident[EI_DATA] == ELFDATA2LSB) { do_reverse_endian = 0; } else if (ehdr->e_ident[EI_DATA] == ELFDATA2MSB) { /* fprintf(stderr, "ELF file has different endianness.\n"); */ do_reverse_endian = 1; } #elif __BYTE_ORDER == __BIG_ENDIAN if (ehdr->e_ident[EI_DATA] == ELFDATA2LSB) { /* fprintf(stderr, "ELF file has different endianness.\n"); */ do_reverse_endian = 1; } else if (ehdr->e_ident[EI_DATA] == ELFDATA2MSB) { do_reverse_endian = 0; } #else #error unkown endianness #endif else { err("Unsupported endianness"); return -1; } /* Check the target architecture. */ /* if (EGET(ehdr->e_machine) != ELF_ARCH) { */ /* /\* return err("ELF file created for different architecture."); *\/ */ /* fprintf(stderr, "ELF file created for different architecture.\n"); */ /* } */ return ehdr->e_ident[EI_CLASS]; } HEADER_FUNCTIONS(32) HEADER_FUNCTIONS(64) /* truncatezeros() examines the bytes at the end of the file's * size-to-be, and reduces the size to exclude any trailing zero * bytes. */ static int truncatezeros(int fd, unsigned long *newsize) { unsigned char contents[1024]; unsigned long size, n; size = *newsize; do { n = sizeof contents; if (n > size) n = size; if (lseek(fd, size - n, SEEK_SET) == (off_t)-1) return ferr("cannot seek in file."); if (read(fd, contents, n) != (ssize_t)n) return ferr("cannot read file contents"); while (n && !contents[--n]) --size; } while (size && !n); /* Sanity check. */ if (!size) return err("ELF file is completely blank!"); *newsize = size; return TRUE; } /* main() loops over the cmdline arguments, leaving all the real work * to the other functions. */ int main(int argc, char *argv[]) { int fd; union { Elf32_Ehdr ehdr32; Elf64_Ehdr ehdr64; } e; union { Elf32_Phdr *phdrs32; Elf64_Phdr *phdrs64; } p; unsigned long newsize; char **arg; int failures = 0; if (argc < 2 || argv[1][0] == '-') { printf("Usage: sstrip FILE...\n" "sstrip discards all nonessential bytes from an executable.\n\n" "Version 2.0-X Copyright (C) 2000,2001 Brian Raiter.\n" "Cross-devel hacks Copyright (C) 2004 Manuel Novoa III.\n" "This program is free software, licensed under the GNU\n" "General Public License. There is absolutely no warranty.\n"); return EXIT_SUCCESS; } progname = argv[0]; for (arg = argv + 1 ; *arg != NULL ; ++arg) { filename = *arg; fd = open(*arg, O_RDWR); if (fd < 0) { ferr("can't open"); ++failures; continue; } switch (readelfheaderident(fd, &e.ehdr32)) { case ELFCLASS32: if (!(readelfheader32(fd, &e.ehdr32) && readphdrtable32(fd, &e.ehdr32, &p.phdrs32) && getmemorysize32(&e.ehdr32, p.phdrs32, &newsize) && truncatezeros(fd, &newsize) && modifyheaders32(&e.ehdr32, p.phdrs32, newsize) && commitchanges32(fd, &e.ehdr32, p.phdrs32, newsize))) ++failures; break; case ELFCLASS64: if (!(readelfheader64(fd, &e.ehdr64) && readphdrtable64(fd, &e.ehdr64, &p.phdrs64) && getmemorysize64(&e.ehdr64, p.phdrs64, &newsize) && truncatezeros(fd, &newsize) && modifyheaders64(&e.ehdr64, p.phdrs64, newsize) && commitchanges64(fd, &e.ehdr64, p.phdrs64, newsize))) ++failures; break; default: ++failures; break; } close(fd); } return failures ? EXIT_FAILURE : EXIT_SUCCESS; }