/* * CDDL HEADER START * * The contents of this file are subject to the terms of the * Common Development and Distribution License (the "License"). * You may not use this file except in compliance with the License. * * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE * or http://www.opensolaris.org/os/licensing. * See the License for the specific language governing permissions * and limitations under the License. * * When distributing Covered Code, include this CDDL HEADER in each * file and include the License file at usr/src/OPENSOLARIS.LICENSE. * If applicable, add the following below this CDDL HEADER, with the * fields enclosed by brackets "[]" replaced with your own identifying * information: Portions Copyright [yyyy] [name of copyright owner] * * CDDL HEADER END */ /* * Copyright 2009 Sun Microsystems, Inc. All rights reserved. * Use is subject to license terms. */ #include #include #include #include /* * Little Endian Base 128 (LEB128) numbers. * ---------------------------------------- * * LEB128 is a scheme for encoding integers densely that exploits the * assumption that most integers are small in magnitude. (This encoding * is equally suitable whether the target machine architecture represents * data in big-endian or little- endian * * Unsigned LEB128 numbers are encoded as follows: start at the low order * end of an unsigned integer and chop it into 7-bit chunks. Place each * chunk into the low order 7 bits of a byte. Typically, several of the * high order bytes will be zero; discard them. Emit the remaining bytes in * a stream, starting with the low order byte; set the high order bit on * each byte except the last emitted byte. The high bit of zero on the last * byte indicates to the decoder that it has encountered the last byte. * The integer zero is a special case, consisting of a single zero byte. * * Signed, 2s complement LEB128 numbers are encoded in a similar except * that the criterion for discarding high order bytes is not whether they * are zero, but whether they consist entirely of sign extension bits. * Consider the 32-bit integer -2. The three high level bytes of the number * are sign extension, thus LEB128 would represent it as a single byte * containing the low order 7 bits, with the high order bit cleared to * indicate the end of the byte stream. * * Note that there is nothing within the LEB128 representation that * indicates whether an encoded number is signed or unsigned. The decoder * must know what type of number to expect. * * DWARF Exception Header Encoding * ------------------------------- * * The DWARF Exception Header Encoding is used to describe the type of data * used in the .eh_frame_hdr section. The upper 4 bits indicate how the * value is to be applied. The lower 4 bits indicate the format of the data. * * DWARF Exception Header value format * * Name Value Meaning * DW_EH_PE_omit 0xff No value is present. * DW_EH_PE_absptr 0x00 Value is a void* * DW_EH_PE_uleb128 0x01 Unsigned value is encoded using the * Little Endian Base 128 (LEB128) * DW_EH_PE_udata2 0x02 A 2 bytes unsigned value. * DW_EH_PE_udata4 0x03 A 4 bytes unsigned value. * DW_EH_PE_udata8 0x04 An 8 bytes unsigned value. * DW_EH_PE_signed 0x08 bit on for all signed encodings * DW_EH_PE_sleb128 0x09 Signed value is encoded using the * Little Endian Base 128 (LEB128) * DW_EH_PE_sdata2 0x0A A 2 bytes signed value. * DW_EH_PE_sdata4 0x0B A 4 bytes signed value. * DW_EH_PE_sdata8 0x0C An 8 bytes signed value. * * DWARF Exception Header application * * Name Value Meaning * DW_EH_PE_absptr 0x00 Value is used with no modification. * DW_EH_PE_pcrel 0x10 Value is reletive to the location of itself * DW_EH_PE_textrel 0x20 * DW_EH_PE_datarel 0x30 Value is reletive to the beginning of the * eh_frame_hdr segment ( segment type * PT_GNU_EH_FRAME ) * DW_EH_PE_funcrel 0x40 * DW_EH_PE_aligned 0x50 value is an aligned void* * DW_EH_PE_indirect 0x80 bit to signal indirection after relocation * DW_EH_PE_omit 0xff No value is present. * */ dwarf_error_t uleb_extract(unsigned char *data, uint64_t *dotp, size_t len, uint64_t *ret) { uint64_t dot = *dotp; uint64_t res = 0; int more = 1; int shift = 0; int val; data += dot; while (more) { if (dot > len) return (DW_OVERFLOW); /* * Pull off lower 7 bits */ val = (*data) & 0x7f; /* * Add prepend value to head of number. */ res = res | (val << shift); /* * Increment shift & dot pointer */ shift += 7; dot++; /* * Check to see if hi bit is set - if not, this * is the last byte. */ more = ((*data++) & 0x80) >> 7; } *dotp = dot; *ret = res; return (DW_SUCCESS); } dwarf_error_t sleb_extract(unsigned char *data, uint64_t *dotp, size_t len, int64_t *ret) { uint64_t dot = *dotp; int64_t res = 0; int more = 1; int shift = 0; int val; data += dot; while (more) { if (dot > len) return (DW_OVERFLOW); /* * Pull off lower 7 bits */ val = (*data) & 0x7f; /* * Add prepend value to head of number. */ res = res | (val << shift); /* * Increment shift & dot pointer */ shift += 7; dot++; /* * Check to see if hi bit is set - if not, this * is the last byte. */ more = ((*data++) & 0x80) >> 7; } *dotp = dot; /* * Make sure value is properly sign extended. */ res = (res << (64 - shift)) >> (64 - shift); *ret = res; return (DW_SUCCESS); } /* * Extract a DWARF encoded datum * * entry: * data - Base of data buffer containing encoded bytes * dotp - Address of variable containing index within data * at which the desired datum starts. * ehe_flags - DWARF encoding * eident - ELF header e_ident[] array for object being processed * frame_hdr - Boolean, true if we're extracting from .eh_frame_hdr * sh_base - Base address of ELF section containing desired datum * sh_offset - Offset relative to sh_base of desired datum. * dbase - The base address to which DW_EH_PE_datarel is relative * (if frame_hdr is false) */ dwarf_error_t dwarf_ehe_extract(unsigned char *data, size_t len, uint64_t *dotp, uint64_t *ret, uint_t ehe_flags, unsigned char *eident, boolean_t frame_hdr, uint64_t sh_base, uint64_t sh_offset, uint64_t dbase) { uint64_t dot = *dotp; uint_t lsb; uint_t wordsize; uint_t fsize; uint64_t result; if (eident[EI_DATA] == ELFDATA2LSB) lsb = 1; else lsb = 0; if (eident[EI_CLASS] == ELFCLASS64) wordsize = 8; else wordsize = 4; switch (ehe_flags & 0x0f) { case DW_EH_PE_omit: *ret = 0; return (DW_SUCCESS); case DW_EH_PE_absptr: fsize = wordsize; break; case DW_EH_PE_udata8: case DW_EH_PE_sdata8: fsize = 8; break; case DW_EH_PE_udata4: case DW_EH_PE_sdata4: fsize = 4; break; case DW_EH_PE_udata2: case DW_EH_PE_sdata2: fsize = 2; break; case DW_EH_PE_uleb128: return (uleb_extract(data, dotp, len, ret)); case DW_EH_PE_sleb128: return (sleb_extract(data, dotp, len, (int64_t *)ret)); default: *ret = 0; return (DW_BAD_ENCODING); } if (lsb) { /* * Extract unaligned LSB formated data */ uint_t cnt; result = 0; for (cnt = 0; cnt < fsize; cnt++, dot++) { uint64_t val; if (dot > len) return (DW_OVERFLOW); val = data[dot]; result |= val << (cnt * 8); } } else { /* * Extract unaligned MSB formated data */ uint_t cnt; result = 0; for (cnt = 0; cnt < fsize; cnt++, dot++) { uint64_t val; if (dot > len) return (DW_OVERFLOW); val = data[dot]; result |= val << ((fsize - cnt - 1) * 8); } } /* * perform sign extension */ if ((ehe_flags & DW_EH_PE_signed) && (fsize < sizeof (uint64_t))) { int64_t sresult; uint_t bitshift; sresult = result; bitshift = (sizeof (uint64_t) - fsize) * 8; sresult = (sresult << bitshift) >> bitshift; result = sresult; } /* * If value is relative to a base address, adjust it */ switch (ehe_flags & 0xf0) { case DW_EH_PE_pcrel: result += sh_base + sh_offset; break; /* * datarel is relative to .eh_frame_hdr if within .eh_frame, * but GOT if not. */ case DW_EH_PE_datarel: if (frame_hdr) result += sh_base; else result += dbase; break; } /* Truncate the result to its specified size */ result = (result << ((sizeof (uint64_t) - fsize) * 8)) >> ((sizeof (uint64_t) - fsize) * 8); *dotp = dot; *ret = result; return (DW_SUCCESS); }