blob: 45561a8bef473614f72ffafe761e2e8d96e21c6d [file] [log] [blame]
/*
* Copyright 2017, Data61
* Commonwealth Scientific and Industrial Research Organisation (CSIRO)
* ABN 41 687 119 230.
*
* This software may be distributed and modified according to the terms of
* the BSD 2-Clause license. Note that NO WARRANTY is provided.
* See "LICENSE_BSD2.txt" for details.
*
* @TAG(DATA61_BSD)
*/
/* This file contains functionality for debugging heap corruption issues. It is
* styled after Electric Fence [0], but we can't check as thoroughly as eFence
* can because we don't have support for mapping/unmapping/mprotecting regions.
* The basic concept is that we stick a 'canary' value before and after
* allocated memory. During free, we check that these canaries haven't been
* overwritten, which would imply buffer underflow or overflow. This checking
* is limited in that we don't catch heap corruption until memory is actually
* freed.
*
* Essentially any allocated region actually looks like this:
* p q r
* ↓ ↓ ↓
* |canary|size|memory...|canary|
*
* Internally we deal in 'unboxed' pointers, like p. Externally the caller is
* given 'boxed' pointers, like q. We effectively play the same tricks malloc
* does to store some book keeping information surrounding the malloced memory.
* The 'size' stored is the size the user requested, not the size including
* the canaries etc. We need to track this in order to calculate the pointer r
* on free.
*
* In addition to checking for corruption within the heap, this functionality
* also tracks pointers that have been allocated. If you try and free (or
* realloc) a pointer that was never allocated, it will be detected.
*
* To use this, you will need to instruct the linker to wrap your calls to
* allocation functions. You will need to append something like the following
* to your LD_FALGS:
* -Wl,--wrap=malloc -Wl,--wrap=free -Wl,--wrap=realloc -Wl,--wrap=calloc
*
* Ensure you do not call any functions that malloc or free memory within this
* file or you will infinitely recurse.
*/
#include <assert.h>
#include <autoconf.h>
#include <sel4debug/gen_config.h>
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h> /* for size_t */
#include <string.h>
/* Maximum alignment of a data type. The malloc spec requires that returned
* pointers are aligned to this.
*/
#define MAX_ALIGNMENT (sizeof(void*) * 2) /* bytes */
/* Random bits to OR into the pre- and post-canary values so we're not storing
* an exact pointer value. Note that these should be less than MAX_ALIGNMENT so
* that we're ORing into known 0 bits. Preserving the pointer is not actually
* necessary so nothing will break if you change these values to any random
* word-sized value.
*/
#define PRE_EXTRA_BITS 0x7
#define POST_EXTRA_BITS 0x3
/* Algorithms for calculating a canary value to use before and after the
* allocated region. The actual algorithm used here is more or less irrelevant
* as long as it is deterministic.
*/
static uintptr_t pre_canary(void *ptr)
{
return ((uintptr_t)ptr) | PRE_EXTRA_BITS;
}
static uintptr_t post_canary(void *ptr)
{
return ((uintptr_t)ptr) | POST_EXTRA_BITS;
}
typedef struct {
uintptr_t canary;
size_t size;
} __attribute__((aligned(MAX_ALIGNMENT))) metadata_t;
/* A `uintptr_t` that is not naturally aligned. It is necessary to explicitly
* tag unaligned pointers because, e.g., on ARM the compiler is free to
* transform `memcpy` calls into a variant that assumes its inputs are aligned
* and performs word-sized accesses. See the following for more information:
* http://infocenter.arm.com/help/index.jsp?topic=/com.arm.doc.faqs/4972.html
*/
typedef uintptr_t unaligned_uintptr_t __attribute__((aligned(1)));
/* Whether we've already encountered heap corruption. See uses of this below,
* where we abandon all instrumentation if we've hit an error. The reasoning
* behind this is that error reporting functions may call malloc.
*/
static int err = 0;
/* Adjust a size that is about to be passed to the real allocation functions in
* order to account for our instrumentation.
*/
static size_t adjust_size(size_t size)
{
return size + sizeof(metadata_t) + sizeof(uintptr_t);
}
/* Wrap a (just-allocated) region with canary values. */
static void *box(void *ptr, size_t size)
{
if (ptr == NULL) {
return ptr;
}
metadata_t *pre = (metadata_t*)ptr;
ptr += sizeof(*pre);
unaligned_uintptr_t *post = ptr + size;
/* Write the leading canary. */
pre->canary = pre_canary(ptr);
pre->size = size;
/* Use memcpy for the trailing canary so we don't need to care about
* alignment.
*/
uintptr_t canary = post_canary(ptr);
memcpy(post, &canary, sizeof(canary));
return ptr;
}
/* Throw an error resulting from a bad user invocation. */
#define error(args...) do { \
assert(!err); /* We should not already be handling an error. */ \
err = 1; \
fprintf(stderr, args); \
abort(); \
} while (0)
/* Unwrap a canary-endowed region into the original allocated pointer. */
static void *unbox(void *ptr, void *ret_addr)
{
if (ptr == NULL) {
return ptr;
}
metadata_t *pre = (metadata_t*)(ptr - sizeof(*pre));
unaligned_uintptr_t *post = ptr + pre->size;
/* Check the leading canary (underflow). */
if (pre->canary != pre_canary(ptr)) {
error("Leading corruption in heap memory pointed to by %p (called "
"prior to %p)\n", ptr, ret_addr);
}
/* Check the trailing canary with memcmp so we don't need to care about
* alignment. If the memcmp VM faults here, it's likely that you underran
* your buffer and overwrote the 'size' metadata, causing this function to
* derive an incorrect 'post' pointer.
*/
uintptr_t canary = post_canary(ptr);
if (memcmp(post, &canary, sizeof(canary)) != 0) {
error("Buffer overflow in heap memory pointed to by %p (called prior "
"to %p)\n", ptr, ret_addr);
}
return (void*)pre;
}
/* Buffer for tracking currently live heap pointers. This is used to detect
* when the user attempts to free an invalid pointer. Note that we always track
* *boxed* pointers as these are the ones seen by the user.
*/
#ifndef CONFIG_LIBSEL4DEBUG_ALLOC_BUFFER_ENTRIES
#define CONFIG_LIBSEL4DEBUG_ALLOC_BUFFER_ENTRIES 128
#endif
static uintptr_t alloced[CONFIG_LIBSEL4DEBUG_ALLOC_BUFFER_ENTRIES];
/* Track the given heap pointer as currently live. */
static void track(void *ptr)
{
if (sizeof(alloced) == 0 || ptr == NULL) {
/* Disable tracking if we have no buffer and never track NULL. */
return;
}
for (unsigned int i = 0; i < sizeof(alloced) / sizeof(uintptr_t); i++) {
if (alloced[i] == 0) {
/* Found a free slot. */
alloced[i] = (uintptr_t)ptr;
return;
}
}
/* Failed to find a free slot. */
error("Exhausted pointer tracking buffer; try increasing "
"CONFIG_LIBSEL4DEBUG_ALLOC_BUFFER_ENTRIES value\n");
}
/* Stop tracking the given pointer (mark it as dead). */
static void untrack(void *ptr, void *ret_addr)
{
if (sizeof(alloced) == 0 || ptr == NULL) {
/* Ignore tracking if we have no buffer or are freeing NULL. */
return;
}
for (unsigned int i = 0; i < sizeof(alloced) / sizeof(uintptr_t); i++) {
if (alloced[i] == (uintptr_t)ptr) {
/* Found it. */
alloced[i] = 0;
return;
}
}
/* Failed to find it. */
error("Attempt to free pointer %p that was never malloced (called prior "
"to %p)\n", ptr, ret_addr);
}
/* Wrapped functions that will be exported to us from libmuslc. */
void *__real_malloc(size_t size);
void __real_free(void *ptr);
void *__real_calloc(size_t num, size_t size);
void *__real_realloc(void *ptr, size_t size);
/* Actual allocation wrappers follow. */
void *__wrap_malloc(size_t size)
{
if (err) {
return __real_malloc(size);
}
size_t new_size = adjust_size(size);
void *ptr = __real_malloc(new_size);
ptr = box(ptr, size);
track(ptr);
return ptr;
}
void __wrap_free(void *ptr)
{
if (err) {
__real_free(ptr);
return;
}
void *ret = __builtin_extract_return_addr(__builtin_return_address(0));
untrack(ptr, ret);
/* Write garbage all over the region we were handed back to try to expose
* use-after-free bugs. If we fault while doing this, it probably means the
* user underran their buffer and overwrote the 'size' metadata.
*/
metadata_t *pre = (metadata_t*)(ptr - sizeof(*pre));
for (unsigned int i = 0; i < pre->size; i++) {
((char*)ptr)[i] ^= (char)~i;
}
ptr = unbox(ptr, ret);
__real_free(ptr);
}
void *__wrap_calloc(size_t num, size_t size)
{
if (err) {
return __real_calloc(num, size);
}
size_t sz = adjust_size(num * size);
size_t new_num = sz / size;
if (sz % size != 0) {
new_num++;
}
void *ptr = __real_calloc(new_num, size);
ptr = box(ptr, num * size);
track(ptr);
return ptr;
}
void *__wrap_realloc(void *ptr, size_t size)
{
if (err) {
return __real_realloc(ptr, size);
}
void *ret = __builtin_extract_return_addr(__builtin_return_address(0));
untrack(ptr, ret);
ptr = unbox(ptr, ret);
size_t new_size = adjust_size(size);
ptr = __real_realloc(ptr, new_size);
ptr = box(ptr, size);
track(ptr);
return ptr;
}