#include <zone_debug.h>
#include <mach/mach_types.h>
#include <mach/vm_param.h>
#include <mach/kern_return.h>
#include <mach/mach_host_server.h>
#include <mach/task_server.h>
#include <mach/machine/vm_types.h>
#include <mach_debug/zone_info.h>
#include <mach/vm_map.h>
#include <kern/kern_types.h>
#include <kern/assert.h>
#include <kern/backtrace.h>
#include <kern/host.h>
#include <kern/macro_help.h>
#include <kern/sched.h>
#include <kern/locks.h>
#include <kern/sched_prim.h>
#include <kern/misc_protos.h>
#include <kern/thread_call.h>
#include <kern/zalloc.h>
#include <kern/kalloc.h>
#include <vm/pmap.h>
#include <vm/vm_map.h>
#include <vm/vm_kern.h>
#include <vm/vm_page.h>
#include <pexpert/pexpert.h>
#include <machine/machparam.h>
#include <machine/machine_routines.h>
#include <libkern/OSDebug.h>
#include <libkern/OSAtomic.h>
#include <sys/kdebug.h>
#define from_zone_map(addr, size) \
((vm_offset_t)(addr) >= zone_map_min_address && \
((vm_offset_t)(addr) + size - 1) < zone_map_max_address )
static inline boolean_t
sample_counter(volatile uint32_t * count_p, uint32_t factor)
{
uint32_t old_count, new_count;
boolean_t rolled_over;
do {
new_count = old_count = *count_p;
if (++new_count >= factor) {
rolled_over = TRUE;
new_count = 0;
} else {
rolled_over = FALSE;
}
} while (!OSCompareAndSwap(old_count, new_count, count_p));
return rolled_over;
}
#if defined(__LP64__)
#define ZP_POISON 0xdeadbeefdeadbeef
#else
#define ZP_POISON 0xdeadbeef
#endif
#define ZP_DEFAULT_SAMPLING_FACTOR 16
#define ZP_DEFAULT_SCALE_FACTOR 4
uint32_t zp_factor = 0;
uint32_t zp_scale = 0;
vm_size_t zp_tiny_zone_limit = 0;
uintptr_t zp_poisoned_cookie = 0;
uintptr_t zp_nopoison_cookie = 0;
static inline void
zp_init(void)
{
char temp_buf[16];
zp_poisoned_cookie = (uintptr_t) early_random();
ml_cpu_info_t cpu_info;
ml_cpu_get_info(&cpu_info);
zp_tiny_zone_limit = (vm_size_t) cpu_info.cache_line_size;
zp_factor = ZP_DEFAULT_SAMPLING_FACTOR;
zp_scale = ZP_DEFAULT_SCALE_FACTOR;
if (zp_factor != 0) {
uint32_t rand_bits = early_random() & 0x3;
if (rand_bits == 0x1)
zp_factor += 1;
else if (rand_bits == 0x2)
zp_factor -= 1;
}
if (PE_parse_boot_argn("-zp", temp_buf, sizeof(temp_buf))) {
zp_factor = 1;
}
if (PE_parse_boot_argn("-no-zp", temp_buf, sizeof(temp_buf))) {
zp_factor = 0;
zp_tiny_zone_limit = 0;
printf("Zone poisoning disabled\n");
}
if (PE_parse_boot_argn("zp-factor", &zp_factor, sizeof(zp_factor))) {
printf("Zone poisoning factor override: %u\n", zp_factor);
}
if (PE_parse_boot_argn("zp-scale", &zp_scale, sizeof(zp_scale))) {
printf("Zone poisoning scale factor override: %u\n", zp_scale);
}
zp_nopoison_cookie = (uintptr_t) early_random();
#if MACH_ASSERT
if (zp_poisoned_cookie == zp_nopoison_cookie)
panic("early_random() is broken: %p and %p are not random\n",
(void *) zp_poisoned_cookie, (void *) zp_nopoison_cookie);
#endif
zp_poisoned_cookie |= (uintptr_t)0x1ULL;
zp_nopoison_cookie &= ~((uintptr_t)0x1ULL);
#if defined(__LP64__)
zp_poisoned_cookie &= 0x000000FFFFFFFFFF;
zp_poisoned_cookie |= 0x0535210000000000;
zp_nopoison_cookie &= 0x000000FFFFFFFFFF;
zp_nopoison_cookie |= 0x3f00110000000000;
#endif
}
#define ZONE_PAGE_COUNT_INCR(z, count) \
{ \
OSAddAtomic64(count, &(z->page_count)); \
}
#define ZONE_PAGE_COUNT_DECR(z, count) \
{ \
OSAddAtomic64(-count, &(z->page_count)); \
}
vm_map_t zone_map = VM_MAP_NULL;
vm_offset_t zone_map_min_address = 0;
vm_offset_t zone_map_max_address = 0;
#define MAX_ENTROPY_PER_ZCRAM 4
#define RANDOM_BOOL_GEN_SEED_COUNT 4
static unsigned int bool_gen_seed[RANDOM_BOOL_GEN_SEED_COUNT];
static unsigned int bool_gen_global = 0;
decl_simple_lock_data(, bool_gen_lock)
vm_offset_t zone_metadata_region_min = 0;
vm_offset_t zone_metadata_region_max = 0;
decl_lck_mtx_data(static ,zone_metadata_region_lck)
lck_attr_t zone_metadata_lock_attr;
lck_mtx_ext_t zone_metadata_region_lck_ext;
struct zone_free_element {
struct zone_free_element *next;
};
decl_simple_lock_data(, all_zones_lock)
unsigned int num_zones;
#define MAX_ZONES 256
struct zone zone_array[MAX_ZONES];
static int zone_array_index = 0;
#define MULTIPAGE_METADATA_MAGIC (0xff)
#define PAGE_METADATA_GET_ZINDEX(page_meta) \
(page_meta->zindex)
#define PAGE_METADATA_GET_ZONE(page_meta) \
(&(zone_array[page_meta->zindex]))
#define PAGE_METADATA_SET_ZINDEX(page_meta, index) \
page_meta->zindex = (index);
struct zone_page_metadata {
queue_chain_t pages;
union {
uint32_t freelist_offset;
uint32_t real_metadata_offset;
};
uint16_t free_count;
uint8_t zindex;
uint8_t page_count;
};
#define PAGE_INDEX_FOR_ELEMENT(element) \
(((vm_offset_t)trunc_page(element) - zone_map_min_address) / PAGE_SIZE)
#define PAGE_METADATA_FOR_PAGE_INDEX(index) \
(zone_metadata_region_min + ((index) * sizeof(struct zone_page_metadata)))
#define PAGE_INDEX_FOR_METADATA(page_meta) \
(((vm_offset_t)page_meta - zone_metadata_region_min) / sizeof(struct zone_page_metadata))
#define PAGE_FOR_PAGE_INDEX(index) \
(zone_map_min_address + (PAGE_SIZE * (index)))
#define PAGE_METADATA_FOR_ELEMENT(element) \
(struct zone_page_metadata *)(PAGE_METADATA_FOR_PAGE_INDEX(PAGE_INDEX_FOR_ELEMENT(element)))
#define PAGE_METADATA_EMPTY_FREELIST ((uint32_t)(~0))
static inline void *
page_metadata_get_freelist(struct zone_page_metadata *page_meta)
{
assert(PAGE_METADATA_GET_ZINDEX(page_meta) != MULTIPAGE_METADATA_MAGIC);
if (page_meta->freelist_offset == PAGE_METADATA_EMPTY_FREELIST)
return NULL;
else {
if (from_zone_map(page_meta, sizeof(struct zone_page_metadata)))
return (void *)(PAGE_FOR_PAGE_INDEX(PAGE_INDEX_FOR_METADATA(page_meta)) + page_meta->freelist_offset);
else
return (void *)((vm_offset_t)page_meta + page_meta->freelist_offset);
}
}
static inline void
page_metadata_set_freelist(struct zone_page_metadata *page_meta, void *addr)
{
assert(PAGE_METADATA_GET_ZINDEX(page_meta) != MULTIPAGE_METADATA_MAGIC);
if (addr == NULL)
page_meta->freelist_offset = PAGE_METADATA_EMPTY_FREELIST;
else {
if (from_zone_map(page_meta, sizeof(struct zone_page_metadata)))
page_meta->freelist_offset = (uint32_t)((vm_offset_t)(addr) - PAGE_FOR_PAGE_INDEX(PAGE_INDEX_FOR_METADATA(page_meta)));
else
page_meta->freelist_offset = (uint32_t)((vm_offset_t)(addr) - (vm_offset_t)page_meta);
}
}
static inline struct zone_page_metadata *
page_metadata_get_realmeta(struct zone_page_metadata *page_meta)
{
assert(PAGE_METADATA_GET_ZINDEX(page_meta) == MULTIPAGE_METADATA_MAGIC);
return (struct zone_page_metadata *)((vm_offset_t)page_meta - page_meta->real_metadata_offset);
}
static inline void
page_metadata_set_realmeta(struct zone_page_metadata *page_meta, struct zone_page_metadata *real_meta)
{
assert(PAGE_METADATA_GET_ZINDEX(page_meta) == MULTIPAGE_METADATA_MAGIC);
assert(PAGE_METADATA_GET_ZINDEX(real_meta) != MULTIPAGE_METADATA_MAGIC);
assert((vm_offset_t)page_meta > (vm_offset_t)real_meta);
vm_offset_t offset = (vm_offset_t)page_meta - (vm_offset_t)real_meta;
assert(offset <= UINT32_MAX);
page_meta->real_metadata_offset = (uint32_t)offset;
}
static inline vm_offset_t *
get_backup_ptr(vm_size_t elem_size,
vm_offset_t *element)
{
return (vm_offset_t *) ((vm_offset_t)element + elem_size - sizeof(vm_offset_t));
}
static inline void
zone_populate_metadata_page(struct zone_page_metadata *page_meta)
{
vm_offset_t page_metadata_begin = trunc_page(page_meta);
vm_offset_t page_metadata_end = trunc_page((vm_offset_t)page_meta + sizeof(struct zone_page_metadata));
for(;page_metadata_begin <= page_metadata_end; page_metadata_begin += PAGE_SIZE) {
if (pmap_find_phys(kernel_pmap, (vm_map_address_t)page_metadata_begin))
continue;
lck_mtx_lock(&zone_metadata_region_lck);
if (0 == pmap_find_phys(kernel_pmap, (vm_map_address_t)page_metadata_begin)) {
kernel_memory_populate(zone_map,
page_metadata_begin,
PAGE_SIZE,
KMA_KOBJECT,
VM_KERN_MEMORY_OSFMK);
}
lck_mtx_unlock(&zone_metadata_region_lck);
}
return;
}
static inline uint16_t
get_metadata_alloc_count(struct zone_page_metadata *page_meta)
{
assert(PAGE_METADATA_GET_ZINDEX(page_meta) != MULTIPAGE_METADATA_MAGIC);
struct zone *z = PAGE_METADATA_GET_ZONE(page_meta);
return ((page_meta->page_count * PAGE_SIZE) / z->elem_size);
}
static inline struct zone_page_metadata *
get_zone_page_metadata(struct zone_free_element *element, boolean_t init)
{
struct zone_page_metadata *page_meta = 0;
if (from_zone_map(element, sizeof(struct zone_free_element))) {
page_meta = (struct zone_page_metadata *)(PAGE_METADATA_FOR_ELEMENT(element));
if (init)
zone_populate_metadata_page(page_meta);
} else {
page_meta = (struct zone_page_metadata *)(trunc_page((vm_offset_t)element));
}
if (init)
bzero((char *)page_meta, sizeof(struct zone_page_metadata));
return ((PAGE_METADATA_GET_ZINDEX(page_meta) != MULTIPAGE_METADATA_MAGIC) ? page_meta : page_metadata_get_realmeta(page_meta));
}
static inline vm_offset_t
get_zone_page(struct zone_page_metadata *page_meta)
{
if (from_zone_map(page_meta, sizeof(struct zone_page_metadata)))
return (vm_offset_t)(PAGE_FOR_PAGE_INDEX(PAGE_INDEX_FOR_METADATA(page_meta)));
else
return (vm_offset_t)(trunc_page(page_meta));
}
vm_size_t
zone_element_size(void *addr, zone_t *z)
{
struct zone *src_zone;
if (from_zone_map(addr, sizeof(void *))) {
struct zone_page_metadata *page_meta = get_zone_page_metadata((struct zone_free_element *)addr, FALSE);
src_zone = PAGE_METADATA_GET_ZONE(page_meta);
if (z) {
*z = src_zone;
}
return (src_zone->elem_size);
} else {
#if CONFIG_GZALLOC
vm_size_t gzsize;
if (gzalloc_element_size(addr, z, &gzsize)) {
return gzsize;
}
#endif
return 0;
}
}
static inline boolean_t
is_sane_zone_ptr(zone_t zone,
vm_offset_t addr,
size_t obj_size)
{
if (__improbable((addr & (sizeof(vm_offset_t) - 1)) != 0))
return FALSE;
if (__improbable(!pmap_kernel_va(addr)))
return FALSE;
if (zone->collectable && !zone->allows_foreign) {
if (addr >= zone_map_min_address &&
(addr + obj_size - 1) < zone_map_max_address )
return TRUE;
return FALSE;
}
return TRUE;
}
static inline boolean_t
is_sane_zone_page_metadata(zone_t zone,
vm_offset_t page_meta)
{
if (page_meta == 0)
return FALSE;
return is_sane_zone_ptr(zone, page_meta, sizeof(struct zone_page_metadata));
}
static inline boolean_t
is_sane_zone_element(zone_t zone,
vm_offset_t addr)
{
if (addr == 0)
return TRUE;
return is_sane_zone_ptr(zone, addr, zone->elem_size);
}
static inline void
zone_element_was_modified_panic(zone_t zone,
vm_offset_t element,
vm_offset_t found,
vm_offset_t expected,
vm_offset_t offset)
{
panic("a freed zone element has been modified in zone %s: expected %p but found %p, bits changed %p, at offset %d of %d in element %p, cookies %p %p",
zone->zone_name,
(void *) expected,
(void *) found,
(void *) (expected ^ found),
(uint32_t) offset,
(uint32_t) zone->elem_size,
(void *) element,
(void *) zp_nopoison_cookie,
(void *) zp_poisoned_cookie);
}
static void
backup_ptr_mismatch_panic(zone_t zone,
vm_offset_t element,
vm_offset_t primary,
vm_offset_t backup)
{
vm_offset_t likely_backup;
vm_offset_t likely_primary;
likely_primary = primary ^ zp_nopoison_cookie;
boolean_t sane_backup;
boolean_t sane_primary = is_sane_zone_element(zone, likely_primary);
boolean_t element_was_poisoned = (backup & 0x1) ? TRUE : FALSE;
#if defined(__LP64__)
if ((backup & 0xFFFFFF0000000000) == 0xFACADE0000000000)
element_was_poisoned = TRUE;
else if ((backup & 0xFFFFFF0000000000) == 0xC0FFEE0000000000)
element_was_poisoned = FALSE;
#endif
if (element_was_poisoned) {
likely_backup = backup ^ zp_poisoned_cookie;
sane_backup = is_sane_zone_element(zone, likely_backup);
} else {
likely_backup = backup ^ zp_nopoison_cookie;
sane_backup = is_sane_zone_element(zone, likely_backup);
}
if (!sane_primary && sane_backup)
zone_element_was_modified_panic(zone, element, primary, (likely_backup ^ zp_nopoison_cookie), 0);
if (sane_primary && !sane_backup)
zone_element_was_modified_panic(zone, element, backup,
(primary ^ (element_was_poisoned ? zp_poisoned_cookie : zp_nopoison_cookie)),
zone->elem_size - sizeof(vm_offset_t));
if (sane_primary && sane_backup)
zone_element_was_modified_panic(zone, element, primary, likely_backup, 0);
zone_element_was_modified_panic(zone, element, primary, likely_backup, 0);
}
static inline void
free_to_zone(zone_t zone,
vm_offset_t element,
boolean_t poison)
{
vm_offset_t old_head;
struct zone_page_metadata *page_meta;
vm_offset_t *primary = (vm_offset_t *) element;
vm_offset_t *backup = get_backup_ptr(zone->elem_size, primary);
page_meta = get_zone_page_metadata((struct zone_free_element *)element, FALSE);
assert(PAGE_METADATA_GET_ZONE(page_meta) == zone);
old_head = (vm_offset_t)page_metadata_get_freelist(page_meta);
#if MACH_ASSERT
if (__improbable(!is_sane_zone_element(zone, old_head)))
panic("zfree: invalid head pointer %p for freelist of zone %s\n",
(void *) old_head, zone->zone_name);
#endif
if (__improbable(!is_sane_zone_element(zone, element)))
panic("zfree: freeing invalid pointer %p to zone %s\n",
(void *) element, zone->zone_name);
*backup = old_head ^ (poison ? zp_poisoned_cookie : zp_nopoison_cookie);
*primary = old_head ^ zp_nopoison_cookie;
page_metadata_set_freelist(page_meta, (struct zone_free_element *)element);
page_meta->free_count++;
if (zone->allows_foreign && !from_zone_map(element, zone->elem_size)) {
if (page_meta->free_count == 1) {
re_queue_tail(&zone->pages.any_free_foreign, &(page_meta->pages));
} else {
}
} else if (page_meta->free_count == get_metadata_alloc_count(page_meta)) {
re_queue_tail(&zone->pages.all_free, &(page_meta->pages));
zone->count_all_free_pages += page_meta->page_count;
} else if (page_meta->free_count == 1) {
re_queue_tail(&zone->pages.intermediate, &(page_meta->pages));
}
zone->count--;
zone->countfree++;
}
static inline vm_offset_t
try_alloc_from_zone(zone_t zone,
boolean_t* check_poison)
{
vm_offset_t element;
struct zone_page_metadata *page_meta;
*check_poison = FALSE;
if (zone->allows_foreign && !queue_empty(&zone->pages.any_free_foreign))
page_meta = (struct zone_page_metadata *)queue_first(&zone->pages.any_free_foreign);
else if (!queue_empty(&zone->pages.intermediate))
page_meta = (struct zone_page_metadata *)queue_first(&zone->pages.intermediate);
else if (!queue_empty(&zone->pages.all_free)) {
page_meta = (struct zone_page_metadata *)queue_first(&zone->pages.all_free);
assert(zone->count_all_free_pages >= page_meta->page_count);
zone->count_all_free_pages -= page_meta->page_count;
} else {
return 0;
}
if (__improbable(!is_sane_zone_page_metadata(zone, (vm_offset_t)page_meta)))
panic("zalloc: invalid metadata structure %p for freelist of zone %s\n",
(void *) page_meta, zone->zone_name);
assert(PAGE_METADATA_GET_ZONE(page_meta) == zone);
element = (vm_offset_t)page_metadata_get_freelist(page_meta);
if (__improbable(!is_sane_zone_ptr(zone, element, zone->elem_size)))
panic("zfree: invalid head pointer %p for freelist of zone %s\n",
(void *) element, zone->zone_name);
vm_offset_t *primary = (vm_offset_t *) element;
vm_offset_t *backup = get_backup_ptr(zone->elem_size, primary);
vm_offset_t next_element = *primary ^ zp_nopoison_cookie;
vm_offset_t next_element_primary = *primary;
vm_offset_t next_element_backup = *backup;
if (__improbable(!is_sane_zone_element(zone, next_element)))
backup_ptr_mismatch_panic(zone, element, next_element_primary, next_element_backup);
if (__improbable(next_element != (next_element_backup ^ zp_nopoison_cookie))) {
if (__improbable(next_element != (next_element_backup ^ zp_poisoned_cookie)))
backup_ptr_mismatch_panic(zone, element, next_element_primary, next_element_backup);
*check_poison = TRUE;
}
if (__improbable(page_meta != get_zone_page_metadata((struct zone_free_element *)element, FALSE)))
panic("zalloc: Incorrect metadata %p found in zone %s page queue. Expected metadata: %p\n",
page_meta, zone->zone_name, get_zone_page_metadata((struct zone_free_element *)element, FALSE));
if (next_element) {
if (__improbable(page_meta != get_zone_page_metadata((struct zone_free_element *)next_element, FALSE)))
panic("zalloc: next element pointer %p for element %p points to invalid element for zone %s\n",
(void *)next_element, (void *)element, zone->zone_name);
}
page_metadata_set_freelist(page_meta, (struct zone_free_element *)next_element);
page_meta->free_count--;
if (page_meta->free_count == 0) {
re_queue_tail(&zone->pages.all_used, &(page_meta->pages));
} else {
if (!zone->allows_foreign || from_zone_map(element, zone->elem_size)) {
if (get_metadata_alloc_count(page_meta) == page_meta->free_count + 1) {
re_queue_tail(&zone->pages.intermediate, &(page_meta->pages));
}
}
}
zone->countfree--;
zone->count++;
zone->sum_count++;
return element;
}
#define ZINFO_SLOTS MAX_ZONES
void zone_display_zprint(void);
zone_t zone_find_largest(void);
void zalloc_async(
thread_call_param_t p0,
thread_call_param_t p1);
static thread_call_data_t call_async_alloc;
#define ZONE_ELEMENT_ALIGNMENT 32
#define zone_wakeup(zone) thread_wakeup((event_t)(zone))
#define zone_sleep(zone) \
(void) lck_mtx_sleep(&(zone)->lock, LCK_SLEEP_SPIN, (event_t)(zone), THREAD_UNINT);
lck_grp_t zone_locks_grp;
lck_grp_attr_t zone_locks_grp_attr;
#define lock_zone_init(zone) \
MACRO_BEGIN \
lck_attr_setdefault(&(zone)->lock_attr); \
lck_mtx_init_ext(&(zone)->lock, &(zone)->lock_ext, \
&zone_locks_grp, &(zone)->lock_attr); \
MACRO_END
#define lock_try_zone(zone) lck_mtx_try_lock_spin(&zone->lock)
decl_lck_mtx_data(, zone_gc_lock)
lck_attr_t zone_gc_lck_attr;
lck_grp_t zone_gc_lck_grp;
lck_grp_attr_t zone_gc_lck_grp_attr;
lck_mtx_ext_t zone_gc_lck_ext;
boolean_t zone_gc_allowed = TRUE;
boolean_t panic_include_zprint = FALSE;
vm_offset_t panic_kext_memory_info = 0;
vm_size_t panic_kext_memory_size = 0;
#define ZALLOC_DEBUG_ZONEGC 0x00000001
#define ZALLOC_DEBUG_ZCRAM 0x00000002
uint32_t zalloc_debug = 0;
static boolean_t log_records_init = FALSE;
static int log_records;
#define MAX_NUM_ZONES_ALLOWED_LOGGING 5
static int max_num_zones_to_log = MAX_NUM_ZONES_ALLOWED_LOGGING;
static int num_zones_logged = 0;
#define MAX_ZONE_NAME 32
static char zone_name_to_log[MAX_ZONE_NAME] = "";
boolean_t corruption_debug_flag = FALSE;
#if DEBUG || DEVELOPMENT
boolean_t leak_scan_debug_flag = FALSE;
#endif
#if defined(__LP64__)
#define ZRECORDS_MAX 2560
#else
#define ZRECORDS_MAX 1536
#endif
#define ZRECORDS_DEFAULT 1024
#define ZOP_ALLOC 1
#define ZOP_FREE 0
static int
log_this_zone(const char *zonename, const char *logname)
{
int len;
const char *zc = zonename;
const char *lc = logname;
for (len = 1; len <= MAX_ZONE_NAME; zc++, lc++, len++) {
if (*zc != *lc && !(*zc == ' ' && *lc == '.'))
break;
if (*zc == '\0')
return TRUE;
}
return FALSE;
}
#define DO_LOGGING(z) (z->zone_logging == TRUE && z->zlog_btlog)
extern boolean_t kmem_alloc_ready;
#if CONFIG_ZLEAKS
#pragma mark -
#pragma mark Zone Leak Detection
#define ZLEAK_STATE_ENABLED 0x01
#define ZLEAK_STATE_ACTIVE 0x02
#define ZLEAK_STATE_ACTIVATING 0x04
#define ZLEAK_STATE_FAILED 0x08
uint32_t zleak_state = 0;
boolean_t panic_include_ztrace = FALSE;
vm_size_t zleak_global_tracking_threshold;
vm_size_t zleak_per_zone_tracking_threshold;
unsigned int zleak_sample_factor = 1000;
unsigned int z_alloc_collisions = 0;
unsigned int z_trace_collisions = 0;
unsigned int z_alloc_overwrites = 0;
unsigned int z_trace_overwrites = 0;
unsigned int z_alloc_recorded = 0;
unsigned int z_trace_recorded = 0;
unsigned int z_total_conflicts = 0;
#pragma mark struct zallocation
struct zallocation {
uintptr_t za_element;
vm_size_t za_size;
uint32_t za_trace_index;
uint32_t za_hit_count;
};
uint32_t zleak_alloc_buckets = CONFIG_ZLEAK_ALLOCATION_MAP_NUM;
uint32_t zleak_trace_buckets = CONFIG_ZLEAK_TRACE_MAP_NUM;
vm_size_t zleak_max_zonemap_size;
static struct zallocation* zallocations;
static struct ztrace* ztraces;
struct ztrace* top_ztrace;
static lck_spin_t zleak_lock;
static lck_attr_t zleak_lock_attr;
static lck_grp_t zleak_lock_grp;
static lck_grp_attr_t zleak_lock_grp_attr;
static void
zleak_init(vm_size_t max_zonemap_size)
{
char scratch_buf[16];
boolean_t zleak_enable_flag = FALSE;
zleak_max_zonemap_size = max_zonemap_size;
zleak_global_tracking_threshold = max_zonemap_size / 2;
zleak_per_zone_tracking_threshold = zleak_global_tracking_threshold / 8;
if (PE_parse_boot_argn("-zleakoff", scratch_buf, sizeof(scratch_buf))) {
zleak_enable_flag = FALSE;
printf("zone leak detection disabled\n");
} else {
zleak_enable_flag = TRUE;
printf("zone leak detection enabled\n");
}
if (PE_parse_boot_argn("zfactor", &zleak_sample_factor, sizeof(zleak_sample_factor))) {
printf("Zone leak factor override: %u\n", zleak_sample_factor);
}
if (PE_parse_boot_argn("zleak-allocs", &zleak_alloc_buckets, sizeof(zleak_alloc_buckets))) {
printf("Zone leak alloc buckets override: %u\n", zleak_alloc_buckets);
if (zleak_alloc_buckets == 0 || (zleak_alloc_buckets & (zleak_alloc_buckets-1))) {
printf("Override isn't a power of two, bad things might happen!\n");
}
}
if (PE_parse_boot_argn("zleak-traces", &zleak_trace_buckets, sizeof(zleak_trace_buckets))) {
printf("Zone leak trace buckets override: %u\n", zleak_trace_buckets);
if (zleak_trace_buckets == 0 || (zleak_trace_buckets & (zleak_trace_buckets-1))) {
printf("Override isn't a power of two, bad things might happen!\n");
}
}
lck_grp_attr_setdefault(&zleak_lock_grp_attr);
lck_grp_init(&zleak_lock_grp, "zleak_lock", &zleak_lock_grp_attr);
lck_attr_setdefault(&zleak_lock_attr);
lck_spin_init(&zleak_lock, &zleak_lock_grp, &zleak_lock_attr);
if (zleak_enable_flag) {
zleak_state = ZLEAK_STATE_ENABLED;
}
}
#if CONFIG_ZLEAKS
int
get_zleak_state(void)
{
if (zleak_state & ZLEAK_STATE_FAILED)
return (-1);
if (zleak_state & ZLEAK_STATE_ACTIVE)
return (1);
return (0);
}
#endif
kern_return_t
zleak_activate(void)
{
kern_return_t retval;
vm_size_t z_alloc_size = zleak_alloc_buckets * sizeof(struct zallocation);
vm_size_t z_trace_size = zleak_trace_buckets * sizeof(struct ztrace);
void *allocations_ptr = NULL;
void *traces_ptr = NULL;
if (zleak_state & (ZLEAK_STATE_ACTIVE | ZLEAK_STATE_ACTIVATING | ZLEAK_STATE_FAILED)) {
return KERN_SUCCESS;
}
lck_spin_lock(&zleak_lock);
if (zleak_state & (ZLEAK_STATE_ACTIVE | ZLEAK_STATE_ACTIVATING | ZLEAK_STATE_FAILED)) {
lck_spin_unlock(&zleak_lock);
return KERN_SUCCESS;
}
zleak_state |= ZLEAK_STATE_ACTIVATING;
lck_spin_unlock(&zleak_lock);
retval = kmem_alloc_kobject(kernel_map, (vm_offset_t*)&allocations_ptr, z_alloc_size, VM_KERN_MEMORY_OSFMK);
if (retval != KERN_SUCCESS) {
goto fail;
}
retval = kmem_alloc_kobject(kernel_map, (vm_offset_t*)&traces_ptr, z_trace_size, VM_KERN_MEMORY_OSFMK);
if (retval != KERN_SUCCESS) {
goto fail;
}
bzero(allocations_ptr, z_alloc_size);
bzero(traces_ptr, z_trace_size);
zallocations = allocations_ptr;
ztraces = traces_ptr;
top_ztrace = &ztraces[0];
lck_spin_lock(&zleak_lock);
zleak_state |= ZLEAK_STATE_ACTIVE;
zleak_state &= ~ZLEAK_STATE_ACTIVATING;
lck_spin_unlock(&zleak_lock);
return 0;
fail:
lck_spin_lock(&zleak_lock);
zleak_state |= ZLEAK_STATE_FAILED;
zleak_state &= ~ZLEAK_STATE_ACTIVATING;
lck_spin_unlock(&zleak_lock);
if (allocations_ptr != NULL) {
kmem_free(kernel_map, (vm_offset_t)allocations_ptr, z_alloc_size);
}
if (traces_ptr != NULL) {
kmem_free(kernel_map, (vm_offset_t)traces_ptr, z_trace_size);
}
return retval;
}
static boolean_t
zleak_log(uintptr_t* bt,
uintptr_t addr,
uint32_t depth,
vm_size_t allocation_size)
{
if (!lck_spin_try_lock(&zleak_lock)) {
z_total_conflicts++;
return FALSE;
}
struct zallocation* allocation = &zallocations[hashaddr(addr, zleak_alloc_buckets)];
uint32_t trace_index = hashbacktrace(bt, depth, zleak_trace_buckets);
struct ztrace* trace = &ztraces[trace_index];
allocation->za_hit_count++;
trace->zt_hit_count++;
if (allocation->za_element != (uintptr_t) 0 && trace_index == allocation->za_trace_index) {
z_alloc_collisions++;
lck_spin_unlock(&zleak_lock);
return TRUE;
}
if (trace->zt_size > 0 && bcmp(trace->zt_stack, bt, (depth * sizeof(uintptr_t))) != 0 ) {
trace->zt_collisions++;
z_trace_collisions++;
lck_spin_unlock(&zleak_lock);
return TRUE;
} else if (trace->zt_size > 0) {
trace->zt_size += allocation_size;
} else {
if (trace->zt_depth != 0)
z_trace_overwrites++;
z_trace_recorded++;
trace->zt_size = allocation_size;
memcpy(trace->zt_stack, bt, (depth * sizeof(uintptr_t)) );
trace->zt_depth = depth;
trace->zt_collisions = 0;
}
if (allocation->za_element != (uintptr_t) 0) {
z_alloc_collisions++;
struct ztrace* associated_trace = &ztraces[allocation->za_trace_index];
associated_trace->zt_size -= allocation->za_size;
} else if (allocation->za_trace_index != 0) {
z_alloc_overwrites++;
}
allocation->za_element = addr;
allocation->za_trace_index = trace_index;
allocation->za_size = allocation_size;
z_alloc_recorded++;
if (top_ztrace->zt_size < trace->zt_size)
top_ztrace = trace;
lck_spin_unlock(&zleak_lock);
return TRUE;
}
static void
zleak_free(uintptr_t addr,
vm_size_t allocation_size)
{
if (addr == (uintptr_t) 0)
return;
struct zallocation* allocation = &zallocations[hashaddr(addr, zleak_alloc_buckets)];
if (allocation->za_element == addr && allocation->za_trace_index < zleak_trace_buckets) {
lck_spin_lock(&zleak_lock);
if (allocation->za_element == addr && allocation->za_trace_index < zleak_trace_buckets) {
struct ztrace *trace;
if (allocation->za_size != allocation_size) {
panic("Freeing as size %lu memory that was allocated with size %lu\n",
(uintptr_t)allocation_size, (uintptr_t)allocation->za_size);
}
trace = &ztraces[allocation->za_trace_index];
if (trace->zt_size > 0) {
trace->zt_size -= allocation_size;
}
allocation->za_element = 0;
}
lck_spin_unlock(&zleak_lock);
}
}
#endif
uintptr_t
hash_mix(uintptr_t x)
{
#ifndef __LP64__
x += ~(x << 15);
x ^= (x >> 10);
x += (x << 3 );
x ^= (x >> 6 );
x += ~(x << 11);
x ^= (x >> 16);
#else
x += ~(x << 32);
x ^= (x >> 22);
x += ~(x << 13);
x ^= (x >> 8 );
x += (x << 3 );
x ^= (x >> 15);
x += ~(x << 27);
x ^= (x >> 31);
#endif
return x;
}
uint32_t
hashbacktrace(uintptr_t* bt, uint32_t depth, uint32_t max_size)
{
uintptr_t hash = 0;
uintptr_t mask = max_size - 1;
while (depth) {
hash += bt[--depth];
}
hash = hash_mix(hash) & mask;
assert(hash < max_size);
return (uint32_t) hash;
}
uint32_t
hashaddr(uintptr_t pt, uint32_t max_size)
{
uintptr_t hash = 0;
uintptr_t mask = max_size - 1;
hash = hash_mix(pt) & mask;
assert(hash < max_size);
return (uint32_t) hash;
}
#pragma mark -
#define ZONE_MAX_ALLOC_SIZE (32 * 1024)
#define ZONE_ALLOC_FRAG_PERCENT(alloc_size, ele_size) (((alloc_size % ele_size) * 100) / alloc_size)
zone_t
zinit(
vm_size_t size,
vm_size_t max,
vm_size_t alloc,
const char *name)
{
zone_t z;
simple_lock(&all_zones_lock);
z = &(zone_array[zone_array_index]);
zone_array_index++;
assert(zone_array_index != MAX_ZONES);
simple_unlock(&all_zones_lock);
vm_size_t minimum_element_size = sizeof(vm_offset_t) * 2;
if (size < minimum_element_size)
size = minimum_element_size;
size = ((size-1) + sizeof(vm_offset_t)) -
((size-1) % sizeof(vm_offset_t));
if (alloc == 0)
alloc = PAGE_SIZE;
alloc = round_page(alloc);
max = round_page(max);
vm_size_t best_alloc = PAGE_SIZE;
vm_size_t alloc_size;
for (alloc_size = (2 * PAGE_SIZE); alloc_size <= ZONE_MAX_ALLOC_SIZE; alloc_size += PAGE_SIZE) {
if (ZONE_ALLOC_FRAG_PERCENT(alloc_size, size) < ZONE_ALLOC_FRAG_PERCENT(best_alloc, size)) {
best_alloc = alloc_size;
}
}
alloc = best_alloc;
if (max && (max < alloc))
max = alloc;
z->free_elements = NULL;
queue_init(&z->pages.any_free_foreign);
queue_init(&z->pages.all_free);
queue_init(&z->pages.intermediate);
queue_init(&z->pages.all_used);
z->cur_size = 0;
z->page_count = 0;
z->max_size = max;
z->elem_size = size;
z->alloc_size = alloc;
z->zone_name = name;
z->count = 0;
z->countfree = 0;
z->count_all_free_pages = 0;
z->sum_count = 0LL;
z->doing_alloc_without_vm_priv = FALSE;
z->doing_alloc_with_vm_priv = FALSE;
z->exhaustible = FALSE;
z->collectable = TRUE;
z->allows_foreign = FALSE;
z->expandable = TRUE;
z->waiting = FALSE;
z->async_pending = FALSE;
z->caller_acct = TRUE;
z->noencrypt = FALSE;
z->no_callout = FALSE;
z->async_prio_refill = FALSE;
z->gzalloc_exempt = FALSE;
z->alignment_required = FALSE;
z->zone_replenishing = FALSE;
z->prio_refill_watermark = 0;
z->zone_replenish_thread = NULL;
z->zp_count = 0;
#if CONFIG_ZLEAKS
z->zleak_capture = 0;
z->zleak_on = FALSE;
#endif
lock_zone_init(z);
simple_lock(&all_zones_lock);
z->index = num_zones;
num_zones++;
simple_unlock(&all_zones_lock);
if (num_zones_logged < max_num_zones_to_log) {
int i = 1;
boolean_t zone_logging_enabled = FALSE;
char zlog_name[MAX_ZONE_NAME] = "";
while (i <= max_num_zones_to_log) {
snprintf(zlog_name, MAX_ZONE_NAME, "zlog%d", i);
if (PE_parse_boot_argn(zlog_name, zone_name_to_log, sizeof(zone_name_to_log)) == TRUE) {
if (log_this_zone(z->zone_name, zone_name_to_log)) {
z->zone_logging = TRUE;
zone_logging_enabled = TRUE;
num_zones_logged++;
break;
}
}
i++;
}
if (zone_logging_enabled == FALSE) {
if (PE_parse_boot_argn("zlog", zone_name_to_log, sizeof(zone_name_to_log)) == TRUE) {
if (log_this_zone(z->zone_name, zone_name_to_log)) {
z->zone_logging = TRUE;
zone_logging_enabled = TRUE;
num_zones_logged++;
}
}
}
if (log_records_init == FALSE && zone_logging_enabled == TRUE) {
if (PE_parse_boot_argn("zrecs", &log_records, sizeof(log_records)) == TRUE) {
log_records = MIN(ZRECORDS_MAX, log_records);
log_records_init = TRUE;
} else {
log_records = ZRECORDS_DEFAULT;
log_records_init = TRUE;
}
}
if (kmem_alloc_ready) {
zone_t curr_zone = NULL;
unsigned int max_zones = 0, zone_idx = 0;
simple_lock(&all_zones_lock);
max_zones = num_zones;
simple_unlock(&all_zones_lock);
for (zone_idx = 0; zone_idx < max_zones; zone_idx++) {
curr_zone = &(zone_array[zone_idx]);
if (curr_zone->zone_logging && curr_zone->zlog_btlog == NULL) {
curr_zone->zlog_btlog = btlog_create(log_records, MAX_ZTRACE_DEPTH, (corruption_debug_flag == FALSE) );
if (curr_zone->zlog_btlog) {
printf("zone: logging started for zone %s\n", curr_zone->zone_name);
} else {
printf("zone: couldn't allocate memory for zrecords, turning off zleak logging\n");
curr_zone->zone_logging = FALSE;
}
}
}
}
}
#if CONFIG_GZALLOC
gzalloc_zone_init(z);
#endif
return(z);
}
unsigned zone_replenish_loops, zone_replenish_wakeups, zone_replenish_wakeups_initiated, zone_replenish_throttle_count;
static void zone_replenish_thread(zone_t);
__attribute__((noreturn))
static void
zone_replenish_thread(zone_t z)
{
vm_size_t free_size;
current_thread()->options |= TH_OPT_VMPRIV;
for (;;) {
lock_zone(z);
z->zone_replenishing = TRUE;
assert(z->prio_refill_watermark != 0);
while ((free_size = (z->cur_size - (z->count * z->elem_size))) < (z->prio_refill_watermark * z->elem_size)) {
assert(z->doing_alloc_without_vm_priv == FALSE);
assert(z->doing_alloc_with_vm_priv == FALSE);
assert(z->async_prio_refill == TRUE);
unlock_zone(z);
int zflags = KMA_KOBJECT|KMA_NOPAGEWAIT;
vm_offset_t space, alloc_size;
kern_return_t kr;
if (vm_pool_low())
alloc_size = round_page(z->elem_size);
else
alloc_size = z->alloc_size;
if (z->noencrypt)
zflags |= KMA_NOENCRYPT;
kr = kernel_memory_allocate(zone_map, &space, alloc_size, 0, zflags, VM_KERN_MEMORY_ZONE);
if (kr == KERN_SUCCESS) {
zcram(z, space, alloc_size);
} else if (kr == KERN_RESOURCE_SHORTAGE) {
VM_PAGE_WAIT();
} else if (kr == KERN_NO_SPACE) {
kr = kernel_memory_allocate(kernel_map, &space, alloc_size, 0, zflags, VM_KERN_MEMORY_ZONE);
if (kr == KERN_SUCCESS) {
zcram(z, space, alloc_size);
} else {
assert_wait_timeout(&z->zone_replenish_thread, THREAD_UNINT, 1, 100 * NSEC_PER_USEC);
thread_block(THREAD_CONTINUE_NULL);
}
}
lock_zone(z);
zone_replenish_loops++;
}
z->zone_replenishing = FALSE;
thread_wakeup(z);
assert_wait(&z->zone_replenish_thread, THREAD_UNINT);
unlock_zone(z);
thread_block(THREAD_CONTINUE_NULL);
zone_replenish_wakeups++;
}
}
void
zone_prio_refill_configure(zone_t z, vm_size_t low_water_mark) {
z->prio_refill_watermark = low_water_mark;
z->async_prio_refill = TRUE;
OSMemoryBarrier();
kern_return_t tres = kernel_thread_start_priority((thread_continue_t)zone_replenish_thread, z, MAXPRI_KERNEL, &z->zone_replenish_thread);
if (tres != KERN_SUCCESS) {
panic("zone_prio_refill_configure, thread create: 0x%x", tres);
}
thread_deallocate(z->zone_replenish_thread);
}
static inline void
zcram_metadata_init(vm_offset_t newmem, vm_size_t size, struct zone_page_metadata *chunk_metadata)
{
struct zone_page_metadata *page_metadata;
size -= PAGE_SIZE;
newmem += PAGE_SIZE;
for (; size > 0; newmem += PAGE_SIZE, size -= PAGE_SIZE) {
page_metadata = get_zone_page_metadata((struct zone_free_element *)newmem, TRUE);
assert(page_metadata != chunk_metadata);
PAGE_METADATA_SET_ZINDEX(page_metadata, MULTIPAGE_METADATA_MAGIC);
page_metadata_set_realmeta(page_metadata, chunk_metadata);
page_metadata->free_count = 0;
}
return;
}
static void random_bool_gen_entropy(
int *buffer,
int count)
{
int i, t;
simple_lock(&bool_gen_lock);
for (i = 0; i < count; i++) {
bool_gen_seed[1] ^= (bool_gen_seed[1] << 5);
bool_gen_seed[1] ^= (bool_gen_seed[1] >> 7);
bool_gen_seed[1] ^= (bool_gen_seed[1] << 22);
t = bool_gen_seed[2] + bool_gen_seed[3] + bool_gen_global;
bool_gen_seed[2] = bool_gen_seed[3];
bool_gen_global = t < 0;
bool_gen_seed[3] = t &2147483647;
bool_gen_seed[0] += 1411392427;
buffer[i] = (bool_gen_seed[0] + bool_gen_seed[1] + bool_gen_seed[3]);
}
simple_unlock(&bool_gen_lock);
}
static boolean_t random_bool_gen(
int *buffer,
int index,
int bufsize)
{
int valindex, bitpos;
valindex = (index / (8 * sizeof(int))) % bufsize;
bitpos = index % (8 * sizeof(int));
return (boolean_t)(buffer[valindex] & (1 << bitpos));
}
static void
random_free_to_zone(
zone_t zone,
vm_offset_t newmem,
vm_offset_t first_element_offset,
int element_count,
int *entropy_buffer)
{
vm_offset_t last_element_offset;
vm_offset_t element_addr;
vm_size_t elem_size;
int index;
elem_size = zone->elem_size;
last_element_offset = first_element_offset + ((element_count * elem_size) - elem_size);
for (index = 0; index < element_count; index++) {
assert(first_element_offset <= last_element_offset);
if (
#if DEBUG || DEVELOPMENT
leak_scan_debug_flag ||
#endif
random_bool_gen(entropy_buffer, index, MAX_ENTROPY_PER_ZCRAM)) {
element_addr = newmem + first_element_offset;
first_element_offset += elem_size;
} else {
element_addr = newmem + last_element_offset;
last_element_offset -= elem_size;
}
if (element_addr != (vm_offset_t)zone) {
zone->count++;
free_to_zone(zone, element_addr, FALSE);
}
zone->cur_size += elem_size;
}
}
void
zcram(
zone_t zone,
vm_offset_t newmem,
vm_size_t size)
{
vm_size_t elem_size;
boolean_t from_zm = FALSE;
int element_count;
int entropy_buffer[MAX_ENTROPY_PER_ZCRAM];
assert(zone != ZONE_NULL && newmem != (vm_offset_t)0);
assert(!zone->collectable || zone->allows_foreign
|| (from_zone_map(newmem, size)));
elem_size = zone->elem_size;
KERNEL_DEBUG_CONSTANT(MACHDBG_CODE(DBG_MACH_ZALLOC, ZALLOC_ZCRAM) | DBG_FUNC_START, VM_KERNEL_ADDRPERM(zone), size, 0, 0, 0);
if (from_zone_map(newmem, size))
from_zm = TRUE;
if (!from_zm) {
assert((zone->allows_foreign == TRUE) && (zone->elem_size <= (PAGE_SIZE - sizeof(struct zone_page_metadata))));
}
if (zalloc_debug & ZALLOC_DEBUG_ZCRAM)
kprintf("zcram(%p[%s], 0x%lx%s, 0x%lx)\n", zone, zone->zone_name,
(unsigned long)newmem, from_zm ? "" : "[F]", (unsigned long)size);
ZONE_PAGE_COUNT_INCR(zone, (size / PAGE_SIZE));
random_bool_gen_entropy(entropy_buffer, MAX_ENTROPY_PER_ZCRAM);
struct zone_page_metadata *chunk_metadata;
size_t zone_page_metadata_size = sizeof(struct zone_page_metadata);
assert((newmem & PAGE_MASK) == 0);
assert((size & PAGE_MASK) == 0);
chunk_metadata = get_zone_page_metadata((struct zone_free_element *)newmem, TRUE);
chunk_metadata->pages.next = NULL;
chunk_metadata->pages.prev = NULL;
page_metadata_set_freelist(chunk_metadata, 0);
PAGE_METADATA_SET_ZINDEX(chunk_metadata, zone->index);
chunk_metadata->free_count = 0;
chunk_metadata->page_count = (size / PAGE_SIZE);
zcram_metadata_init(newmem, size, chunk_metadata);
lock_zone(zone);
enqueue_tail(&zone->pages.all_used, &(chunk_metadata->pages));
if (!from_zm) {
for (; size > 0; newmem += PAGE_SIZE, size -= PAGE_SIZE) {
vm_offset_t first_element_offset = 0;
if (zone_page_metadata_size % ZONE_ELEMENT_ALIGNMENT == 0){
first_element_offset = zone_page_metadata_size;
} else {
first_element_offset = zone_page_metadata_size + (ZONE_ELEMENT_ALIGNMENT - (zone_page_metadata_size % ZONE_ELEMENT_ALIGNMENT));
}
element_count = (int)((PAGE_SIZE - first_element_offset) / elem_size);
random_free_to_zone(zone, newmem, first_element_offset, element_count, entropy_buffer);
}
} else {
element_count = (int)(size / elem_size);
random_free_to_zone(zone, newmem, 0, element_count, entropy_buffer);
}
unlock_zone(zone);
KERNEL_DEBUG_CONSTANT(MACHDBG_CODE(DBG_MACH_ZALLOC, ZALLOC_ZCRAM) | DBG_FUNC_END, VM_KERNEL_ADDRPERM(zone), 0, 0, 0, 0);
}
int
zfill(
zone_t zone,
int nelem)
{
kern_return_t kr;
vm_size_t size;
vm_offset_t memory;
int nalloc;
assert(nelem > 0);
if (nelem <= 0)
return 0;
size = nelem * zone->elem_size;
size = round_page(size);
kr = kmem_alloc_kobject(kernel_map, &memory, size, VM_KERN_MEMORY_ZONE);
if (kr != KERN_SUCCESS)
return 0;
zone_change(zone, Z_FOREIGN, TRUE);
zcram(zone, memory, size);
nalloc = (int)(size / zone->elem_size);
assert(nalloc >= nelem);
return nalloc;
}
void
zone_bootstrap(void)
{
char temp_buf[16];
unsigned int i;
if (!PE_parse_boot_argn("zalloc_debug", &zalloc_debug, sizeof(zalloc_debug)))
zalloc_debug = 0;
zp_init();
for (i = 0; i < RANDOM_BOOL_GEN_SEED_COUNT; i++) {
bool_gen_seed[i] = (unsigned int)early_random();
}
simple_lock_init(&bool_gen_lock, 0);
if (PE_parse_boot_argn("-zc", temp_buf, sizeof(temp_buf))) {
corruption_debug_flag = TRUE;
}
#if DEBUG || DEVELOPMENT
if (PE_parse_boot_argn("-zl", temp_buf, sizeof(temp_buf))) {
leak_scan_debug_flag = TRUE;
}
#endif
simple_lock_init(&all_zones_lock, 0);
num_zones = 0;
thread_call_setup(&call_async_alloc, zalloc_async, NULL);
lck_grp_attr_setdefault(&zone_locks_grp_attr);
lck_grp_init(&zone_locks_grp, "zone_locks", &zone_locks_grp_attr);
lck_attr_setdefault(&zone_metadata_lock_attr);
lck_mtx_init_ext(&zone_metadata_region_lck, &zone_metadata_region_lck_ext, &zone_locks_grp, &zone_metadata_lock_attr);
}
void
zone_init(
vm_size_t max_zonemap_size)
{
kern_return_t retval;
vm_offset_t zone_min;
vm_offset_t zone_max;
vm_offset_t zone_metadata_space;
unsigned int zone_pages;
retval = kmem_suballoc(kernel_map, &zone_min, max_zonemap_size,
FALSE, VM_FLAGS_ANYWHERE | VM_FLAGS_PERMANENT | VM_MAKE_TAG(VM_KERN_MEMORY_ZONE),
&zone_map);
if (retval != KERN_SUCCESS)
panic("zone_init: kmem_suballoc failed");
zone_max = zone_min + round_page(max_zonemap_size);
#if CONFIG_GZALLOC
gzalloc_init(max_zonemap_size);
#endif
zone_map_min_address = zone_min;
zone_map_max_address = zone_max;
zone_pages = (unsigned int)atop_kernel(zone_max - zone_min);
zone_metadata_space = round_page(zone_pages * sizeof(struct zone_page_metadata));
retval = kernel_memory_allocate(zone_map, &zone_metadata_region_min, zone_metadata_space,
0, KMA_KOBJECT | KMA_VAONLY | KMA_PERMANENT, VM_KERN_MEMORY_OSFMK);
if (retval != KERN_SUCCESS)
panic("zone_init: zone_metadata_region initialization failed!");
zone_metadata_region_max = zone_metadata_region_min + zone_metadata_space;
#if defined(__LP64__)
if ((vm_page_t)(VM_PAGE_UNPACK_PTR(VM_PAGE_PACK_PTR(zone_metadata_region_max))) != (vm_page_t)zone_metadata_region_max)
panic("VM_PAGE_PACK_PTR failed on zone_metadata_region_max - %p", (void *)zone_metadata_region_max);
if ((vm_page_t)(VM_PAGE_UNPACK_PTR(VM_PAGE_PACK_PTR(zone_map_max_address))) != (vm_page_t)zone_map_max_address)
panic("VM_PAGE_PACK_PTR failed on zone_map_max_address - %p", (void *)zone_map_max_address);
#endif
lck_grp_attr_setdefault(&zone_gc_lck_grp_attr);
lck_grp_init(&zone_gc_lck_grp, "zone_gc", &zone_gc_lck_grp_attr);
lck_attr_setdefault(&zone_gc_lck_attr);
lck_mtx_init_ext(&zone_gc_lock, &zone_gc_lck_ext, &zone_gc_lck_grp, &zone_gc_lck_attr);
#if CONFIG_ZLEAKS
zleak_init(max_zonemap_size);
#endif
}
extern volatile SInt32 kfree_nop_count;
#pragma mark -
#pragma mark zalloc_canblock
static void *
zalloc_internal(
zone_t zone,
boolean_t canblock,
boolean_t nopagewait)
{
vm_offset_t addr = 0;
kern_return_t retval;
uintptr_t zbt[MAX_ZTRACE_DEPTH];
int numsaved = 0;
boolean_t zone_replenish_wakeup = FALSE, zone_alloc_throttle = FALSE;
#if CONFIG_GZALLOC
boolean_t did_gzalloc = FALSE;
#endif
thread_t thr = current_thread();
boolean_t check_poison = FALSE;
boolean_t set_doing_alloc_with_vm_priv = FALSE;
#if CONFIG_ZLEAKS
uint32_t zleak_tracedepth = 0;
#endif
assert(zone != ZONE_NULL);
#if CONFIG_GZALLOC
addr = gzalloc_alloc(zone, canblock);
did_gzalloc = (addr != 0);
#endif
if (__improbable(DO_LOGGING(zone)))
numsaved = OSBacktrace((void*) zbt, MAX_ZTRACE_DEPTH);
#if CONFIG_ZLEAKS
if (__improbable(zone->zleak_on && sample_counter(&zone->zleak_capture, zleak_sample_factor) == TRUE)) {
if (numsaved == 0)
zleak_tracedepth = backtrace(zbt, MAX_ZTRACE_DEPTH);
else
zleak_tracedepth = numsaved;
}
#endif
lock_zone(zone);
if (zone->async_prio_refill && zone->zone_replenish_thread) {
do {
vm_size_t zfreec = (zone->cur_size - (zone->count * zone->elem_size));
vm_size_t zrefillwm = zone->prio_refill_watermark * zone->elem_size;
zone_replenish_wakeup = (zfreec < zrefillwm);
zone_alloc_throttle = (zfreec < (zrefillwm / 2)) && ((thr->options & TH_OPT_VMPRIV) == 0);
if (zone_replenish_wakeup) {
zone_replenish_wakeups_initiated++;
thread_wakeup(&zone->zone_replenish_thread);
unlock_zone(zone);
if (zone_alloc_throttle) {
zone_replenish_throttle_count++;
assert_wait_timeout(zone, THREAD_UNINT, 1, NSEC_PER_MSEC);
thread_block(THREAD_CONTINUE_NULL);
}
lock_zone(zone);
}
} while (zone_alloc_throttle == TRUE);
}
if (__probable(addr == 0))
addr = try_alloc_from_zone(zone, &check_poison);
while ((addr == 0) && canblock) {
if ((zone->doing_alloc_without_vm_priv || zone->doing_alloc_with_vm_priv) &&
(((thr->options & TH_OPT_VMPRIV) == 0) || zone->doing_alloc_with_vm_priv)) {
zone->waiting = TRUE;
zone_sleep(zone);
} else {
vm_offset_t space;
vm_size_t alloc_size;
int retry = 0;
if ((zone->cur_size + zone->elem_size) >
zone->max_size) {
if (zone->exhaustible)
break;
if (zone->expandable) {
zone->max_size += (zone->max_size >> 1);
} else {
unlock_zone(zone);
panic_include_zprint = TRUE;
#if CONFIG_ZLEAKS
if (zleak_state & ZLEAK_STATE_ACTIVE)
panic_include_ztrace = TRUE;
#endif
panic("zalloc: zone \"%s\" empty.", zone->zone_name);
}
}
set_thread_rwlock_boost();
if ((thr->options & TH_OPT_VMPRIV)) {
zone->doing_alloc_with_vm_priv = TRUE;
set_doing_alloc_with_vm_priv = TRUE;
} else {
zone->doing_alloc_without_vm_priv = TRUE;
}
unlock_zone(zone);
for (;;) {
int zflags = KMA_KOBJECT|KMA_NOPAGEWAIT;
if (vm_pool_low() || retry >= 1)
alloc_size =
round_page(zone->elem_size);
else
alloc_size = zone->alloc_size;
if (zone->noencrypt)
zflags |= KMA_NOENCRYPT;
retval = kernel_memory_allocate(zone_map, &space, alloc_size, 0, zflags, VM_KERN_MEMORY_ZONE);
if (retval == KERN_SUCCESS) {
#if CONFIG_ZLEAKS
if ((zleak_state & (ZLEAK_STATE_ENABLED | ZLEAK_STATE_ACTIVE)) == ZLEAK_STATE_ENABLED) {
if (zone_map->size >= zleak_global_tracking_threshold) {
kern_return_t kr;
kr = zleak_activate();
if (kr != KERN_SUCCESS) {
printf("Failed to activate live zone leak debugging (%d).\n", kr);
}
}
}
if ((zleak_state & ZLEAK_STATE_ACTIVE) && !(zone->zleak_on)) {
if (zone->cur_size > zleak_per_zone_tracking_threshold) {
zone->zleak_on = TRUE;
}
}
#endif
zcram(zone, space, alloc_size);
break;
} else if (retval != KERN_RESOURCE_SHORTAGE) {
retry++;
if (retry == 2) {
zone_gc();
printf("zalloc did gc\n");
zone_display_zprint();
}
if (retry == 3) {
panic_include_zprint = TRUE;
#if CONFIG_ZLEAKS
if ((zleak_state & ZLEAK_STATE_ACTIVE)) {
panic_include_ztrace = TRUE;
}
#endif
if (retval == KERN_NO_SPACE) {
zone_t zone_largest = zone_find_largest();
panic("zalloc: zone map exhausted while allocating from zone %s, likely due to memory leak in zone %s (%lu total bytes, %d elements allocated)",
zone->zone_name, zone_largest->zone_name,
(unsigned long)zone_largest->cur_size, zone_largest->count);
}
panic("zalloc: \"%s\" (%d elements) retry fail %d, kfree_nop_count: %d", zone->zone_name, zone->count, retval, (int)kfree_nop_count);
}
} else {
break;
}
}
lock_zone(zone);
if (set_doing_alloc_with_vm_priv == TRUE)
zone->doing_alloc_with_vm_priv = FALSE;
else
zone->doing_alloc_without_vm_priv = FALSE;
if (zone->waiting) {
zone->waiting = FALSE;
zone_wakeup(zone);
}
clear_thread_rwlock_boost();
addr = try_alloc_from_zone(zone, &check_poison);
if (addr == 0 &&
retval == KERN_RESOURCE_SHORTAGE) {
if (nopagewait == TRUE)
break;
unlock_zone(zone);
VM_PAGE_WAIT();
lock_zone(zone);
}
}
if (addr == 0)
addr = try_alloc_from_zone(zone, &check_poison);
}
#if CONFIG_ZLEAKS
if (addr && zleak_tracedepth > 0) {
if (!zleak_log(zbt, addr, zleak_tracedepth, zone->elem_size)) {
zone->zleak_capture = zleak_sample_factor;
}
}
#endif
if ((addr == 0) && (!canblock || nopagewait) && (zone->async_pending == FALSE) && (zone->no_callout == FALSE) && (zone->exhaustible == FALSE) && (!vm_pool_low())) {
zone->async_pending = TRUE;
unlock_zone(zone);
thread_call_enter(&call_async_alloc);
lock_zone(zone);
addr = try_alloc_from_zone(zone, &check_poison);
}
vm_offset_t inner_size = zone->elem_size;
unlock_zone(zone);
if (__improbable(DO_LOGGING(zone) && addr)) {
btlog_add_entry(zone->zlog_btlog, (void *)addr, ZOP_ALLOC, (void **)zbt, numsaved);
}
if (__improbable(check_poison && addr)) {
vm_offset_t *element_cursor = ((vm_offset_t *) addr) + 1;
vm_offset_t *backup = get_backup_ptr(inner_size, (vm_offset_t *) addr);
for ( ; element_cursor < backup ; element_cursor++)
if (__improbable(*element_cursor != ZP_POISON))
zone_element_was_modified_panic(zone,
addr,
*element_cursor,
ZP_POISON,
((vm_offset_t)element_cursor) - addr);
}
if (addr) {
vm_offset_t *primary = (vm_offset_t *) addr;
vm_offset_t *backup = get_backup_ptr(inner_size, primary);
*primary = ZP_POISON;
*backup = ZP_POISON;
#if DEBUG || DEVELOPMENT
if (__improbable(leak_scan_debug_flag && !(zone->elem_size & (sizeof(uintptr_t) - 1)))) {
int count, idx;
if (numsaved == 0) numsaved = backtrace(zbt, MAX_ZTRACE_DEPTH);
count = (int) (zone->elem_size / sizeof(uintptr_t));
if (count >= numsaved) count = numsaved - 1;
for (idx = 0; idx < count; idx++) ((uintptr_t *)addr)[count - 1 - idx] = zbt[idx + 1];
}
#endif
}
TRACE_MACHLEAKS(ZALLOC_CODE, ZALLOC_CODE_2, zone->elem_size, addr);
return((void *)addr);
}
void *
zalloc(zone_t zone)
{
return (zalloc_internal(zone, TRUE, FALSE));
}
void *
zalloc_noblock(zone_t zone)
{
return (zalloc_internal(zone, FALSE, FALSE));
}
void *
zalloc_nopagewait(zone_t zone)
{
return (zalloc_internal(zone, TRUE, TRUE));
}
void *
zalloc_canblock(zone_t zone, boolean_t canblock)
{
return (zalloc_internal(zone, canblock, FALSE));
}
void
zalloc_async(
__unused thread_call_param_t p0,
__unused thread_call_param_t p1)
{
zone_t current_z = NULL;
unsigned int max_zones, i;
void *elt = NULL;
boolean_t pending = FALSE;
simple_lock(&all_zones_lock);
max_zones = num_zones;
simple_unlock(&all_zones_lock);
for (i = 0; i < max_zones; i++) {
current_z = &(zone_array[i]);
lock_zone(current_z);
if (current_z->async_pending == TRUE) {
current_z->async_pending = FALSE;
pending = TRUE;
}
unlock_zone(current_z);
if (pending == TRUE) {
elt = zalloc_canblock(current_z, TRUE);
zfree(current_z, elt);
pending = FALSE;
}
}
}
void *
zget(
zone_t zone)
{
return zalloc_internal(zone, FALSE, TRUE);
}
boolean_t zone_check = FALSE;
static void zone_check_freelist(zone_t zone, vm_offset_t elem)
{
struct zone_free_element *this;
struct zone_page_metadata *thispage;
if (zone->allows_foreign) {
for (thispage = (struct zone_page_metadata *)queue_first(&zone->pages.any_free_foreign);
!queue_end(&zone->pages.any_free_foreign, &(thispage->pages));
thispage = (struct zone_page_metadata *)queue_next(&(thispage->pages))) {
for (this = page_metadata_get_freelist(thispage);
this != NULL;
this = this->next) {
if (!is_sane_zone_element(zone, (vm_address_t)this) || (vm_address_t)this == elem)
panic("zone_check_freelist");
}
}
}
for (thispage = (struct zone_page_metadata *)queue_first(&zone->pages.all_free);
!queue_end(&zone->pages.all_free, &(thispage->pages));
thispage = (struct zone_page_metadata *)queue_next(&(thispage->pages))) {
for (this = page_metadata_get_freelist(thispage);
this != NULL;
this = this->next) {
if (!is_sane_zone_element(zone, (vm_address_t)this) || (vm_address_t)this == elem)
panic("zone_check_freelist");
}
}
for (thispage = (struct zone_page_metadata *)queue_first(&zone->pages.intermediate);
!queue_end(&zone->pages.intermediate, &(thispage->pages));
thispage = (struct zone_page_metadata *)queue_next(&(thispage->pages))) {
for (this = page_metadata_get_freelist(thispage);
this != NULL;
this = this->next) {
if (!is_sane_zone_element(zone, (vm_address_t)this) || (vm_address_t)this == elem)
panic("zone_check_freelist");
}
}
}
void
zfree(
zone_t zone,
void *addr)
{
vm_offset_t elem = (vm_offset_t) addr;
uintptr_t zbt[MAX_ZTRACE_DEPTH];
int numsaved = 0;
boolean_t gzfreed = FALSE;
boolean_t poison = FALSE;
assert(zone != ZONE_NULL);
if (__improbable(DO_LOGGING(zone) && corruption_debug_flag))
numsaved = OSBacktrace((void *)zbt, MAX_ZTRACE_DEPTH);
#if MACH_ASSERT
if (zone == ZONE_NULL || elem == (vm_offset_t)0)
panic("zfree: NULL");
#endif
#if CONFIG_GZALLOC
gzfreed = gzalloc_free(zone, addr);
#endif
if (!gzfreed) {
struct zone_page_metadata *page_meta = get_zone_page_metadata((struct zone_free_element *)addr, FALSE);
if (zone != PAGE_METADATA_GET_ZONE(page_meta)) {
panic("Element %p from zone %s caught being freed to wrong zone %s\n", addr, PAGE_METADATA_GET_ZONE(page_meta)->zone_name, zone->zone_name);
}
}
TRACE_MACHLEAKS(ZFREE_CODE, ZFREE_CODE_2, zone->elem_size, (uintptr_t)addr);
if (__improbable(!gzfreed && zone->collectable && !zone->allows_foreign &&
!from_zone_map(elem, zone->elem_size))) {
panic("zfree: non-allocated memory in collectable zone!");
}
if ((zp_factor != 0 || zp_tiny_zone_limit != 0) && !gzfreed) {
vm_offset_t inner_size = zone->elem_size;
uint32_t sample_factor = zp_factor + (((uint32_t)inner_size) >> zp_scale);
if (inner_size <= zp_tiny_zone_limit)
poison = TRUE;
else if (zp_factor != 0 && sample_counter(&zone->zp_count, sample_factor) == TRUE)
poison = TRUE;
if (__improbable(poison)) {
vm_offset_t *element_cursor = ((vm_offset_t *) elem) + 1;
vm_offset_t *backup = get_backup_ptr(inner_size, (vm_offset_t *)elem);
for ( ; element_cursor < backup; element_cursor++)
*element_cursor = ZP_POISON;
}
}
if (__improbable(DO_LOGGING(zone))) {
if (corruption_debug_flag) {
btlog_add_entry(zone->zlog_btlog, (void *)addr, ZOP_FREE, (void **)zbt, numsaved);
} else {
btlog_remove_entries_for_element(zone->zlog_btlog, (void *)addr);
}
}
lock_zone(zone);
if (zone_check) {
zone_check_freelist(zone, elem);
}
if (__probable(!gzfreed))
free_to_zone(zone, elem, poison);
#if MACH_ASSERT
if (zone->count < 0)
panic("zfree: zone count underflow in zone %s while freeing element %p, possible cause: double frees or freeing memory that did not come from this zone",
zone->zone_name, addr);
#endif
#if CONFIG_ZLEAKS
if (zone->zleak_on) {
zleak_free(elem, zone->elem_size);
}
#endif
unlock_zone(zone);
}
void
zone_change(
zone_t zone,
unsigned int item,
boolean_t value)
{
assert( zone != ZONE_NULL );
assert( value == TRUE || value == FALSE );
switch(item){
case Z_NOENCRYPT:
zone->noencrypt = value;
break;
case Z_EXHAUST:
zone->exhaustible = value;
break;
case Z_COLLECT:
zone->collectable = value;
break;
case Z_EXPAND:
zone->expandable = value;
break;
case Z_FOREIGN:
zone->allows_foreign = value;
break;
case Z_CALLERACCT:
zone->caller_acct = value;
break;
case Z_NOCALLOUT:
zone->no_callout = value;
break;
case Z_GZALLOC_EXEMPT:
zone->gzalloc_exempt = value;
#if CONFIG_GZALLOC
gzalloc_reconfigure(zone);
#endif
break;
case Z_ALIGNMENT_REQUIRED:
zone->alignment_required = value;
#if CONFIG_GZALLOC
gzalloc_reconfigure(zone);
#endif
break;
default:
panic("Zone_change: Wrong Item Type!");
}
}
integer_t
zone_free_count(zone_t zone)
{
integer_t free_count;
lock_zone(zone);
free_count = zone->countfree;
unlock_zone(zone);
assert(free_count >= 0);
return(free_count);
}
extern zone_t vm_map_entry_reserved_zone;
uint64_t zone_gc_bailed = 0;
void
zone_gc(void)
{
unsigned int max_zones;
zone_t z;
unsigned int i;
zone_t zres = vm_map_entry_reserved_zone;
lck_mtx_lock(&zone_gc_lock);
simple_lock(&all_zones_lock);
max_zones = num_zones;
simple_unlock(&all_zones_lock);
if (zalloc_debug & ZALLOC_DEBUG_ZONEGC)
kprintf("zone_gc() starting...\n");
for (i = 0; i < max_zones; i++) {
z = &(zone_array[i]);
vm_size_t elt_size, size_freed;
int total_freed_pages = 0;
struct zone_page_metadata *page_meta;
queue_head_t page_meta_head;
assert(z != ZONE_NULL);
if (!z->collectable)
continue;
if (queue_empty(&z->pages.all_free)) {
continue;
}
if (zres->zone_replenishing) {
zone_gc_bailed++;
break;
}
lock_zone(z);
elt_size = z->elem_size;
if (queue_empty(&z->pages.all_free)) {
unlock_zone(z);
continue;
}
uint64_t old_all_free_count = z->count_all_free_pages;
queue_new_head(&z->pages.all_free, &page_meta_head, struct zone_page_metadata *, pages);
queue_init(&z->pages.all_free);
z->count_all_free_pages = 0;
unlock_zone(z);
size_freed = 0;
queue_iterate(&page_meta_head, page_meta, struct zone_page_metadata *, pages) {
assert(from_zone_map((vm_address_t)page_meta, sizeof(*page_meta)));
size_freed += elt_size * page_meta->free_count;
}
lock_zone(z);
z->cur_size -= size_freed;
z->countfree -= size_freed/elt_size;
unlock_zone(z);
while ((page_meta = (struct zone_page_metadata *)dequeue_head(&page_meta_head)) != NULL) {
vm_address_t free_page_address;
if (zres->zone_replenishing)
break;
free_page_address = get_zone_page(page_meta);
ZONE_PAGE_COUNT_DECR(z, page_meta->page_count);
total_freed_pages += page_meta->page_count;
old_all_free_count -= page_meta->page_count;
size_freed -= (elt_size * page_meta->free_count);
kmem_free(zone_map, free_page_address, (page_meta->page_count * PAGE_SIZE));
thread_yield_to_preemption();
}
if (page_meta != NULL) {
queue_entry_t qe;
enqueue_head(&page_meta_head, &(page_meta->pages));
zone_gc_bailed++;
lock_zone(z);
qe_foreach_safe(qe, &page_meta_head) {
re_queue_tail(&z->pages.all_free, qe);
}
z->count_all_free_pages += (int)old_all_free_count;
z->cur_size += size_freed;
z->countfree += size_freed/elt_size;
unlock_zone(z);
if (zalloc_debug & ZALLOC_DEBUG_ZONEGC)
kprintf("zone_gc() bailed due to VM entry zone replenishing (zone_gc_bailed: %lld)\n", zone_gc_bailed);
break;
}
assert(old_all_free_count == 0);
if (zalloc_debug & ZALLOC_DEBUG_ZONEGC)
kprintf("zone_gc() of zone %s freed %lu elements, %d pages\n", z->zone_name, (unsigned long)size_freed/elt_size, total_freed_pages);
}
lck_mtx_unlock(&zone_gc_lock);
}
extern vm_offset_t kmapoff_kaddr;
extern unsigned int kmapoff_pgcnt;
void
consider_zone_gc(void)
{
if (kmapoff_kaddr != 0) {
(void) vm_deallocate(kernel_map,
kmapoff_kaddr, kmapoff_pgcnt * PAGE_SIZE_64);
kmapoff_kaddr = 0;
}
if (zone_gc_allowed)
zone_gc();
}
kern_return_t
task_zone_info(
__unused task_t task,
__unused mach_zone_name_array_t *namesp,
__unused mach_msg_type_number_t *namesCntp,
__unused task_zone_info_array_t *infop,
__unused mach_msg_type_number_t *infoCntp)
{
return KERN_FAILURE;
}
kern_return_t
mach_zone_info(
host_priv_t host,
mach_zone_name_array_t *namesp,
mach_msg_type_number_t *namesCntp,
mach_zone_info_array_t *infop,
mach_msg_type_number_t *infoCntp)
{
return (mach_memory_info(host, namesp, namesCntp, infop, infoCntp, NULL, NULL));
}
kern_return_t
host_zone_info(
host_priv_t host,
zone_name_array_t *namesp,
mach_msg_type_number_t *namesCntp,
zone_info_array_t *infop,
mach_msg_type_number_t *infoCntp)
{
return (mach_memory_info(host, (mach_zone_name_array_t *)namesp, namesCntp, (mach_zone_info_array_t *)infop, infoCntp, NULL, NULL));
}
kern_return_t
mach_memory_info(
host_priv_t host,
mach_zone_name_array_t *namesp,
mach_msg_type_number_t *namesCntp,
mach_zone_info_array_t *infop,
mach_msg_type_number_t *infoCntp,
mach_memory_info_array_t *memoryInfop,
mach_msg_type_number_t *memoryInfoCntp)
{
mach_zone_name_t *names;
vm_offset_t names_addr;
vm_size_t names_size;
mach_zone_info_t *info;
vm_offset_t info_addr;
vm_size_t info_size;
mach_memory_info_t *memory_info;
vm_offset_t memory_info_addr;
vm_size_t memory_info_size;
vm_size_t memory_info_vmsize;
unsigned int num_sites;
unsigned int max_zones, i;
zone_t z;
mach_zone_name_t *zn;
mach_zone_info_t *zi;
kern_return_t kr;
vm_size_t used;
vm_map_copy_t copy;
uint64_t zones_collectable_bytes = 0;
if (host == HOST_NULL)
return KERN_INVALID_HOST;
#if CONFIG_DEBUGGER_FOR_ZONE_INFO
if (!PE_i_can_has_debugger(NULL))
return KERN_INVALID_HOST;
#endif
simple_lock(&all_zones_lock);
max_zones = (unsigned int)(num_zones);
simple_unlock(&all_zones_lock);
names_size = round_page(max_zones * sizeof *names);
kr = kmem_alloc_pageable(ipc_kernel_map,
&names_addr, names_size, VM_KERN_MEMORY_IPC);
if (kr != KERN_SUCCESS)
return kr;
names = (mach_zone_name_t *) names_addr;
info_size = round_page(max_zones * sizeof *info);
kr = kmem_alloc_pageable(ipc_kernel_map,
&info_addr, info_size, VM_KERN_MEMORY_IPC);
if (kr != KERN_SUCCESS) {
kmem_free(ipc_kernel_map,
names_addr, names_size);
return kr;
}
info = (mach_zone_info_t *) info_addr;
zn = &names[0];
zi = &info[0];
for (i = 0; i < max_zones; i++) {
struct zone zcopy;
z = &(zone_array[i]);
assert(z != ZONE_NULL);
lock_zone(z);
zcopy = *z;
unlock_zone(z);
(void) strncpy(zn->mzn_name, zcopy.zone_name,
sizeof zn->mzn_name);
zn->mzn_name[sizeof zn->mzn_name - 1] = '\0';
zi->mzi_count = (uint64_t)zcopy.count;
zi->mzi_cur_size = ptoa_64(zcopy.page_count);
zi->mzi_max_size = (uint64_t)zcopy.max_size;
zi->mzi_elem_size = (uint64_t)zcopy.elem_size;
zi->mzi_alloc_size = (uint64_t)zcopy.alloc_size;
zi->mzi_sum_size = zcopy.sum_count * zcopy.elem_size;
zi->mzi_exhaustible = (uint64_t)zcopy.exhaustible;
zi->mzi_collectable = (uint64_t)zcopy.collectable;
zones_collectable_bytes += ((uint64_t)zcopy.count_all_free_pages * PAGE_SIZE);
zn++;
zi++;
}
used = max_zones * sizeof *names;
if (used != names_size)
bzero((char *) (names_addr + used), names_size - used);
kr = vm_map_copyin(ipc_kernel_map, (vm_map_address_t)names_addr,
(vm_map_size_t)used, TRUE, ©);
assert(kr == KERN_SUCCESS);
*namesp = (mach_zone_name_t *) copy;
*namesCntp = max_zones;
used = max_zones * sizeof *info;
if (used != info_size)
bzero((char *) (info_addr + used), info_size - used);
kr = vm_map_copyin(ipc_kernel_map, (vm_map_address_t)info_addr,
(vm_map_size_t)used, TRUE, ©);
assert(kr == KERN_SUCCESS);
*infop = (mach_zone_info_t *) copy;
*infoCntp = max_zones;
num_sites = 0;
memory_info_addr = 0;
if (memoryInfop && memoryInfoCntp)
{
num_sites = VM_KERN_MEMORY_COUNT + VM_KERN_COUNTER_COUNT;
memory_info_size = num_sites * sizeof(*info);
memory_info_vmsize = round_page(memory_info_size);
kr = kmem_alloc_pageable(ipc_kernel_map,
&memory_info_addr, memory_info_vmsize, VM_KERN_MEMORY_IPC);
if (kr != KERN_SUCCESS) {
kmem_free(ipc_kernel_map,
names_addr, names_size);
kmem_free(ipc_kernel_map,
info_addr, info_size);
return kr;
}
kr = vm_map_wire(ipc_kernel_map, memory_info_addr, memory_info_addr + memory_info_vmsize,
VM_PROT_READ|VM_PROT_WRITE|VM_PROT_MEMORY_TAG_MAKE(VM_KERN_MEMORY_IPC), FALSE);
assert(kr == KERN_SUCCESS);
memory_info = (mach_memory_info_t *) memory_info_addr;
vm_page_diagnose(memory_info, num_sites, zones_collectable_bytes);
kr = vm_map_unwire(ipc_kernel_map, memory_info_addr, memory_info_addr + memory_info_vmsize, FALSE);
assert(kr == KERN_SUCCESS);
kr = vm_map_copyin(ipc_kernel_map, (vm_map_address_t)memory_info_addr,
(vm_map_size_t)memory_info_size, TRUE, ©);
assert(kr == KERN_SUCCESS);
*memoryInfop = (mach_memory_info_t *) copy;
*memoryInfoCntp = num_sites;
}
return KERN_SUCCESS;
}
kern_return_t
mach_zone_force_gc(
host_t host)
{
if (host == HOST_NULL)
return KERN_INVALID_HOST;
consider_zone_gc();
return (KERN_SUCCESS);
}
extern unsigned int stack_total;
extern unsigned long long stack_allocs;
#if defined(__i386__) || defined (__x86_64__)
extern unsigned int inuse_ptepages_count;
extern long long alloc_ptepages_count;
#endif
void zone_display_zprint()
{
unsigned int i;
zone_t the_zone;
for (i = 0; i < num_zones; i++) {
the_zone = &(zone_array[i]);
if(the_zone->cur_size > (1024*1024)) {
printf("%.20s:\t%lu\n",the_zone->zone_name,(uintptr_t)the_zone->cur_size);
}
}
printf("Kernel Stacks:\t%lu\n",(uintptr_t)(kernel_stack_size * stack_total));
#if defined(__i386__) || defined (__x86_64__)
printf("PageTables:\t%lu\n",(uintptr_t)(PAGE_SIZE * inuse_ptepages_count));
#endif
printf("Kalloc.Large:\t%lu\n",(uintptr_t)kalloc_large_total);
}
zone_t
zone_find_largest(void)
{
unsigned int i;
unsigned int max_zones;
zone_t the_zone;
zone_t zone_largest;
simple_lock(&all_zones_lock);
max_zones = num_zones;
simple_unlock(&all_zones_lock);
zone_largest = &(zone_array[0]);
for (i = 0; i < max_zones; i++) {
the_zone = &(zone_array[i]);
if (the_zone->cur_size > zone_largest->cur_size) {
zone_largest = the_zone;
}
}
return zone_largest;
}
#if ZONE_DEBUG
#define zone_in_use(z) ( z->count || z->free_elements \
|| !queue_empty(&z->pages.all_free) \
|| !queue_empty(&z->pages.intermediate) \
|| (z->allows_foreign && !queue_empty(&z->pages.any_free_foreign)))
#endif
#if DEBUG || DEVELOPMENT
static uintptr_t *
zone_copy_all_allocations_inqueue(zone_t z, queue_head_t * queue, uintptr_t * elems)
{
struct zone_page_metadata *page_meta;
vm_offset_t free, elements;
vm_offset_t idx, numElements, freeCount, bytesAvail, metaSize;
queue_iterate(queue, page_meta, struct zone_page_metadata *, pages)
{
elements = get_zone_page(page_meta);
bytesAvail = ptoa(page_meta->page_count);
freeCount = 0;
if (z->allows_foreign && !from_zone_map(elements, z->elem_size))
{
metaSize = (sizeof(struct zone_page_metadata) + ZONE_ELEMENT_ALIGNMENT - 1) & ~(ZONE_ELEMENT_ALIGNMENT - 1);
bytesAvail -= metaSize;
elements += metaSize;
}
numElements = bytesAvail / z->elem_size;
for (idx = 0; idx < numElements; idx++)
{
elems[idx] = INSTANCE_PUT(elements + idx * z->elem_size);
}
free = (vm_offset_t)page_metadata_get_freelist(page_meta);
while (free)
{
for (idx = 0; (idx < numElements) && (elems[idx] != INSTANCE_PUT(free)); idx++) {}
assert(idx < numElements);
bcopy(&elems[idx + 1], &elems[idx], (numElements - (idx + 1)) * sizeof(elems[0]));
numElements--;
freeCount++;
vm_offset_t *primary = (vm_offset_t *) free;
free = *primary ^ zp_nopoison_cookie;
}
elems += numElements;
}
return (elems);
}
kern_return_t
zone_leaks(const char * zoneName, uint32_t nameLen, leak_site_proc proc, void * refCon)
{
uintptr_t zbt[MAX_ZTRACE_DEPTH];
zone_t zone;
uintptr_t * array;
uintptr_t * next;
uintptr_t element, bt;
uint32_t idx, count, found;
uint32_t btidx, btcount, nobtcount, btfound;
uint32_t elemSize;
uint64_t maxElems;
kern_return_t kr;
for (idx = 0; idx < num_zones; idx++)
{
if (!strncmp(zoneName, zone_array[idx].zone_name, nameLen)) break;
}
if (idx >= num_zones) return (KERN_INVALID_NAME);
zone = &zone_array[idx];
elemSize = (uint32_t) zone->elem_size;
maxElems = ptoa(zone->page_count) / elemSize;
if ((zone->alloc_size % elemSize)
&& !leak_scan_debug_flag) return (KERN_INVALID_CAPABILITY);
kr = kmem_alloc_kobject(kernel_map, (vm_offset_t *) &array,
maxElems * sizeof(uintptr_t), VM_KERN_MEMORY_DIAG);
if (KERN_SUCCESS != kr) return (kr);
lock_zone(zone);
next = array;
next = zone_copy_all_allocations_inqueue(zone, &zone->pages.any_free_foreign, next);
next = zone_copy_all_allocations_inqueue(zone, &zone->pages.intermediate, next);
next = zone_copy_all_allocations_inqueue(zone, &zone->pages.all_used, next);
count = (uint32_t)(next - array);
unlock_zone(zone);
zone_leaks_scan(array, count, (uint32_t)zone->elem_size, &found);
assert(found <= count);
for (idx = 0; idx < count; idx++)
{
element = array[idx];
if (kInstanceFlagReferenced & element) continue;
element = INSTANCE_PUT(element) & ~kInstanceFlags;
}
if (zone->zlog_btlog && !corruption_debug_flag)
{
btlog_copy_backtraces_for_elements(zone->zlog_btlog, array, &count, elemSize, proc, refCon);
}
for (nobtcount = idx = 0; idx < count; idx++)
{
element = array[idx];
if (!element) continue;
if (kInstanceFlagReferenced & element) continue;
element = INSTANCE_PUT(element) & ~kInstanceFlags;
btcount = (typeof(btcount)) (zone->elem_size / sizeof(uintptr_t));
if (btcount >= MAX_ZTRACE_DEPTH) btcount = MAX_ZTRACE_DEPTH - 1;
for (btfound = btidx = 0; btidx < btcount; btidx++)
{
bt = ((uintptr_t *)element)[btcount - 1 - btidx];
if (!VM_KERNEL_IS_SLID(bt)) break;
zbt[btfound++] = bt;
}
if (btfound) (*proc)(refCon, 1, elemSize, &zbt[0], btfound);
else nobtcount++;
}
if (nobtcount)
{
zbt[0] = (uintptr_t) &zalloc;
(*proc)(refCon, nobtcount, elemSize, &zbt[0], 1);
}
kmem_free(kernel_map, (vm_offset_t) array, maxElems * sizeof(uintptr_t));
return (KERN_SUCCESS);
}
void
kern_wired_diagnose(void)
{
unsigned int count = VM_KERN_MEMORY_COUNT + VM_KERN_COUNTER_COUNT;
mach_memory_info_t info[count];
unsigned int idx;
uint64_t total_zone, total_wired, top_wired, osfmk_wired;
if (KERN_SUCCESS != vm_page_diagnose(info, count, 0)) return;
total_zone = total_wired = top_wired = osfmk_wired = 0;
for (idx = 0; idx < num_zones; idx++)
{
total_zone += ptoa_64(zone_array[idx].page_count);
}
total_wired = total_zone;
for (idx = 0; idx < count; idx++)
{
if (VM_KERN_COUNT_WIRED == info[idx].site) top_wired = info[idx].size;
if (VM_KERN_MEMORY_OSFMK == info[idx].site) osfmk_wired = info[idx].size;
if (VM_KERN_SITE_HIDE & info[idx].flags) continue;
if (!(VM_KERN_SITE_WIRED & info[idx].flags)) continue;
total_wired += info[idx].size;
}
printf("top 0x%qx, total 0x%qx, zone 0x%qx, osfmk 0x%qx\n",
top_wired, total_wired, total_zone, osfmk_wired);
}
#endif