#include <zone_debug.h>
#include <zone_alias_addr.h>
#include <mach/mach_types.h>
#include <mach/vm_param.h>
#include <mach/kern_return.h>
#include <mach/mach_host_server.h>
#include <mach/task_server.h>
#include <mach/machine/vm_types.h>
#include <mach_debug/zone_info.h>
#include <mach/vm_map.h>
#include <kern/kern_types.h>
#include <kern/assert.h>
#include <kern/host.h>
#include <kern/macro_help.h>
#include <kern/sched.h>
#include <kern/locks.h>
#include <kern/sched_prim.h>
#include <kern/misc_protos.h>
#include <kern/thread_call.h>
#include <kern/zalloc.h>
#include <kern/kalloc.h>
#include <kern/btlog.h>
#include <vm/pmap.h>
#include <vm/vm_map.h>
#include <vm/vm_kern.h>
#include <vm/vm_page.h>
#include <pexpert/pexpert.h>
#include <machine/machparam.h>
#include <machine/machine_routines.h>
#include <libkern/OSDebug.h>
#include <libkern/OSAtomic.h>
#include <sys/kdebug.h>
#if !ZONE_ALIAS_ADDR
#define from_zone_map(addr, size) \
((vm_offset_t)(addr) >= zone_map_min_address && \
((vm_offset_t)(addr) + size - 1) < zone_map_max_address )
#else
#define from_zone_map(addr, size) \
((vm_offset_t)(zone_virtual_addr((vm_map_address_t)(uintptr_t)addr)) >= zone_map_min_address && \
((vm_offset_t)(zone_virtual_addr((vm_map_address_t)(uintptr_t)addr)) + size -1) < zone_map_max_address )
#endif
static inline boolean_t
sample_counter(volatile uint32_t * count_p, uint32_t factor)
{
uint32_t old_count, new_count;
boolean_t rolled_over;
do {
new_count = old_count = *count_p;
if (++new_count >= factor) {
rolled_over = TRUE;
new_count = 0;
} else {
rolled_over = FALSE;
}
} while (!OSCompareAndSwap(old_count, new_count, count_p));
return rolled_over;
}
#if defined(__LP64__)
#define ZP_POISON 0xdeadbeefdeadbeef
#else
#define ZP_POISON 0xdeadbeef
#endif
#define ZP_DEFAULT_SAMPLING_FACTOR 16
#define ZP_DEFAULT_SCALE_FACTOR 4
uint32_t zp_factor = 0;
uint32_t zp_scale = 0;
vm_size_t zp_tiny_zone_limit = 0;
uintptr_t zp_poisoned_cookie = 0;
uintptr_t zp_nopoison_cookie = 0;
static inline void
zp_init(void)
{
char temp_buf[16];
zp_poisoned_cookie = (uintptr_t) early_random();
ml_cpu_info_t cpu_info;
ml_cpu_get_info(&cpu_info);
zp_tiny_zone_limit = (vm_size_t) cpu_info.cache_line_size;
zp_factor = ZP_DEFAULT_SAMPLING_FACTOR;
zp_scale = ZP_DEFAULT_SCALE_FACTOR;
if (zp_factor != 0) {
uint32_t rand_bits = early_random() & 0x3;
if (rand_bits == 0x1)
zp_factor += 1;
else if (rand_bits == 0x2)
zp_factor -= 1;
}
if (PE_parse_boot_argn("-zp", temp_buf, sizeof(temp_buf))) {
zp_factor = 1;
}
if (PE_parse_boot_argn("-no-zp", temp_buf, sizeof(temp_buf))) {
zp_factor = 0;
zp_tiny_zone_limit = 0;
printf("Zone poisoning disabled\n");
}
if (PE_parse_boot_argn("zp-factor", &zp_factor, sizeof(zp_factor))) {
printf("Zone poisoning factor override: %u\n", zp_factor);
}
if (PE_parse_boot_argn("zp-scale", &zp_scale, sizeof(zp_scale))) {
printf("Zone poisoning scale factor override: %u\n", zp_scale);
}
zp_nopoison_cookie = (uintptr_t) early_random();
#if MACH_ASSERT
if (zp_poisoned_cookie == zp_nopoison_cookie)
panic("early_random() is broken: %p and %p are not random\n",
(void *) zp_poisoned_cookie, (void *) zp_nopoison_cookie);
#endif
zp_poisoned_cookie |= (uintptr_t)0x1ULL;
zp_nopoison_cookie &= ~((uintptr_t)0x1ULL);
#if defined(__LP64__)
zp_poisoned_cookie &= 0x000000FFFFFFFFFF;
zp_poisoned_cookie |= 0x0535210000000000;
zp_nopoison_cookie &= 0x000000FFFFFFFFFF;
zp_nopoison_cookie |= 0x3f00110000000000;
#endif
}
uint64_t zone_map_table_page_count = 0;
#define ZONE_PAGE_COUNT_INCR(z, count) \
{ \
OSAddAtomic64(count, &(z->page_count)); \
}
#define ZONE_PAGE_COUNT_DECR(z, count) \
{ \
OSAddAtomic64(-count, &(z->page_count)); \
}
vm_offset_t zone_map_min_address = 0;
vm_offset_t zone_map_max_address = 0;
struct zone_free_element {
struct zone_free_element *next;
};
struct zone_page_metadata {
queue_chain_t pages;
struct zone_free_element *elements;
zone_t zone;
uint16_t alloc_count;
uint16_t free_count;
};
static inline vm_offset_t *
get_backup_ptr(vm_size_t elem_size,
vm_offset_t *element)
{
return (vm_offset_t *) ((vm_offset_t)element + elem_size - sizeof(vm_offset_t));
}
static inline struct zone_page_metadata *
get_zone_page_metadata(struct zone_free_element *element)
{
return (struct zone_page_metadata *)(trunc_page((vm_offset_t)element));
}
static inline boolean_t
is_sane_zone_ptr(zone_t zone,
vm_offset_t addr,
size_t obj_size)
{
if (__improbable((addr & (sizeof(vm_offset_t) - 1)) != 0))
return FALSE;
if (__improbable(!pmap_kernel_va(addr)))
return FALSE;
if (zone->collectable && !zone->allows_foreign) {
#if ZONE_ALIAS_ADDR
if ((addr - gVirtBase) < gPhysSize)
return TRUE;
#endif
if (addr >= zone_map_min_address &&
(addr + obj_size - 1) < zone_map_max_address )
return TRUE;
return FALSE;
}
return TRUE;
}
static inline boolean_t
is_sane_zone_page_metadata(zone_t zone,
vm_offset_t page_meta)
{
if (page_meta == 0)
return FALSE;
return is_sane_zone_ptr(zone, page_meta, sizeof(struct zone_page_metadata));
}
static inline boolean_t
is_sane_zone_element(zone_t zone,
vm_offset_t addr)
{
if (addr == 0)
return TRUE;
return is_sane_zone_ptr(zone, addr, zone->elem_size);
}
static inline void
zone_element_was_modified_panic(zone_t zone,
vm_offset_t element,
vm_offset_t found,
vm_offset_t expected,
vm_offset_t offset)
{
panic("a freed zone element has been modified in zone %s: expected %p but found %p, bits changed %p, at offset %d of %d in element %p, cookies %p %p",
zone->zone_name,
(void *) expected,
(void *) found,
(void *) (expected ^ found),
(uint32_t) offset,
(uint32_t) zone->elem_size,
(void *) element,
(void *) zp_nopoison_cookie,
(void *) zp_poisoned_cookie);
}
static void
backup_ptr_mismatch_panic(zone_t zone,
vm_offset_t element,
vm_offset_t primary,
vm_offset_t backup)
{
vm_offset_t likely_backup;
boolean_t sane_backup;
boolean_t sane_primary = is_sane_zone_element(zone, primary);
boolean_t element_was_poisoned = (backup & 0x1) ? TRUE : FALSE;
#if defined(__LP64__)
if ((backup & 0xFFFFFF0000000000) == 0xFACADE0000000000)
element_was_poisoned = TRUE;
else if ((backup & 0xFFFFFF0000000000) == 0xC0FFEE0000000000)
element_was_poisoned = FALSE;
#endif
if (element_was_poisoned) {
likely_backup = backup ^ zp_poisoned_cookie;
sane_backup = is_sane_zone_element(zone, likely_backup);
} else {
likely_backup = backup ^ zp_nopoison_cookie;
sane_backup = is_sane_zone_element(zone, likely_backup);
}
if (!sane_primary && sane_backup)
zone_element_was_modified_panic(zone, element, primary, likely_backup, 0);
if (sane_primary && !sane_backup)
zone_element_was_modified_panic(zone, element, backup,
(primary ^ (element_was_poisoned ? zp_poisoned_cookie : zp_nopoison_cookie)),
zone->elem_size - sizeof(vm_offset_t));
if (sane_primary && sane_backup)
zone_element_was_modified_panic(zone, element, primary, likely_backup, 0);
zone_element_was_modified_panic(zone, element, primary, likely_backup, 0);
}
static inline void
append_zone_element(zone_t zone,
struct zone_free_element *tail,
struct zone_free_element *elem)
{
vm_offset_t *backup = get_backup_ptr(zone->elem_size, (vm_offset_t *) tail);
vm_offset_t old_backup = *backup;
vm_offset_t old_next = (vm_offset_t) tail->next;
vm_offset_t new_next = (vm_offset_t) elem;
if (old_next == (old_backup ^ zp_nopoison_cookie))
*backup = new_next ^ zp_nopoison_cookie;
else if (old_next == (old_backup ^ zp_poisoned_cookie))
*backup = new_next ^ zp_poisoned_cookie;
else
backup_ptr_mismatch_panic(zone,
(vm_offset_t) tail,
old_next,
old_backup);
tail->next = elem;
}
static inline void
add_list_to_zone(zone_t zone,
struct zone_free_element *head,
struct zone_free_element *tail)
{
assert(tail->next == NULL);
assert(!zone->use_page_list);
append_zone_element(zone, tail, zone->free_elements);
zone->free_elements = head;
}
static inline void
free_to_zone(zone_t zone,
vm_offset_t element,
boolean_t poison)
{
vm_offset_t old_head;
struct zone_page_metadata *page_meta;
vm_offset_t *primary = (vm_offset_t *) element;
vm_offset_t *backup = get_backup_ptr(zone->elem_size, primary);
if (zone->use_page_list) {
page_meta = get_zone_page_metadata((struct zone_free_element *)element);
assert(page_meta->zone == zone);
old_head = (vm_offset_t)page_meta->elements;
} else {
old_head = (vm_offset_t)zone->free_elements;
}
#if MACH_ASSERT
if (__improbable(!is_sane_zone_element(zone, old_head)))
panic("zfree: invalid head pointer %p for freelist of zone %s\n",
(void *) old_head, zone->zone_name);
#endif
if (__improbable(!is_sane_zone_element(zone, element)))
panic("zfree: freeing invalid pointer %p to zone %s\n",
(void *) element, zone->zone_name);
*backup = old_head ^ (poison ? zp_poisoned_cookie : zp_nopoison_cookie);
*primary = old_head;
if (zone->use_page_list) {
page_meta->elements = (struct zone_free_element *)element;
page_meta->free_count++;
if (zone->allows_foreign && !from_zone_map(element, zone->elem_size)) {
if (page_meta->free_count == 1) {
remqueue((queue_entry_t)page_meta);
enqueue_tail(&zone->pages.any_free_foreign, (queue_entry_t)page_meta);
} else {
}
} else if (page_meta->free_count == page_meta->alloc_count) {
remqueue((queue_entry_t)page_meta);
enqueue_tail(&zone->pages.all_free, (queue_entry_t)page_meta);
} else if (page_meta->free_count == 1) {
remqueue((queue_entry_t)page_meta);
enqueue_tail(&zone->pages.intermediate, (queue_entry_t)page_meta);
}
} else {
zone->free_elements = (struct zone_free_element *)element;
}
zone->count--;
zone->countfree++;
}
static inline vm_offset_t
try_alloc_from_zone(zone_t zone,
boolean_t* check_poison)
{
vm_offset_t element;
struct zone_page_metadata *page_meta;
*check_poison = FALSE;
if (zone->use_page_list) {
if (zone->allows_foreign && !queue_empty(&zone->pages.any_free_foreign))
page_meta = (struct zone_page_metadata *)queue_first(&zone->pages.any_free_foreign);
else if (!queue_empty(&zone->pages.intermediate))
page_meta = (struct zone_page_metadata *)queue_first(&zone->pages.intermediate);
else if (!queue_empty(&zone->pages.all_free))
page_meta = (struct zone_page_metadata *)queue_first(&zone->pages.all_free);
else {
return 0;
}
if (__improbable(!is_sane_zone_page_metadata(zone, (vm_offset_t)page_meta)))
panic("zalloc: invalid metadata structure %p for freelist of zone %s\n",
(void *) page_meta, zone->zone_name);
assert(page_meta->zone == zone);
element = (vm_offset_t)page_meta->elements;
} else {
if (zone->free_elements == NULL)
return 0;
element = (vm_offset_t)zone->free_elements;
}
#if MACH_ASSERT
if (__improbable(!is_sane_zone_element(zone, element)))
panic("zfree: invalid head pointer %p for freelist of zone %s\n",
(void *) element, zone->zone_name);
#endif
vm_offset_t *primary = (vm_offset_t *) element;
vm_offset_t *backup = get_backup_ptr(zone->elem_size, primary);
vm_offset_t next_element = *primary;
vm_offset_t next_element_backup = *backup;
if (__improbable(!is_sane_zone_element(zone, next_element)))
backup_ptr_mismatch_panic(zone, element, next_element, next_element_backup);
if (__improbable(next_element != (next_element_backup ^ zp_nopoison_cookie))) {
if (__improbable(next_element != (next_element_backup ^ zp_poisoned_cookie)))
backup_ptr_mismatch_panic(zone, element, next_element, next_element_backup);
*check_poison = TRUE;
}
if (zone->use_page_list) {
if (__improbable(page_meta != get_zone_page_metadata((struct zone_free_element *)element)))
panic("zalloc: metadata located at incorrect location on page of zone %s\n",
zone->zone_name);
if (next_element) {
if (__improbable(page_meta != get_zone_page_metadata((struct zone_free_element *)next_element)))
panic("zalloc: next element pointer %p for element %p points to invalid element for zone %s\n",
(void *)next_element, (void *)element, zone->zone_name);
}
}
if (zone->use_page_list) {
page_meta->elements = (struct zone_free_element *)next_element;
page_meta->free_count--;
if (zone->allows_foreign && !from_zone_map(element, zone->elem_size)) {
if (page_meta->free_count == 0) {
remqueue((queue_entry_t)page_meta);
enqueue_tail(&zone->pages.all_used, (queue_entry_t)page_meta);
} else {
}
} else if (page_meta->free_count == 0) {
remqueue((queue_entry_t)page_meta);
enqueue_tail(&zone->pages.all_used, (queue_entry_t)page_meta);
} else if (page_meta->alloc_count == page_meta->free_count + 1) {
remqueue((queue_entry_t)page_meta);
enqueue_tail(&zone->pages.intermediate, (queue_entry_t)page_meta);
}
} else {
zone->free_elements = (struct zone_free_element *)next_element;
}
zone->countfree--;
zone->count++;
zone->sum_count++;
return element;
}
struct fake_zone_info {
const char* name;
void (*init)(int);
void (*query)(int *,
vm_size_t *, vm_size_t *, vm_size_t *, vm_size_t *,
uint64_t *, int *, int *, int *);
};
static const struct fake_zone_info fake_zones[] = {
};
static const unsigned int num_fake_zones =
sizeof (fake_zones) / sizeof (fake_zones[0]);
boolean_t zinfo_per_task = FALSE;
#define ZINFO_SLOTS 200
#define ZONES_MAX (ZINFO_SLOTS - num_fake_zones - 1)
typedef uint32_t zone_page_index_t;
#define ZONE_PAGE_INDEX_INVALID ((zone_page_index_t)0xFFFFFFFFU)
struct zone_page_table_entry {
volatile uint16_t alloc_count;
volatile uint16_t collect_count;
};
#define ZONE_PAGE_USED 0
#define ZONE_PAGE_UNUSED 0xffff
void zone_page_init(
vm_offset_t addr,
vm_size_t size);
void zone_page_alloc(
vm_offset_t addr,
vm_size_t size);
void zone_page_free_element(
zone_page_index_t *free_page_head,
zone_page_index_t *free_page_tail,
vm_offset_t addr,
vm_size_t size);
void zone_page_collect(
vm_offset_t addr,
vm_size_t size);
boolean_t zone_page_collectable(
vm_offset_t addr,
vm_size_t size);
void zone_page_keep(
vm_offset_t addr,
vm_size_t size);
void zone_display_zprint(void);
zone_t zone_find_largest(void);
void zalloc_async(
thread_call_param_t p0,
thread_call_param_t p1);
static thread_call_data_t call_async_alloc;
vm_map_t zone_map = VM_MAP_NULL;
zone_t zone_zone = ZONE_NULL;
zone_t zinfo_zone = ZONE_NULL;
vm_offset_t zdata;
vm_size_t zdata_size;
#define ZONE_ELEMENT_ALIGNMENT 32
#define zone_wakeup(zone) thread_wakeup((event_t)(zone))
#define zone_sleep(zone) \
(void) lck_mtx_sleep(&(zone)->lock, LCK_SLEEP_SPIN, (event_t)(zone), THREAD_UNINT);
lck_grp_t zone_locks_grp;
lck_grp_attr_t zone_locks_grp_attr;
#define lock_zone_init(zone) \
MACRO_BEGIN \
lck_attr_setdefault(&(zone)->lock_attr); \
lck_mtx_init_ext(&(zone)->lock, &(zone)->lock_ext, \
&zone_locks_grp, &(zone)->lock_attr); \
MACRO_END
#define lock_try_zone(zone) lck_mtx_try_lock_spin(&zone->lock)
#define ZONE_PAGE_TABLE_FIRST_LEVEL_SIZE (32)
struct zone_page_table_entry * volatile zone_page_table[ZONE_PAGE_TABLE_FIRST_LEVEL_SIZE];
vm_size_t zone_page_table_used_size;
unsigned int zone_pages;
unsigned int zone_page_table_second_level_size;
unsigned int zone_page_table_second_level_shift_amount;
#define zone_page_table_first_level_slot(x) ((x) >> zone_page_table_second_level_shift_amount)
#define zone_page_table_second_level_slot(x) ((x) & (zone_page_table_second_level_size - 1))
void zone_page_table_expand(zone_page_index_t pindex);
struct zone_page_table_entry *zone_page_table_lookup(zone_page_index_t pindex);
decl_lck_mtx_data(, zone_gc_lock)
lck_attr_t zone_gc_lck_attr;
lck_grp_t zone_gc_lck_grp;
lck_grp_attr_t zone_gc_lck_grp_attr;
lck_mtx_ext_t zone_gc_lck_ext;
decl_simple_lock_data(, all_zones_lock)
zone_t first_zone;
zone_t *last_zone;
unsigned int num_zones;
boolean_t zone_gc_allowed = TRUE;
boolean_t zone_gc_forced = FALSE;
boolean_t panic_include_zprint = FALSE;
boolean_t zone_gc_allowed_by_time_throttle = TRUE;
vm_offset_t panic_kext_memory_info = 0;
vm_size_t panic_kext_memory_size = 0;
#define ZALLOC_DEBUG_ZONEGC 0x00000001
#define ZALLOC_DEBUG_ZCRAM 0x00000002
uint32_t zalloc_debug = 0;
static int log_records;
#define MAX_ZONE_NAME 32
static char zone_name_to_log[MAX_ZONE_NAME] = "";
boolean_t corruption_debug_flag = FALSE;
#if defined(__LP64__)
#define ZRECORDS_MAX 128000
#else
#define ZRECORDS_MAX 8000
#endif
#define ZRECORDS_DEFAULT 4000
#define ZOP_ALLOC 1
#define ZOP_FREE 0
static btlog_t *zlog_btlog;
static zone_t zone_of_interest = NULL;
static int
log_this_zone(const char *zonename, const char *logname)
{
int len;
const char *zc = zonename;
const char *lc = logname;
for (len = 1; len <= MAX_ZONE_NAME; zc++, lc++, len++) {
if (*zc != *lc && !(*zc == ' ' && *lc == '.'))
break;
if (*zc == '\0')
return TRUE;
}
return FALSE;
}
#define DO_LOGGING(z) (zlog_btlog && (z) == zone_of_interest)
extern boolean_t kmem_alloc_ready;
#if CONFIG_ZLEAKS
#pragma mark -
#pragma mark Zone Leak Detection
#define ZLEAK_STATE_ENABLED 0x01
#define ZLEAK_STATE_ACTIVE 0x02
#define ZLEAK_STATE_ACTIVATING 0x04
#define ZLEAK_STATE_FAILED 0x08
uint32_t zleak_state = 0;
boolean_t panic_include_ztrace = FALSE;
vm_size_t zleak_global_tracking_threshold;
vm_size_t zleak_per_zone_tracking_threshold;
unsigned int zleak_sample_factor = 1000;
unsigned int z_alloc_collisions = 0;
unsigned int z_trace_collisions = 0;
unsigned int z_alloc_overwrites = 0;
unsigned int z_trace_overwrites = 0;
unsigned int z_alloc_recorded = 0;
unsigned int z_trace_recorded = 0;
unsigned int z_total_conflicts = 0;
#pragma mark struct zallocation
struct zallocation {
uintptr_t za_element;
vm_size_t za_size;
uint32_t za_trace_index;
uint32_t za_hit_count;
};
uint32_t zleak_alloc_buckets = CONFIG_ZLEAK_ALLOCATION_MAP_NUM;
uint32_t zleak_trace_buckets = CONFIG_ZLEAK_TRACE_MAP_NUM;
vm_size_t zleak_max_zonemap_size;
static struct zallocation* zallocations;
static struct ztrace* ztraces;
struct ztrace* top_ztrace;
static lck_spin_t zleak_lock;
static lck_attr_t zleak_lock_attr;
static lck_grp_t zleak_lock_grp;
static lck_grp_attr_t zleak_lock_grp_attr;
static void
zleak_init(vm_size_t max_zonemap_size)
{
char scratch_buf[16];
boolean_t zleak_enable_flag = FALSE;
zleak_max_zonemap_size = max_zonemap_size;
zleak_global_tracking_threshold = max_zonemap_size / 2;
zleak_per_zone_tracking_threshold = zleak_global_tracking_threshold / 8;
if (PE_parse_boot_argn("-zleakoff", scratch_buf, sizeof(scratch_buf))) {
zleak_enable_flag = FALSE;
printf("zone leak detection disabled\n");
} else {
zleak_enable_flag = TRUE;
printf("zone leak detection enabled\n");
}
if (PE_parse_boot_argn("zfactor", &zleak_sample_factor, sizeof(zleak_sample_factor))) {
printf("Zone leak factor override: %u\n", zleak_sample_factor);
}
if (PE_parse_boot_argn("zleak-allocs", &zleak_alloc_buckets, sizeof(zleak_alloc_buckets))) {
printf("Zone leak alloc buckets override: %u\n", zleak_alloc_buckets);
if (zleak_alloc_buckets == 0 || (zleak_alloc_buckets & (zleak_alloc_buckets-1))) {
printf("Override isn't a power of two, bad things might happen!\n");
}
}
if (PE_parse_boot_argn("zleak-traces", &zleak_trace_buckets, sizeof(zleak_trace_buckets))) {
printf("Zone leak trace buckets override: %u\n", zleak_trace_buckets);
if (zleak_trace_buckets == 0 || (zleak_trace_buckets & (zleak_trace_buckets-1))) {
printf("Override isn't a power of two, bad things might happen!\n");
}
}
lck_grp_attr_setdefault(&zleak_lock_grp_attr);
lck_grp_init(&zleak_lock_grp, "zleak_lock", &zleak_lock_grp_attr);
lck_attr_setdefault(&zleak_lock_attr);
lck_spin_init(&zleak_lock, &zleak_lock_grp, &zleak_lock_attr);
if (zleak_enable_flag) {
zleak_state = ZLEAK_STATE_ENABLED;
}
}
#if CONFIG_ZLEAKS
int
get_zleak_state(void)
{
if (zleak_state & ZLEAK_STATE_FAILED)
return (-1);
if (zleak_state & ZLEAK_STATE_ACTIVE)
return (1);
return (0);
}
#endif
kern_return_t
zleak_activate(void)
{
kern_return_t retval;
vm_size_t z_alloc_size = zleak_alloc_buckets * sizeof(struct zallocation);
vm_size_t z_trace_size = zleak_trace_buckets * sizeof(struct ztrace);
void *allocations_ptr = NULL;
void *traces_ptr = NULL;
if (zleak_state & (ZLEAK_STATE_ACTIVE | ZLEAK_STATE_ACTIVATING | ZLEAK_STATE_FAILED)) {
return KERN_SUCCESS;
}
lck_spin_lock(&zleak_lock);
if (zleak_state & (ZLEAK_STATE_ACTIVE | ZLEAK_STATE_ACTIVATING | ZLEAK_STATE_FAILED)) {
lck_spin_unlock(&zleak_lock);
return KERN_SUCCESS;
}
zleak_state |= ZLEAK_STATE_ACTIVATING;
lck_spin_unlock(&zleak_lock);
retval = kmem_alloc_kobject(kernel_map, (vm_offset_t*)&allocations_ptr, z_alloc_size, VM_KERN_MEMORY_OSFMK);
if (retval != KERN_SUCCESS) {
goto fail;
}
retval = kmem_alloc_kobject(kernel_map, (vm_offset_t*)&traces_ptr, z_trace_size, VM_KERN_MEMORY_OSFMK);
if (retval != KERN_SUCCESS) {
goto fail;
}
bzero(allocations_ptr, z_alloc_size);
bzero(traces_ptr, z_trace_size);
zallocations = allocations_ptr;
ztraces = traces_ptr;
top_ztrace = &ztraces[0];
lck_spin_lock(&zleak_lock);
zleak_state |= ZLEAK_STATE_ACTIVE;
zleak_state &= ~ZLEAK_STATE_ACTIVATING;
lck_spin_unlock(&zleak_lock);
return 0;
fail:
lck_spin_lock(&zleak_lock);
zleak_state |= ZLEAK_STATE_FAILED;
zleak_state &= ~ZLEAK_STATE_ACTIVATING;
lck_spin_unlock(&zleak_lock);
if (allocations_ptr != NULL) {
kmem_free(kernel_map, (vm_offset_t)allocations_ptr, z_alloc_size);
}
if (traces_ptr != NULL) {
kmem_free(kernel_map, (vm_offset_t)traces_ptr, z_trace_size);
}
return retval;
}
static boolean_t
zleak_log(uintptr_t* bt,
uintptr_t addr,
uint32_t depth,
vm_size_t allocation_size)
{
if (!lck_spin_try_lock(&zleak_lock)) {
z_total_conflicts++;
return FALSE;
}
struct zallocation* allocation = &zallocations[hashaddr(addr, zleak_alloc_buckets)];
uint32_t trace_index = hashbacktrace(bt, depth, zleak_trace_buckets);
struct ztrace* trace = &ztraces[trace_index];
allocation->za_hit_count++;
trace->zt_hit_count++;
if (allocation->za_element != (uintptr_t) 0 && trace_index == allocation->za_trace_index) {
z_alloc_collisions++;
lck_spin_unlock(&zleak_lock);
return TRUE;
}
if (trace->zt_size > 0 && bcmp(trace->zt_stack, bt, (depth * sizeof(uintptr_t))) != 0 ) {
trace->zt_collisions++;
z_trace_collisions++;
lck_spin_unlock(&zleak_lock);
return TRUE;
} else if (trace->zt_size > 0) {
trace->zt_size += allocation_size;
} else {
if (trace->zt_depth != 0)
z_trace_overwrites++;
z_trace_recorded++;
trace->zt_size = allocation_size;
memcpy(trace->zt_stack, bt, (depth * sizeof(uintptr_t)) );
trace->zt_depth = depth;
trace->zt_collisions = 0;
}
if (allocation->za_element != (uintptr_t) 0) {
z_alloc_collisions++;
struct ztrace* associated_trace = &ztraces[allocation->za_trace_index];
associated_trace->zt_size -= allocation->za_size;
} else if (allocation->za_trace_index != 0) {
z_alloc_overwrites++;
}
allocation->za_element = addr;
allocation->za_trace_index = trace_index;
allocation->za_size = allocation_size;
z_alloc_recorded++;
if (top_ztrace->zt_size < trace->zt_size)
top_ztrace = trace;
lck_spin_unlock(&zleak_lock);
return TRUE;
}
static void
zleak_free(uintptr_t addr,
vm_size_t allocation_size)
{
if (addr == (uintptr_t) 0)
return;
struct zallocation* allocation = &zallocations[hashaddr(addr, zleak_alloc_buckets)];
if (allocation->za_element == addr && allocation->za_trace_index < zleak_trace_buckets) {
lck_spin_lock(&zleak_lock);
if (allocation->za_element == addr && allocation->za_trace_index < zleak_trace_buckets) {
struct ztrace *trace;
if (allocation->za_size != allocation_size) {
panic("Freeing as size %lu memory that was allocated with size %lu\n",
(uintptr_t)allocation_size, (uintptr_t)allocation->za_size);
}
trace = &ztraces[allocation->za_trace_index];
if (trace->zt_size > 0) {
trace->zt_size -= allocation_size;
}
allocation->za_element = 0;
}
lck_spin_unlock(&zleak_lock);
}
}
#endif
uint32_t
fastbacktrace(uintptr_t* bt, uint32_t max_frames)
{
uintptr_t* frameptr = NULL, *frameptr_next = NULL;
uintptr_t retaddr = 0;
uint32_t frame_index = 0, frames = 0;
uintptr_t kstackb, kstackt;
thread_t cthread = current_thread();
if (__improbable(cthread == NULL))
return 0;
kstackb = cthread->kernel_stack;
kstackt = kstackb + kernel_stack_size;
frameptr = __builtin_frame_address(0);
if (((uintptr_t)frameptr > kstackt) || ((uintptr_t)frameptr < kstackb))
frameptr = NULL;
while (frameptr != NULL && frame_index < max_frames ) {
frameptr_next = (uintptr_t*) *frameptr;
if (frameptr_next == NULL)
break;
if (((uintptr_t)frameptr_next > kstackt) || ((uintptr_t)frameptr_next < kstackb))
break;
retaddr = *(frameptr + 1);
bt[frame_index++] = retaddr;
frameptr = frameptr_next;
}
frames = frame_index;
while (frame_index < max_frames)
bt[frame_index++] = 0;
return frames;
}
uintptr_t
hash_mix(uintptr_t x)
{
#ifndef __LP64__
x += ~(x << 15);
x ^= (x >> 10);
x += (x << 3 );
x ^= (x >> 6 );
x += ~(x << 11);
x ^= (x >> 16);
#else
x += ~(x << 32);
x ^= (x >> 22);
x += ~(x << 13);
x ^= (x >> 8 );
x += (x << 3 );
x ^= (x >> 15);
x += ~(x << 27);
x ^= (x >> 31);
#endif
return x;
}
uint32_t
hashbacktrace(uintptr_t* bt, uint32_t depth, uint32_t max_size)
{
uintptr_t hash = 0;
uintptr_t mask = max_size - 1;
while (depth) {
hash += bt[--depth];
}
hash = hash_mix(hash) & mask;
assert(hash < max_size);
return (uint32_t) hash;
}
uint32_t
hashaddr(uintptr_t pt, uint32_t max_size)
{
uintptr_t hash = 0;
uintptr_t mask = max_size - 1;
hash = hash_mix(pt) & mask;
assert(hash < max_size);
return (uint32_t) hash;
}
#pragma mark -
zone_t
zinit(
vm_size_t size,
vm_size_t max,
vm_size_t alloc,
const char *name)
{
zone_t z;
boolean_t use_page_list = FALSE;
if (zone_zone == ZONE_NULL) {
z = (struct zone *)zdata;
} else
z = (zone_t) zalloc(zone_zone);
if (z == ZONE_NULL)
return(ZONE_NULL);
vm_size_t minimum_element_size = sizeof(vm_offset_t) * 2;
if (size < minimum_element_size)
size = minimum_element_size;
size = ((size-1) + sizeof(vm_offset_t)) -
((size-1) % sizeof(vm_offset_t));
if (alloc == 0)
alloc = PAGE_SIZE;
alloc = round_page(alloc);
max = round_page(max);
#if ZONE_ALIAS_ADDR
if ((size < PAGE_SIZE) && (PAGE_SIZE % size <= PAGE_SIZE / 10))
alloc = PAGE_SIZE;
else
#endif
#if defined(__LP64__)
if (((alloc % size) != 0) || (alloc > PAGE_SIZE * 8))
#endif
{
vm_size_t best, waste; unsigned int i;
best = PAGE_SIZE;
waste = best % size;
for (i = 1; i <= 5; i++) {
vm_size_t tsize, twaste;
tsize = i * PAGE_SIZE;
if ((tsize % size) < (tsize / 100)) {
alloc = tsize;
goto use_this_allocation;
}
twaste = tsize % size;
if (twaste < waste)
best = tsize, waste = twaste;
}
if (alloc <= best || (alloc % size >= waste))
alloc = best;
}
use_this_allocation:
if (max && (max < alloc))
max = alloc;
if (alloc == PAGE_SIZE && zone_zone != ZONE_NULL) {
vm_offset_t first_element_offset;
size_t zone_page_metadata_size = sizeof(struct zone_page_metadata);
if (zone_page_metadata_size % ZONE_ELEMENT_ALIGNMENT == 0) {
first_element_offset = zone_page_metadata_size;
} else {
first_element_offset = zone_page_metadata_size + (ZONE_ELEMENT_ALIGNMENT - (zone_page_metadata_size % ZONE_ELEMENT_ALIGNMENT));
}
if (((PAGE_SIZE - first_element_offset) % size) <= PAGE_SIZE / 100) {
use_page_list = TRUE;
}
}
z->free_elements = NULL;
queue_init(&z->pages.any_free_foreign);
queue_init(&z->pages.all_free);
queue_init(&z->pages.intermediate);
queue_init(&z->pages.all_used);
z->cur_size = 0;
z->page_count = 0;
z->max_size = max;
z->elem_size = size;
z->alloc_size = alloc;
z->zone_name = name;
z->count = 0;
z->countfree = 0;
z->sum_count = 0LL;
z->doing_alloc_without_vm_priv = FALSE;
z->doing_alloc_with_vm_priv = FALSE;
z->doing_gc = FALSE;
z->exhaustible = FALSE;
z->collectable = TRUE;
z->allows_foreign = FALSE;
z->expandable = TRUE;
z->waiting = FALSE;
z->async_pending = FALSE;
z->caller_acct = TRUE;
z->noencrypt = FALSE;
z->no_callout = FALSE;
z->async_prio_refill = FALSE;
z->gzalloc_exempt = FALSE;
z->alignment_required = FALSE;
z->use_page_list = use_page_list;
z->prio_refill_watermark = 0;
z->zone_replenish_thread = NULL;
z->zp_count = 0;
#if CONFIG_ZLEAKS
z->zleak_capture = 0;
z->zleak_on = FALSE;
#endif
#if ZONE_DEBUG
z->active_zones.next = z->active_zones.prev = NULL;
zone_debug_enable(z);
#endif
lock_zone_init(z);
z->next_zone = ZONE_NULL;
simple_lock(&all_zones_lock);
*last_zone = z;
last_zone = &z->next_zone;
z->index = num_zones;
if (zinfo_per_task) {
if (num_zones > ZONES_MAX)
z->index = ZONES_MAX;
}
num_zones++;
simple_unlock(&all_zones_lock);
if (log_this_zone(z->zone_name, zone_name_to_log)) {
zone_of_interest = z;
}
if (zone_of_interest != NULL && zlog_btlog == NULL && kmem_alloc_ready) {
zlog_btlog = btlog_create(log_records, MAX_ZTRACE_DEPTH, NULL, NULL, NULL);
if (zlog_btlog) {
printf("zone: logging started for zone %s\n", zone_of_interest->zone_name);
} else {
printf("zone: couldn't allocate memory for zrecords, turning off zleak logging\n");
zone_of_interest = NULL;
}
}
#if CONFIG_GZALLOC
gzalloc_zone_init(z);
#endif
return(z);
}
unsigned zone_replenish_loops, zone_replenish_wakeups, zone_replenish_wakeups_initiated, zone_replenish_throttle_count;
static void zone_replenish_thread(zone_t);
static void zone_replenish_thread(zone_t z) {
vm_size_t free_size;
current_thread()->options |= TH_OPT_VMPRIV;
for (;;) {
lock_zone(z);
assert(z->prio_refill_watermark != 0);
while ((free_size = (z->cur_size - (z->count * z->elem_size))) < (z->prio_refill_watermark * z->elem_size)) {
assert(z->doing_alloc_without_vm_priv == FALSE);
assert(z->doing_alloc_with_vm_priv == FALSE);
assert(z->async_prio_refill == TRUE);
unlock_zone(z);
int zflags = KMA_KOBJECT|KMA_NOPAGEWAIT;
vm_offset_t space, alloc_size;
kern_return_t kr;
if (vm_pool_low())
alloc_size = round_page(z->elem_size);
else
alloc_size = z->alloc_size;
if (z->noencrypt)
zflags |= KMA_NOENCRYPT;
kr = kernel_memory_allocate(zone_map, &space, alloc_size, 0, zflags, VM_KERN_MEMORY_ZONE);
if (kr == KERN_SUCCESS) {
#if ZONE_ALIAS_ADDR
if (alloc_size == PAGE_SIZE)
space = zone_alias_addr(space);
#endif
zcram(z, space, alloc_size);
} else if (kr == KERN_RESOURCE_SHORTAGE) {
VM_PAGE_WAIT();
} else if (kr == KERN_NO_SPACE) {
kr = kernel_memory_allocate(kernel_map, &space, alloc_size, 0, zflags, VM_KERN_MEMORY_ZONE);
if (kr == KERN_SUCCESS) {
#if ZONE_ALIAS_ADDR
if (alloc_size == PAGE_SIZE)
space = zone_alias_addr(space);
#endif
zcram(z, space, alloc_size);
} else {
assert_wait_timeout(&z->zone_replenish_thread, THREAD_UNINT, 1, 100 * NSEC_PER_USEC);
thread_block(THREAD_CONTINUE_NULL);
}
}
lock_zone(z);
zone_replenish_loops++;
}
unlock_zone(z);
thread_wakeup(z);
assert_wait(&z->zone_replenish_thread, THREAD_UNINT);
thread_block(THREAD_CONTINUE_NULL);
zone_replenish_wakeups++;
}
}
void
zone_prio_refill_configure(zone_t z, vm_size_t low_water_mark) {
z->prio_refill_watermark = low_water_mark;
z->async_prio_refill = TRUE;
OSMemoryBarrier();
kern_return_t tres = kernel_thread_start_priority((thread_continue_t)zone_replenish_thread, z, MAXPRI_KERNEL, &z->zone_replenish_thread);
if (tres != KERN_SUCCESS) {
panic("zone_prio_refill_configure, thread create: 0x%x", tres);
}
thread_deallocate(z->zone_replenish_thread);
}
void
zcram(
zone_t zone,
vm_offset_t newmem,
vm_size_t size)
{
vm_size_t elem_size;
boolean_t from_zm = FALSE;
assert(zone != ZONE_NULL && newmem != (vm_offset_t)0);
assert(!zone->collectable || zone->allows_foreign
|| (from_zone_map(newmem, size)));
elem_size = zone->elem_size;
if (from_zone_map(newmem, size))
from_zm = TRUE;
if (zalloc_debug & ZALLOC_DEBUG_ZCRAM)
kprintf("zcram(%p[%s], 0x%lx%s, 0x%lx)\n", zone, zone->zone_name,
(unsigned long)newmem, from_zm ? "" : "[F]", (unsigned long)size);
if (from_zm && !zone->use_page_list)
zone_page_init(newmem, size);
ZONE_PAGE_COUNT_INCR(zone, (size / PAGE_SIZE));
lock_zone(zone);
if (zone->use_page_list) {
struct zone_page_metadata *page_metadata;
size_t zone_page_metadata_size = sizeof(struct zone_page_metadata);
assert((newmem & PAGE_MASK) == 0);
assert((size & PAGE_MASK) == 0);
for (; size > 0; newmem += PAGE_SIZE, size -= PAGE_SIZE) {
vm_size_t pos_in_page;
page_metadata = (struct zone_page_metadata *)(newmem);
page_metadata->pages.next = NULL;
page_metadata->pages.prev = NULL;
page_metadata->elements = NULL;
page_metadata->zone = zone;
page_metadata->alloc_count = 0;
page_metadata->free_count = 0;
enqueue_tail(&zone->pages.all_used, (queue_entry_t)page_metadata);
vm_offset_t first_element_offset;
if (zone_page_metadata_size % ZONE_ELEMENT_ALIGNMENT == 0){
first_element_offset = zone_page_metadata_size;
} else {
first_element_offset = zone_page_metadata_size + (ZONE_ELEMENT_ALIGNMENT - (zone_page_metadata_size % ZONE_ELEMENT_ALIGNMENT));
}
for (pos_in_page = first_element_offset; (newmem + pos_in_page + elem_size) < (vm_offset_t)(newmem + PAGE_SIZE); pos_in_page += elem_size) {
page_metadata->alloc_count++;
zone->count++;
free_to_zone(zone, newmem + pos_in_page, FALSE);
zone->cur_size += elem_size;
}
}
} else {
while (size >= elem_size) {
zone->count++;
if (newmem == (vm_offset_t)zone) {
} else {
free_to_zone(zone, newmem, FALSE);
}
if (from_zm)
zone_page_alloc(newmem, elem_size);
size -= elem_size;
newmem += elem_size;
zone->cur_size += elem_size;
}
}
unlock_zone(zone);
}
void
zone_steal_memory(void)
{
#if CONFIG_GZALLOC
gzalloc_configure();
#endif
zdata_size = 12 * sizeof(struct zone);
zdata_size = round_page(zdata_size);
zdata = (vm_offset_t)pmap_steal_memory(zdata_size);
}
int
zfill(
zone_t zone,
int nelem)
{
kern_return_t kr;
vm_size_t size;
vm_offset_t memory;
int nalloc;
assert(nelem > 0);
if (nelem <= 0)
return 0;
size = nelem * zone->elem_size;
size = round_page(size);
kr = kmem_alloc_kobject(kernel_map, &memory, size, VM_KERN_MEMORY_ZONE);
if (kr != KERN_SUCCESS)
return 0;
zone_change(zone, Z_FOREIGN, TRUE);
zcram(zone, memory, size);
nalloc = (int)(size / zone->elem_size);
assert(nalloc >= nelem);
return nalloc;
}
void
zone_bootstrap(void)
{
char temp_buf[16];
if (PE_parse_boot_argn("-zinfop", temp_buf, sizeof(temp_buf))) {
zinfo_per_task = TRUE;
}
if (!PE_parse_boot_argn("zalloc_debug", &zalloc_debug, sizeof(zalloc_debug)))
zalloc_debug = 0;
zp_init();
if (PE_parse_boot_argn("-zc", temp_buf, sizeof(temp_buf))) {
corruption_debug_flag = TRUE;
}
if (PE_parse_boot_argn("zlog", zone_name_to_log, sizeof(zone_name_to_log)) == TRUE) {
if (PE_parse_boot_argn("zrecs", &log_records, sizeof(log_records)) == TRUE) {
log_records = MIN(ZRECORDS_MAX, log_records);
} else {
log_records = ZRECORDS_DEFAULT;
}
}
simple_lock_init(&all_zones_lock, 0);
first_zone = ZONE_NULL;
last_zone = &first_zone;
num_zones = 0;
thread_call_setup(&call_async_alloc, zalloc_async, NULL);
assert(zone_zone == ZONE_NULL);
lck_grp_attr_setdefault(&zone_locks_grp_attr);
lck_grp_init(&zone_locks_grp, "zone_locks", &zone_locks_grp_attr);
zone_zone = zinit(sizeof(struct zone), 128 * sizeof(struct zone),
sizeof(struct zone), "zones");
zone_change(zone_zone, Z_COLLECT, FALSE);
zone_change(zone_zone, Z_CALLERACCT, FALSE);
zone_change(zone_zone, Z_NOENCRYPT, TRUE);
zcram(zone_zone, zdata, zdata_size);
VM_PAGE_MOVE_STOLEN(atop_64(zdata_size));
if (zinfo_per_task) {
vm_size_t zisize = sizeof(zinfo_usage_store_t) * ZINFO_SLOTS;
unsigned int i;
for (i = 0; i < num_fake_zones; i++)
fake_zones[i].init(ZINFO_SLOTS - num_fake_zones + i);
zinfo_zone = zinit(zisize, zisize * CONFIG_TASK_MAX,
zisize, "per task zinfo");
zone_change(zinfo_zone, Z_CALLERACCT, FALSE);
}
}
void
zinfo_task_init(task_t task)
{
if (zinfo_per_task) {
task->tkm_zinfo = zalloc(zinfo_zone);
memset(task->tkm_zinfo, 0, sizeof(zinfo_usage_store_t) * ZINFO_SLOTS);
} else {
task->tkm_zinfo = NULL;
}
}
void
zinfo_task_free(task_t task)
{
assert(task != kernel_task);
if (task->tkm_zinfo != NULL) {
zfree(zinfo_zone, task->tkm_zinfo);
task->tkm_zinfo = NULL;
}
}
void
zone_init(
vm_size_t max_zonemap_size)
{
kern_return_t retval;
vm_offset_t zone_min;
vm_offset_t zone_max;
retval = kmem_suballoc(kernel_map, &zone_min, max_zonemap_size,
FALSE, VM_FLAGS_ANYWHERE | VM_FLAGS_PERMANENT | VM_MAKE_TAG(VM_KERN_MEMORY_ZONE),
&zone_map);
if (retval != KERN_SUCCESS)
panic("zone_init: kmem_suballoc failed");
zone_max = zone_min + round_page(max_zonemap_size);
#if CONFIG_GZALLOC
gzalloc_init(max_zonemap_size);
#endif
zone_map_min_address = zone_min;
zone_map_max_address = zone_max;
#if defined(__LP64__)
if (VM_PAGE_UNPACK_PTR(VM_PAGE_PACK_PTR(zone_map_min_address)) != (vm_page_t)zone_map_min_address)
panic("VM_PAGE_PACK_PTR failed on zone_map_min_address - %p", (void *)zone_map_min_address);
if (VM_PAGE_UNPACK_PTR(VM_PAGE_PACK_PTR(zone_map_max_address)) != (vm_page_t)zone_map_max_address)
panic("VM_PAGE_PACK_PTR failed on zone_map_max_address - %p", (void *)zone_map_max_address);
#endif
zone_pages = (unsigned int)atop_kernel(zone_max - zone_min);
zone_page_table_used_size = sizeof(zone_page_table);
zone_page_table_second_level_size = 1;
zone_page_table_second_level_shift_amount = 0;
while ((zone_page_table_first_level_slot(zone_pages-1)) >= ZONE_PAGE_TABLE_FIRST_LEVEL_SIZE) {
zone_page_table_second_level_size <<= 1;
zone_page_table_second_level_shift_amount++;
}
lck_grp_attr_setdefault(&zone_gc_lck_grp_attr);
lck_grp_init(&zone_gc_lck_grp, "zone_gc", &zone_gc_lck_grp_attr);
lck_attr_setdefault(&zone_gc_lck_attr);
lck_mtx_init_ext(&zone_gc_lock, &zone_gc_lck_ext, &zone_gc_lck_grp, &zone_gc_lck_attr);
#if CONFIG_ZLEAKS
zleak_init(max_zonemap_size);
#endif
}
void
zone_page_table_expand(zone_page_index_t pindex)
{
unsigned int first_index;
struct zone_page_table_entry * volatile * first_level_ptr;
assert(pindex < zone_pages);
first_index = zone_page_table_first_level_slot(pindex);
first_level_ptr = &zone_page_table[first_index];
if (*first_level_ptr == NULL) {
vm_offset_t second_level_array = 0;
vm_size_t second_level_size = round_page(zone_page_table_second_level_size * sizeof(struct zone_page_table_entry));
zone_page_index_t i;
struct zone_page_table_entry *entry_array;
if (kmem_alloc_kobject(zone_map, &second_level_array,
second_level_size, VM_KERN_MEMORY_OSFMK) != KERN_SUCCESS) {
panic("zone_page_table_expand");
}
zone_map_table_page_count += (second_level_size / PAGE_SIZE);
entry_array = (struct zone_page_table_entry *)second_level_array;
for (i=0; i < zone_page_table_second_level_size; i++) {
entry_array[i].alloc_count = ZONE_PAGE_UNUSED;
entry_array[i].collect_count = 0;
}
if (OSCompareAndSwapPtr(NULL, entry_array, first_level_ptr)) {
OSAddAtomicLong(second_level_size, &zone_page_table_used_size);
} else {
kmem_free(zone_map, second_level_array, second_level_size);
zone_map_table_page_count -= (second_level_size / PAGE_SIZE);
}
} else {
}
}
struct zone_page_table_entry *
zone_page_table_lookup(zone_page_index_t pindex)
{
unsigned int first_index = zone_page_table_first_level_slot(pindex);
struct zone_page_table_entry *second_level = zone_page_table[first_index];
if (second_level) {
return &second_level[zone_page_table_second_level_slot(pindex)];
}
return NULL;
}
extern volatile SInt32 kfree_nop_count;
#pragma mark -
#pragma mark zalloc_canblock
static void *
zalloc_internal(
zone_t zone,
boolean_t canblock,
boolean_t nopagewait)
{
vm_offset_t addr = 0;
kern_return_t retval;
uintptr_t zbt[MAX_ZTRACE_DEPTH];
int numsaved = 0;
boolean_t zone_replenish_wakeup = FALSE, zone_alloc_throttle = FALSE;
#if CONFIG_GZALLOC || ZONE_DEBUG
boolean_t did_gzalloc = FALSE;
#endif
thread_t thr = current_thread();
boolean_t check_poison = FALSE;
boolean_t set_doing_alloc_with_vm_priv = FALSE;
#if CONFIG_ZLEAKS
uint32_t zleak_tracedepth = 0;
#endif
assert(zone != ZONE_NULL);
#if CONFIG_GZALLOC
addr = gzalloc_alloc(zone, canblock);
did_gzalloc = (addr != 0);
#endif
if (__improbable(DO_LOGGING(zone)))
numsaved = OSBacktrace((void*) zbt, MAX_ZTRACE_DEPTH);
#if CONFIG_ZLEAKS
if (__improbable(zone->zleak_on && sample_counter(&zone->zleak_capture, zleak_sample_factor) == TRUE)) {
if (numsaved == 0)
zleak_tracedepth = fastbacktrace(zbt, MAX_ZTRACE_DEPTH);
else
zleak_tracedepth = numsaved;
}
#endif
lock_zone(zone);
if (zone->async_prio_refill && zone->zone_replenish_thread) {
do {
vm_size_t zfreec = (zone->cur_size - (zone->count * zone->elem_size));
vm_size_t zrefillwm = zone->prio_refill_watermark * zone->elem_size;
zone_replenish_wakeup = (zfreec < zrefillwm);
zone_alloc_throttle = (zfreec < (zrefillwm / 2)) && ((thr->options & TH_OPT_VMPRIV) == 0);
if (zone_replenish_wakeup) {
zone_replenish_wakeups_initiated++;
unlock_zone(zone);
thread_wakeup(&zone->zone_replenish_thread);
if (zone_alloc_throttle) {
zone_replenish_throttle_count++;
assert_wait_timeout(zone, THREAD_UNINT, 1, NSEC_PER_MSEC);
thread_block(THREAD_CONTINUE_NULL);
}
lock_zone(zone);
}
} while (zone_alloc_throttle == TRUE);
}
if (__probable(addr == 0))
addr = try_alloc_from_zone(zone, &check_poison);
while ((addr == 0) && canblock) {
if ((zone->doing_alloc_without_vm_priv || zone->doing_alloc_with_vm_priv) &&
(((thr->options & TH_OPT_VMPRIV) == 0) || zone->doing_alloc_with_vm_priv)) {
zone->waiting = TRUE;
zone_sleep(zone);
} else if (zone->doing_gc) {
zone->waiting = TRUE;
zone_sleep(zone);
} else {
vm_offset_t space;
vm_size_t alloc_size;
int retry = 0;
if ((zone->cur_size + zone->elem_size) >
zone->max_size) {
if (zone->exhaustible)
break;
if (zone->expandable) {
zone->max_size += (zone->max_size >> 1);
} else {
unlock_zone(zone);
panic_include_zprint = TRUE;
#if CONFIG_ZLEAKS
if (zleak_state & ZLEAK_STATE_ACTIVE)
panic_include_ztrace = TRUE;
#endif
panic("zalloc: zone \"%s\" empty.", zone->zone_name);
}
}
if ((thr->options & TH_OPT_VMPRIV)) {
zone->doing_alloc_with_vm_priv = TRUE;
set_doing_alloc_with_vm_priv = TRUE;
} else {
zone->doing_alloc_without_vm_priv = TRUE;
}
unlock_zone(zone);
for (;;) {
int zflags = KMA_KOBJECT|KMA_NOPAGEWAIT;
if (vm_pool_low() || retry >= 1)
alloc_size =
round_page(zone->elem_size);
else
alloc_size = zone->alloc_size;
if (zone->noencrypt)
zflags |= KMA_NOENCRYPT;
retval = kernel_memory_allocate(zone_map, &space, alloc_size, 0, zflags, VM_KERN_MEMORY_ZONE);
if (retval == KERN_SUCCESS) {
#if ZONE_ALIAS_ADDR
if (alloc_size == PAGE_SIZE)
space = zone_alias_addr(space);
#endif
#if CONFIG_ZLEAKS
if ((zleak_state & (ZLEAK_STATE_ENABLED | ZLEAK_STATE_ACTIVE)) == ZLEAK_STATE_ENABLED) {
if (zone_map->size >= zleak_global_tracking_threshold) {
kern_return_t kr;
kr = zleak_activate();
if (kr != KERN_SUCCESS) {
printf("Failed to activate live zone leak debugging (%d).\n", kr);
}
}
}
if ((zleak_state & ZLEAK_STATE_ACTIVE) && !(zone->zleak_on)) {
if (zone->cur_size > zleak_per_zone_tracking_threshold) {
zone->zleak_on = TRUE;
}
}
#endif
zcram(zone, space, alloc_size);
break;
} else if (retval != KERN_RESOURCE_SHORTAGE) {
retry++;
if (retry == 2) {
zone_gc(TRUE);
printf("zalloc did gc\n");
zone_display_zprint();
}
if (retry == 3) {
panic_include_zprint = TRUE;
#if CONFIG_ZLEAKS
if ((zleak_state & ZLEAK_STATE_ACTIVE)) {
panic_include_ztrace = TRUE;
}
#endif
if (retval == KERN_NO_SPACE) {
zone_t zone_largest = zone_find_largest();
panic("zalloc: zone map exhausted while allocating from zone %s, likely due to memory leak in zone %s (%lu total bytes, %d elements allocated)",
zone->zone_name, zone_largest->zone_name,
(unsigned long)zone_largest->cur_size, zone_largest->count);
}
panic("zalloc: \"%s\" (%d elements) retry fail %d, kfree_nop_count: %d", zone->zone_name, zone->count, retval, (int)kfree_nop_count);
}
} else {
break;
}
}
lock_zone(zone);
if (set_doing_alloc_with_vm_priv == TRUE)
zone->doing_alloc_with_vm_priv = FALSE;
else
zone->doing_alloc_without_vm_priv = FALSE;
if (zone->waiting) {
zone->waiting = FALSE;
zone_wakeup(zone);
}
addr = try_alloc_from_zone(zone, &check_poison);
if (addr == 0 &&
retval == KERN_RESOURCE_SHORTAGE) {
if (nopagewait == TRUE)
break;
unlock_zone(zone);
VM_PAGE_WAIT();
lock_zone(zone);
}
}
if (addr == 0)
addr = try_alloc_from_zone(zone, &check_poison);
}
#if CONFIG_ZLEAKS
if (addr && zleak_tracedepth > 0) {
if (!zleak_log(zbt, addr, zleak_tracedepth, zone->elem_size)) {
zone->zleak_capture = zleak_sample_factor;
}
}
#endif
if ((addr == 0) && (!canblock || nopagewait) && (zone->async_pending == FALSE) && (zone->no_callout == FALSE) && (zone->exhaustible == FALSE) && (!vm_pool_low())) {
zone->async_pending = TRUE;
unlock_zone(zone);
thread_call_enter(&call_async_alloc);
lock_zone(zone);
addr = try_alloc_from_zone(zone, &check_poison);
}
if (__improbable(DO_LOGGING(zone) && addr)) {
btlog_add_entry(zlog_btlog, (void *)addr, ZOP_ALLOC, (void **)zbt, numsaved);
}
vm_offset_t inner_size = zone->elem_size;
#if ZONE_DEBUG
if (!did_gzalloc && addr && zone_debug_enabled(zone)) {
enqueue_tail(&zone->active_zones, (queue_entry_t)addr);
addr += ZONE_DEBUG_OFFSET;
inner_size -= ZONE_DEBUG_OFFSET;
}
#endif
unlock_zone(zone);
if (__improbable(check_poison && addr)) {
vm_offset_t *element_cursor = ((vm_offset_t *) addr) + 1;
vm_offset_t *backup = get_backup_ptr(inner_size, (vm_offset_t *) addr);
for ( ; element_cursor < backup ; element_cursor++)
if (__improbable(*element_cursor != ZP_POISON))
zone_element_was_modified_panic(zone,
addr,
*element_cursor,
ZP_POISON,
((vm_offset_t)element_cursor) - addr);
}
if (addr) {
vm_offset_t *primary = (vm_offset_t *) addr;
vm_offset_t *backup = get_backup_ptr(inner_size, primary);
*primary = ZP_POISON;
*backup = ZP_POISON;
}
TRACE_MACHLEAKS(ZALLOC_CODE, ZALLOC_CODE_2, zone->elem_size, addr);
if (addr) {
task_t task;
zinfo_usage_t zinfo;
vm_size_t sz = zone->elem_size;
if (zone->caller_acct)
ledger_credit(thr->t_ledger, task_ledgers.tkm_private, sz);
else
ledger_credit(thr->t_ledger, task_ledgers.tkm_shared, sz);
if ((task = thr->task) != NULL && (zinfo = task->tkm_zinfo) != NULL)
OSAddAtomic64(sz, (int64_t *)&zinfo[zone->index].alloc);
}
return((void *)addr);
}
void *
zalloc(zone_t zone)
{
return (zalloc_internal(zone, TRUE, FALSE));
}
void *
zalloc_noblock(zone_t zone)
{
return (zalloc_internal(zone, FALSE, FALSE));
}
void *
zalloc_nopagewait(zone_t zone)
{
return (zalloc_internal(zone, TRUE, TRUE));
}
void *
zalloc_canblock(zone_t zone, boolean_t canblock)
{
return (zalloc_internal(zone, canblock, FALSE));
}
void
zalloc_async(
__unused thread_call_param_t p0,
__unused thread_call_param_t p1)
{
zone_t current_z = NULL, head_z;
unsigned int max_zones, i;
void *elt = NULL;
boolean_t pending = FALSE;
simple_lock(&all_zones_lock);
head_z = first_zone;
max_zones = num_zones;
simple_unlock(&all_zones_lock);
current_z = head_z;
for (i = 0; i < max_zones; i++) {
lock_zone(current_z);
if (current_z->async_pending == TRUE) {
current_z->async_pending = FALSE;
pending = TRUE;
}
unlock_zone(current_z);
if (pending == TRUE) {
elt = zalloc_canblock(current_z, TRUE);
zfree(current_z, elt);
pending = FALSE;
}
current_z = current_z->next_zone;
}
}
void *
zget(
register zone_t zone)
{
vm_offset_t addr;
boolean_t check_poison = FALSE;
#if CONFIG_ZLEAKS
uintptr_t zbt[MAX_ZTRACE_DEPTH];
uint32_t zleak_tracedepth = 0;
#endif
assert( zone != ZONE_NULL );
#if CONFIG_ZLEAKS
if (__improbable(zone->zleak_on && sample_counter(&zone->zleak_capture, zleak_sample_factor) == TRUE)) {
zleak_tracedepth = fastbacktrace(zbt, MAX_ZTRACE_DEPTH);
}
#endif
if (!lock_try_zone(zone))
return NULL;
addr = try_alloc_from_zone(zone, &check_poison);
vm_offset_t inner_size = zone->elem_size;
#if ZONE_DEBUG
if (addr && zone_debug_enabled(zone)) {
enqueue_tail(&zone->active_zones, (queue_entry_t)addr);
addr += ZONE_DEBUG_OFFSET;
inner_size -= ZONE_DEBUG_OFFSET;
}
#endif
#if CONFIG_ZLEAKS
if (zone->zleak_on && zleak_tracedepth > 0 && addr) {
if (!zleak_log(zbt, addr, zleak_tracedepth, zone->elem_size)) {
zone->zleak_capture = zleak_sample_factor;
}
}
#endif
unlock_zone(zone);
if (__improbable(check_poison && addr)) {
vm_offset_t *element_cursor = ((vm_offset_t *) addr) + 1;
vm_offset_t *backup = get_backup_ptr(inner_size, (vm_offset_t *) addr);
for ( ; element_cursor < backup ; element_cursor++)
if (__improbable(*element_cursor != ZP_POISON))
zone_element_was_modified_panic(zone,
addr,
*element_cursor,
ZP_POISON,
((vm_offset_t)element_cursor) - addr);
}
if (addr) {
vm_offset_t *primary = (vm_offset_t *) addr;
vm_offset_t *backup = get_backup_ptr(inner_size, primary);
*primary = ZP_POISON;
*backup = ZP_POISON;
}
return((void *) addr);
}
boolean_t zone_check = FALSE;
static void zone_check_freelist(zone_t zone, vm_offset_t elem)
{
struct zone_free_element *this;
struct zone_page_metadata *thispage;
if (zone->use_page_list) {
if (zone->allows_foreign) {
for (thispage = (struct zone_page_metadata *)queue_first(&zone->pages.any_free_foreign);
!queue_end(&zone->pages.any_free_foreign, (queue_entry_t)thispage);
thispage = (struct zone_page_metadata *)queue_next((queue_chain_t *)thispage)) {
for (this = thispage->elements;
this != NULL;
this = this->next) {
if (!is_sane_zone_element(zone, (vm_address_t)this) || (vm_address_t)this == elem)
panic("zone_check_freelist");
}
}
}
for (thispage = (struct zone_page_metadata *)queue_first(&zone->pages.all_free);
!queue_end(&zone->pages.all_free, (queue_entry_t)thispage);
thispage = (struct zone_page_metadata *)queue_next((queue_chain_t *)thispage)) {
for (this = thispage->elements;
this != NULL;
this = this->next) {
if (!is_sane_zone_element(zone, (vm_address_t)this) || (vm_address_t)this == elem)
panic("zone_check_freelist");
}
}
for (thispage = (struct zone_page_metadata *)queue_first(&zone->pages.intermediate);
!queue_end(&zone->pages.intermediate, (queue_entry_t)thispage);
thispage = (struct zone_page_metadata *)queue_next((queue_chain_t *)thispage)) {
for (this = thispage->elements;
this != NULL;
this = this->next) {
if (!is_sane_zone_element(zone, (vm_address_t)this) || (vm_address_t)this == elem)
panic("zone_check_freelist");
}
}
} else {
for (this = zone->free_elements;
this != NULL;
this = this->next) {
if (!is_sane_zone_element(zone, (vm_address_t)this) || (vm_address_t)this == elem)
panic("zone_check_freelist");
}
}
}
static zone_t zone_last_bogus_zone = ZONE_NULL;
static vm_offset_t zone_last_bogus_elem = 0;
void
zfree(
register zone_t zone,
void *addr)
{
vm_offset_t elem = (vm_offset_t) addr;
uintptr_t zbt[MAX_ZTRACE_DEPTH];
int numsaved = 0;
boolean_t gzfreed = FALSE;
boolean_t poison = FALSE;
assert(zone != ZONE_NULL);
#if 1
if (zone->use_page_list) {
struct zone_page_metadata *page_meta = get_zone_page_metadata((struct zone_free_element *)addr);
if (zone != page_meta->zone) {
zone_t fixed_zone = NULL;
int fixed_i, max_zones;
simple_lock(&all_zones_lock);
max_zones = num_zones;
fixed_zone = first_zone;
simple_unlock(&all_zones_lock);
for (fixed_i=0; fixed_i < max_zones; fixed_i++, fixed_zone = fixed_zone->next_zone) {
if (fixed_zone == page_meta->zone && fixed_zone->use_page_list) {
printf("Fixing incorrect zfree from zone %s to zone %s\n", zone->zone_name, fixed_zone->zone_name);
zone = fixed_zone;
break;
}
}
}
}
#endif
if (__improbable(DO_LOGGING(zone) && corruption_debug_flag))
numsaved = OSBacktrace((void *)zbt, MAX_ZTRACE_DEPTH);
#if MACH_ASSERT
if (zone == ZONE_NULL || elem == (vm_offset_t)0)
panic("zfree: NULL");
if (zone == zone_zone)
panic("zfree: freeing to zone_zone breaks zone_gc!");
#endif
#if CONFIG_GZALLOC
gzfreed = gzalloc_free(zone, addr);
#endif
TRACE_MACHLEAKS(ZFREE_CODE, ZFREE_CODE_2, zone->elem_size, (uintptr_t)addr);
if (__improbable(!gzfreed && zone->collectable && !zone->allows_foreign &&
!from_zone_map(elem, zone->elem_size))) {
#if MACH_ASSERT
panic("zfree: non-allocated memory in collectable zone!");
#endif
zone_last_bogus_zone = zone;
zone_last_bogus_elem = elem;
return;
}
if ((zp_factor != 0 || zp_tiny_zone_limit != 0) && !gzfreed) {
vm_offset_t inner_size = zone->elem_size;
#if ZONE_DEBUG
if (!gzfreed && zone_debug_enabled(zone)) {
inner_size -= ZONE_DEBUG_OFFSET;
}
#endif
uint32_t sample_factor = zp_factor + (((uint32_t)inner_size) >> zp_scale);
if (inner_size <= zp_tiny_zone_limit)
poison = TRUE;
else if (zp_factor != 0 && sample_counter(&zone->zp_count, sample_factor) == TRUE)
poison = TRUE;
if (__improbable(poison)) {
vm_offset_t *element_cursor = ((vm_offset_t *) elem) + 1;
vm_offset_t *backup = get_backup_ptr(inner_size, (vm_offset_t *)elem);
for ( ; element_cursor < backup; element_cursor++)
*element_cursor = ZP_POISON;
}
}
lock_zone(zone);
if (__improbable(DO_LOGGING(zone))) {
if (corruption_debug_flag) {
btlog_add_entry(zlog_btlog, (void *)addr, ZOP_FREE, (void **)zbt, numsaved);
} else {
btlog_remove_entries_for_element(zlog_btlog, (void *)addr);
}
}
#if ZONE_DEBUG
if (!gzfreed && zone_debug_enabled(zone)) {
queue_t tmp_elem;
elem -= ZONE_DEBUG_OFFSET;
if (zone_check) {
for (tmp_elem = queue_first(&zone->active_zones);
!queue_end(tmp_elem, &zone->active_zones);
tmp_elem = queue_next(tmp_elem))
if (elem == (vm_offset_t)tmp_elem)
break;
if (elem != (vm_offset_t)tmp_elem)
panic("zfree()ing element from wrong zone");
}
remqueue((queue_t) elem);
}
#endif
if (zone_check) {
zone_check_freelist(zone, elem);
}
if (__probable(!gzfreed))
free_to_zone(zone, elem, poison);
#if MACH_ASSERT
if (zone->count < 0)
panic("zfree: zone count underflow in zone %s while freeing element %p, possible cause: double frees or freeing memory that did not come from this zone",
zone->zone_name, addr);
#endif
#if CONFIG_ZLEAKS
if (zone->zleak_on) {
zleak_free(elem, zone->elem_size);
}
#endif
if (zone->elem_size >= PAGE_SIZE &&
vm_pool_low()){
zone_gc_forced = TRUE;
}
unlock_zone(zone);
{
thread_t thr = current_thread();
task_t task;
zinfo_usage_t zinfo;
vm_size_t sz = zone->elem_size;
if (zone->caller_acct)
ledger_debit(thr->t_ledger, task_ledgers.tkm_private, sz);
else
ledger_debit(thr->t_ledger, task_ledgers.tkm_shared, sz);
if ((task = thr->task) != NULL && (zinfo = task->tkm_zinfo) != NULL)
OSAddAtomic64(sz, (int64_t *)&zinfo[zone->index].free);
}
}
void
zone_change(
zone_t zone,
unsigned int item,
boolean_t value)
{
assert( zone != ZONE_NULL );
assert( value == TRUE || value == FALSE );
switch(item){
case Z_NOENCRYPT:
zone->noencrypt = value;
break;
case Z_EXHAUST:
zone->exhaustible = value;
break;
case Z_COLLECT:
zone->collectable = value;
break;
case Z_EXPAND:
zone->expandable = value;
break;
case Z_FOREIGN:
zone->allows_foreign = value;
break;
case Z_CALLERACCT:
zone->caller_acct = value;
break;
case Z_NOCALLOUT:
zone->no_callout = value;
break;
case Z_GZALLOC_EXEMPT:
zone->gzalloc_exempt = value;
#if CONFIG_GZALLOC
gzalloc_reconfigure(zone);
#endif
break;
case Z_ALIGNMENT_REQUIRED:
zone->alignment_required = value;
zone->use_page_list = FALSE;
#if ZONE_DEBUG
zone_debug_disable(zone);
#endif
#if CONFIG_GZALLOC
gzalloc_reconfigure(zone);
#endif
break;
default:
panic("Zone_change: Wrong Item Type!");
}
}
integer_t
zone_free_count(zone_t zone)
{
integer_t free_count;
lock_zone(zone);
free_count = zone->countfree;
unlock_zone(zone);
assert(free_count >= 0);
return(free_count);
}
boolean_t
zone_page_collectable(
vm_offset_t addr,
vm_size_t size)
{
struct zone_page_table_entry *zp;
zone_page_index_t i, j;
#if ZONE_ALIAS_ADDR
addr = zone_virtual_addr(addr);
#endif
#if MACH_ASSERT
if (!from_zone_map(addr, size))
panic("zone_page_collectable");
#endif
i = (zone_page_index_t)atop_kernel(addr-zone_map_min_address);
j = (zone_page_index_t)atop_kernel((addr+size-1) - zone_map_min_address);
for (; i <= j; i++) {
zp = zone_page_table_lookup(i);
if (zp->collect_count == zp->alloc_count)
return (TRUE);
}
return (FALSE);
}
void
zone_page_keep(
vm_offset_t addr,
vm_size_t size)
{
struct zone_page_table_entry *zp;
zone_page_index_t i, j;
#if ZONE_ALIAS_ADDR
addr = zone_virtual_addr(addr);
#endif
#if MACH_ASSERT
if (!from_zone_map(addr, size))
panic("zone_page_keep");
#endif
i = (zone_page_index_t)atop_kernel(addr-zone_map_min_address);
j = (zone_page_index_t)atop_kernel((addr+size-1) - zone_map_min_address);
for (; i <= j; i++) {
zp = zone_page_table_lookup(i);
zp->collect_count = 0;
}
}
void
zone_page_collect(
vm_offset_t addr,
vm_size_t size)
{
struct zone_page_table_entry *zp;
zone_page_index_t i, j;
#if ZONE_ALIAS_ADDR
addr = zone_virtual_addr(addr);
#endif
#if MACH_ASSERT
if (!from_zone_map(addr, size))
panic("zone_page_collect");
#endif
i = (zone_page_index_t)atop_kernel(addr-zone_map_min_address);
j = (zone_page_index_t)atop_kernel((addr+size-1) - zone_map_min_address);
for (; i <= j; i++) {
zp = zone_page_table_lookup(i);
++zp->collect_count;
}
}
void
zone_page_init(
vm_offset_t addr,
vm_size_t size)
{
struct zone_page_table_entry *zp;
zone_page_index_t i, j;
#if ZONE_ALIAS_ADDR
addr = zone_virtual_addr(addr);
#endif
#if MACH_ASSERT
if (!from_zone_map(addr, size))
panic("zone_page_init");
#endif
i = (zone_page_index_t)atop_kernel(addr-zone_map_min_address);
j = (zone_page_index_t)atop_kernel((addr+size-1) - zone_map_min_address);
for (; i <= j; i++) {
zone_page_table_expand(i);
zp = zone_page_table_lookup(i);
assert(zp);
zp->alloc_count = ZONE_PAGE_UNUSED;
zp->collect_count = 0;
}
}
void
zone_page_alloc(
vm_offset_t addr,
vm_size_t size)
{
struct zone_page_table_entry *zp;
zone_page_index_t i, j;
#if ZONE_ALIAS_ADDR
addr = zone_virtual_addr(addr);
#endif
#if MACH_ASSERT
if (!from_zone_map(addr, size))
panic("zone_page_alloc");
#endif
i = (zone_page_index_t)atop_kernel(addr-zone_map_min_address);
j = (zone_page_index_t)atop_kernel((addr+size-1) - zone_map_min_address);
for (; i <= j; i++) {
zp = zone_page_table_lookup(i);
assert(zp);
if (zp->alloc_count == ZONE_PAGE_UNUSED)
zp->alloc_count = ZONE_PAGE_USED;
++zp->alloc_count;
}
}
void
zone_page_free_element(
zone_page_index_t *free_page_head,
zone_page_index_t *free_page_tail,
vm_offset_t addr,
vm_size_t size)
{
struct zone_page_table_entry *zp;
zone_page_index_t i, j;
#if ZONE_ALIAS_ADDR
addr = zone_virtual_addr(addr);
#endif
#if MACH_ASSERT
if (!from_zone_map(addr, size))
panic("zone_page_free_element");
#endif
vm_offset_t *primary = (vm_offset_t *) addr;
vm_offset_t *backup = get_backup_ptr(size, primary);
*primary = ZP_POISON;
*backup = ZP_POISON;
i = (zone_page_index_t)atop_kernel(addr-zone_map_min_address);
j = (zone_page_index_t)atop_kernel((addr+size-1) - zone_map_min_address);
for (; i <= j; i++) {
zp = zone_page_table_lookup(i);
if (zp->collect_count > 0)
--zp->collect_count;
if (--zp->alloc_count == 0) {
vm_address_t free_page_address;
vm_address_t prev_free_page_address;
zp->alloc_count = ZONE_PAGE_UNUSED;
zp->collect_count = 0;
free_page_address = zone_map_min_address + PAGE_SIZE * ((vm_size_t)i);
*(zone_page_index_t *)free_page_address = ZONE_PAGE_INDEX_INVALID;
if (*free_page_head == ZONE_PAGE_INDEX_INVALID) {
*free_page_head = i;
*free_page_tail = i;
} else {
prev_free_page_address = zone_map_min_address + PAGE_SIZE * ((vm_size_t)(*free_page_tail));
*(zone_page_index_t *)prev_free_page_address = i;
*free_page_tail = i;
}
}
}
}
#define ZONEGC_SMALL_ELEMENT_SIZE 4096
struct {
uint64_t zgc_invoked;
uint64_t zgc_bailed;
uint32_t pgs_freed;
uint32_t elems_collected,
elems_freed,
elems_kept;
} zgc_stats;
void
zone_gc(boolean_t all_zones)
{
unsigned int max_zones;
zone_t z;
unsigned int i;
uint32_t old_pgs_freed;
zone_page_index_t zone_free_page_head;
zone_page_index_t zone_free_page_tail;
thread_t mythread = current_thread();
lck_mtx_lock(&zone_gc_lock);
zgc_stats.zgc_invoked++;
old_pgs_freed = zgc_stats.pgs_freed;
simple_lock(&all_zones_lock);
max_zones = num_zones;
z = first_zone;
simple_unlock(&all_zones_lock);
if (zalloc_debug & ZALLOC_DEBUG_ZONEGC)
kprintf("zone_gc(all_zones=%s) starting...\n", all_zones ? "TRUE" : "FALSE");
thread_set_eager_preempt(mythread);
#if MACH_ASSERT
for (i = 0; i < zone_pages; i++) {
struct zone_page_table_entry *zp;
zp = zone_page_table_lookup(i);
assert(!zp || (zp->collect_count == 0));
}
#endif
for (i = 0; i < max_zones; i++, z = z->next_zone) {
unsigned int n, m;
vm_size_t elt_size, size_freed;
struct zone_free_element *elt, *base_elt, *base_prev, *prev, *scan, *keep, *tail;
int kmem_frees = 0, total_freed_pages = 0;
struct zone_page_metadata *page_meta;
queue_head_t page_meta_head;
assert(z != ZONE_NULL);
if (!z->collectable)
continue;
if (all_zones == FALSE && z->elem_size < ZONEGC_SMALL_ELEMENT_SIZE && !z->use_page_list)
continue;
lock_zone(z);
elt_size = z->elem_size;
if ((elt_size & PAGE_MASK) &&
!z->use_page_list &&
(((z->cur_size - z->count * elt_size) <= (2 * z->alloc_size)) ||
((z->cur_size - z->count * elt_size) <= (z->cur_size / 10)))) {
unlock_zone(z);
continue;
}
z->doing_gc = TRUE;
if (z->use_page_list) {
queue_new_head(&z->pages.all_free, &page_meta_head, struct zone_page_metadata *, pages);
queue_init(&z->pages.all_free);
} else {
scan = (void *)z->free_elements;
z->free_elements = 0;
}
unlock_zone(z);
if (z->use_page_list) {
size_freed = 0;
queue_iterate(&page_meta_head, page_meta, struct zone_page_metadata *, pages) {
assert(from_zone_map((vm_address_t)page_meta, sizeof(*page_meta)));
zgc_stats.elems_freed += page_meta->free_count;
size_freed += elt_size * page_meta->free_count;
zgc_stats.elems_collected += page_meta->free_count;
}
lock_zone(z);
if (size_freed > 0) {
z->cur_size -= size_freed;
z->countfree -= size_freed/elt_size;
}
z->doing_gc = FALSE;
if (z->waiting) {
z->waiting = FALSE;
zone_wakeup(z);
}
unlock_zone(z);
if (queue_empty(&page_meta_head))
continue;
thread_clear_eager_preempt(mythread);
while ((page_meta = (struct zone_page_metadata *)dequeue_head(&page_meta_head)) != NULL) {
vm_address_t free_page_address;
free_page_address = trunc_page((vm_address_t)page_meta);
#if ZONE_ALIAS_ADDR
free_page_address = zone_virtual_addr(free_page_address);
#endif
kmem_free(zone_map, free_page_address, PAGE_SIZE);
ZONE_PAGE_COUNT_DECR(z, 1);
total_freed_pages++;
zgc_stats.pgs_freed += 1;
if (++kmem_frees == 32) {
thread_yield_internal(1);
kmem_frees = 0;
}
}
if (zalloc_debug & ZALLOC_DEBUG_ZONEGC)
kprintf("zone_gc() of zone %s freed %lu elements, %d pages\n", z->zone_name, (unsigned long)size_freed/elt_size, total_freed_pages);
thread_set_eager_preempt(mythread);
continue;
}
prev = (void *)&scan;
elt = scan;
n = 0; tail = keep = NULL;
zone_free_page_head = ZONE_PAGE_INDEX_INVALID;
zone_free_page_tail = ZONE_PAGE_INDEX_INVALID;
while (elt != NULL) {
if (from_zone_map(elt, elt_size)) {
zone_page_collect((vm_offset_t)elt, elt_size);
prev = elt;
elt = elt->next;
++zgc_stats.elems_collected;
}
else {
if (keep == NULL)
keep = tail = elt;
else {
append_zone_element(z, tail, elt);
tail = elt;
}
append_zone_element(z, prev, elt->next);
elt = elt->next;
append_zone_element(z, tail, NULL);
}
if (++n >= 50) {
if (z->waiting == TRUE) {
lock_zone(z);
if (keep != NULL) {
add_list_to_zone(z, keep, tail);
tail = keep = NULL;
} else {
m =0;
base_elt = elt;
base_prev = prev;
while ((elt != NULL) && (++m < 50)) {
prev = elt;
elt = elt->next;
}
if (m !=0 ) {
append_zone_element(z, prev, NULL);
add_list_to_zone(z, base_elt, prev);
append_zone_element(z, base_prev, elt);
prev = base_prev;
}
}
if (z->waiting) {
z->waiting = FALSE;
zone_wakeup(z);
}
unlock_zone(z);
}
n =0;
}
}
if (keep != NULL) {
lock_zone(z);
add_list_to_zone(z, keep, tail);
if (z->waiting) {
z->waiting = FALSE;
zone_wakeup(z);
}
unlock_zone(z);
}
size_freed = 0;
elt = scan;
n = 0; tail = keep = NULL;
while (elt != NULL) {
if (zone_page_collectable((vm_offset_t)elt, elt_size)) {
struct zone_free_element *next_elt = elt->next;
size_freed += elt_size;
zone_page_free_element(&zone_free_page_head, &zone_free_page_tail, (vm_offset_t)elt, elt_size);
elt = next_elt;
++zgc_stats.elems_freed;
}
else {
zone_page_keep((vm_offset_t)elt, elt_size);
if (keep == NULL)
keep = tail = elt;
else {
append_zone_element(z, tail, elt);
tail = elt;
}
elt = elt->next;
append_zone_element(z, tail, NULL);
++zgc_stats.elems_kept;
}
if (++n >= 50) {
lock_zone(z);
z->cur_size -= size_freed;
z->countfree -= size_freed/elt_size;
size_freed = 0;
if (keep != NULL) {
add_list_to_zone(z, keep, tail);
}
if (z->waiting) {
z->waiting = FALSE;
zone_wakeup(z);
}
unlock_zone(z);
n = 0; tail = keep = NULL;
}
}
lock_zone(z);
if (size_freed > 0 || keep != NULL) {
z->cur_size -= size_freed;
z->countfree -= size_freed/elt_size;
if (keep != NULL) {
add_list_to_zone(z, keep, tail);
}
}
z->doing_gc = FALSE;
if (z->waiting) {
z->waiting = FALSE;
zone_wakeup(z);
}
unlock_zone(z);
if (zone_free_page_head == ZONE_PAGE_INDEX_INVALID)
continue;
thread_clear_eager_preempt(mythread);
uint32_t pages_to_free_count = 0;
vm_address_t fpa;
zone_page_index_t index;
for (index = zone_free_page_head; index != ZONE_PAGE_INDEX_INVALID;) {
pages_to_free_count++;
fpa = zone_map_min_address + PAGE_SIZE * ((vm_size_t)index);
index = *(zone_page_index_t *)fpa;
}
while (zone_free_page_head != ZONE_PAGE_INDEX_INVALID) {
zone_page_index_t zind = zone_free_page_head;
vm_address_t free_page_address;
int page_count;
free_page_address = zone_map_min_address + PAGE_SIZE * ((vm_size_t)zind);
zone_free_page_head = *(zone_page_index_t *)free_page_address;
page_count = 1;
total_freed_pages++;
while (zone_free_page_head != ZONE_PAGE_INDEX_INVALID) {
zone_page_index_t next_zind = zone_free_page_head;
vm_address_t next_free_page_address;
next_free_page_address = zone_map_min_address + PAGE_SIZE * ((vm_size_t)next_zind);
if (next_free_page_address == (free_page_address - PAGE_SIZE)) {
free_page_address = next_free_page_address;
} else if (next_free_page_address != (free_page_address + (PAGE_SIZE * page_count)))
break;
zone_free_page_head = *(zone_page_index_t *)next_free_page_address;
page_count++;
total_freed_pages++;
}
kmem_free(zone_map, free_page_address, page_count * PAGE_SIZE);
ZONE_PAGE_COUNT_DECR(z, page_count);
zgc_stats.pgs_freed += page_count;
pages_to_free_count -= page_count;
if (++kmem_frees == 32) {
thread_yield_internal(1);
kmem_frees = 0;
}
}
assert(pages_to_free_count == 0);
if (zalloc_debug & ZALLOC_DEBUG_ZONEGC)
kprintf("zone_gc() of zone %s freed %lu elements, %d pages\n", z->zone_name, (unsigned long)size_freed/elt_size, total_freed_pages);
thread_set_eager_preempt(mythread);
}
if (old_pgs_freed == zgc_stats.pgs_freed)
zgc_stats.zgc_bailed++;
thread_clear_eager_preempt(mythread);
lck_mtx_unlock(&zone_gc_lock);
}
extern vm_offset_t kmapoff_kaddr;
extern unsigned int kmapoff_pgcnt;
void
consider_zone_gc(boolean_t force)
{
boolean_t all_zones = FALSE;
if (kmapoff_kaddr != 0) {
(void) vm_deallocate(kernel_map,
kmapoff_kaddr, kmapoff_pgcnt * PAGE_SIZE_64);
kmapoff_kaddr = 0;
}
if (zone_gc_allowed &&
(zone_gc_allowed_by_time_throttle ||
zone_gc_forced ||
force)) {
if (zone_gc_allowed_by_time_throttle == TRUE) {
zone_gc_allowed_by_time_throttle = FALSE;
all_zones = TRUE;
}
zone_gc_forced = FALSE;
zone_gc(all_zones);
}
}
void
compute_zone_gc_throttle(void *arg __unused)
{
zone_gc_allowed_by_time_throttle = TRUE;
}
#if CONFIG_TASK_ZONE_INFO
kern_return_t
task_zone_info(
task_t task,
mach_zone_name_array_t *namesp,
mach_msg_type_number_t *namesCntp,
task_zone_info_array_t *infop,
mach_msg_type_number_t *infoCntp)
{
mach_zone_name_t *names;
vm_offset_t names_addr;
vm_size_t names_size;
task_zone_info_t *info;
vm_offset_t info_addr;
vm_size_t info_size;
unsigned int max_zones, i;
zone_t z;
mach_zone_name_t *zn;
task_zone_info_t *zi;
kern_return_t kr;
vm_size_t used;
vm_map_copy_t copy;
if (task == TASK_NULL)
return KERN_INVALID_TASK;
simple_lock(&all_zones_lock);
max_zones = (unsigned int)(num_zones + num_fake_zones);
z = first_zone;
simple_unlock(&all_zones_lock);
names_size = round_page(max_zones * sizeof *names);
kr = kmem_alloc_pageable(ipc_kernel_map,
&names_addr, names_size, VM_KERN_MEMORY_IPC);
if (kr != KERN_SUCCESS)
return kr;
names = (mach_zone_name_t *) names_addr;
info_size = round_page(max_zones * sizeof *info);
kr = kmem_alloc_pageable(ipc_kernel_map,
&info_addr, info_size, VM_KERN_MEMORY_IPC);
if (kr != KERN_SUCCESS) {
kmem_free(ipc_kernel_map,
names_addr, names_size);
return kr;
}
info = (task_zone_info_t *) info_addr;
zn = &names[0];
zi = &info[0];
for (i = 0; i < max_zones - num_fake_zones; i++) {
struct zone zcopy;
assert(z != ZONE_NULL);
lock_zone(z);
zcopy = *z;
unlock_zone(z);
simple_lock(&all_zones_lock);
z = z->next_zone;
simple_unlock(&all_zones_lock);
(void) strncpy(zn->mzn_name, zcopy.zone_name,
sizeof zn->mzn_name);
zn->mzn_name[sizeof zn->mzn_name - 1] = '\0';
zi->tzi_count = (uint64_t)zcopy.count;
zi->tzi_cur_size = ptoa_64(zcopy.page_count);
zi->tzi_max_size = (uint64_t)zcopy.max_size;
zi->tzi_elem_size = (uint64_t)zcopy.elem_size;
zi->tzi_alloc_size = (uint64_t)zcopy.alloc_size;
zi->tzi_sum_size = zcopy.sum_count * zcopy.elem_size;
zi->tzi_exhaustible = (uint64_t)zcopy.exhaustible;
zi->tzi_collectable = (uint64_t)zcopy.collectable;
zi->tzi_caller_acct = (uint64_t)zcopy.caller_acct;
if (task->tkm_zinfo != NULL) {
zi->tzi_task_alloc = task->tkm_zinfo[zcopy.index].alloc;
zi->tzi_task_free = task->tkm_zinfo[zcopy.index].free;
} else {
zi->tzi_task_alloc = 0;
zi->tzi_task_free = 0;
}
zn++;
zi++;
}
for (i = 0; i < num_fake_zones; i++) {
int count, collectable, exhaustible, caller_acct, index;
vm_size_t cur_size, max_size, elem_size, alloc_size;
uint64_t sum_size;
strncpy(zn->mzn_name, fake_zones[i].name, sizeof zn->mzn_name);
zn->mzn_name[sizeof zn->mzn_name - 1] = '\0';
fake_zones[i].query(&count, &cur_size,
&max_size, &elem_size,
&alloc_size, &sum_size,
&collectable, &exhaustible, &caller_acct);
zi->tzi_count = (uint64_t)count;
zi->tzi_cur_size = (uint64_t)cur_size;
zi->tzi_max_size = (uint64_t)max_size;
zi->tzi_elem_size = (uint64_t)elem_size;
zi->tzi_alloc_size = (uint64_t)alloc_size;
zi->tzi_sum_size = sum_size;
zi->tzi_collectable = (uint64_t)collectable;
zi->tzi_exhaustible = (uint64_t)exhaustible;
zi->tzi_caller_acct = (uint64_t)caller_acct;
if (task->tkm_zinfo != NULL) {
index = ZINFO_SLOTS - num_fake_zones + i;
zi->tzi_task_alloc = task->tkm_zinfo[index].alloc;
zi->tzi_task_free = task->tkm_zinfo[index].free;
} else {
zi->tzi_task_alloc = 0;
zi->tzi_task_free = 0;
}
zn++;
zi++;
}
used = max_zones * sizeof *names;
if (used != names_size)
bzero((char *) (names_addr + used), names_size - used);
kr = vm_map_copyin(ipc_kernel_map, (vm_map_address_t)names_addr,
(vm_map_size_t)used, TRUE, ©);
assert(kr == KERN_SUCCESS);
*namesp = (mach_zone_name_t *) copy;
*namesCntp = max_zones;
used = max_zones * sizeof *info;
if (used != info_size)
bzero((char *) (info_addr + used), info_size - used);
kr = vm_map_copyin(ipc_kernel_map, (vm_map_address_t)info_addr,
(vm_map_size_t)used, TRUE, ©);
assert(kr == KERN_SUCCESS);
*infop = (task_zone_info_t *) copy;
*infoCntp = max_zones;
return KERN_SUCCESS;
}
#else
kern_return_t
task_zone_info(
__unused task_t task,
__unused mach_zone_name_array_t *namesp,
__unused mach_msg_type_number_t *namesCntp,
__unused task_zone_info_array_t *infop,
__unused mach_msg_type_number_t *infoCntp)
{
return KERN_FAILURE;
}
#endif
kern_return_t
mach_zone_info(
host_priv_t host,
mach_zone_name_array_t *namesp,
mach_msg_type_number_t *namesCntp,
mach_zone_info_array_t *infop,
mach_msg_type_number_t *infoCntp)
{
return (mach_memory_info(host, namesp, namesCntp, infop, infoCntp, NULL, NULL));
}
kern_return_t
mach_memory_info(
host_priv_t host,
mach_zone_name_array_t *namesp,
mach_msg_type_number_t *namesCntp,
mach_zone_info_array_t *infop,
mach_msg_type_number_t *infoCntp,
mach_memory_info_array_t *memoryInfop,
mach_msg_type_number_t *memoryInfoCntp)
{
mach_zone_name_t *names;
vm_offset_t names_addr;
vm_size_t names_size;
mach_zone_info_t *info;
vm_offset_t info_addr;
vm_size_t info_size;
mach_memory_info_t *memory_info;
vm_offset_t memory_info_addr;
vm_size_t memory_info_size;
vm_size_t memory_info_vmsize;
unsigned int num_sites;
unsigned int max_zones, i;
zone_t z;
mach_zone_name_t *zn;
mach_zone_info_t *zi;
kern_return_t kr;
vm_size_t used;
vm_map_copy_t copy;
if (host == HOST_NULL)
return KERN_INVALID_HOST;
#if CONFIG_DEBUGGER_FOR_ZONE_INFO
if (!PE_i_can_has_debugger(NULL))
return KERN_INVALID_HOST;
#endif
simple_lock(&all_zones_lock);
max_zones = (unsigned int)(num_zones + num_fake_zones);
z = first_zone;
simple_unlock(&all_zones_lock);
names_size = round_page(max_zones * sizeof *names);
kr = kmem_alloc_pageable(ipc_kernel_map,
&names_addr, names_size, VM_KERN_MEMORY_IPC);
if (kr != KERN_SUCCESS)
return kr;
names = (mach_zone_name_t *) names_addr;
info_size = round_page(max_zones * sizeof *info);
kr = kmem_alloc_pageable(ipc_kernel_map,
&info_addr, info_size, VM_KERN_MEMORY_IPC);
if (kr != KERN_SUCCESS) {
kmem_free(ipc_kernel_map,
names_addr, names_size);
return kr;
}
info = (mach_zone_info_t *) info_addr;
num_sites = 0;
memory_info_addr = 0;
if (memoryInfop && memoryInfoCntp)
{
num_sites = VM_KERN_MEMORY_COUNT + VM_KERN_COUNTER_COUNT;
memory_info_size = num_sites * sizeof(*info);
memory_info_vmsize = round_page(memory_info_size);
kr = kmem_alloc_pageable(ipc_kernel_map,
&memory_info_addr, memory_info_vmsize, VM_KERN_MEMORY_IPC);
if (kr != KERN_SUCCESS) {
kmem_free(ipc_kernel_map,
names_addr, names_size);
kmem_free(ipc_kernel_map,
info_addr, info_size);
return kr;
}
kr = vm_map_wire(ipc_kernel_map, memory_info_addr, memory_info_addr + memory_info_vmsize,
VM_PROT_READ|VM_PROT_WRITE|VM_PROT_MEMORY_TAG_MAKE(VM_KERN_MEMORY_IPC), FALSE);
assert(kr == KERN_SUCCESS);
memory_info = (mach_memory_info_t *) memory_info_addr;
vm_page_diagnose(memory_info, num_sites);
kr = vm_map_unwire(ipc_kernel_map, memory_info_addr, memory_info_addr + memory_info_vmsize, FALSE);
assert(kr == KERN_SUCCESS);
}
zn = &names[0];
zi = &info[0];
for (i = 0; i < max_zones - num_fake_zones; i++) {
struct zone zcopy;
assert(z != ZONE_NULL);
lock_zone(z);
zcopy = *z;
unlock_zone(z);
simple_lock(&all_zones_lock);
z = z->next_zone;
simple_unlock(&all_zones_lock);
(void) strncpy(zn->mzn_name, zcopy.zone_name,
sizeof zn->mzn_name);
zn->mzn_name[sizeof zn->mzn_name - 1] = '\0';
zi->mzi_count = (uint64_t)zcopy.count;
zi->mzi_cur_size = ptoa_64(zcopy.page_count);
zi->mzi_max_size = (uint64_t)zcopy.max_size;
zi->mzi_elem_size = (uint64_t)zcopy.elem_size;
zi->mzi_alloc_size = (uint64_t)zcopy.alloc_size;
zi->mzi_sum_size = zcopy.sum_count * zcopy.elem_size;
zi->mzi_exhaustible = (uint64_t)zcopy.exhaustible;
zi->mzi_collectable = (uint64_t)zcopy.collectable;
zn++;
zi++;
}
for (i = 0; i < num_fake_zones; i++) {
int count, collectable, exhaustible, caller_acct;
vm_size_t cur_size, max_size, elem_size, alloc_size;
uint64_t sum_size;
strncpy(zn->mzn_name, fake_zones[i].name, sizeof zn->mzn_name);
zn->mzn_name[sizeof zn->mzn_name - 1] = '\0';
fake_zones[i].query(&count, &cur_size,
&max_size, &elem_size,
&alloc_size, &sum_size,
&collectable, &exhaustible, &caller_acct);
zi->mzi_count = (uint64_t)count;
zi->mzi_cur_size = (uint64_t)cur_size;
zi->mzi_max_size = (uint64_t)max_size;
zi->mzi_elem_size = (uint64_t)elem_size;
zi->mzi_alloc_size = (uint64_t)alloc_size;
zi->mzi_sum_size = sum_size;
zi->mzi_collectable = (uint64_t)collectable;
zi->mzi_exhaustible = (uint64_t)exhaustible;
zn++;
zi++;
}
used = max_zones * sizeof *names;
if (used != names_size)
bzero((char *) (names_addr + used), names_size - used);
kr = vm_map_copyin(ipc_kernel_map, (vm_map_address_t)names_addr,
(vm_map_size_t)used, TRUE, ©);
assert(kr == KERN_SUCCESS);
*namesp = (mach_zone_name_t *) copy;
*namesCntp = max_zones;
used = max_zones * sizeof *info;
if (used != info_size)
bzero((char *) (info_addr + used), info_size - used);
kr = vm_map_copyin(ipc_kernel_map, (vm_map_address_t)info_addr,
(vm_map_size_t)used, TRUE, ©);
assert(kr == KERN_SUCCESS);
*infop = (mach_zone_info_t *) copy;
*infoCntp = max_zones;
if (memoryInfop && memoryInfoCntp)
{
kr = vm_map_copyin(ipc_kernel_map, (vm_map_address_t)memory_info_addr,
(vm_map_size_t)memory_info_size, TRUE, ©);
assert(kr == KERN_SUCCESS);
*memoryInfop = (mach_memory_info_t *) copy;
*memoryInfoCntp = num_sites;
}
return KERN_SUCCESS;
}
kern_return_t
host_zone_info(
host_priv_t host,
zone_name_array_t *namesp,
mach_msg_type_number_t *namesCntp,
zone_info_array_t *infop,
mach_msg_type_number_t *infoCntp)
{
zone_name_t *names;
vm_offset_t names_addr;
vm_size_t names_size;
zone_info_t *info;
vm_offset_t info_addr;
vm_size_t info_size;
unsigned int max_zones, i;
zone_t z;
zone_name_t *zn;
zone_info_t *zi;
kern_return_t kr;
vm_size_t used;
vm_map_copy_t copy;
if (host == HOST_NULL)
return KERN_INVALID_HOST;
#if CONFIG_DEBUGGER_FOR_ZONE_INFO
if (!PE_i_can_has_debugger(NULL))
return KERN_INVALID_HOST;
#endif
#if defined(__LP64__)
if (!thread_is_64bit(current_thread()))
return KERN_NOT_SUPPORTED;
#else
if (thread_is_64bit(current_thread()))
return KERN_NOT_SUPPORTED;
#endif
simple_lock(&all_zones_lock);
max_zones = (unsigned int)(num_zones + num_fake_zones);
z = first_zone;
simple_unlock(&all_zones_lock);
names_size = round_page(max_zones * sizeof *names);
kr = kmem_alloc_pageable(ipc_kernel_map,
&names_addr, names_size, VM_KERN_MEMORY_IPC);
if (kr != KERN_SUCCESS)
return kr;
names = (zone_name_t *) names_addr;
info_size = round_page(max_zones * sizeof *info);
kr = kmem_alloc_pageable(ipc_kernel_map,
&info_addr, info_size, VM_KERN_MEMORY_IPC);
if (kr != KERN_SUCCESS) {
kmem_free(ipc_kernel_map,
names_addr, names_size);
return kr;
}
info = (zone_info_t *) info_addr;
zn = &names[0];
zi = &info[0];
for (i = 0; i < max_zones - num_fake_zones; i++) {
struct zone zcopy;
assert(z != ZONE_NULL);
lock_zone(z);
zcopy = *z;
unlock_zone(z);
simple_lock(&all_zones_lock);
z = z->next_zone;
simple_unlock(&all_zones_lock);
(void) strncpy(zn->zn_name, zcopy.zone_name,
sizeof zn->zn_name);
zn->zn_name[sizeof zn->zn_name - 1] = '\0';
zi->zi_count = zcopy.count;
zi->zi_cur_size = ptoa(zcopy.page_count);
zi->zi_max_size = zcopy.max_size;
zi->zi_elem_size = zcopy.elem_size;
zi->zi_alloc_size = zcopy.alloc_size;
zi->zi_exhaustible = zcopy.exhaustible;
zi->zi_collectable = zcopy.collectable;
zn++;
zi++;
}
for (i = 0; i < num_fake_zones; i++) {
int caller_acct;
uint64_t sum_space;
strncpy(zn->zn_name, fake_zones[i].name, sizeof zn->zn_name);
zn->zn_name[sizeof zn->zn_name - 1] = '\0';
fake_zones[i].query(&zi->zi_count, &zi->zi_cur_size,
&zi->zi_max_size, &zi->zi_elem_size,
&zi->zi_alloc_size, &sum_space,
&zi->zi_collectable, &zi->zi_exhaustible, &caller_acct);
zn++;
zi++;
}
used = max_zones * sizeof *names;
if (used != names_size)
bzero((char *) (names_addr + used), names_size - used);
kr = vm_map_copyin(ipc_kernel_map, (vm_map_address_t)names_addr,
(vm_map_size_t)used, TRUE, ©);
assert(kr == KERN_SUCCESS);
*namesp = (zone_name_t *) copy;
*namesCntp = max_zones;
used = max_zones * sizeof *info;
if (used != info_size)
bzero((char *) (info_addr + used), info_size - used);
kr = vm_map_copyin(ipc_kernel_map, (vm_map_address_t)info_addr,
(vm_map_size_t)used, TRUE, ©);
assert(kr == KERN_SUCCESS);
*infop = (zone_info_t *) copy;
*infoCntp = max_zones;
return KERN_SUCCESS;
}
kern_return_t
mach_zone_force_gc(
host_t host)
{
if (host == HOST_NULL)
return KERN_INVALID_HOST;
consider_zone_gc(TRUE);
return (KERN_SUCCESS);
}
extern unsigned int stack_total;
extern unsigned long long stack_allocs;
#if defined(__i386__) || defined (__x86_64__)
extern unsigned int inuse_ptepages_count;
extern long long alloc_ptepages_count;
#endif
void zone_display_zprint()
{
unsigned int i;
zone_t the_zone;
if(first_zone!=NULL) {
the_zone = first_zone;
for (i = 0; i < num_zones; i++) {
if(the_zone->cur_size > (1024*1024)) {
printf("%.20s:\t%lu\n",the_zone->zone_name,(uintptr_t)the_zone->cur_size);
}
if(the_zone->next_zone == NULL) {
break;
}
the_zone = the_zone->next_zone;
}
}
printf("Kernel Stacks:\t%lu\n",(uintptr_t)(kernel_stack_size * stack_total));
#if defined(__i386__) || defined (__x86_64__)
printf("PageTables:\t%lu\n",(uintptr_t)(PAGE_SIZE * inuse_ptepages_count));
#endif
printf("Kalloc.Large:\t%lu\n",(uintptr_t)kalloc_large_total);
}
zone_t
zone_find_largest(void)
{
unsigned int i;
unsigned int max_zones;
zone_t the_zone;
zone_t zone_largest;
simple_lock(&all_zones_lock);
the_zone = first_zone;
max_zones = num_zones;
simple_unlock(&all_zones_lock);
zone_largest = the_zone;
for (i = 0; i < max_zones; i++) {
if (the_zone->cur_size > zone_largest->cur_size) {
zone_largest = the_zone;
}
if (the_zone->next_zone == NULL) {
break;
}
the_zone = the_zone->next_zone;
}
return zone_largest;
}
#if ZONE_DEBUG
#define zone_in_use(z) ( z->count || z->free_elements \
|| !queue_empty(&z->pages.all_free) \
|| !queue_empty(&z->pages.intermediate) \
|| (z->allows_foreign && !queue_empty(&z->pages.any_free_foreign)))
void
zone_debug_enable(
zone_t z)
{
if (zone_debug_enabled(z) || zone_in_use(z) ||
z->alloc_size < (z->elem_size + ZONE_DEBUG_OFFSET))
return;
queue_init(&z->active_zones);
z->elem_size += ZONE_DEBUG_OFFSET;
}
void
zone_debug_disable(
zone_t z)
{
if (!zone_debug_enabled(z) || zone_in_use(z))
return;
z->elem_size -= ZONE_DEBUG_OFFSET;
z->active_zones.next = z->active_zones.prev = NULL;
}
#endif