magazine_malloc.c   [plain text]


/*
 * Copyright (c) 1999, 2006, 2008 Apple Inc. All rights reserved.
 *
 * @APPLE_LICENSE_HEADER_START@
 *
 * This file contains Original Code and/or Modifications of Original Code
 * as defined in and that are subject to the Apple Public Source License
 * Version 2.0 (the 'License'). You may not use this file except in
 * compliance with the License. Please obtain a copy of the License at
 * http://www.opensource.apple.com/apsl/ and read it before using this
 * file.
 *
 * The Original Code and all software distributed under the License are
 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
 * Please see the License for the specific language governing rights and
 * limitations under the License.
 *
 * @APPLE_LICENSE_HEADER_END@
 */

/* Author: Bertrand Serlet, August 1999 */

/*
 * Multithread enhancements for "tiny" allocations introduced February 2008.
 * These are in the spirit of "Hoard". See:
 * Emery D. Berger, Kathryn S. McKinley, Robert D. Blumofe, and Paul R. Wilson. 2000.
 * Hoard: a scalable memory allocator for multithreaded applications.
 * In Proceedings of the ninth international conference on Architectural support for
 * programming languages and operating systems (ASPLOS IX).
 * ACM, New York, NY, USA, 117-128.
 * DOI: https://doi.org/10.1145/378993.379232
 * Retrieved on 2008-02-22.
 */

#include "internal.h"

#if DEBUG_MALLOC
#define LOG(szone, ptr) (szone->log_address && (((uintptr_t)szone->log_address == -1) || (szone->log_address == (void *)(ptr))))
#else
#define LOG(szone, ptr) 0
#endif

// Maximum number of magazines, set from the number of logical CPUS and
// possibly limited by the MallocMaxMagazines environment variable.
int max_magazines;

// Control whether medium is enabled at all when creating new magazine zones
bool magazine_medium_enabled = true;

// Control the DRAM limit at which medium kicks in.
uint64_t magazine_medium_active_threshold = MEDIUM_ACTIVATION_THRESHOLD;

// Control the DRAM limit at which the expanded large cache kicks in.
uint64_t magazine_large_expanded_cache_threshold = LARGE_CACHE_EXPANDED_THRESHOLD;

// <rdar://problem/47353961> Maximum number of magzines that the medium
// allocator will use. This addresses a 32-bit load-offset range issue found
// in some apps when introducing medium.
int max_medium_magazines;

// Number of regions to retain in a recirc depot.
#if CONFIG_RECIRC_DEPOT
int recirc_retained_regions = DEFAULT_RECIRC_RETAINED_REGIONS;
#endif // CONFIG_RECIRC_DEPOT

/*********************	Zone call backs	************************/
/*
 * Mark these MALLOC_NOINLINE to avoid bloating the purgeable zone call backs
 */
void
szone_free(szone_t *szone, void *ptr)
{
	region_t tiny_region;
	region_t small_region;

#if DEBUG_MALLOC
	if (LOG(szone, ptr)) {
		malloc_report(ASL_LEVEL_INFO, "in szone_free with %p\n", ptr);
	}
#endif
	if (!ptr) {
		return;
	}
	/*
	 * Try to free to a tiny region.
	 */
	if ((uintptr_t)ptr & (TINY_QUANTUM - 1)) {
		malloc_zone_error(szone->debug_flags, true, "Non-aligned pointer %p being freed\n", ptr);
		return;
	}
	if ((tiny_region = tiny_region_for_ptr_no_lock(&szone->tiny_rack, ptr)) != NULL) {
		if (TINY_INDEX_FOR_PTR(ptr) >= NUM_TINY_BLOCKS) {
			malloc_zone_error(szone->debug_flags, true, "Pointer %p to metadata being freed\n", ptr);
			return;
		}
		free_tiny(&szone->tiny_rack, ptr, tiny_region, 0, false);
		return;
	}

	/*
	 * Try to free to a small region.
	 */
	if ((uintptr_t)ptr & (SMALL_QUANTUM - 1)) {
		malloc_zone_error(szone->debug_flags, true, "Non-aligned pointer %p being freed (2)\n", ptr);
		return;
	}
	if ((small_region = small_region_for_ptr_no_lock(&szone->small_rack, ptr)) != NULL) {
		if (SMALL_META_INDEX_FOR_PTR(ptr) >= NUM_SMALL_BLOCKS) {
			malloc_zone_error(szone->debug_flags, true, "Pointer %p to metadata being freed (2)\n", ptr);
			return;
		}
		free_small(&szone->small_rack, ptr, small_region, 0);
		return;
	}

#if CONFIG_MEDIUM_ALLOCATOR
	region_t medium_region;

	if (szone->is_medium_engaged &&
			(medium_region = medium_region_for_ptr_no_lock(&szone->medium_rack, ptr)) != NULL) {
		if (MEDIUM_META_INDEX_FOR_PTR(ptr) >= NUM_MEDIUM_BLOCKS) {
			malloc_zone_error(szone->debug_flags, true, "Pointer %p to metadata being freed (2)\n", ptr);
			return;
		}
		free_medium(&szone->medium_rack, ptr, medium_region, 0);
		return;
	}
#endif // CONFIG_MEDIUM_ALLOCATOR

	/* check that it's a legal large allocation */
	if ((uintptr_t)ptr & (vm_page_quanta_size - 1)) {
		malloc_zone_error(szone->debug_flags, true, "non-page-aligned, non-allocated pointer %p being freed\n", ptr);
		return;
	}
	free_large(szone, ptr);
}

void
szone_free_definite_size(szone_t *szone, void *ptr, size_t size)
{
#if DEBUG_MALLOC
	if (LOG(szone, ptr)) {
		malloc_report(ASL_LEVEL_INFO, "in szone_free_definite_size with %p\n", ptr);
	}

	if (0 == size) {
		malloc_zone_error(szone->debug_flags, true, "pointer %p of size zero being freed\n", ptr);
		return;
	}

#endif
	if (!ptr) {
		return;
	}

	/*
	 * Try to free to a tiny region.
	 */
	if ((uintptr_t)ptr & (TINY_QUANTUM - 1)) {
		malloc_zone_error(szone->debug_flags, true, "Non-aligned pointer %p being freed\n", ptr);
		return;
	}
	if (size <= TINY_LIMIT_THRESHOLD) {
		if (TINY_INDEX_FOR_PTR(ptr) >= NUM_TINY_BLOCKS) {
			malloc_zone_error(szone->debug_flags, true, "Pointer %p to metadata being freed\n", ptr);
			return;
		}
		free_tiny(&szone->tiny_rack, ptr, TINY_REGION_FOR_PTR(ptr), size, false);
		return;
	}

	/*
	 * Try to free to a small region.
	 */
	if ((uintptr_t)ptr & (SMALL_QUANTUM - 1)) {
		malloc_zone_error(szone->debug_flags, true, "Non-aligned pointer %p being freed (2)\n", ptr);
		return;
	}
	if (size <= SMALL_LIMIT_THRESHOLD) {
		if (SMALL_META_INDEX_FOR_PTR(ptr) >= NUM_SMALL_BLOCKS) {
			malloc_zone_error(szone->debug_flags, true, "Pointer %p to metadata being freed (2)\n", ptr);
			return;
		}
		free_small(&szone->small_rack, ptr, SMALL_REGION_FOR_PTR(ptr), size);
		return;
	}

#if CONFIG_MEDIUM_ALLOCATOR
	/*
	 * Try to free to a medium region.
	 */
	if (szone->is_medium_engaged && size <= MEDIUM_LIMIT_THRESHOLD) {
		if (MEDIUM_META_INDEX_FOR_PTR(ptr) >= NUM_MEDIUM_BLOCKS) {
			malloc_zone_error(szone->debug_flags, true, "Pointer %p to metadata being freed (2)\n", ptr);
			return;
		}
		free_medium(&szone->medium_rack, ptr, MEDIUM_REGION_FOR_PTR(ptr), size);
		return;
	}
#endif // CONFIG_MEDIUM_ALLOCATOR

	/* check that it's a legal large allocation */
	if ((uintptr_t)ptr & (vm_page_quanta_size - 1)) {
		malloc_zone_error(szone->debug_flags, true, "non-page-aligned, non-allocated pointer %p being freed\n", ptr);
		return;
	}
	free_large(szone, ptr);
}

MALLOC_NOINLINE void *
szone_malloc_should_clear(szone_t *szone, size_t size, boolean_t cleared_requested)
{
	void *ptr;
	msize_t msize;

	if (size <= TINY_LIMIT_THRESHOLD) {
		msize = TINY_MSIZE_FOR_BYTES(size + TINY_QUANTUM - 1);
		if (!msize) {
			msize = 1;
		}
		ptr = tiny_malloc_should_clear(&szone->tiny_rack, msize, cleared_requested);
	} else if (size <= SMALL_LIMIT_THRESHOLD) {
		msize = SMALL_MSIZE_FOR_BYTES(size + SMALL_QUANTUM - 1);
		if (!msize) {
			msize = 1;
		}
		ptr = small_malloc_should_clear(&szone->small_rack, msize, cleared_requested);
#if CONFIG_MEDIUM_ALLOCATOR
	} else if (szone->is_medium_engaged && size <= MEDIUM_LIMIT_THRESHOLD) {
		msize = MEDIUM_MSIZE_FOR_BYTES(size + MEDIUM_QUANTUM - 1);
		if (!msize) {
			msize = 1;
		}
		ptr = medium_malloc_should_clear(&szone->medium_rack, msize, cleared_requested);
#endif
	} else {
		size_t num_kernel_pages = round_page_quanta(size) >> vm_page_quanta_shift;
		if (num_kernel_pages == 0) { /* Overflowed */
			ptr = 0;
		} else {
			ptr = large_malloc(szone, num_kernel_pages, 0, cleared_requested);
		}
	}
#if DEBUG_MALLOC
	if (LOG(szone, ptr)) {
		malloc_report(ASL_LEVEL_INFO, "szone_malloc returned %p\n", ptr);
	}
#endif
	/*
	 * If requested, scribble on allocated memory.
	 */
	if ((szone->debug_flags & MALLOC_DO_SCRIBBLE) && ptr && !cleared_requested && size) {
		memset(ptr, SCRIBBLE_BYTE, szone_size(szone, ptr));
	}

	return ptr;
}

void *
szone_malloc(szone_t *szone, size_t size)
{
	return szone_malloc_should_clear(szone, size, 0);
}

void *
szone_calloc(szone_t *szone, size_t num_items, size_t size)
{
	size_t total_bytes;
	if (calloc_get_size(num_items, size, 0, &total_bytes)) {
		return NULL;
	}
	return szone_malloc_should_clear(szone, total_bytes, 1);
}

void *
szone_valloc(szone_t *szone, size_t size)
{
	void *ptr;

	if (size <= MEDIUM_LIMIT_THRESHOLD) {
		ptr = szone_memalign(szone, vm_page_quanta_size, size);
	} else {
		size_t num_kernel_pages;

		num_kernel_pages = round_page_quanta(size) >> vm_page_quanta_shift;
		ptr = large_malloc(szone, num_kernel_pages, 0, 0);
	}

#if DEBUG_MALLOC
	if (LOG(szone, ptr)) {
		malloc_report(ASL_LEVEL_INFO, "szone_valloc returned %p\n", ptr);
	}
#endif
	return ptr;
}

/* Isolate PIC-base load here. */
size_t
szone_size_try_large(szone_t *szone, const void *ptr)
{
	size_t size = 0;
	large_entry_t *entry;

	SZONE_LOCK(szone);
	entry = large_entry_for_pointer_no_lock(szone, ptr);
	if (entry) {
		size = entry->size;
	}
	SZONE_UNLOCK(szone);
#if DEBUG_MALLOC
	if (LOG(szone, ptr)) {
		malloc_report(ASL_LEVEL_INFO, "szone_size for %p returned %d\n", ptr, (unsigned)size);
	}
#endif
	return size;
}

size_t
szone_size(szone_t *szone, const void *ptr)
{
	size_t sz = 0;

	if (!ptr) {
		return 0;
	}
#if DEBUG_MALLOC
	if (LOG(szone, ptr)) {
		malloc_report(ASL_LEVEL_INFO, "in szone_size for %p (szone=%p)\n", ptr, szone);
	}
#endif

	/*
	 * Look for it in a tiny region.
	 */
	if ((uintptr_t)ptr & (TINY_QUANTUM - 1)) {
		return 0;
	}

	sz = tiny_size(&szone->tiny_rack, ptr);
	if (sz) {
		return sz;
	}

	/*
	 * Look for it in a small region.
	 */
	if ((uintptr_t)ptr & (SMALL_QUANTUM - 1)) {
		return 0;
	}

	sz = small_size(&szone->small_rack, ptr);
	if (sz) {
		return sz;
	}

#if CONFIG_MEDIUM_ALLOCATOR
	/*
	 * Look for it in a medium region.
	 */
	if (szone->is_medium_engaged) {
		sz = medium_size(&szone->medium_rack, ptr);
		if (sz) {
			return sz;
		}
	}
#endif // CONFIG_MEDIUM_ALLOCATOR

	/*
	 * If not page-aligned, it cannot have come from a large allocation.
	 */
	if ((uintptr_t)ptr & (vm_page_quanta_size - 1)) {
		return 0;
	}

	/*
	 * Look for it in a large entry.
	 */
	return szone_size_try_large(szone, ptr);
}

void *
szone_realloc(szone_t *szone, void *ptr, size_t new_size)
{
	size_t old_size, new_good_size, valid_size;
	void *new_ptr;

#if DEBUG_MALLOC
	if (LOG(szone, ptr)) {
		malloc_report(ASL_LEVEL_INFO, "in szone_realloc for %p, %d\n", ptr, (unsigned)new_size);
	}
#endif
	if (NULL == ptr) {
		// If ptr is a null pointer, realloc() shall be equivalent to malloc() for the specified size.
		return szone_malloc(szone, new_size);
	} else if (0 == new_size) {
		// If size is 0 and ptr is not a null pointer, the object pointed to is freed.
		szone_free(szone, ptr);
		// If size is 0, either a null pointer or a unique pointer that can be successfully passed
		// to free() shall be returned.
		return szone_malloc(szone, 1);
	}

	old_size = szone_size(szone, ptr);
	if (!old_size) {
		malloc_zone_error(szone->debug_flags, true, "pointer %p being reallocated was not allocated\n", ptr);
		return NULL;
	}

	new_good_size = szone_good_size(szone, new_size);
	if (new_good_size == old_size) { // Existing allocation is best fit evar?
		return ptr;
	}

	/*
	 * If the new size suits the tiny allocator and the pointer being resized
	 * belongs to a tiny region, try to reallocate in-place.
	 */
	if (new_good_size <= TINY_LIMIT_THRESHOLD) {
		if (old_size <= TINY_LIMIT_THRESHOLD) {
			if (new_good_size <= (old_size >> 1)) {
				/*
				 * Serious shrinkage (more than half). free() the excess.
				 */
				return tiny_try_shrink_in_place(&szone->tiny_rack, ptr, old_size, new_good_size);
			} else if (new_good_size <= old_size) {
				/*
				 * new_good_size smaller than old_size but not by much (less than half).
				 * Avoid thrashing at the expense of some wasted storage.
				 */
				if (szone->debug_flags & MALLOC_DO_SCRIBBLE) {
					memset(ptr + new_size, SCRIBBLE_BYTE, old_size - new_size);
				}
				return ptr;
			} else if (tiny_try_realloc_in_place(&szone->tiny_rack, ptr, old_size, new_good_size)) { // try to grow the allocation
				if (szone->debug_flags & MALLOC_DO_SCRIBBLE) {
					memset(ptr + old_size, SCRIBBLE_BYTE, new_good_size - old_size);
				}
				return ptr;
			}
		}

		/*
		 * Else if the new size suits the small allocator and the pointer being resized
		 * belongs to a small region, and we're not protecting the small allocations
		 * try to reallocate in-place.
		 */
	} else if (new_good_size <= SMALL_LIMIT_THRESHOLD) {
		if (TINY_LIMIT_THRESHOLD < old_size && old_size <= SMALL_LIMIT_THRESHOLD) {
			if (new_good_size <= (old_size >> 1)) {
				return small_try_shrink_in_place(&szone->small_rack, ptr, old_size, new_good_size);
			} else if (new_good_size <= old_size) {
				if (szone->debug_flags & MALLOC_DO_SCRIBBLE) {
					memset(ptr + new_size, SCRIBBLE_BYTE, old_size - new_size);
				}
				return ptr;
			} else if (small_try_realloc_in_place(&szone->small_rack, ptr, old_size, new_good_size)) {
				if (szone->debug_flags & MALLOC_DO_SCRIBBLE) {
					memset(ptr + old_size, SCRIBBLE_BYTE, new_good_size - old_size);
				}
				return ptr;
			}
		}

#if CONFIG_MEDIUM_ALLOCATOR
	} else if (szone->is_medium_engaged && new_good_size <= MEDIUM_LIMIT_THRESHOLD) {
		if (SMALL_LIMIT_THRESHOLD < old_size && old_size <= MEDIUM_LIMIT_THRESHOLD) {
			if (new_good_size <= (old_size >> 1)) {
				return medium_try_shrink_in_place(&szone->medium_rack, ptr, old_size, new_good_size);
			} else if (new_good_size <= old_size) {
				if (szone->debug_flags & MALLOC_DO_SCRIBBLE) {
					memset(ptr + new_size, SCRIBBLE_BYTE, old_size - new_size);
				}
			} else if (medium_try_realloc_in_place(&szone->medium_rack, ptr, old_size, new_good_size)) {
				if (szone->debug_flags & MALLOC_DO_SCRIBBLE) {
					memset(ptr + old_size, SCRIBBLE_BYTE, new_good_size - old_size);
				}
				return ptr;
			}
		}
#endif // CONFIG_MEDIUM_ALLOCATOR

		/*
		 * Else if the allocation's a large allocation, try to reallocate in-place there.
		 */
	} else if (!(szone->debug_flags & MALLOC_PURGEABLE) && // purgeable needs fresh allocation
			   (old_size > LARGE_THRESHOLD(szone)) && (new_good_size > LARGE_THRESHOLD(szone))) {
		if (new_good_size <= (old_size >> 1)) {
			return large_try_shrink_in_place(szone, ptr, old_size, new_good_size);
		} else if (new_good_size <= old_size) {
			if (szone->debug_flags & MALLOC_DO_SCRIBBLE) {
				memset(ptr + new_size, SCRIBBLE_BYTE, old_size - new_size);
			}
			return ptr;
		} else if (large_try_realloc_in_place(szone, ptr, old_size, new_good_size)) {
			if (szone->debug_flags & MALLOC_DO_SCRIBBLE) {
				memset(ptr + old_size, SCRIBBLE_BYTE, new_good_size - old_size);
			}
			return ptr;
		}
	}

	/*
	 * Can't reallocate in place for whatever reason; allocate a new buffer and copy.
	 */
	if (new_good_size <= (old_size >> 1)) {
		/* Serious shrinkage (more than half). FALL THROUGH to alloc/copy/free. */
	} else if (new_good_size <= old_size) {
		if (szone->debug_flags & MALLOC_DO_SCRIBBLE) {
			memset(ptr + new_size, SCRIBBLE_BYTE, old_size - new_size);
		}
		return ptr;
	}

	new_ptr = szone_malloc(szone, new_size);
	if (new_ptr == NULL) {
		return NULL;
	}

	/*
	 * If the allocation's large enough, try to copy using VM.  If that fails, or
	 * if it's too small, just copy by hand.
	 */
	valid_size = MIN(old_size, new_size);
#if CONFIG_REALLOC_CAN_USE_VMCOPY
	if ((valid_size <= VM_COPY_THRESHOLD) ||
			vm_copy(mach_task_self(), (vm_address_t)ptr, valid_size, (vm_address_t)new_ptr))
#endif
	{
		memcpy(new_ptr, ptr, valid_size);
	}
	szone_free(szone, ptr);

#if DEBUG_MALLOC
	if (LOG(szone, ptr)) {
		malloc_report(ASL_LEVEL_INFO, "szone_realloc returned %p for %d\n", new_ptr, (unsigned)new_size);
	}
#endif
	return new_ptr;
}

void *
szone_memalign(szone_t *szone, size_t alignment, size_t size)
{
	if (size == 0) {
		size = 1; // Ensures we'll return an aligned free()-able pointer
	}
	if ((size + alignment) < size) { // size_t arithmetic wrapped!
		return NULL;
	}

	// alignment is a power of 2 at least as large as sizeof(void *), hence
	// non-zero.  Since size + alignment didn't wrap, 0 <= size + alignment - 1
	// < size + alignment
	size_t span = size + alignment - 1;

	if (alignment <= TINY_QUANTUM) {
		// Trivially satisfied by tiny, small, medium, or large.
		return szone_malloc(szone, size);
	}
	if (span <= TINY_LIMIT_THRESHOLD) {
		return tiny_memalign(szone, alignment, size, span);
	}
	if (TINY_LIMIT_THRESHOLD < size && alignment <= SMALL_QUANTUM) {
		// Trivially satisfied by small, medium or large.
		return szone_malloc(szone, size);
	}
	if (size <= TINY_LIMIT_THRESHOLD) {
		// The allocation asked for a size that TINY would normally fulfill
		// but it cannot guarantee the alignment. So bump it up to fit inside
		// SMALL and try again.
		size = TINY_LIMIT_THRESHOLD + TINY_QUANTUM;
		span = size + alignment - 1;
	}
	if (span <= SMALL_LIMIT_THRESHOLD) {
		return small_memalign(szone, alignment, size, span);
	}
#if CONFIG_MEDIUM_ALLOCATOR
	if (szone->is_medium_engaged) {
		if (size <= SMALL_LIMIT_THRESHOLD) {
			size = SMALL_LIMIT_THRESHOLD + SMALL_QUANTUM;
			span = size + alignment - 1;
		}
		if (szone->is_medium_engaged && span <= MEDIUM_LIMIT_THRESHOLD) {
			return medium_memalign(szone, alignment, size, span);
		}
	}
#endif // CONFIG_MEDIUM_ALLOCATOR
	if (LARGE_THRESHOLD(szone) < size && alignment <= vm_page_quanta_size) {
		// Trivially satisfied by large (which rounds to a whole page).
		return szone_malloc(szone, size);
	}
	// ensure block allocated by large does not have a small-possible size
	size_t num_kernel_pages = round_page_quanta(MAX(LARGE_THRESHOLD(szone) + 1,
			size)) >> vm_page_quanta_shift;
	if (num_kernel_pages == 0) { /* Overflowed */
		return NULL;
	} else {
		return large_malloc(szone, num_kernel_pages,
				MAX(vm_page_quanta_shift, __builtin_ctz((unsigned)alignment)), 0);
	}
	/* NOTREACHED */
	__builtin_unreachable();
}

// Given a size, returns the number of pointers allocated capable of holding
// that size, up to the limit specified by the 'count' argument.  These pointers
// are stored in the 'results' array, which must be allocated by the caller.
// May return zero, since this function is only a best attempt at allocating
// the pointers. Clients should be prepared to call malloc for any additional
// blocks they need.
unsigned
szone_batch_malloc(szone_t *szone, size_t size, void **results, unsigned count)
{
	// only bother implementing this for tiny
	if (size <= TINY_LIMIT_THRESHOLD) {
		return tiny_batch_malloc(szone, size, results, count);
	}
	return 0;
}

void
szone_batch_free(szone_t *szone, void **to_be_freed, unsigned count)
{
	// frees all the pointers in to_be_freed
	// note that to_be_freed may be overwritten during the process
	if (!count) {
		return;
	}

	CHECK(szone, __PRETTY_FUNCTION__);

	// We only support batch malloc in tiny. Let it free all of the pointers
	// that belong to it, then let the standard free deal with the rest.
	tiny_batch_free(szone, to_be_freed, count);

	CHECK(szone, __PRETTY_FUNCTION__);
	while (count--) {
		void *ptr = to_be_freed[count];
		if (ptr) {
			szone_free(szone, ptr);
		}
	}
}

// FIXME: Suppose one of the locks is held?
static void
szone_destroy(szone_t *szone)
{
	size_t index;
	large_entry_t *large;
	vm_range_t range_to_deallocate;

#if CONFIG_LARGE_CACHE
	SZONE_LOCK(szone);

	/* disable any memory pressure responder */
	szone->flotsam_enabled = FALSE;

	// stack allocated copy of the death-row cache
	int idx = szone->large_entry_cache_oldest, idx_max = szone->large_entry_cache_newest;
	large_entry_t local_entry_cache[LARGE_ENTRY_CACHE_SIZE_HIGH];

	memcpy((void *)local_entry_cache, (void *)szone->large_entry_cache, sizeof(local_entry_cache));

	szone->large_entry_cache_oldest = szone->large_entry_cache_newest = 0;
	szone->large_entry_cache[0].address = 0x0;
	szone->large_entry_cache[0].size = 0;
	szone->large_entry_cache_bytes = 0;
	szone->large_entry_cache_reserve_bytes = 0;

	SZONE_UNLOCK(szone);

	// deallocate the death-row cache outside the zone lock
	while (idx != idx_max) {
		mvm_deallocate_pages((void *)local_entry_cache[idx].address, local_entry_cache[idx].size, szone->debug_flags);
		if (++idx == szone->large_cache_depth) {
			idx = 0;
		}
	}
	if (0 != local_entry_cache[idx].address && 0 != local_entry_cache[idx].size) {
		mvm_deallocate_pages((void *)local_entry_cache[idx].address, local_entry_cache[idx].size, szone->debug_flags);
	}
#endif

	/* destroy large entries */
	index = szone->num_large_entries;
	while (index--) {
		large = szone->large_entries + index;
		if (large->address) {
			// we deallocate_pages, including guard pages
			mvm_deallocate_pages((void *)(large->address), large->size, szone->debug_flags);
		}
	}
	large_entries_free_no_lock(szone, szone->large_entries, szone->num_large_entries, &range_to_deallocate);
	if (range_to_deallocate.size) {
		mvm_deallocate_pages((void *)range_to_deallocate.address, (size_t)range_to_deallocate.size, szone->debug_flags);
	}

	/* destroy allocator regions */
	rack_destroy_regions(&szone->tiny_rack, TINY_REGION_SIZE);
	rack_destroy_regions(&szone->small_rack, SMALL_REGION_SIZE);

	/* destroy rack region hash rings and racks themselves */
	rack_destroy(&szone->tiny_rack);
	rack_destroy(&szone->small_rack);

#if CONFIG_MEDIUM_ALLOCATOR
	if (szone->is_medium_engaged) {
		rack_destroy_regions(&szone->medium_rack, MEDIUM_REGION_SIZE);
		rack_destroy(&szone->medium_rack);
	}
#endif // CONFIG_MEDIUM_ALLOCATOR

	mvm_deallocate_pages((void *)szone, SZONE_PAGED_SIZE, 0);
}

size_t
szone_good_size(szone_t *szone, size_t size)
{
	msize_t msize;

	// Find a good size for this tiny allocation.
	if (size <= TINY_LIMIT_THRESHOLD) {
		msize = TINY_MSIZE_FOR_BYTES(size + TINY_QUANTUM - 1);
		if (!msize) {
			msize = 1;
		}
		return TINY_BYTES_FOR_MSIZE(msize);
	}

	// Find a good size for this small allocation.
	if (size <= SMALL_LIMIT_THRESHOLD) {
		msize = SMALL_MSIZE_FOR_BYTES(size + SMALL_QUANTUM - 1);
		if (!msize) {
			msize = 1;
		}
		return SMALL_BYTES_FOR_MSIZE(msize);
	}

#if CONFIG_MEDIUM_ALLOCATOR
	if (szone->is_medium_engaged && size <= MEDIUM_LIMIT_THRESHOLD) {
		msize = MEDIUM_MSIZE_FOR_BYTES(size + MEDIUM_QUANTUM - 1);
		if (!msize) {
			msize = 1;
		}
		return MEDIUM_BYTES_FOR_MSIZE(msize);
	}
#endif // CONFIG_MEDIUM_ALLOCATOR

	// Check for integer overflow on the size, since unlike the two cases above,
	// there is no upper bound on allocation size at this point.
	if (size > round_page_quanta(size)) {
		return (size_t)(-1LL);
	}

#if DEBUG_MALLOC
	// It is not acceptable to see a size of zero here, since that means we
	// failed to catch a request for zero bytes in the tiny check, or the size
	// overflowed to zero during some arithmetic.
	if (size == 0) {
		malloc_report(ASL_LEVEL_INFO, "szone_good_size() invariant broken %y\n", size);
	}
#endif
	return round_page_quanta(size);
}

boolean_t
szone_claimed_address(szone_t *szone, void *ptr)
{
	return tiny_claimed_address(&szone->tiny_rack, ptr)
			|| small_claimed_address(&szone->small_rack, ptr)
#if CONFIG_MEDIUM_ALLOCATOR
			|| (szone->is_medium_engaged &&
					medium_claimed_address(&szone->medium_rack, ptr))
#endif // CONFIG_MEDIUM_ALLOCATOR
			|| large_claimed_address(szone, ptr);
}

unsigned szone_check_counter = 0;
unsigned szone_check_start = 0;
unsigned szone_check_modulo = 1;

static MALLOC_NOINLINE boolean_t
szone_check_all(szone_t *szone, const char *function)
{
	size_t index;

	/* check tiny regions - chould check region count */
	for (index = 0; index < szone->tiny_rack.region_generation->num_regions_allocated; ++index) {
		region_t tiny = szone->tiny_rack.region_generation->hashed_regions[index];

		if (HASHRING_REGION_DEALLOCATED == tiny) {
			continue;
		}

		if (tiny) {
			magazine_t *tiny_mag_ptr = mag_lock_zine_for_region_trailer(szone->tiny_rack.magazines,
					REGION_TRAILER_FOR_TINY_REGION(tiny),
					MAGAZINE_INDEX_FOR_TINY_REGION(tiny));

			if (!tiny_check_region(&szone->tiny_rack, tiny, index, szone_check_counter)) {
				SZONE_MAGAZINE_PTR_UNLOCK(tiny_mag_ptr);
				szone->debug_flags &= ~CHECK_REGIONS;
				return 0;
			}
			SZONE_MAGAZINE_PTR_UNLOCK(tiny_mag_ptr);
		}
	}
	/* check tiny free lists */
	for (index = 0; index < NUM_TINY_SLOTS; ++index) {
		if (!tiny_free_list_check(&szone->tiny_rack, (grain_t)index, szone_check_counter)) {
			szone->debug_flags &= ~CHECK_REGIONS;
			return 0;
		}
	}

	/* check small regions - could check region count */
	for (index = 0; index < szone->small_rack.region_generation->num_regions_allocated; ++index) {
		region_t small = szone->small_rack.region_generation->hashed_regions[index];

		if (HASHRING_REGION_DEALLOCATED == small) {
			continue;
		}

		if (small) {
			magazine_t *small_mag_ptr = mag_lock_zine_for_region_trailer(szone->small_rack.magazines,
					REGION_TRAILER_FOR_SMALL_REGION(small),
					MAGAZINE_INDEX_FOR_SMALL_REGION(small));

			if (!small_check_region(&szone->small_rack, small, index, szone_check_counter)) {
				SZONE_MAGAZINE_PTR_UNLOCK(small_mag_ptr);
				szone->debug_flags &= ~CHECK_REGIONS;
				return 0;
			}
			SZONE_MAGAZINE_PTR_UNLOCK(small_mag_ptr);
		}
	}
	/* check small free lists */
	for (index = 0; index < SMALL_FREE_SLOT_COUNT(&szone->small_rack); ++index) {
		if (!small_free_list_check(&szone->small_rack, (grain_t)index, szone_check_counter)) {
			szone->debug_flags &= ~CHECK_REGIONS;
			return 0;
		}
	}

#if CONFIG_MEDIUM_ALLOCATOR
	if (szone->is_medium_engaged) {
		/* check medium regions - could check region count */
		for (index = 0; index < szone->medium_rack.region_generation->num_regions_allocated; ++index) {
			region_t medium = szone->medium_rack.region_generation->hashed_regions[index];

			if (HASHRING_REGION_DEALLOCATED == medium) {
				continue;
			}

			if (medium) {
				magazine_t *medium_mag_ptr = mag_lock_zine_for_region_trailer(szone->medium_rack.magazines,
						REGION_TRAILER_FOR_MEDIUM_REGION(medium),
						MAGAZINE_INDEX_FOR_MEDIUM_REGION(medium));

				if (!medium_check_region(&szone->medium_rack, medium, index, szone_check_counter)) {
					SZONE_MAGAZINE_PTR_UNLOCK(medium_mag_ptr);
					szone->debug_flags &= ~CHECK_REGIONS;
					return 0;
				}
				SZONE_MAGAZINE_PTR_UNLOCK(medium_mag_ptr);
			}
		}
		/* check medium free lists */
		for (index = 0; index < MEDIUM_FREE_SLOT_COUNT(&szone->medium_rack); ++index) {
			if (!medium_free_list_check(&szone->medium_rack, (grain_t)index, szone_check_counter)) {
				szone->debug_flags &= ~CHECK_REGIONS;
				return 0;
			}
		}
	}
#endif // CONFIG_MEDIUM_ALLOCATOR

	return 1;
}

static boolean_t
szone_check(szone_t *szone)
{
	if ((++szone_check_counter % 10000) == 0) {
		malloc_report(ASL_LEVEL_NOTICE, "at szone_check counter=%d\n", szone_check_counter);
	}

	if (szone_check_counter < szone_check_start) {
		return 1;
	}

	if (szone_check_counter % szone_check_modulo) {
		return 1;
	}

	return szone_check_all(szone, "");
}

static kern_return_t
szone_ptr_in_use_enumerator(task_t task,
		void *context,
		unsigned type_mask,
		vm_address_t zone_address,
		memory_reader_t reader,
		vm_range_recorder_t recorder)
{
	szone_t *szone;
	kern_return_t err;

	if (!reader) {
		reader = _malloc_default_reader;
	}

	err = reader(task, zone_address, sizeof(szone_t), (void **)&szone);
	if (err) {
		return err;
	}

	err = tiny_in_use_enumerator(task, context, type_mask, szone, reader, recorder);
	if (err) {
		return err;
	}

	err = small_in_use_enumerator(task, context, type_mask, szone, reader, recorder);
	if (err) {
		return err;
	}

#if CONFIG_MEDIUM_ALLOCATOR
	if (szone->is_medium_engaged) {
		err = medium_in_use_enumerator(task, context, type_mask, szone, reader, recorder);
		if (err) {
			return err;
		}
	}
#endif // CONFIG_MEDIUM_ALLOCATOR

	err = large_in_use_enumerator(
			task, context, type_mask, (vm_address_t)szone->large_entries, szone->num_large_entries, reader, recorder);
	return err;
}

static boolean_t
scalable_zone_info_task(task_t task, memory_reader_t reader,
		malloc_zone_t *zone, unsigned *info_to_fill, unsigned count)
{
	szone_t *szone = (void *)zone;
	unsigned info[13];

	// We do not lock to facilitate debug

	size_t s = 0;
	unsigned t = 0;
	size_t u = 0;
	mag_index_t mag_index;

	magazine_t *mapped_magazines;
	if (reader(task, (vm_address_t)szone->tiny_rack.magazines,
			sizeof(magazine_t), (void **)&mapped_magazines)) {
		return false;
	}
	for (mag_index = -1; mag_index < szone->tiny_rack.num_magazines; mag_index++) {
		s += mapped_magazines[mag_index].mag_bytes_free_at_start;
		s += mapped_magazines[mag_index].mag_bytes_free_at_end;
		t += mapped_magazines[mag_index].mag_num_objects;
		u += mapped_magazines[mag_index].mag_num_bytes_in_objects;
	}

	info[4] = (unsigned)t;
	info[5] = (unsigned)u;

	if (reader(task, (vm_address_t)szone->small_rack.magazines,
			sizeof(magazine_t), (void **)&mapped_magazines)) {
		return false;
	}
	for (t = 0, u = 0, mag_index = -1; mag_index < szone->small_rack.num_magazines; mag_index++) {
		s += mapped_magazines[mag_index].mag_bytes_free_at_start;
		s += mapped_magazines[mag_index].mag_bytes_free_at_end;
		t += mapped_magazines[mag_index].mag_num_objects;
		u += mapped_magazines[mag_index].mag_num_bytes_in_objects;
	}

	info[6] = (unsigned)t;
	info[7] = (unsigned)u;

	info[8] = (unsigned)szone->num_large_objects_in_use;
	info[9] = (unsigned)szone->num_bytes_in_large_objects;

	info[10] = 0; // DEPRECATED szone->num_huge_entries;
	info[11] = 0; // DEPRECATED szone->num_bytes_in_huge_objects;

	info[12] = szone->debug_flags;

	info[0] = info[4] + info[6] + info[8] + info[10];
	info[1] = info[5] + info[7] + info[9] + info[11];

	info[3] = (unsigned)(szone->tiny_rack.num_regions - szone->tiny_rack.num_regions_dealloc) * TINY_REGION_SIZE +
			  (unsigned)(szone->small_rack.num_regions - szone->small_rack.num_regions_dealloc) * SMALL_REGION_SIZE + info[9] + info[11];

	info[2] = info[3] - (unsigned)s;
	memcpy(info_to_fill, info, sizeof(unsigned) * count);

	return true;
}

// Following method is deprecated:  use scalable_zone_statistics instead
// Required for backward compatibility.
void
scalable_zone_info(malloc_zone_t *zone, unsigned *info_to_fill, unsigned count) {
	scalable_zone_info_task(mach_task_self(), _malloc_default_reader, zone,
			info_to_fill, count);
}

// FIXME: consistent picture requires locking!
static MALLOC_NOINLINE void
szone_print(task_t task, unsigned level, vm_address_t zone_address,
		memory_reader_t reader, print_task_printer_t printer)
{
	unsigned info[13];
	size_t index;
	region_t region;
	region_t mapped_region;

	szone_t *szone = (szone_t *)zone_address;
	szone_t *mapped_szone;
	if (reader(task, zone_address, sizeof(szone_t), (void **)&mapped_szone)) {
		printer("Failed to read szone structure\n");
		return;
	}

	if (!scalable_zone_info_task(task, reader, (void *)mapped_szone, info, 13)) {
		printer("Failed to get scalable zone info\n");
		return;
	}
	printer("Scalable zone %p: inUse=%u(%u) touched=%u allocated=%u flags=0x%x\n",
			zone_address, info[0], info[1], info[2], info[3], info[12]);
	printer("\ttiny=%u(%u) small=%u(%u) large=%u(%u)\n", info[4],
			info[5], info[6], info[7], info[8], info[9]);
	// tiny
	printer("%lu tiny regions:\n", mapped_szone->tiny_rack.num_regions);
	if (mapped_szone->tiny_rack.num_regions_dealloc) {
		printer("[%lu tiny regions have been vm_deallocate'd]\n",
				mapped_szone->tiny_rack.num_regions_dealloc);
	}

	region_hash_generation_t *mapped_region_generation;
	region_t *mapped_hashed_regions;
	magazine_t *mapped_magazines;
	if (reader(task, (vm_address_t)mapped_szone->tiny_rack.region_generation,
			sizeof(region_hash_generation_t), (void **)&mapped_region_generation)) {
		printer("Failed to map tiny rack region_generation\n");
		return;
	}
	if (reader(task, (vm_address_t)mapped_region_generation->hashed_regions,
			sizeof(region_t), (void **)&mapped_hashed_regions)) {
		printer("Failed to map tiny rack hashed_regions\n");
		return;
	}
	if (reader(task, (vm_address_t)mapped_szone->tiny_rack.magazines,
			mapped_szone->tiny_rack.num_magazines * sizeof(magazine_t),
			(void **)&mapped_magazines)) {
		printer("Failed to map tiny rack magazines\n");
		return;
	}

	int recirc_regions = 0;
	for (index = 0; index < mapped_region_generation->num_regions_allocated; ++index) {
		region = mapped_hashed_regions[index];
		if (HASHRING_OPEN_ENTRY != region && HASHRING_REGION_DEALLOCATED != region) {
			if (reader(task, (vm_address_t)region, sizeof(struct tiny_region),
					(void **)&mapped_region)) {
				printer("Failed to map region %p\n", region);
				return;
			}
			mag_index_t mag_index = MAGAZINE_INDEX_FOR_TINY_REGION(mapped_region);
			if (mag_index == DEPOT_MAGAZINE_INDEX) {
				recirc_regions++;
			}
			print_tiny_region(task, reader, printer, level, region,
					(region == mapped_magazines[mag_index].mag_last_region)
						? mapped_magazines[mag_index].mag_bytes_free_at_start
						: 0,
					(region == mapped_magazines[mag_index].mag_last_region)
						? mapped_magazines[mag_index].mag_bytes_free_at_end
						: 0);
		}
	}

#if CONFIG_RECIRC_DEPOT
	magazine_t *mapped_recirc_depot = &mapped_magazines[DEPOT_MAGAZINE_INDEX];
	if (mapped_recirc_depot->mag_num_bytes_in_objects) {
		printer("Tiny recirc depot: total bytes: %llu, in-use bytes: %llu, "
				"allocations: %llu, regions: %d (min # retained regions: %d)\n",
				mapped_recirc_depot->num_bytes_in_magazine,
				mapped_recirc_depot->mag_num_bytes_in_objects,
				mapped_recirc_depot->mag_num_objects, recirc_regions,
				recirc_retained_regions);
	} else {
		printer("Tiny recirc depot is empty\n");
	}
#else // CONFIG_RECIRC_DEPOT
	printer("Tiny recirc depot not configured\n");
#endif // CONFIG_RECIRC_DEPOT

	if (level > 0) {
		print_tiny_free_list(task, reader, printer, &szone->tiny_rack);
	}

	// small
	printer("%lu small regions:\n", mapped_szone->small_rack.num_regions);
	if (mapped_szone->small_rack.num_regions_dealloc) {
		printer("[%lu small regions have been vm_deallocate'd]\n",
				mapped_szone->small_rack.num_regions_dealloc);
	}
	if (reader(task, (vm_address_t)mapped_szone->small_rack.region_generation,
			sizeof(region_hash_generation_t), (void **)&mapped_region_generation)) {
		printer("Failed to map small rack region_generation\n");
		return;
	}
	if (reader(task, (vm_address_t)mapped_region_generation->hashed_regions,
			sizeof(region_t), (void **)&mapped_hashed_regions)) {
		printer("Failed to map small rack hashed_regions\n");
		return;
	}
	if (reader(task, (vm_address_t)mapped_szone->small_rack.magazines,
			mapped_szone->small_rack.num_magazines * sizeof(magazine_t),
			(void **)&mapped_magazines)) {
		printer("Failed to map small rack magazines\n");
		return;
	}

	recirc_regions = 0;
	for (index = 0; index < mapped_region_generation->num_regions_allocated; ++index) {
		region = mapped_hashed_regions[index];
		if (HASHRING_OPEN_ENTRY != region && HASHRING_REGION_DEALLOCATED != region) {
			if (reader(task, (vm_address_t)region, sizeof(struct small_region),
					(void **)&mapped_region)) {
				printer("Failed to map region %p\n", region);
				return;
			}
			mag_index_t mag_index = MAGAZINE_INDEX_FOR_SMALL_REGION(mapped_region);
			if (mag_index == DEPOT_MAGAZINE_INDEX) {
				recirc_regions++;
			}
			print_small_region(task, reader, printer, mapped_szone, level, region,
					(region == mapped_magazines[mag_index].mag_last_region)
						? mapped_magazines[mag_index].mag_bytes_free_at_start
						: 0,
					(region == mapped_magazines[mag_index].mag_last_region)
						? mapped_magazines[mag_index].mag_bytes_free_at_end
						: 0);
		}
	}

#if CONFIG_RECIRC_DEPOT
	mapped_recirc_depot = &mapped_magazines[DEPOT_MAGAZINE_INDEX];
	if (mapped_recirc_depot->mag_num_bytes_in_objects) {
		printer("Small recirc depot: total bytes: %llu, in-use bytes: %llu, "
				"allocations: %llu, regions: %d (min # retained regions: %d)\n",
				mapped_recirc_depot->num_bytes_in_magazine,
				mapped_recirc_depot->mag_num_bytes_in_objects,
				mapped_recirc_depot->mag_num_objects, recirc_regions,
				recirc_retained_regions);
	} else {
		printer("Small recirc depot is empty\n");
	}
#else // CONFIG_RECIRC_DEPOT
	printer("Small recirc depot not configured\n");
#endif // CONFIG_RECIRC_DEPOT

	if (level > 0) {
		print_small_free_list(task, reader, printer, &szone->small_rack);
	}

#if CONFIG_MEDIUM_ALLOCATOR
	if (szone->is_medium_engaged) {
		// medium
		printer("%lu medium regions:\n", mapped_szone->medium_rack.num_regions);
		if (mapped_szone->medium_rack.num_regions_dealloc) {
			printer("[%lu medium regions have been vm_deallocate'd]\n",
					mapped_szone->medium_rack.num_regions_dealloc);
		}
		if (reader(task, (vm_address_t)mapped_szone->medium_rack.region_generation,
				sizeof(region_hash_generation_t), (void **)&mapped_region_generation)) {
			printer("Failed to map medium rack region_generation\n");
			return;
		}
		if (reader(task, (vm_address_t)mapped_region_generation->hashed_regions,
				sizeof(region_t), (void **)&mapped_hashed_regions)) {
			printer("Failed to map medium rack hashed_regions\n");
			return;
		}
		if (reader(task, (vm_address_t)mapped_szone->medium_rack.magazines,
				mapped_szone->medium_rack.num_magazines * sizeof(magazine_t),
				(void **)&mapped_magazines)) {
			printer("Failed to map medium rack magazines\n");
			return;
		}

		recirc_regions = 0;
		for (index = 0; index < mapped_region_generation->num_regions_allocated; ++index) {
			region = mapped_hashed_regions[index];
			if (HASHRING_OPEN_ENTRY != region && HASHRING_REGION_DEALLOCATED != region) {
				if (reader(task, (vm_address_t)region, sizeof(struct medium_region),
						(void **)&mapped_region)) {
					printer("Failed to map region %p\n", region);
					return;
				}
				mag_index_t mag_index = MAGAZINE_INDEX_FOR_MEDIUM_REGION(mapped_region);
				if (mag_index == DEPOT_MAGAZINE_INDEX) {
					recirc_regions++;
				}
				print_medium_region(task, reader, printer, mapped_szone, level,
						region,
						(region == mapped_magazines[mag_index].mag_last_region)
							? mapped_magazines[mag_index].mag_bytes_free_at_start
							: 0,
						(region == mapped_magazines[mag_index].mag_last_region)
							? mapped_magazines[mag_index].mag_bytes_free_at_end
							: 0);
			}
		}

#if CONFIG_RECIRC_DEPOT
		mapped_recirc_depot = &mapped_magazines[DEPOT_MAGAZINE_INDEX];
		if (mapped_recirc_depot->mag_num_bytes_in_objects) {
			printer("Medium recirc depot: total bytes: %llu, in-use bytes: %llu, "
					"allocations: %llu, regions: %d (min # retained regions: %d)\n",
					mapped_recirc_depot->num_bytes_in_magazine,
					mapped_recirc_depot->mag_num_bytes_in_objects,
					mapped_recirc_depot->mag_num_objects, recirc_regions,
					recirc_retained_regions);
		} else {
			printer("Medium recirc depot is empty\n");
		}
#else // CONFIG_RECIRC_DEPOT
		printer("Medium recirc depot not configured\n");
#endif // CONFIG_RECIRC_DEPOT

		if (level > 0) {
			print_medium_free_list(task, reader, printer, &szone->medium_rack);
		}
	}
#endif // CONFIG_MEDIUM_ALLOCATOR

	// Large
	large_debug_print(task, level, zone_address, reader, printer);
}

static void
szone_print_self(szone_t *szone, boolean_t verbose)
{
	szone_print(mach_task_self(), verbose ? MALLOC_VERBOSE_PRINT_LEVEL : 0,
			(vm_address_t)szone, _malloc_default_reader, malloc_report_simple);
}

static void
szone_print_task(task_t task, unsigned level, vm_address_t zone_address,
		memory_reader_t reader, print_task_printer_t printer)
{
	szone_print(task, level, zone_address, reader, printer);
}

static void
szone_log(malloc_zone_t *zone, void *log_address)
{
	szone_t *szone = (szone_t *)zone;

	szone->log_address = log_address;
}

// <rdar://problem/18001324>
// When forcing the lock on the entire zone, make sure we are out of the critical section in each magazine
static MALLOC_INLINE void
szone_force_lock_magazine(szone_t *szone, magazine_t *mag)
{
	while (1) {
		SZONE_MAGAZINE_PTR_LOCK(mag);
		if (!mag->alloc_underway) {
			return;
		}

		SZONE_MAGAZINE_PTR_UNLOCK(mag);
		yield();
	}
}

static void
szone_force_lock(szone_t *szone)
{
	mag_index_t i;

	for (i = 0; i < szone->tiny_rack.num_magazines; ++i) {
		szone_force_lock_magazine(szone, &szone->tiny_rack.magazines[i]);
	}
	szone_force_lock_magazine(szone, &szone->tiny_rack.magazines[DEPOT_MAGAZINE_INDEX]);

	for (i = 0; i < szone->small_rack.num_magazines; ++i) {
		szone_force_lock_magazine(szone, &szone->small_rack.magazines[i]);
	}
	szone_force_lock_magazine(szone, &szone->small_rack.magazines[DEPOT_MAGAZINE_INDEX]);

#if CONFIG_MEDIUM_ALLOCATOR
	if (szone->is_medium_engaged) {
		for (i = 0; i < szone->medium_rack.num_magazines; ++i) {
			szone_force_lock_magazine(szone, &szone->medium_rack.magazines[i]);
		}
		szone_force_lock_magazine(szone, &szone->medium_rack.magazines[DEPOT_MAGAZINE_INDEX]);
	}
#endif

	SZONE_LOCK(szone);
}

static void
szone_force_unlock(szone_t *szone)
{
	mag_index_t i;

	SZONE_UNLOCK(szone);

#if CONFIG_MEDIUM_ALLOCATOR
	if (szone->is_medium_engaged) {
		for (i = -1; i < szone->medium_rack.num_magazines; ++i) {
			SZONE_MAGAZINE_PTR_UNLOCK((&(szone->medium_rack.magazines[i])));
		}
	}
#endif // CONFIG_MEDIUM_ALLOCATOR

	for (i = -1; i < szone->small_rack.num_magazines; ++i) {
		SZONE_MAGAZINE_PTR_UNLOCK((&(szone->small_rack.magazines[i])));
	}

	for (i = -1; i < szone->tiny_rack.num_magazines; ++i) {
		SZONE_MAGAZINE_PTR_UNLOCK((&(szone->tiny_rack.magazines[i])));
	}
}

static void
szone_reinit_lock(szone_t *szone)
{
	mag_index_t i;

	SZONE_REINIT_LOCK(szone);

#if CONFIG_MEDIUM_ALLOCATOR
	if (szone->is_medium_engaged) {
		for (i = -1; i < szone->medium_rack.num_magazines; ++i) {
			SZONE_MAGAZINE_PTR_REINIT_LOCK((&(szone->medium_rack.magazines[i])));
		}
	}
#endif // CONFIG_MEDIUM_ALLOCATOR

	for (i = -1; i < szone->small_rack.num_magazines; ++i) {
		SZONE_MAGAZINE_PTR_REINIT_LOCK((&(szone->small_rack.magazines[i])));
	}

	for (i = -1; i < szone->tiny_rack.num_magazines; ++i) {
		SZONE_MAGAZINE_PTR_REINIT_LOCK((&(szone->tiny_rack.magazines[i])));
	}
}

static boolean_t
szone_locked(szone_t *szone)
{
	mag_index_t i;
	int tookLock;

	tookLock = SZONE_TRY_LOCK(szone);
	if (tookLock == 0) {
		return 1;
	}
	SZONE_UNLOCK(szone);

#if CONFIG_MEDIUM_ALLOCATOR
	if (szone->is_medium_engaged) {
		for (i = -1; i < szone->small_rack.num_magazines; ++i) {
				tookLock = SZONE_MAGAZINE_PTR_TRY_LOCK((&(szone->small_rack.magazines[i])));
				if (tookLock == 0) {
					return 1;
				}
				SZONE_MAGAZINE_PTR_UNLOCK((&(szone->small_rack.magazines[i])));
		}
	}
#endif // CONFIG_MEDIUM_ALLOCATOR

	for (i = -1; i < szone->small_rack.num_magazines; ++i) {
		tookLock = SZONE_MAGAZINE_PTR_TRY_LOCK((&(szone->small_rack.magazines[i])));
		if (tookLock == 0) {
			return 1;
		}
		SZONE_MAGAZINE_PTR_UNLOCK((&(szone->small_rack.magazines[i])));
	}

	for (i = -1; i < szone->tiny_rack.num_magazines; ++i) {
		tookLock = SZONE_MAGAZINE_PTR_TRY_LOCK((&(szone->tiny_rack.magazines[i])));
		if (tookLock == 0) {
			return 1;
		}
		SZONE_MAGAZINE_PTR_UNLOCK((&(szone->tiny_rack.magazines[i])));
	}
	return 0;
}

size_t
szone_pressure_relief(szone_t *szone, size_t goal)
{
	size_t total = 0;

	MAGMALLOC_PRESSURERELIEFBEGIN((void *)szone, szone->basic_zone.zone_name, (int)goal); // DTrace USDT Probe
	MALLOC_TRACE(TRACE_malloc_memory_pressure | DBG_FUNC_START, (uint64_t)szone, goal, 0, 0);

#if CONFIG_MADVISE_PRESSURE_RELIEF
	tiny_madvise_pressure_relief(&szone->tiny_rack);
	small_madvise_pressure_relief(&szone->small_rack);

#if CONFIG_MEDIUM_ALLOCATOR
	if (szone->is_medium_engaged) {
		medium_madvise_pressure_relief(&szone->medium_rack);
	}
#endif // CONFIG_MEDIUM_ALLOCATOR
#endif // CONFIG_MADVISE_PRESSURE_RELIEF

#if CONFIG_LARGE_CACHE
	if (szone->flotsam_enabled) {
		SZONE_LOCK(szone);

		// stack allocated copy of the death-row cache
		int idx = szone->large_entry_cache_oldest, idx_max = szone->large_entry_cache_newest;
		large_entry_t local_entry_cache[LARGE_ENTRY_CACHE_SIZE_HIGH];

		memcpy((void *)local_entry_cache, (void *)szone->large_entry_cache, sizeof(local_entry_cache));

		szone->large_entry_cache_oldest = szone->large_entry_cache_newest = 0;
		szone->large_entry_cache[0].address = 0x0;
		szone->large_entry_cache[0].size = 0;
		szone->large_entry_cache_bytes = 0;
		szone->large_entry_cache_reserve_bytes = 0;

		szone->flotsam_enabled = FALSE;

		SZONE_UNLOCK(szone);

		// deallocate the death-row cache outside the zone lock
		size_t total = 0;
		while (idx != idx_max) {
			mvm_deallocate_pages((void *)local_entry_cache[idx].address, local_entry_cache[idx].size, szone->debug_flags);
			total += local_entry_cache[idx].size;
			if (++idx == szone->large_cache_depth) {
				idx = 0;
			}
		}
		if (0 != local_entry_cache[idx].address && 0 != local_entry_cache[idx].size) {
			mvm_deallocate_pages((void *)local_entry_cache[idx].address, local_entry_cache[idx].size, szone->debug_flags);
			total += local_entry_cache[idx].size;
		}
	}
#endif

	MAGMALLOC_PRESSURERELIEFEND((void *)szone, szone->basic_zone.zone_name, (int)goal, (int)total); // DTrace USDT Probe
	MALLOC_TRACE(TRACE_malloc_memory_pressure | DBG_FUNC_END, (uint64_t)szone, goal, total, 0);

	return total;
}

boolean_t
scalable_zone_statistics(malloc_zone_t *zone, malloc_statistics_t *stats, unsigned subzone)
{
	szone_t *szone = (szone_t *)zone;

	switch (subzone) {
	case 0: {
		size_t s = 0;
		unsigned t = 0;
		size_t u = 0;
		mag_index_t mag_index;

		for (mag_index = -1; mag_index < szone->tiny_rack.num_magazines; mag_index++) {
			s += szone->tiny_rack.magazines[mag_index].mag_bytes_free_at_start;
			s += szone->tiny_rack.magazines[mag_index].mag_bytes_free_at_end;
			t += szone->tiny_rack.magazines[mag_index].mag_num_objects;
			u += szone->tiny_rack.magazines[mag_index].mag_num_bytes_in_objects;
		}

		stats->blocks_in_use = t;
		stats->size_in_use = u;
		stats->size_allocated = (szone->tiny_rack.num_regions - szone->tiny_rack.num_regions_dealloc) * TINY_REGION_SIZE;
		stats->max_size_in_use = stats->size_allocated - s;
		return 1;
	}
	case 1: {
		size_t s = 0;
		unsigned t = 0;
		size_t u = 0;
		mag_index_t mag_index;

		for (mag_index = -1; mag_index < szone->small_rack.num_magazines; mag_index++) {
			s += szone->small_rack.magazines[mag_index].mag_bytes_free_at_start;
			s += szone->small_rack.magazines[mag_index].mag_bytes_free_at_end;
			t += szone->small_rack.magazines[mag_index].mag_num_objects;
			u += szone->small_rack.magazines[mag_index].mag_num_bytes_in_objects;
		}

		stats->blocks_in_use = t;
		stats->size_in_use = u;
		stats->size_allocated = (szone->small_rack.num_regions - szone->small_rack.num_regions_dealloc) * SMALL_REGION_SIZE;
		stats->max_size_in_use = stats->size_allocated - s;
		return 1;
	}
	case 2:
		stats->blocks_in_use = szone->num_large_objects_in_use;
		stats->size_in_use = szone->num_bytes_in_large_objects;
		stats->max_size_in_use = stats->size_allocated = stats->size_in_use;
		return 1;
	case 3:
		stats->blocks_in_use = 0; // DEPRECATED szone->num_huge_entries;
		stats->size_in_use = 0;   // DEPRECATED szone->num_bytes_in_huge_objects;
		stats->max_size_in_use = stats->size_allocated = 0;
		return 1;
	case 4: {
		size_t s = 0;
		unsigned t = 0;
		size_t u = 0;
		size_t sa = 0;

#if CONFIG_MEDIUM_ALLOCATOR
		mag_index_t mag_index;
		if (szone->is_medium_engaged) {
			for (mag_index = -1; mag_index < szone->medium_rack.num_magazines; mag_index++) {
				s += szone->medium_rack.magazines[mag_index].mag_bytes_free_at_start;
				s += szone->medium_rack.magazines[mag_index].mag_bytes_free_at_end;
				t += szone->medium_rack.magazines[mag_index].mag_num_objects;
				u += szone->medium_rack.magazines[mag_index].mag_num_bytes_in_objects;
			}
		}

		sa = (szone->medium_rack.num_regions - szone->medium_rack.num_regions_dealloc) * MEDIUM_REGION_SIZE;
#endif // CONFIG_MEDIUM_ALLOCATOR

		stats->blocks_in_use = t;
		stats->size_in_use = u;
		stats->size_allocated = sa;
		stats->max_size_in_use = stats->size_allocated - s;
		return 1;
	}}
	return 0;
}

static kern_return_t
szone_statistics_task(task_t task, vm_address_t zone_address,
					  memory_reader_t reader, malloc_statistics_t *stats)
{
	reader = !reader && task == mach_task_self() ? _malloc_default_reader : reader;

	szone_t *szone;
	kern_return_t err;

	err = reader(task, zone_address, sizeof(szone_t), (void**)&szone);
	if (err) return err;

	size_t large;
	size_t s = 0;
	unsigned t = 0;
	size_t u = 0;
	mag_index_t mag_index;

	magazine_t *mags;
	err = reader(task, (vm_address_t)szone->tiny_rack.magazines, sizeof(magazine_t) * szone->tiny_rack.num_magazines, (void**)&mags);
	if (err) return err;

	for (mag_index = -1; mag_index < szone->tiny_rack.num_magazines; mag_index++) {
		s += mags[mag_index].mag_bytes_free_at_start;
		s += mags[mag_index].mag_bytes_free_at_end;
		t += mags[mag_index].mag_num_objects;
		u += mags[mag_index].mag_num_bytes_in_objects;
	}

	err = reader(task, (vm_address_t)szone->small_rack.magazines, sizeof(magazine_t) * szone->small_rack.num_magazines, (void**)&mags);
	if (err) return err;

	for (mag_index = -1; mag_index < szone->small_rack.num_magazines; mag_index++) {
		s += mags[mag_index].mag_bytes_free_at_start;
		s += mags[mag_index].mag_bytes_free_at_end;
		t += mags[mag_index].mag_num_objects;
		u += mags[mag_index].mag_num_bytes_in_objects;
	}

#if CONFIG_MEDIUM_ALLOCATOR
	if (szone->is_medium_engaged) {
		for (mag_index = -1; mag_index < szone->medium_rack.num_magazines; mag_index++) {
			s += szone->medium_rack.magazines[mag_index].mag_bytes_free_at_start;
			s += szone->medium_rack.magazines[mag_index].mag_bytes_free_at_end;
			t += szone->medium_rack.magazines[mag_index].mag_num_objects;
			u += szone->medium_rack.magazines[mag_index].mag_num_bytes_in_objects;
		}
	}
#endif // CONFIG_MEDIUM_ALLOCATOR

	large = szone->num_bytes_in_large_objects;

	stats->blocks_in_use = t + szone->num_large_objects_in_use;
	stats->size_in_use = u + large;
	stats->max_size_in_use = stats->size_allocated =
			(szone->tiny_rack.num_regions - szone->tiny_rack.num_regions_dealloc) * TINY_REGION_SIZE +
			(szone->small_rack.num_regions - szone->small_rack.num_regions_dealloc) * SMALL_REGION_SIZE + large;

#if CONFIG_MEDIUM_ALLOCATOR
	if (szone->is_medium_engaged) {
		stats->max_size_in_use += (szone->medium_rack.num_regions -
				szone->medium_rack.num_regions_dealloc) * MEDIUM_REGION_SIZE;
	}
#endif
	// Now we account for the untouched areas
	stats->max_size_in_use -= s;

	return KERN_SUCCESS;
}

static void
szone_statistics(szone_t *szone, malloc_statistics_t *stats)
{
	szone_statistics_task(mach_task_self(), (vm_address_t)szone, NULL, stats);
}

const struct malloc_introspection_t szone_introspect = {
		(void *)szone_ptr_in_use_enumerator, (void *)szone_good_size, (void *)szone_check, (void *)szone_print_self, szone_log,
		(void *)szone_force_lock, (void *)szone_force_unlock, (void *)szone_statistics, (void *)szone_locked, NULL, NULL, NULL,
		NULL, /* Zone enumeration version 7 and forward. */
		(void *)szone_reinit_lock, // reinit_lock version 9 and forward
		(void *)szone_print_task,  // print task, version 11 and forward
		(void *)szone_statistics_task // stats for task, version 12 and forward
}; // marked as const to spare the DATA section

szone_t *
create_scalable_szone(size_t initial_size, unsigned debug_flags)
{
	szone_t *szone;

#if defined(__i386__) || defined(__x86_64__)
	if (_COMM_PAGE_VERSION_REQD > (*((uint16_t *)_COMM_PAGE_VERSION))) {
		MALLOC_REPORT_FATAL_ERROR((*((uint16_t *)_COMM_PAGE_VERSION)), "comm page version mismatch");
	}
#endif

	/* get memory for the zone. */
	szone = mvm_allocate_pages(SZONE_PAGED_SIZE, 0, DISABLE_ASLR, VM_MEMORY_MALLOC);
	if (!szone) {
		return NULL;
	}

/* set up the szone structure */
#if 0
#warning CHECK_REGIONS enabled
	debug_flags |= CHECK_REGIONS;
#endif
#if 0
#warning LOG enabled
	szone->log_address = ~0;
#endif

	if (mvm_aslr_enabled()) {
		debug_flags &= ~DISABLE_ASLR;
	} else {
		debug_flags |= DISABLE_ASLR;
	}

#if CONFIG_MEDIUM_ALLOCATOR || CONFIG_LARGE_CACHE
	uint64_t memsize = platform_hw_memsize();
#endif // CONFIG_MEDIUM_ALLOCATOR || CONFIG_LARGE_CACHE

#if CONFIG_MEDIUM_ALLOCATOR
	szone->is_medium_engaged = (magazine_medium_enabled &&
			(memsize >= magazine_medium_active_threshold));
#endif // CONFIG_MEDIUM_ALLOCATOR

	// Query the number of configured processors.
	// Uniprocessor case gets just one tiny and one small magazine (whose index is zero). This gives
	// the same behavior as the original scalable malloc. MP gets per-CPU magazines
	// that scale (way) better.
	unsigned int max_mags = mag_max_magazines();
	uint32_t num_magazines = (max_mags > 1) ? MIN(max_mags, TINY_MAX_MAGAZINES) : 1;
	rack_init(&szone->tiny_rack, RACK_TYPE_TINY, num_magazines, debug_flags);
	rack_init(&szone->small_rack, RACK_TYPE_SMALL, num_magazines, debug_flags);

#if CONFIG_MEDIUM_ALLOCATOR
	if (szone->is_medium_engaged) {
		unsigned max_medium_mags = mag_max_medium_magazines();
		uint32_t num_medium_mags = (max_medium_mags > 1) ?
				MIN(max_medium_mags, TINY_MAX_MAGAZINES) : 1;
		rack_init(&szone->medium_rack, RACK_TYPE_MEDIUM, num_medium_mags,
				debug_flags);
	}
#endif // CONFIG_MEDIUM_ALLOCATOR

#if CONFIG_LARGE_CACHE
	// madvise(..., MADV_REUSABLE) death-row arrivals above this threshold [~0.1%]
	szone->large_entry_cache_reserve_limit = (size_t)(memsize >> 10);
	if (memsize >= magazine_large_expanded_cache_threshold) {
		szone->large_cache_depth = LARGE_ENTRY_CACHE_SIZE_HIGH;
		szone->large_cache_entry_limit = LARGE_ENTRY_SIZE_ENTRY_LIMIT_HIGH;
	} else {
		szone->large_cache_depth = LARGE_ENTRY_CACHE_SIZE_LOW;
		szone->large_cache_entry_limit = LARGE_ENTRY_SIZE_ENTRY_LIMIT_LOW;
	}

	/* <rdar://problem/6610904> Reset protection when returning a previous large allocation? */
	int32_t libSystemVersion = NSVersionOfLinkTimeLibrary("System");
	if ((-1 != libSystemVersion) && ((libSystemVersion >> 16) < 112) /* CFSystemVersionSnowLeopard */) {
		szone->large_legacy_reset_mprotect = TRUE;
	} else {
		szone->large_legacy_reset_mprotect = FALSE;
	}
#endif

	// Initialize the security token.
	szone->cookie = (uintptr_t)malloc_entropy[0];

	szone->basic_zone.version = 12;
	szone->basic_zone.size = (void *)szone_size;
	szone->basic_zone.malloc = (void *)szone_malloc;
	szone->basic_zone.calloc = (void *)szone_calloc;
	szone->basic_zone.valloc = (void *)szone_valloc;
	szone->basic_zone.free = (void *)szone_free;
	szone->basic_zone.realloc = (void *)szone_realloc;
	szone->basic_zone.destroy = (void *)szone_destroy;
	szone->basic_zone.batch_malloc = (void *)szone_batch_malloc;
	szone->basic_zone.batch_free = (void *)szone_batch_free;
	szone->basic_zone.introspect = (struct malloc_introspection_t *)&szone_introspect;
	szone->basic_zone.memalign = (void *)szone_memalign;
	szone->basic_zone.free_definite_size = (void *)szone_free_definite_size;
	szone->basic_zone.pressure_relief = (void *)szone_pressure_relief;
	szone->basic_zone.claimed_address = (void *)szone_claimed_address;

	/* Set to zero once and for all as required by CFAllocator. */
	szone->basic_zone.reserved1 = 0;
	/* Set to zero once and for all as required by CFAllocator. */
	szone->basic_zone.reserved2 = 0;

	/* Prevent overwriting the function pointers in basic_zone. */
	mprotect(szone, sizeof(szone->basic_zone), PROT_READ);

	szone->debug_flags = debug_flags;
	_malloc_lock_init(&szone->large_szone_lock);

	szone->cpu_id_key = -1UL; // Unused.

	CHECK(szone, __PRETTY_FUNCTION__);
	return szone;
}

malloc_zone_t *
create_scalable_zone(size_t initial_size, unsigned debug_flags) {
	return (malloc_zone_t *) create_scalable_szone(initial_size, debug_flags);
}

/* vim: set noet:ts=4:sw=4:cindent: */