#include <mach/kern_return.h>
#include <mach/vm_param.h>
#include <kern/assert.h>
#include <kern/lock.h>
#include <kern/thread.h>
#include <vm/vm_kern.h>
#include <vm/vm_map.h>
#include <vm/vm_object.h>
#include <vm/vm_page.h>
#include <vm/vm_pageout.h>
#include <kern/misc_protos.h>
#include <vm/cpm.h>
#include <string.h>
#include <libkern/OSDebug.h>
#include <sys/kdebug.h>
vm_map_t kernel_map;
vm_map_t kernel_pageable_map;
extern boolean_t vm_kernel_ready;
extern kern_return_t kmem_alloc_pages(
register vm_object_t object,
register vm_object_offset_t offset,
register vm_object_size_t size);
extern void kmem_remap_pages(
register vm_object_t object,
register vm_object_offset_t offset,
register vm_offset_t start,
register vm_offset_t end,
vm_prot_t protection);
kern_return_t
kmem_alloc_contig(
vm_map_t map,
vm_offset_t *addrp,
vm_size_t size,
vm_offset_t mask,
ppnum_t max_pnum,
ppnum_t pnum_mask,
int flags)
{
vm_object_t object;
vm_object_offset_t offset;
vm_map_offset_t map_addr;
vm_map_offset_t map_mask;
vm_map_size_t map_size, i;
vm_map_entry_t entry;
vm_page_t m, pages;
kern_return_t kr;
if (map == VM_MAP_NULL || (flags & ~(KMA_KOBJECT | KMA_LOMEM | KMA_NOPAGEWAIT)))
return KERN_INVALID_ARGUMENT;
if (size == 0) {
*addrp = 0;
return KERN_INVALID_ARGUMENT;
}
map_size = vm_map_round_page(size);
map_mask = (vm_map_offset_t)mask;
if ((flags & KMA_KOBJECT) != 0) {
object = kernel_object;
vm_object_reference(object);
} else {
object = vm_object_allocate(map_size);
}
kr = vm_map_find_space(map, &map_addr, map_size, map_mask, 0, &entry);
if (KERN_SUCCESS != kr) {
vm_object_deallocate(object);
return kr;
}
entry->object.vm_object = object;
entry->offset = offset = (object == kernel_object) ?
map_addr : 0;
vm_object_reference(object);
vm_map_unlock(map);
kr = cpm_allocate(CAST_DOWN(vm_size_t, map_size), &pages, max_pnum, pnum_mask, FALSE, flags);
if (kr != KERN_SUCCESS) {
vm_map_remove(map, vm_map_trunc_page(map_addr),
vm_map_round_page(map_addr + map_size), 0);
vm_object_deallocate(object);
*addrp = 0;
return kr;
}
vm_object_lock(object);
for (i = 0; i < map_size; i += PAGE_SIZE) {
m = pages;
pages = NEXT_PAGE(m);
*(NEXT_PAGE_PTR(m)) = VM_PAGE_NULL;
m->busy = FALSE;
vm_page_insert(m, object, offset + i);
}
vm_object_unlock(object);
if ((kr = vm_map_wire(map, vm_map_trunc_page(map_addr),
vm_map_round_page(map_addr + map_size), VM_PROT_DEFAULT, FALSE))
!= KERN_SUCCESS) {
if (object == kernel_object) {
vm_object_lock(object);
vm_object_page_remove(object, offset, offset + map_size);
vm_object_unlock(object);
}
vm_map_remove(map, vm_map_trunc_page(map_addr),
vm_map_round_page(map_addr + map_size), 0);
vm_object_deallocate(object);
return kr;
}
vm_object_deallocate(object);
if (object == kernel_object)
vm_map_simplify(map, map_addr);
*addrp = (vm_offset_t) map_addr;
assert((vm_map_offset_t) *addrp == map_addr);
return KERN_SUCCESS;
}
kern_return_t
kernel_memory_allocate(
register vm_map_t map,
register vm_offset_t *addrp,
register vm_size_t size,
register vm_offset_t mask,
int flags)
{
vm_object_t object;
vm_object_offset_t offset;
vm_object_offset_t pg_offset;
vm_map_entry_t entry;
vm_map_offset_t map_addr, fill_start;
vm_map_offset_t map_mask;
vm_map_size_t map_size, fill_size;
kern_return_t kr;
vm_page_t mem;
vm_page_t guard_page_list = NULL;
vm_page_t wired_page_list = NULL;
int guard_page_count = 0;
int wired_page_count = 0;
int i;
int vm_alloc_flags;
if (! vm_kernel_ready) {
panic("kernel_memory_allocate: VM is not ready");
}
if (size == 0) {
*addrp = 0;
return KERN_INVALID_ARGUMENT;
}
map_size = vm_map_round_page(size);
map_mask = (vm_map_offset_t) mask;
vm_alloc_flags = 0;
if (map_size > (1 << 30)) {
return KERN_RESOURCE_SHORTAGE;
}
fill_start = 0;
fill_size = map_size;
if (flags & KMA_GUARD_FIRST) {
vm_alloc_flags |= VM_FLAGS_GUARD_BEFORE;
fill_start += PAGE_SIZE_64;
fill_size -= PAGE_SIZE_64;
if (map_size < fill_start + fill_size) {
*addrp = 0;
return KERN_INVALID_ARGUMENT;
}
guard_page_count++;
}
if (flags & KMA_GUARD_LAST) {
vm_alloc_flags |= VM_FLAGS_GUARD_AFTER;
fill_size -= PAGE_SIZE_64;
if (map_size <= fill_start + fill_size) {
*addrp = 0;
return KERN_INVALID_ARGUMENT;
}
guard_page_count++;
}
wired_page_count = (int) (fill_size / PAGE_SIZE_64);
assert(wired_page_count * PAGE_SIZE_64 == fill_size);
for (i = 0; i < guard_page_count; i++) {
for (;;) {
mem = vm_page_grab_guard();
if (mem != VM_PAGE_NULL)
break;
if (flags & KMA_NOPAGEWAIT) {
kr = KERN_RESOURCE_SHORTAGE;
goto out;
}
vm_page_more_fictitious();
}
mem->pageq.next = (queue_entry_t)guard_page_list;
guard_page_list = mem;
}
for (i = 0; i < wired_page_count; i++) {
uint64_t unavailable;
for (;;) {
if (flags & KMA_LOMEM)
mem = vm_page_grablo();
else
mem = vm_page_grab();
if (mem != VM_PAGE_NULL)
break;
if (flags & KMA_NOPAGEWAIT) {
kr = KERN_RESOURCE_SHORTAGE;
goto out;
}
if ((flags & KMA_LOMEM) && (vm_lopage_needed == TRUE)) {
kr = KERN_RESOURCE_SHORTAGE;
goto out;
}
unavailable = (vm_page_wire_count + vm_page_free_target) * PAGE_SIZE;
if (unavailable > max_mem || map_size > (max_mem - unavailable)) {
kr = KERN_RESOURCE_SHORTAGE;
goto out;
}
VM_PAGE_WAIT();
}
mem->pageq.next = (queue_entry_t)wired_page_list;
wired_page_list = mem;
}
if ((flags & KMA_KOBJECT) != 0) {
object = kernel_object;
vm_object_reference(object);
} else {
object = vm_object_allocate(map_size);
}
kr = vm_map_find_space(map, &map_addr,
fill_size, map_mask,
vm_alloc_flags, &entry);
if (KERN_SUCCESS != kr) {
vm_object_deallocate(object);
goto out;
}
entry->object.vm_object = object;
entry->offset = offset = (object == kernel_object) ?
map_addr : 0;
entry->wired_count++;
if (flags & KMA_PERMANENT)
entry->permanent = TRUE;
if (object != kernel_object)
vm_object_reference(object);
vm_object_lock(object);
vm_map_unlock(map);
pg_offset = 0;
if (fill_start) {
if (guard_page_list == NULL)
panic("kernel_memory_allocate: guard_page_list == NULL");
mem = guard_page_list;
guard_page_list = (vm_page_t)mem->pageq.next;
mem->pageq.next = NULL;
vm_page_insert(mem, object, offset + pg_offset);
mem->busy = FALSE;
pg_offset += PAGE_SIZE_64;
}
for (pg_offset = fill_start; pg_offset < fill_start + fill_size; pg_offset += PAGE_SIZE_64) {
if (wired_page_list == NULL)
panic("kernel_memory_allocate: wired_page_list == NULL");
mem = wired_page_list;
wired_page_list = (vm_page_t)mem->pageq.next;
mem->pageq.next = NULL;
mem->wire_count++;
vm_page_insert(mem, object, offset + pg_offset);
mem->busy = FALSE;
mem->pmapped = TRUE;
mem->wpmapped = TRUE;
PMAP_ENTER(kernel_pmap, map_addr + pg_offset, mem,
VM_PROT_READ | VM_PROT_WRITE, 0, TRUE);
if (flags & KMA_NOENCRYPT) {
bzero(CAST_DOWN(void *, (map_addr + pg_offset)), PAGE_SIZE);
pmap_set_noencrypt(mem->phys_page);
}
}
if ((fill_start + fill_size) < map_size) {
if (guard_page_list == NULL)
panic("kernel_memory_allocate: guard_page_list == NULL");
mem = guard_page_list;
guard_page_list = (vm_page_t)mem->pageq.next;
mem->pageq.next = NULL;
vm_page_insert(mem, object, offset + pg_offset);
mem->busy = FALSE;
}
if (guard_page_list || wired_page_list)
panic("kernel_memory_allocate: non empty list\n");
vm_page_lockspin_queues();
vm_page_wire_count += wired_page_count;
vm_page_unlock_queues();
vm_object_unlock(object);
if (object == kernel_object)
vm_map_simplify(map, map_addr);
else
vm_object_deallocate(object);
*addrp = CAST_DOWN(vm_offset_t, map_addr);
return KERN_SUCCESS;
out:
if (guard_page_list)
vm_page_free_list(guard_page_list, FALSE);
if (wired_page_list)
vm_page_free_list(wired_page_list, FALSE);
return kr;
}
kern_return_t
kmem_alloc(
vm_map_t map,
vm_offset_t *addrp,
vm_size_t size)
{
kern_return_t kr = kernel_memory_allocate(map, addrp, size, 0, 0);
TRACE_MACHLEAKS(KMEM_ALLOC_CODE, KMEM_ALLOC_CODE_2, size, *addrp);
return kr;
}
kern_return_t
kmem_realloc(
vm_map_t map,
vm_offset_t oldaddr,
vm_size_t oldsize,
vm_offset_t *newaddrp,
vm_size_t newsize)
{
vm_object_t object;
vm_object_offset_t offset;
vm_map_offset_t oldmapmin;
vm_map_offset_t oldmapmax;
vm_map_offset_t newmapaddr;
vm_map_size_t oldmapsize;
vm_map_size_t newmapsize;
vm_map_entry_t oldentry;
vm_map_entry_t newentry;
vm_page_t mem;
kern_return_t kr;
oldmapmin = vm_map_trunc_page(oldaddr);
oldmapmax = vm_map_round_page(oldaddr + oldsize);
oldmapsize = oldmapmax - oldmapmin;
newmapsize = vm_map_round_page(newsize);
vm_map_lock(map);
if (!vm_map_lookup_entry(map, oldmapmin, &oldentry))
panic("kmem_realloc");
object = oldentry->object.vm_object;
vm_object_reference(object);
vm_object_lock(object);
vm_map_unlock(map);
if (object->vo_size != oldmapsize)
panic("kmem_realloc");
object->vo_size = newmapsize;
vm_object_unlock(object);
kmem_alloc_pages(object, vm_object_round_page(oldmapsize),
vm_object_round_page(newmapsize-oldmapsize));
kr = vm_map_find_space(map, &newmapaddr, newmapsize,
(vm_map_offset_t) 0, 0, &newentry);
if (kr != KERN_SUCCESS) {
vm_object_lock(object);
for(offset = oldmapsize;
offset < newmapsize; offset += PAGE_SIZE) {
if ((mem = vm_page_lookup(object, offset)) != VM_PAGE_NULL) {
VM_PAGE_FREE(mem);
}
}
object->vo_size = oldmapsize;
vm_object_unlock(object);
vm_object_deallocate(object);
return kr;
}
newentry->object.vm_object = object;
newentry->offset = 0;
assert (newentry->wired_count == 0);
vm_object_reference(object);
vm_map_unlock(map);
kr = vm_map_wire(map, newmapaddr, newmapaddr + newmapsize, VM_PROT_DEFAULT, FALSE);
if (KERN_SUCCESS != kr) {
vm_map_remove(map, newmapaddr, newmapaddr + newmapsize, 0);
vm_object_lock(object);
for(offset = oldsize; offset < newmapsize; offset += PAGE_SIZE) {
if ((mem = vm_page_lookup(object, offset)) != VM_PAGE_NULL) {
VM_PAGE_FREE(mem);
}
}
object->vo_size = oldmapsize;
vm_object_unlock(object);
vm_object_deallocate(object);
return (kr);
}
vm_object_deallocate(object);
*newaddrp = CAST_DOWN(vm_offset_t, newmapaddr);
return KERN_SUCCESS;
}
kern_return_t
kmem_alloc_kobject(
vm_map_t map,
vm_offset_t *addrp,
vm_size_t size)
{
return kernel_memory_allocate(map, addrp, size, 0, KMA_KOBJECT);
}
kern_return_t
kmem_alloc_aligned(
vm_map_t map,
vm_offset_t *addrp,
vm_size_t size)
{
if ((size & (size - 1)) != 0)
panic("kmem_alloc_aligned: size not aligned");
return kernel_memory_allocate(map, addrp, size, size - 1, KMA_KOBJECT);
}
kern_return_t
kmem_alloc_pageable(
vm_map_t map,
vm_offset_t *addrp,
vm_size_t size)
{
vm_map_offset_t map_addr;
vm_map_size_t map_size;
kern_return_t kr;
#ifndef normal
map_addr = (vm_map_min(map)) + 0x1000;
#else
map_addr = vm_map_min(map);
#endif
map_size = vm_map_round_page(size);
kr = vm_map_enter(map, &map_addr, map_size,
(vm_map_offset_t) 0, VM_FLAGS_ANYWHERE,
VM_OBJECT_NULL, (vm_object_offset_t) 0, FALSE,
VM_PROT_DEFAULT, VM_PROT_ALL, VM_INHERIT_DEFAULT);
if (kr != KERN_SUCCESS)
return kr;
*addrp = CAST_DOWN(vm_offset_t, map_addr);
return KERN_SUCCESS;
}
void
kmem_free(
vm_map_t map,
vm_offset_t addr,
vm_size_t size)
{
kern_return_t kr;
assert(addr >= VM_MIN_KERNEL_AND_KEXT_ADDRESS);
TRACE_MACHLEAKS(KMEM_FREE_CODE, KMEM_FREE_CODE_2, size, addr);
if(size == 0) {
#if MACH_ASSERT
printf("kmem_free called with size==0 for map: %p with addr: 0x%llx\n",map,(uint64_t)addr);
#endif
return;
}
kr = vm_map_remove(map, vm_map_trunc_page(addr),
vm_map_round_page(addr + size),
VM_MAP_REMOVE_KUNWIRE);
if (kr != KERN_SUCCESS)
panic("kmem_free");
}
kern_return_t
kmem_alloc_pages(
register vm_object_t object,
register vm_object_offset_t offset,
register vm_object_size_t size)
{
vm_object_size_t alloc_size;
alloc_size = vm_object_round_page(size);
vm_object_lock(object);
while (alloc_size) {
register vm_page_t mem;
while (VM_PAGE_NULL ==
(mem = vm_page_alloc(object, offset))) {
vm_object_unlock(object);
VM_PAGE_WAIT();
vm_object_lock(object);
}
mem->busy = FALSE;
alloc_size -= PAGE_SIZE;
offset += PAGE_SIZE;
}
vm_object_unlock(object);
return KERN_SUCCESS;
}
void
kmem_remap_pages(
register vm_object_t object,
register vm_object_offset_t offset,
register vm_offset_t start,
register vm_offset_t end,
vm_prot_t protection)
{
vm_map_offset_t map_start;
vm_map_offset_t map_end;
map_start = vm_map_trunc_page(start);
map_end = vm_map_round_page(end);
pmap_pageable(kernel_pmap, map_start, map_end, FALSE);
while (map_start < map_end) {
register vm_page_t mem;
vm_object_lock(object);
if ((mem = vm_page_lookup(object, offset)) == VM_PAGE_NULL)
panic("kmem_remap_pages");
vm_page_lockspin_queues();
vm_page_wire(mem);
vm_page_unlock_queues();
vm_object_unlock(object);
ASSERT_PAGE_DECRYPTED(mem);
mem->pmapped = TRUE;
mem->wpmapped = TRUE;
PMAP_ENTER(kernel_pmap, map_start, mem, protection, 0, TRUE);
map_start += PAGE_SIZE;
offset += PAGE_SIZE;
}
}
kern_return_t
kmem_suballoc(
vm_map_t parent,
vm_offset_t *addr,
vm_size_t size,
boolean_t pageable,
int flags,
vm_map_t *new_map)
{
vm_map_t map;
vm_map_offset_t map_addr;
vm_map_size_t map_size;
kern_return_t kr;
map_size = vm_map_round_page(size);
vm_object_reference(vm_submap_object);
map_addr = (flags & VM_FLAGS_ANYWHERE) ?
vm_map_min(parent) : vm_map_trunc_page(*addr);
kr = vm_map_enter(parent, &map_addr, map_size,
(vm_map_offset_t) 0, flags,
vm_submap_object, (vm_object_offset_t) 0, FALSE,
VM_PROT_DEFAULT, VM_PROT_ALL, VM_INHERIT_DEFAULT);
if (kr != KERN_SUCCESS) {
vm_object_deallocate(vm_submap_object);
return (kr);
}
pmap_reference(vm_map_pmap(parent));
map = vm_map_create(vm_map_pmap(parent), map_addr, map_addr + map_size, pageable);
if (map == VM_MAP_NULL)
panic("kmem_suballoc: vm_map_create failed");
kr = vm_map_submap(parent, map_addr, map_addr + map_size, map, map_addr, FALSE);
if (kr != KERN_SUCCESS) {
vm_map_remove(parent, map_addr, map_addr + map_size, VM_MAP_NO_FLAGS);
vm_map_deallocate(map);
vm_object_deallocate(vm_submap_object);
return (kr);
}
*addr = CAST_DOWN(vm_offset_t, map_addr);
*new_map = map;
return (KERN_SUCCESS);
}
void
kmem_init(
vm_offset_t start,
vm_offset_t end)
{
vm_map_offset_t map_start;
vm_map_offset_t map_end;
map_start = vm_map_trunc_page(start);
map_end = vm_map_round_page(end);
kernel_map = vm_map_create(pmap_kernel(),VM_MIN_KERNEL_AND_KEXT_ADDRESS,
map_end, FALSE);
if (start != VM_MIN_KERNEL_AND_KEXT_ADDRESS) {
vm_map_offset_t map_addr;
kern_return_t kr;
map_addr = VM_MIN_KERNEL_AND_KEXT_ADDRESS;
kr = vm_map_enter(kernel_map,
&map_addr,
(vm_map_size_t)(map_start - VM_MIN_KERNEL_AND_KEXT_ADDRESS),
(vm_map_offset_t) 0,
VM_FLAGS_FIXED | VM_FLAGS_NO_PMAP_CHECK,
VM_OBJECT_NULL,
(vm_object_offset_t) 0, FALSE,
VM_PROT_NONE, VM_PROT_NONE,
VM_INHERIT_DEFAULT);
if (kr != KERN_SUCCESS) {
panic("kmem_init(0x%llx,0x%llx): vm_map_enter(0x%llx,0x%llx) error 0x%x\n",
(uint64_t) start, (uint64_t) end,
(uint64_t) VM_MIN_KERNEL_AND_KEXT_ADDRESS,
(uint64_t) (map_start - VM_MIN_KERNEL_AND_KEXT_ADDRESS),
kr);
}
}
vm_global_no_user_wire_amount = MIN(max_mem*20/100,
VM_NOT_USER_WIREABLE);
vm_global_user_wire_limit = max_mem - vm_global_no_user_wire_amount;
vm_user_wire_limit = vm_global_user_wire_limit;
}
kern_return_t
copyinmap(
vm_map_t map,
vm_map_offset_t fromaddr,
void *todata,
vm_size_t length)
{
kern_return_t kr = KERN_SUCCESS;
vm_map_t oldmap;
if (vm_map_pmap(map) == pmap_kernel())
{
memcpy(todata, CAST_DOWN(void *, fromaddr), length);
}
else if (current_map() == map)
{
if (copyin(fromaddr, todata, length) != 0)
kr = KERN_INVALID_ADDRESS;
}
else
{
vm_map_reference(map);
oldmap = vm_map_switch(map);
if (copyin(fromaddr, todata, length) != 0)
kr = KERN_INVALID_ADDRESS;
vm_map_switch(oldmap);
vm_map_deallocate(map);
}
return kr;
}
kern_return_t
copyoutmap(
vm_map_t map,
void *fromdata,
vm_map_address_t toaddr,
vm_size_t length)
{
if (vm_map_pmap(map) == pmap_kernel()) {
memcpy(CAST_DOWN(void *, toaddr), fromdata, length);
return KERN_SUCCESS;
}
if (current_map() != map)
return KERN_NOT_SUPPORTED;
if (copyout(fromdata, toaddr, length) != 0)
return KERN_INVALID_ADDRESS;
return KERN_SUCCESS;
}
kern_return_t
vm_conflict_check(
vm_map_t map,
vm_map_offset_t off,
vm_map_size_t len,
memory_object_t pager,
vm_object_offset_t file_off)
{
vm_map_entry_t entry;
vm_object_t obj;
vm_object_offset_t obj_off;
vm_map_t base_map;
vm_map_offset_t base_offset;
vm_map_offset_t original_offset;
kern_return_t kr;
vm_map_size_t local_len;
base_map = map;
base_offset = off;
original_offset = off;
kr = KERN_SUCCESS;
vm_map_lock(map);
while(vm_map_lookup_entry(map, off, &entry)) {
local_len = len;
if (entry->object.vm_object == VM_OBJECT_NULL) {
vm_map_unlock(map);
return KERN_SUCCESS;
}
if (entry->is_sub_map) {
vm_map_t old_map;
old_map = map;
vm_map_lock(entry->object.sub_map);
map = entry->object.sub_map;
off = entry->offset + (off - entry->vme_start);
vm_map_unlock(old_map);
continue;
}
obj = entry->object.vm_object;
obj_off = (off - entry->vme_start) + entry->offset;
while(obj->shadow) {
obj_off += obj->vo_shadow_offset;
obj = obj->shadow;
}
if((obj->pager_created) && (obj->pager == pager)) {
if(((obj->paging_offset) + obj_off) == file_off) {
if(off != base_offset) {
vm_map_unlock(map);
return KERN_FAILURE;
}
kr = KERN_ALREADY_WAITING;
} else {
vm_object_offset_t obj_off_aligned;
vm_object_offset_t file_off_aligned;
obj_off_aligned = obj_off & ~PAGE_MASK;
file_off_aligned = file_off & ~PAGE_MASK;
if (file_off_aligned == (obj->paging_offset + obj_off_aligned)) {
vm_map_unlock(map);
return KERN_FAILURE;
}
if ((file_off < (obj->paging_offset + obj_off_aligned)) &&
((file_off + len) > (obj->paging_offset + obj_off_aligned))) {
vm_map_unlock(map);
return KERN_FAILURE;
}
if ((file_off_aligned > (obj->paging_offset + obj_off)) &&
(file_off_aligned < (obj->paging_offset + obj_off) + len)) {
vm_map_unlock(map);
return KERN_FAILURE;
}
}
} else if(kr != KERN_SUCCESS) {
vm_map_unlock(map);
return KERN_FAILURE;
}
if(len <= ((entry->vme_end - entry->vme_start) -
(off - entry->vme_start))) {
vm_map_unlock(map);
return kr;
} else {
len -= (entry->vme_end - entry->vme_start) -
(off - entry->vme_start);
}
base_offset = base_offset + (local_len - len);
file_off = file_off + (local_len - len);
off = base_offset;
if(map != base_map) {
vm_map_unlock(map);
vm_map_lock(base_map);
map = base_map;
}
}
vm_map_unlock(map);
return kr;
}