vm_shared_region.c [plain text]
#include <debug.h>
#include <kern/ipc_tt.h>
#include <kern/kalloc.h>
#include <kern/thread_call.h>
#include <mach/mach_vm.h>
#include <vm/vm_map.h>
#include <vm/vm_shared_region.h>
#include <vm/vm_protos.h>
#include <machine/commpage.h>
#include <machine/cpu_capabilities.h>
int shared_region_version = 3;
int shared_region_trace_level = SHARED_REGION_TRACE_ERROR_LVL;
int shared_region_persistence = 0;
int shared_region_destroy_delay = 120;
boolean_t shared_region_completed_slide = FALSE;
lck_grp_t *vm_shared_region_lck_grp;
lck_mtx_t vm_shared_region_lock;
#define vm_shared_region_lock() lck_mtx_lock(&vm_shared_region_lock)
#define vm_shared_region_unlock() lck_mtx_unlock(&vm_shared_region_lock)
#define vm_shared_region_sleep(event, interruptible) \
lck_mtx_sleep(&vm_shared_region_lock, \
LCK_SLEEP_DEFAULT, \
(event_t) (event), \
(interruptible))
queue_head_t vm_shared_region_queue;
static void vm_shared_region_reference_locked(vm_shared_region_t shared_region);
static vm_shared_region_t vm_shared_region_create(
void *root_dir,
cpu_type_t cputype,
boolean_t is_64bit);
static void vm_shared_region_destroy(vm_shared_region_t shared_region);
static void vm_shared_region_timeout(thread_call_param_t param0,
thread_call_param_t param1);
static int __commpage_setup = 0;
#if defined(__i386__) || defined(__x86_64__)
static int __system_power_source = 1;
static void post_sys_powersource_internal(int i, int internal);
#endif
void
vm_shared_region_init(void)
{
SHARED_REGION_TRACE_DEBUG(
("shared_region: -> init\n"));
vm_shared_region_lck_grp = lck_grp_alloc_init("vm shared region",
LCK_GRP_ATTR_NULL);
lck_mtx_init(&vm_shared_region_lock,
vm_shared_region_lck_grp,
LCK_ATTR_NULL);
queue_init(&vm_shared_region_queue);
SHARED_REGION_TRACE_DEBUG(
("shared_region: <- init\n"));
}
vm_shared_region_t
vm_shared_region_get(
task_t task)
{
vm_shared_region_t shared_region;
SHARED_REGION_TRACE_DEBUG(
("shared_region: -> get(%p)\n",
task));
task_lock(task);
vm_shared_region_lock();
shared_region = task->shared_region;
if (shared_region) {
assert(shared_region->sr_ref_count > 0);
vm_shared_region_reference_locked(shared_region);
}
vm_shared_region_unlock();
task_unlock(task);
SHARED_REGION_TRACE_DEBUG(
("shared_region: get(%p) <- %p\n",
task, shared_region));
return shared_region;
}
mach_vm_offset_t
vm_shared_region_base_address(
vm_shared_region_t shared_region)
{
SHARED_REGION_TRACE_DEBUG(
("shared_region: -> base_address(%p)\n",
shared_region));
assert(shared_region->sr_ref_count > 1);
SHARED_REGION_TRACE_DEBUG(
("shared_region: base_address(%p) <- 0x%llx\n",
shared_region, (long long)shared_region->sr_base_address));
return shared_region->sr_base_address;
}
mach_vm_size_t
vm_shared_region_size(
vm_shared_region_t shared_region)
{
SHARED_REGION_TRACE_DEBUG(
("shared_region: -> size(%p)\n",
shared_region));
assert(shared_region->sr_ref_count > 1);
SHARED_REGION_TRACE_DEBUG(
("shared_region: size(%p) <- 0x%llx\n",
shared_region, (long long)shared_region->sr_size));
return shared_region->sr_size;
}
ipc_port_t
vm_shared_region_mem_entry(
vm_shared_region_t shared_region)
{
SHARED_REGION_TRACE_DEBUG(
("shared_region: -> mem_entry(%p)\n",
shared_region));
assert(shared_region->sr_ref_count > 1);
SHARED_REGION_TRACE_DEBUG(
("shared_region: mem_entry(%p) <- %p\n",
shared_region, shared_region->sr_mem_entry));
return shared_region->sr_mem_entry;
}
void
vm_shared_region_set(
task_t task,
vm_shared_region_t new_shared_region)
{
vm_shared_region_t old_shared_region;
SHARED_REGION_TRACE_DEBUG(
("shared_region: -> set(%p, %p)\n",
task, new_shared_region));
task_lock(task);
vm_shared_region_lock();
old_shared_region = task->shared_region;
if (new_shared_region) {
assert(new_shared_region->sr_ref_count > 0);
}
task->shared_region = new_shared_region;
vm_shared_region_unlock();
task_unlock(task);
if (old_shared_region) {
assert(old_shared_region->sr_ref_count > 0);
vm_shared_region_deallocate(old_shared_region);
}
SHARED_REGION_TRACE_DEBUG(
("shared_region: set(%p) <- old=%p new=%p\n",
task, old_shared_region, new_shared_region));
}
vm_shared_region_t
vm_shared_region_lookup(
void *root_dir,
cpu_type_t cputype,
boolean_t is_64bit)
{
vm_shared_region_t shared_region;
vm_shared_region_t new_shared_region;
SHARED_REGION_TRACE_DEBUG(
("shared_region: -> lookup(root=%p,cpu=%d,64bit=%d)\n",
root_dir, cputype, is_64bit));
shared_region = NULL;
new_shared_region = NULL;
vm_shared_region_lock();
for (;;) {
queue_iterate(&vm_shared_region_queue,
shared_region,
vm_shared_region_t,
sr_q) {
assert(shared_region->sr_ref_count > 0);
if (shared_region->sr_cpu_type == cputype &&
shared_region->sr_root_dir == root_dir &&
shared_region->sr_64bit == is_64bit) {
vm_shared_region_reference_locked(shared_region);
goto done;
}
}
if (new_shared_region == NULL) {
vm_shared_region_unlock();
new_shared_region = vm_shared_region_create(root_dir,
cputype,
is_64bit);
vm_shared_region_lock();
continue;
}
shared_region = new_shared_region;
new_shared_region = NULL;
queue_enter(&vm_shared_region_queue,
shared_region,
vm_shared_region_t,
sr_q);
break;
}
done:
vm_shared_region_unlock();
if (new_shared_region) {
assert(new_shared_region->sr_ref_count == 1);
new_shared_region->sr_ref_count--;
vm_shared_region_destroy(new_shared_region);
new_shared_region = NULL;
}
SHARED_REGION_TRACE_DEBUG(
("shared_region: lookup(root=%p,cpu=%d,64bit=%d) <- %p\n",
root_dir, cputype, is_64bit, shared_region));
assert(shared_region->sr_ref_count > 0);
return shared_region;
}
static void
vm_shared_region_reference_locked(
vm_shared_region_t shared_region)
{
#if DEBUG
lck_mtx_assert(&vm_shared_region_lock, LCK_MTX_ASSERT_OWNED);
#endif
SHARED_REGION_TRACE_DEBUG(
("shared_region: -> reference_locked(%p)\n",
shared_region));
assert(shared_region->sr_ref_count > 0);
shared_region->sr_ref_count++;
if (shared_region->sr_timer_call != NULL) {
boolean_t cancelled;
cancelled = thread_call_cancel(shared_region->sr_timer_call);
if (cancelled) {
thread_call_free(shared_region->sr_timer_call);
shared_region->sr_timer_call = NULL;
shared_region->sr_ref_count--;
} else {
}
}
SHARED_REGION_TRACE_DEBUG(
("shared_region: reference_locked(%p) <- %d\n",
shared_region, shared_region->sr_ref_count));
}
void
vm_shared_region_deallocate(
vm_shared_region_t shared_region)
{
SHARED_REGION_TRACE_DEBUG(
("shared_region: -> deallocate(%p)\n",
shared_region));
vm_shared_region_lock();
assert(shared_region->sr_ref_count > 0);
if (shared_region->sr_root_dir == NULL) {
if (shared_region_persistence &&
!shared_region->sr_persists) {
shared_region->sr_ref_count++;
shared_region->sr_persists = TRUE;
} else if (!shared_region_persistence &&
shared_region->sr_persists) {
assert(shared_region->sr_ref_count > 1);
shared_region->sr_ref_count--;
shared_region->sr_persists = FALSE;
}
}
assert(shared_region->sr_ref_count > 0);
shared_region->sr_ref_count--;
SHARED_REGION_TRACE_DEBUG(
("shared_region: deallocate(%p): ref now %d\n",
shared_region, shared_region->sr_ref_count));
if (shared_region->sr_ref_count == 0) {
uint64_t deadline;
if (shared_region->sr_timer_call == NULL) {
assert(! shared_region->sr_mapping_in_progress);
shared_region->sr_ref_count++;
shared_region->sr_timer_call = thread_call_allocate(
(thread_call_func_t) vm_shared_region_timeout,
(thread_call_param_t) shared_region);
clock_interval_to_deadline(shared_region_destroy_delay,
1000 * 1000 * 1000,
&deadline);
thread_call_enter_delayed(shared_region->sr_timer_call,
deadline);
SHARED_REGION_TRACE_DEBUG(
("shared_region: deallocate(%p): armed timer\n",
shared_region));
vm_shared_region_unlock();
} else {
queue_remove(&vm_shared_region_queue,
shared_region,
vm_shared_region_t,
sr_q);
vm_shared_region_unlock();
vm_shared_region_destroy(shared_region);
shared_region = NULL;
}
} else {
vm_shared_region_unlock();
}
SHARED_REGION_TRACE_DEBUG(
("shared_region: deallocate(%p) <-\n",
shared_region));
}
void
vm_shared_region_timeout(
thread_call_param_t param0,
__unused thread_call_param_t param1)
{
vm_shared_region_t shared_region;
shared_region = (vm_shared_region_t) param0;
vm_shared_region_deallocate(shared_region);
}
static vm_shared_region_t
vm_shared_region_create(
void *root_dir,
cpu_type_t cputype,
boolean_t is_64bit)
{
kern_return_t kr;
vm_named_entry_t mem_entry;
ipc_port_t mem_entry_port;
vm_shared_region_t shared_region;
vm_map_t sub_map;
mach_vm_offset_t base_address, pmap_nesting_start;
mach_vm_size_t size, pmap_nesting_size;
SHARED_REGION_TRACE_DEBUG(
("shared_region: -> create(root=%p,cpu=%d,64bit=%d)\n",
root_dir, cputype, is_64bit));
base_address = 0;
size = 0;
mem_entry = NULL;
mem_entry_port = IPC_PORT_NULL;
sub_map = VM_MAP_NULL;
shared_region = kalloc(sizeof (*shared_region));
if (shared_region == NULL) {
SHARED_REGION_TRACE_ERROR(
("shared_region: create: couldn't allocate\n"));
goto done;
}
if (is_64bit) {
switch (cputype) {
case CPU_TYPE_I386:
base_address = SHARED_REGION_BASE_X86_64;
size = SHARED_REGION_SIZE_X86_64;
pmap_nesting_start = SHARED_REGION_NESTING_BASE_X86_64;
pmap_nesting_size = SHARED_REGION_NESTING_SIZE_X86_64;
break;
case CPU_TYPE_POWERPC:
base_address = SHARED_REGION_BASE_PPC64;
size = SHARED_REGION_SIZE_PPC64;
pmap_nesting_start = SHARED_REGION_NESTING_BASE_PPC64;
pmap_nesting_size = SHARED_REGION_NESTING_SIZE_PPC64;
break;
default:
SHARED_REGION_TRACE_ERROR(
("shared_region: create: unknown cpu type %d\n",
cputype));
kfree(shared_region, sizeof (*shared_region));
shared_region = NULL;
goto done;
}
} else {
switch (cputype) {
case CPU_TYPE_I386:
base_address = SHARED_REGION_BASE_I386;
size = SHARED_REGION_SIZE_I386;
pmap_nesting_start = SHARED_REGION_NESTING_BASE_I386;
pmap_nesting_size = SHARED_REGION_NESTING_SIZE_I386;
break;
case CPU_TYPE_POWERPC:
base_address = SHARED_REGION_BASE_PPC;
size = SHARED_REGION_SIZE_PPC;
pmap_nesting_start = SHARED_REGION_NESTING_BASE_PPC;
pmap_nesting_size = SHARED_REGION_NESTING_SIZE_PPC;
break;
#ifdef CPU_TYPE_ARM
case CPU_TYPE_ARM:
base_address = SHARED_REGION_BASE_ARM;
size = SHARED_REGION_SIZE_ARM;
pmap_nesting_start = SHARED_REGION_NESTING_BASE_ARM;
pmap_nesting_size = SHARED_REGION_NESTING_SIZE_ARM;
break;
#endif
default:
SHARED_REGION_TRACE_ERROR(
("shared_region: create: unknown cpu type %d\n",
cputype));
kfree(shared_region, sizeof (*shared_region));
shared_region = NULL;
goto done;
}
}
kr = mach_memory_entry_allocate(&mem_entry,
&mem_entry_port);
if (kr != KERN_SUCCESS) {
kfree(shared_region, sizeof (*shared_region));
shared_region = NULL;
SHARED_REGION_TRACE_ERROR(
("shared_region: create: "
"couldn't allocate mem_entry\n"));
goto done;
}
sub_map = vm_map_create(pmap_create(NULL, 0, is_64bit),
0, size,
TRUE);
if (sub_map == VM_MAP_NULL) {
ipc_port_release_send(mem_entry_port);
kfree(shared_region, sizeof (*shared_region));
shared_region = NULL;
SHARED_REGION_TRACE_ERROR(
("shared_region: create: "
"couldn't allocate map\n"));
goto done;
}
mem_entry->is_sub_map = TRUE;
mem_entry->backing.map = sub_map;
mem_entry->size = size;
mem_entry->protection = VM_PROT_ALL;
shared_region->sr_mem_entry = mem_entry_port;
shared_region->sr_base_address = base_address;
shared_region->sr_size = size;
shared_region->sr_pmap_nesting_start = pmap_nesting_start;
shared_region->sr_pmap_nesting_size = pmap_nesting_size;
shared_region->sr_cpu_type = cputype;
shared_region->sr_64bit = is_64bit;
shared_region->sr_root_dir = root_dir;
queue_init(&shared_region->sr_q);
shared_region->sr_mapping_in_progress = FALSE;
shared_region->sr_persists = FALSE;
shared_region->sr_timer_call = NULL;
shared_region->sr_first_mapping = (mach_vm_offset_t) -1;
shared_region->sr_ref_count = 1;
done:
if (shared_region) {
SHARED_REGION_TRACE_INFO(
("shared_region: create(root=%p,cpu=%d,64bit=%d,"
"base=0x%llx,size=0x%llx) <- "
"%p mem=(%p,%p) map=%p pmap=%p\n",
root_dir, cputype, is_64bit, (long long)base_address,
(long long)size, shared_region,
mem_entry_port, mem_entry, sub_map, sub_map->pmap));
} else {
SHARED_REGION_TRACE_INFO(
("shared_region: create(root=%p,cpu=%d,64bit=%d,"
"base=0x%llx,size=0x%llx) <- NULL",
root_dir, cputype, is_64bit, (long long)base_address,
(long long)size));
}
return shared_region;
}
static void
vm_shared_region_destroy(
vm_shared_region_t shared_region)
{
vm_named_entry_t mem_entry;
vm_map_t map;
SHARED_REGION_TRACE_INFO(
("shared_region: -> destroy(%p) (root=%p,cpu=%d,64bit=%d)\n",
shared_region,
shared_region->sr_root_dir,
shared_region->sr_cpu_type,
shared_region->sr_64bit));
assert(shared_region->sr_ref_count == 0);
assert(!shared_region->sr_persists);
mem_entry = (vm_named_entry_t) shared_region->sr_mem_entry->ip_kobject;
assert(mem_entry->is_sub_map);
assert(!mem_entry->internal);
assert(!mem_entry->is_pager);
map = mem_entry->backing.map;
if (map->pmap) {
pmap_remove(map->pmap,
shared_region->sr_base_address,
(shared_region->sr_base_address +
shared_region->sr_size));
}
mach_memory_entry_port_release(shared_region->sr_mem_entry);
mem_entry = NULL;
shared_region->sr_mem_entry = IPC_PORT_NULL;
if (shared_region->sr_timer_call) {
thread_call_free(shared_region->sr_timer_call);
}
if ((slide_info.slide_info_entry != NULL) && (slide_info.sr == shared_region)) {
kmem_free(kernel_map,
(vm_offset_t) slide_info.slide_info_entry,
(vm_size_t) slide_info.slide_info_size);
vm_object_deallocate(slide_info.slide_object);
slide_info.slide_object = NULL;
slide_info.start = 0;
slide_info.end = 0;
slide_info.slide = 0;
slide_info.sr = NULL;
slide_info.slide_info_entry = NULL;
slide_info.slide_info_size = 0;
shared_region_completed_slide = FALSE;
}
kfree(shared_region, sizeof (*shared_region));
SHARED_REGION_TRACE_DEBUG(
("shared_region: destroy(%p) <-\n",
shared_region));
shared_region = NULL;
}
kern_return_t
vm_shared_region_start_address(
vm_shared_region_t shared_region,
mach_vm_offset_t *start_address)
{
kern_return_t kr;
mach_vm_offset_t sr_base_address;
mach_vm_offset_t sr_first_mapping;
SHARED_REGION_TRACE_DEBUG(
("shared_region: -> start_address(%p)\n",
shared_region));
assert(shared_region->sr_ref_count > 1);
vm_shared_region_lock();
while (shared_region->sr_mapping_in_progress) {
assert(shared_region->sr_ref_count > 1);
vm_shared_region_sleep(&shared_region->sr_mapping_in_progress,
THREAD_UNINT);
}
assert(! shared_region->sr_mapping_in_progress);
assert(shared_region->sr_ref_count > 1);
sr_base_address = shared_region->sr_base_address;
sr_first_mapping = shared_region->sr_first_mapping;
if (sr_first_mapping == (mach_vm_offset_t) -1) {
kr = KERN_INVALID_ADDRESS;
} else {
kr = KERN_SUCCESS;
*start_address = sr_base_address + sr_first_mapping;
}
vm_shared_region_unlock();
SHARED_REGION_TRACE_DEBUG(
("shared_region: start_address(%p) <- 0x%llx\n",
shared_region, (long long)shared_region->sr_base_address));
return kr;
}
void
vm_shared_region_undo_mappings(
vm_map_t sr_map,
mach_vm_offset_t sr_base_address,
struct shared_file_mapping_np *mappings,
unsigned int mappings_count)
{
unsigned int j = 0;
vm_shared_region_t shared_region = NULL;
boolean_t reset_shared_region_state = FALSE;
shared_region = vm_shared_region_get(current_task());
if (shared_region == NULL) {
printf("Failed to undo mappings because of NULL shared region.\n");
return;
}
if (sr_map == NULL) {
ipc_port_t sr_handle;
vm_named_entry_t sr_mem_entry;
vm_shared_region_lock();
assert(shared_region->sr_ref_count > 1);
while (shared_region->sr_mapping_in_progress) {
vm_shared_region_sleep(&shared_region->sr_mapping_in_progress,
THREAD_UNINT);
}
assert(! shared_region->sr_mapping_in_progress);
assert(shared_region->sr_ref_count > 1);
shared_region->sr_mapping_in_progress = TRUE;
vm_shared_region_unlock();
reset_shared_region_state = TRUE;
sr_handle = shared_region->sr_mem_entry;
sr_mem_entry = (vm_named_entry_t) sr_handle->ip_kobject;
sr_map = sr_mem_entry->backing.map;
sr_base_address = shared_region->sr_base_address;
}
for (j = 0; j < mappings_count; j++) {
kern_return_t kr2;
if (mappings[j].sfm_size == 0) {
continue;
}
SHARED_REGION_TRACE_INFO(
("shared_region: mapping[%d]: "
"address:0x%016llx "
"size:0x%016llx "
"offset:0x%016llx "
"maxprot:0x%x prot:0x%x: "
"undoing...\n",
j,
(long long)mappings[j].sfm_address,
(long long)mappings[j].sfm_size,
(long long)mappings[j].sfm_file_offset,
mappings[j].sfm_max_prot,
mappings[j].sfm_init_prot));
kr2 = mach_vm_deallocate(
sr_map,
(mappings[j].sfm_address -
sr_base_address),
mappings[j].sfm_size);
assert(kr2 == KERN_SUCCESS);
}
shared_region->sr_first_mapping = (mach_vm_offset_t) -1;
if (reset_shared_region_state) {
vm_shared_region_lock();
assert(shared_region->sr_ref_count > 1);
assert(shared_region->sr_mapping_in_progress);
shared_region->sr_mapping_in_progress = FALSE;
thread_wakeup((event_t) &shared_region->sr_mapping_in_progress);
vm_shared_region_unlock();
reset_shared_region_state = FALSE;
}
vm_shared_region_deallocate(shared_region);
}
kern_return_t
vm_shared_region_map_file(
vm_shared_region_t shared_region,
unsigned int mappings_count,
struct shared_file_mapping_np *mappings,
memory_object_control_t file_control,
memory_object_size_t file_size,
void *root_dir,
struct shared_file_mapping_np *mapping_to_slide)
{
kern_return_t kr;
vm_object_t file_object;
ipc_port_t sr_handle;
vm_named_entry_t sr_mem_entry;
vm_map_t sr_map;
mach_vm_offset_t sr_base_address;
unsigned int i;
mach_port_t map_port;
vm_map_offset_t target_address;
vm_object_t object;
vm_object_size_t obj_size;
boolean_t found_mapping_to_slide = FALSE;
kr = KERN_SUCCESS;
vm_shared_region_lock();
assert(shared_region->sr_ref_count > 1);
if (shared_region->sr_root_dir != root_dir) {
vm_shared_region_unlock();
kr = KERN_PROTECTION_FAILURE;
goto done;
}
while (shared_region->sr_mapping_in_progress) {
vm_shared_region_sleep(&shared_region->sr_mapping_in_progress,
THREAD_UNINT);
}
assert(! shared_region->sr_mapping_in_progress);
assert(shared_region->sr_ref_count > 1);
shared_region->sr_mapping_in_progress = TRUE;
vm_shared_region_unlock();
sr_handle = shared_region->sr_mem_entry;
sr_mem_entry = (vm_named_entry_t) sr_handle->ip_kobject;
sr_map = sr_mem_entry->backing.map;
sr_base_address = shared_region->sr_base_address;
SHARED_REGION_TRACE_DEBUG(
("shared_region: -> map(%p,%d,%p,%p,0x%llx)\n",
shared_region, mappings_count, mappings,
file_control, file_size));
file_object = memory_object_control_to_vm_object(file_control);
for (i = 0; i < mappings_count; i++) {
SHARED_REGION_TRACE_INFO(
("shared_region: mapping[%d]: "
"address:0x%016llx size:0x%016llx offset:0x%016llx "
"maxprot:0x%x prot:0x%x\n",
i,
(long long)mappings[i].sfm_address,
(long long)mappings[i].sfm_size,
(long long)mappings[i].sfm_file_offset,
mappings[i].sfm_max_prot,
mappings[i].sfm_init_prot));
if (mappings[i].sfm_init_prot & VM_PROT_ZF) {
map_port = MACH_PORT_NULL;
} else {
map_port = (ipc_port_t) file_object->pager;
}
if (mappings[i].sfm_init_prot & VM_PROT_SLIDE) {
if (found_mapping_to_slide == TRUE) {
SHARED_REGION_TRACE_INFO(
("shared_region: mapping[%d]: "
"address:0x%016llx size:0x%016llx "
"offset:0x%016llx "
"maxprot:0x%x prot:0x%x "
"will not be slid as only one such mapping is allowed...\n",
i,
(long long)mappings[i].sfm_address,
(long long)mappings[i].sfm_size,
(long long)mappings[i].sfm_file_offset,
mappings[i].sfm_max_prot,
mappings[i].sfm_init_prot));
} else {
if (mapping_to_slide != NULL) {
mapping_to_slide->sfm_file_offset = mappings[i].sfm_file_offset;
mapping_to_slide->sfm_size = mappings[i].sfm_size;
found_mapping_to_slide = TRUE;
}
}
}
target_address =
mappings[i].sfm_address - sr_base_address;
if (map_port == MACH_PORT_NULL) {
obj_size = vm_map_round_page(mappings[i].sfm_size);
object = vm_object_allocate(obj_size);
if (object == VM_OBJECT_NULL) {
kr = KERN_RESOURCE_SHORTAGE;
} else {
kr = vm_map_enter(
sr_map,
&target_address,
vm_map_round_page(mappings[i].sfm_size),
0,
VM_FLAGS_FIXED | VM_FLAGS_ALREADY,
object,
0,
TRUE,
mappings[i].sfm_init_prot & VM_PROT_ALL,
mappings[i].sfm_max_prot & VM_PROT_ALL,
VM_INHERIT_DEFAULT);
}
} else {
object = VM_OBJECT_NULL;
kr = vm_map_enter_mem_object(
sr_map,
&target_address,
vm_map_round_page(mappings[i].sfm_size),
0,
VM_FLAGS_FIXED | VM_FLAGS_ALREADY,
map_port,
mappings[i].sfm_file_offset,
TRUE,
mappings[i].sfm_init_prot & VM_PROT_ALL,
mappings[i].sfm_max_prot & VM_PROT_ALL,
VM_INHERIT_DEFAULT);
}
if (kr != KERN_SUCCESS) {
if (map_port == MACH_PORT_NULL) {
vm_object_deallocate(object);
object = VM_OBJECT_NULL;
}
if (kr == KERN_MEMORY_PRESENT) {
SHARED_REGION_TRACE_INFO(
("shared_region: mapping[%d]: "
"address:0x%016llx size:0x%016llx "
"offset:0x%016llx "
"maxprot:0x%x prot:0x%x "
"already mapped...\n",
i,
(long long)mappings[i].sfm_address,
(long long)mappings[i].sfm_size,
(long long)mappings[i].sfm_file_offset,
mappings[i].sfm_max_prot,
mappings[i].sfm_init_prot));
mappings[i].sfm_size = 0;
kr = KERN_SUCCESS;
} else {
SHARED_REGION_TRACE_ERROR(
("shared_region: mapping[%d]: "
"address:0x%016llx size:0x%016llx "
"offset:0x%016llx "
"maxprot:0x%x prot:0x%x failed 0x%x\n",
i,
(long long)mappings[i].sfm_address,
(long long)mappings[i].sfm_size,
(long long)mappings[i].sfm_file_offset,
mappings[i].sfm_max_prot,
mappings[i].sfm_init_prot,
kr));
vm_shared_region_undo_mappings(sr_map, sr_base_address, mappings, i);
break;
}
}
if (shared_region->sr_first_mapping == (mach_vm_offset_t) -1) {
shared_region->sr_first_mapping = target_address;
}
}
vm_shared_region_lock();
assert(shared_region->sr_ref_count > 1);
assert(shared_region->sr_mapping_in_progress);
shared_region->sr_mapping_in_progress = FALSE;
thread_wakeup((event_t) &shared_region->sr_mapping_in_progress);
vm_shared_region_unlock();
done:
SHARED_REGION_TRACE_DEBUG(
("shared_region: map(%p,%d,%p,%p,0x%llx) <- 0x%x \n",
shared_region, mappings_count, mappings,
file_control, file_size, kr));
return kr;
}
kern_return_t
vm_shared_region_enter(
struct _vm_map *map,
struct task *task,
void *fsroot,
cpu_type_t cpu)
{
kern_return_t kr;
vm_shared_region_t shared_region;
vm_map_offset_t sr_address, sr_offset, target_address;
vm_map_size_t sr_size, mapping_size;
vm_map_offset_t sr_pmap_nesting_start;
vm_map_size_t sr_pmap_nesting_size;
ipc_port_t sr_handle;
boolean_t is_64bit;
is_64bit = task_has_64BitAddr(task);
SHARED_REGION_TRACE_DEBUG(
("shared_region: -> "
"enter(map=%p,task=%p,root=%p,cpu=%d,64bit=%d)\n",
map, task, fsroot, cpu, is_64bit));
shared_region = vm_shared_region_lookup(fsroot, cpu, is_64bit);
if (shared_region == NULL) {
SHARED_REGION_TRACE_ERROR(
("shared_region: -> "
"enter(map=%p,task=%p,root=%p,cpu=%d,64bit=%d): "
"lookup failed !\n",
map, task, fsroot, cpu, is_64bit));
return KERN_FAILURE;
}
vm_shared_region_set(task, shared_region);
kr = KERN_SUCCESS;
sr_address = shared_region->sr_base_address;
sr_size = shared_region->sr_size;
sr_handle = shared_region->sr_mem_entry;
sr_pmap_nesting_start = shared_region->sr_pmap_nesting_start;
sr_pmap_nesting_size = shared_region->sr_pmap_nesting_size;
sr_offset = 0;
if (sr_pmap_nesting_start > sr_address) {
target_address = sr_address;
mapping_size = sr_pmap_nesting_start - sr_address;
kr = vm_map_enter_mem_object(
map,
&target_address,
mapping_size,
0,
VM_FLAGS_FIXED,
sr_handle,
sr_offset,
TRUE,
VM_PROT_READ,
VM_PROT_ALL,
VM_INHERIT_SHARE);
if (kr != KERN_SUCCESS) {
SHARED_REGION_TRACE_ERROR(
("shared_region: enter(%p,%p,%p,%d,%d): "
"vm_map_enter(0x%llx,0x%llx,%p) error 0x%x\n",
map, task, fsroot, cpu, is_64bit,
(long long)target_address,
(long long)mapping_size, sr_handle, kr));
goto done;
}
SHARED_REGION_TRACE_DEBUG(
("shared_region: enter(%p,%p,%p,%d,%d): "
"vm_map_enter(0x%llx,0x%llx,%p) error 0x%x\n",
map, task, fsroot, cpu, is_64bit,
(long long)target_address, (long long)mapping_size,
sr_handle, kr));
sr_offset += mapping_size;
sr_size -= mapping_size;
}
for (;
sr_pmap_nesting_size > 0;
sr_offset += mapping_size,
sr_size -= mapping_size,
sr_pmap_nesting_size -= mapping_size) {
target_address = sr_address + sr_offset;
mapping_size = sr_pmap_nesting_size;
if (mapping_size > pmap_nesting_size_max) {
mapping_size = (vm_map_offset_t) pmap_nesting_size_max;
}
kr = vm_map_enter_mem_object(
map,
&target_address,
mapping_size,
0,
(VM_FLAGS_FIXED | VM_MAKE_TAG(VM_MEMORY_SHARED_PMAP)),
sr_handle,
sr_offset,
TRUE,
VM_PROT_READ,
VM_PROT_ALL,
VM_INHERIT_SHARE);
if (kr != KERN_SUCCESS) {
SHARED_REGION_TRACE_ERROR(
("shared_region: enter(%p,%p,%p,%d,%d): "
"vm_map_enter(0x%llx,0x%llx,%p) error 0x%x\n",
map, task, fsroot, cpu, is_64bit,
(long long)target_address,
(long long)mapping_size, sr_handle, kr));
goto done;
}
SHARED_REGION_TRACE_DEBUG(
("shared_region: enter(%p,%p,%p,%d,%d): "
"nested vm_map_enter(0x%llx,0x%llx,%p) error 0x%x\n",
map, task, fsroot, cpu, is_64bit,
(long long)target_address, (long long)mapping_size,
sr_handle, kr));
}
if (sr_size > 0) {
target_address = sr_address + sr_offset;
mapping_size = sr_size;
kr = vm_map_enter_mem_object(
map,
&target_address,
mapping_size,
0,
VM_FLAGS_FIXED,
sr_handle,
sr_offset,
TRUE,
VM_PROT_READ,
VM_PROT_ALL,
VM_INHERIT_SHARE);
if (kr != KERN_SUCCESS) {
SHARED_REGION_TRACE_ERROR(
("shared_region: enter(%p,%p,%p,%d,%d): "
"vm_map_enter(0x%llx,0x%llx,%p) error 0x%x\n",
map, task, fsroot, cpu, is_64bit,
(long long)target_address,
(long long)mapping_size, sr_handle, kr));
goto done;
}
SHARED_REGION_TRACE_DEBUG(
("shared_region: enter(%p,%p,%p,%d,%d): "
"vm_map_enter(0x%llx,0x%llx,%p) error 0x%x\n",
map, task, fsroot, cpu, is_64bit,
(long long)target_address, (long long)mapping_size,
sr_handle, kr));
sr_offset += mapping_size;
sr_size -= mapping_size;
}
assert(sr_size == 0);
done:
SHARED_REGION_TRACE_DEBUG(
("shared_region: enter(%p,%p,%p,%d,%d) <- 0x%x\n",
map, task, fsroot, cpu, is_64bit, kr));
return kr;
}
#define SANE_SLIDE_INFO_SIZE (1024*1024)
struct vm_shared_region_slide_info slide_info;
kern_return_t
vm_shared_region_sliding_valid(uint32_t slide) {
kern_return_t kr = KERN_SUCCESS;
if ((shared_region_completed_slide == TRUE) && slide) {
if (slide != slide_info.slide) {
printf("Only one shared region can be slid\n");
kr = KERN_FAILURE;
} else if (slide == slide_info.slide) {
kr = KERN_INVALID_ARGUMENT;
}
}
return kr;
}
kern_return_t
vm_shared_region_slide_init(
mach_vm_size_t slide_info_size,
mach_vm_offset_t start,
mach_vm_size_t size,
uint32_t slide,
memory_object_control_t sr_file_control)
{
kern_return_t kr = KERN_SUCCESS;
vm_object_t object = VM_OBJECT_NULL;
vm_object_offset_t offset = 0;
vm_map_t map =NULL, cur_map = NULL;
boolean_t is_map_locked = FALSE;
if ((kr = vm_shared_region_sliding_valid(slide)) != KERN_SUCCESS) {
if (kr == KERN_INVALID_ARGUMENT) {
kr = KERN_SUCCESS;
}
return kr;
}
if (slide_info_size > SANE_SLIDE_INFO_SIZE) {
printf("Slide_info_size too large: %lx\n", (uintptr_t)slide_info_size);
kr = KERN_FAILURE;
return kr;
}
if (sr_file_control != MEMORY_OBJECT_CONTROL_NULL) {
object = memory_object_control_to_vm_object(sr_file_control);
vm_object_reference(object);
offset = start;
vm_object_lock_shared(object);
} else {
vm_map_entry_t entry = VM_MAP_ENTRY_NULL;
map = current_map();
vm_map_lock_read(map);
is_map_locked = TRUE;
Retry:
cur_map = map;
if(!vm_map_lookup_entry(map, start, &entry)) {
kr = KERN_INVALID_ARGUMENT;
} else {
vm_object_t shadow_obj = VM_OBJECT_NULL;
if (entry->is_sub_map == TRUE) {
map = entry->object.sub_map;
start -= entry->vme_start;
start += entry->offset;
vm_map_lock_read(map);
vm_map_unlock_read(cur_map);
goto Retry;
} else {
object = entry->object.vm_object;
offset = (start - entry->vme_start) + entry->offset;
}
vm_object_lock_shared(object);
while (object->shadow != VM_OBJECT_NULL) {
shadow_obj = object->shadow;
vm_object_lock_shared(shadow_obj);
vm_object_unlock(object);
object = shadow_obj;
}
}
}
if (object->internal == TRUE) {
kr = KERN_INVALID_ADDRESS;
} else {
kr = kmem_alloc(kernel_map,
(vm_offset_t *) &slide_info.slide_info_entry,
(vm_size_t) slide_info_size);
if (kr == KERN_SUCCESS) {
slide_info.slide_info_size = slide_info_size;
slide_info.slide_object = object;
slide_info.start = offset;
slide_info.end = slide_info.start + size;
slide_info.slide = slide;
slide_info.sr = vm_shared_region_get(current_task());
shared_region_completed_slide = TRUE;
} else {
kr = KERN_FAILURE;
}
}
vm_object_unlock(object);
if (is_map_locked == TRUE) {
vm_map_unlock_read(map);
}
return kr;
}
void*
vm_shared_region_get_slide_info(void) {
return (void*)&slide_info;
}
void*
vm_shared_region_get_slide_info_entry(void) {
return (void*)slide_info.slide_info_entry;
}
kern_return_t
vm_shared_region_slide_sanity_check(void)
{
uint32_t pageIndex=0;
uint16_t entryIndex=0;
uint16_t *toc = NULL;
vm_shared_region_slide_info_entry_t s_info;
kern_return_t kr;
s_info = vm_shared_region_get_slide_info_entry();
toc = (uint16_t*)((uintptr_t)s_info + s_info->toc_offset);
kr = mach_vm_protect(kernel_map,
(mach_vm_offset_t)(vm_offset_t) slide_info.slide_info_entry,
(mach_vm_size_t) slide_info.slide_info_size,
VM_PROT_READ, TRUE);
if (kr != KERN_SUCCESS) {
panic("vm_shared_region_slide_sanity_check: vm_protect() error 0x%x\n", kr);
}
for (;pageIndex < s_info->toc_count; pageIndex++) {
entryIndex = (uint16_t)(toc[pageIndex]);
if (entryIndex >= s_info->entry_count) {
printf("No sliding bitmap entry for pageIndex: %d at entryIndex: %d amongst %d entries\n", pageIndex, entryIndex, s_info->entry_count);
goto fail;
}
}
return KERN_SUCCESS;
fail:
if (slide_info.slide_info_entry != NULL) {
kmem_free(kernel_map,
(vm_offset_t) slide_info.slide_info_entry,
(vm_size_t) slide_info.slide_info_size);
vm_object_deallocate(slide_info.slide_object);
slide_info.slide_object = NULL;
slide_info.start = 0;
slide_info.end = 0;
slide_info.slide = 0;
slide_info.slide_info_entry = NULL;
slide_info.slide_info_size = 0;
shared_region_completed_slide = FALSE;
}
return KERN_FAILURE;
}
kern_return_t
vm_shared_region_slide(vm_offset_t vaddr, uint32_t pageIndex)
{
uint16_t *toc = NULL;
slide_info_entry_toc_t bitmap = NULL;
uint32_t i=0, j=0;
uint8_t b = 0;
uint32_t slide = slide_info.slide;
int is_64 = task_has_64BitAddr(current_task());
vm_shared_region_slide_info_entry_t s_info = vm_shared_region_get_slide_info_entry();
toc = (uint16_t*)((uintptr_t)s_info + s_info->toc_offset);
if (pageIndex >= s_info->toc_count) {
printf("No slide entry for this page in toc. PageIndex: %d Toc Count: %d\n", pageIndex, s_info->toc_count);
} else {
uint16_t entryIndex = (uint16_t)(toc[pageIndex]);
slide_info_entry_toc_t slide_info_entries = (slide_info_entry_toc_t)((uintptr_t)s_info + s_info->entry_offset);
if (entryIndex >= s_info->entry_count) {
printf("No sliding bitmap entry for entryIndex: %d amongst %d entries\n", entryIndex, s_info->entry_count);
} else {
bitmap = &slide_info_entries[entryIndex];
for(i=0; i < NUM_SLIDING_BITMAPS_PER_PAGE; ++i) {
b = bitmap->entry[i];
if (b!=0) {
for (j=0; j <8; ++j) {
if (b & (1 <<j)){
uint32_t *ptr_to_slide;
uint32_t old_value;
ptr_to_slide = (uint32_t*)((uintptr_t)(vaddr)+(sizeof(uint32_t)*(i*8 +j)));
old_value = *ptr_to_slide;
*ptr_to_slide += slide;
if (is_64 && *ptr_to_slide < old_value) {
printf("vm_shared_region_slide() carry over: i=%d j=%d b=0x%x slide=0x%x old=0x%x new=0x%x\n",
i, j, b, slide, old_value, *ptr_to_slide);
return KERN_FAILURE;
}
}
}
}
}
}
}
return KERN_SUCCESS;
}
ipc_port_t commpage32_handle = IPC_PORT_NULL;
ipc_port_t commpage64_handle = IPC_PORT_NULL;
vm_named_entry_t commpage32_entry = NULL;
vm_named_entry_t commpage64_entry = NULL;
vm_map_t commpage32_map = VM_MAP_NULL;
vm_map_t commpage64_map = VM_MAP_NULL;
ipc_port_t commpage_text32_handle = IPC_PORT_NULL;
ipc_port_t commpage_text64_handle = IPC_PORT_NULL;
vm_named_entry_t commpage_text32_entry = NULL;
vm_named_entry_t commpage_text64_entry = NULL;
vm_map_t commpage_text32_map = VM_MAP_NULL;
vm_map_t commpage_text64_map = VM_MAP_NULL;
user32_addr_t commpage_text32_location = (user32_addr_t) _COMM_PAGE32_TEXT_START;
user64_addr_t commpage_text64_location = (user64_addr_t) _COMM_PAGE64_TEXT_START;
#if defined(__i386__) || defined(__x86_64__)
static void
_vm_commpage_init(
ipc_port_t *handlep,
vm_map_size_t size)
{
kern_return_t kr;
vm_named_entry_t mem_entry;
vm_map_t new_map;
SHARED_REGION_TRACE_DEBUG(
("commpage: -> _init(0x%llx)\n",
(long long)size));
kr = mach_memory_entry_allocate(&mem_entry,
handlep);
if (kr != KERN_SUCCESS) {
panic("_vm_commpage_init: could not allocate mem_entry");
}
new_map = vm_map_create(pmap_create(NULL, 0, FALSE), 0, size, TRUE);
if (new_map == VM_MAP_NULL) {
panic("_vm_commpage_init: could not allocate VM map");
}
mem_entry->backing.map = new_map;
mem_entry->internal = TRUE;
mem_entry->is_sub_map = TRUE;
mem_entry->offset = 0;
mem_entry->protection = VM_PROT_ALL;
mem_entry->size = size;
SHARED_REGION_TRACE_DEBUG(
("commpage: _init(0x%llx) <- %p\n",
(long long)size, *handlep));
}
#endif
extern u_int32_t random(void);
void
vm_commpage_text_init(void)
{
SHARED_REGION_TRACE_DEBUG(
("commpage text: ->init()\n"));
#if defined(__i386__) || defined(__x86_64__)
unsigned int offset = (random() % _PFZ32_SLIDE_RANGE) << PAGE_SHIFT;
_vm_commpage_init(&commpage_text32_handle, _COMM_PAGE_TEXT_AREA_LENGTH);
commpage_text32_entry = (vm_named_entry_t) commpage_text32_handle->ip_kobject;
commpage_text32_map = commpage_text32_entry->backing.map;
commpage_text32_location = (user32_addr_t) (_COMM_PAGE32_TEXT_START + offset);
offset = (random() % _PFZ64_SLIDE_RANGE) << PAGE_SHIFT;
_vm_commpage_init(&commpage_text64_handle, _COMM_PAGE_TEXT_AREA_LENGTH);
commpage_text64_entry = (vm_named_entry_t) commpage_text64_handle->ip_kobject;
commpage_text64_map = commpage_text64_entry->backing.map;
commpage_text64_location = (user64_addr_t) (_COMM_PAGE64_TEXT_START + offset);
commpage_text_populate();
#else
#error Unknown architecture.
#endif
SHARED_REGION_TRACE_DEBUG(
("commpage text: init() <-\n"));
}
void
vm_commpage_init(void)
{
SHARED_REGION_TRACE_DEBUG(
("commpage: -> init()\n"));
#if defined(__i386__) || defined(__x86_64__)
_vm_commpage_init(&commpage32_handle, _COMM_PAGE32_AREA_LENGTH);
commpage32_entry = (vm_named_entry_t) commpage32_handle->ip_kobject;
commpage32_map = commpage32_entry->backing.map;
_vm_commpage_init(&commpage64_handle, _COMM_PAGE64_AREA_LENGTH);
commpage64_entry = (vm_named_entry_t) commpage64_handle->ip_kobject;
commpage64_map = commpage64_entry->backing.map;
#endif
commpage_populate();
__commpage_setup = 1;
#if defined(__i386__) || defined(__x86_64__)
if (__system_power_source == 0) {
post_sys_powersource_internal(0, 1);
}
#endif
SHARED_REGION_TRACE_DEBUG(
("commpage: init() <-\n"));
}
kern_return_t
vm_commpage_enter(
vm_map_t map,
task_t task)
{
ipc_port_t commpage_handle, commpage_text_handle;
vm_map_offset_t commpage_address, objc_address, commpage_text_address;
vm_map_size_t commpage_size, objc_size, commpage_text_size;
int vm_flags;
kern_return_t kr;
SHARED_REGION_TRACE_DEBUG(
("commpage: -> enter(%p,%p)\n",
map, task));
commpage_text_size = _COMM_PAGE_TEXT_AREA_LENGTH;
vm_flags = VM_FLAGS_FIXED | VM_FLAGS_BEYOND_MAX;
assert(! (task_has_64BitAddr(task) ^ vm_map_is_64bit(map)));
if (task_has_64BitAddr(task)) {
commpage_handle = commpage64_handle;
commpage_address = (vm_map_offset_t) _COMM_PAGE64_BASE_ADDRESS;
commpage_size = _COMM_PAGE64_AREA_LENGTH;
objc_size = _COMM_PAGE64_OBJC_SIZE;
objc_address = _COMM_PAGE64_OBJC_BASE;
commpage_text_handle = commpage_text64_handle;
commpage_text_address = (vm_map_offset_t) commpage_text64_location;
} else {
commpage_handle = commpage32_handle;
commpage_address =
(vm_map_offset_t)(unsigned) _COMM_PAGE32_BASE_ADDRESS;
commpage_size = _COMM_PAGE32_AREA_LENGTH;
objc_size = _COMM_PAGE32_OBJC_SIZE;
objc_address = _COMM_PAGE32_OBJC_BASE;
commpage_text_handle = commpage_text32_handle;
commpage_text_address = (vm_map_offset_t) commpage_text32_location;
}
if ((commpage_address & (pmap_nesting_size_min - 1)) == 0 &&
(commpage_size & (pmap_nesting_size_min - 1)) == 0) {
vm_flags |= VM_MAKE_TAG(VM_MEMORY_SHARED_PMAP);
}
assert(commpage_handle != IPC_PORT_NULL);
kr = vm_map_enter_mem_object(
map,
&commpage_address,
commpage_size,
0,
vm_flags,
commpage_handle,
0,
FALSE,
VM_PROT_READ,
VM_PROT_READ,
VM_INHERIT_SHARE);
if (kr != KERN_SUCCESS) {
SHARED_REGION_TRACE_ERROR(
("commpage: enter(%p,0x%llx,0x%llx) "
"commpage %p mapping failed 0x%x\n",
map, (long long)commpage_address,
(long long)commpage_size, commpage_handle, kr));
}
assert(commpage_text_handle != IPC_PORT_NULL);
kr = vm_map_enter_mem_object(
map,
&commpage_text_address,
commpage_text_size,
0,
vm_flags,
commpage_text_handle,
0,
FALSE,
VM_PROT_READ|VM_PROT_EXECUTE,
VM_PROT_READ|VM_PROT_EXECUTE,
VM_INHERIT_SHARE);
if (kr != KERN_SUCCESS) {
SHARED_REGION_TRACE_ERROR(
("commpage text: enter(%p,0x%llx,0x%llx) "
"commpage text %p mapping failed 0x%x\n",
map, (long long)commpage_text_address,
(long long)commpage_text_size, commpage_text_handle, kr));
}
if (objc_size != 0) {
kr = vm_map_enter_mem_object(
map,
&objc_address,
objc_size,
0,
VM_FLAGS_FIXED | VM_FLAGS_BEYOND_MAX,
IPC_PORT_NULL,
0,
FALSE,
VM_PROT_ALL,
VM_PROT_ALL,
VM_INHERIT_DEFAULT);
if (kr != KERN_SUCCESS) {
SHARED_REGION_TRACE_ERROR(
("commpage: enter(%p,0x%llx,0x%llx) "
"objc mapping failed 0x%x\n",
map, (long long)objc_address,
(long long)objc_size, kr));
}
}
SHARED_REGION_TRACE_DEBUG(
("commpage: enter(%p,%p) <- 0x%x\n",
map, task, kr));
return kr;
}
void
#if defined(__i386__) || defined(__x86_64__)
post_sys_powersource(int i)
#else
post_sys_powersource(__unused int i)
#endif
{
#if defined(__i386__) || defined(__x86_64__)
post_sys_powersource_internal(i, 0);
#endif
}
#if defined(__i386__) || defined(__x86_64__)
static void
post_sys_powersource_internal(int i, int internal)
{
if (internal == 0)
__system_power_source = i;
if (__commpage_setup != 0) {
if (__system_power_source != 0)
commpage_set_spin_count(0);
else
commpage_set_spin_count(MP_SPIN_TRIES);
}
}
#endif