toaruos/kernel/mem/mem.c
2018-10-25 23:23:29 +09:00

567 lines
14 KiB
C

/* vim: tabstop=4 shiftwidth=4 noexpandtab
* This file is part of ToaruOS and is released under the terms
* of the NCSA / University of Illinois License - see LICENSE.md
* Copyright (C) 2011-2018 K. Lange
* Copyright (C) 2012 Markus Schober
*
* Kernel Memory Manager
*/
#include <kernel/mem.h>
#include <kernel/system.h>
#include <kernel/process.h>
#include <kernel/logging.h>
#include <kernel/signal.h>
#include <kernel/module.h>
#include <toaru/hashmap.h>
#define KERNEL_HEAP_INIT 0x00800000
#define KERNEL_HEAP_END 0x20000000
extern void *end;
uintptr_t placement_pointer = (uintptr_t)&end;
uintptr_t heap_end = (uintptr_t)NULL;
uintptr_t kernel_heap_alloc_point = KERNEL_HEAP_INIT;
//static volatile uint8_t frame_alloc_lock = 0;
static spin_lock_t frame_alloc_lock = { 0 };
uint32_t first_n_frames(int n);
void
kmalloc_startat(
uintptr_t address
) {
placement_pointer = address;
}
/*
* kmalloc() is the kernel's dumb placement allocator
*/
uintptr_t
kmalloc_real(
size_t size,
int align,
uintptr_t * phys
) {
if (heap_end) {
void * address;
if (align) {
address = valloc(size);
} else {
address = malloc(size);
}
if (phys) {
if (align && size >= 0x3000) {
debug_print(NOTICE, "Requested large aligned alloc of size 0x%x", size);
for (uintptr_t i = (uintptr_t)address; i < (uintptr_t)address + size; i += 0x1000) {
clear_frame(map_to_physical(i));
}
/* XXX This is going to get touchy... */
spin_lock(frame_alloc_lock);
uint32_t index = first_n_frames((size + 0xFFF) / 0x1000);
if (index == 0xFFFFFFFF) {
spin_unlock(frame_alloc_lock);
return 0;
}
for (unsigned int i = 0; i < (size + 0xFFF) / 0x1000; ++i) {
set_frame((index + i) * 0x1000);
page_t * page = get_page((uintptr_t)address + (i * 0x1000),0,kernel_directory);
ASSUME(page != NULL);
page->frame = index + i;
page->writethrough = 1;
page->cachedisable = 1;
}
spin_unlock(frame_alloc_lock);
}
*phys = map_to_physical((uintptr_t)address);
}
return (uintptr_t)address;
}
if (align && (placement_pointer & 0x00000FFF)) {
placement_pointer &= 0xFFFFF000;
placement_pointer += 0x1000;
}
if (phys) {
*phys = placement_pointer;
}
uintptr_t address = placement_pointer;
placement_pointer += size;
return (uintptr_t)address;
}
/*
* Normal
*/
uintptr_t
kmalloc(
size_t size
) {
return kmalloc_real(size, 0, NULL);
}
/*
* Aligned
*/
uintptr_t
kvmalloc(
size_t size
) {
return kmalloc_real(size, 1, NULL);
}
/*
* With a physical address
*/
uintptr_t
kmalloc_p(
size_t size,
uintptr_t *phys
) {
return kmalloc_real(size, 0, phys);
}
/*
* Aligned, with a physical address
*/
uintptr_t
kvmalloc_p(
size_t size,
uintptr_t *phys
) {
return kmalloc_real(size, 1, phys);
}
/*
* Frame Allocation
*/
uint32_t *frames;
uint32_t nframes;
#define INDEX_FROM_BIT(b) (b / 0x20)
#define OFFSET_FROM_BIT(b) (b % 0x20)
void
set_frame(
uintptr_t frame_addr
) {
if (frame_addr < nframes * 4 * 0x400) {
uint32_t frame = frame_addr / 0x1000;
uint32_t index = INDEX_FROM_BIT(frame);
uint32_t offset = OFFSET_FROM_BIT(frame);
frames[index] |= ((uint32_t)0x1 << offset);
}
}
void
clear_frame(
uintptr_t frame_addr
) {
uint32_t frame = frame_addr / 0x1000;
uint32_t index = INDEX_FROM_BIT(frame);
uint32_t offset = OFFSET_FROM_BIT(frame);
frames[index] &= ~((uint32_t)0x1 << offset);
}
uint32_t test_frame(uintptr_t frame_addr) {
uint32_t frame = frame_addr / 0x1000;
uint32_t index = INDEX_FROM_BIT(frame);
uint32_t offset = OFFSET_FROM_BIT(frame);
return (frames[index] & ((uint32_t)0x1 << offset));
}
uint32_t first_n_frames(int n) {
for (uint32_t i = 0; i < nframes * 0x1000; i += 0x1000) {
int bad = 0;
for (int j = 0; j < n; ++j) {
if (test_frame(i + 0x1000 * j)) {
bad = j+1;
}
}
if (!bad) {
return i / 0x1000;
}
}
return 0xFFFFFFFF;
}
uint32_t first_frame(void) {
uint32_t i, j;
for (i = 0; i < INDEX_FROM_BIT(nframes); ++i) {
if (frames[i] != 0xFFFFFFFF) {
for (j = 0; j < 32; ++j) {
uint32_t testFrame = (uint32_t)0x1 << j;
if (!(frames[i] & testFrame)) {
return i * 0x20 + j;
}
}
}
}
debug_print(CRITICAL, "System claims to be out of usable memory, which means we probably overwrote the page frames.\033[0m");
if (debug_video_crash) {
char * msgs[] = {"Out of memory.", NULL};
debug_video_crash(msgs);
}
STOP;
return -1;
}
void
alloc_frame(
page_t *page,
int is_kernel,
int is_writeable
) {
ASSUME(page != NULL);
if (page->frame != 0) {
page->present = 1;
page->rw = (is_writeable == 1) ? 1 : 0;
page->user = (is_kernel == 1) ? 0 : 1;
return;
} else {
spin_lock(frame_alloc_lock);
uint32_t index = first_frame();
assert(index != (uint32_t)-1 && "Out of frames.");
set_frame(index * 0x1000);
page->frame = index;
spin_unlock(frame_alloc_lock);
page->present = 1;
page->rw = (is_writeable == 1) ? 1 : 0;
page->user = (is_kernel == 1) ? 0 : 1;
}
}
void
dma_frame(
page_t *page,
int is_kernel,
int is_writeable,
uintptr_t address
) {
ASSUME(page != NULL);
/* Page this address directly */
page->present = 1;
page->rw = (is_writeable) ? 1 : 0;
page->user = (is_kernel) ? 0 : 1;
page->frame = address / 0x1000;
set_frame(address);
}
void
free_frame(
page_t *page
) {
uint32_t frame;
if (!(frame = page->frame)) {
assert(0);
return;
} else {
clear_frame(frame * 0x1000);
page->frame = 0x0;
}
}
uintptr_t memory_use(void ) {
uintptr_t ret = 0;
uint32_t i, j;
for (i = 0; i < INDEX_FROM_BIT(nframes); ++i) {
for (j = 0; j < 32; ++j) {
uint32_t testFrame = (uint32_t)0x1 << j;
if (frames[i] & testFrame) {
ret++;
}
}
}
return ret * 4;
}
uintptr_t memory_total(){
return nframes * 4;
}
void paging_install(uint32_t memsize) {
nframes = memsize / 4;
frames = (uint32_t *)kmalloc(INDEX_FROM_BIT(nframes * 8));
memset(frames, 0, INDEX_FROM_BIT(nframes * 8));
uintptr_t phys;
kernel_directory = (page_directory_t *)kvmalloc_p(sizeof(page_directory_t),&phys);
memset(kernel_directory, 0, sizeof(page_directory_t));
/* Set PAT 111b to Write-Combining */
asm volatile (
"mov $0x277, %%ecx\n" /* IA32_MSR_PAT */
"rdmsr\n"
"or $0x1000000, %%edx\n" /* set bit 56 */
"and $0xf9ffffff, %%edx\n" /* unset bits 57, 58 */
"wrmsr\n"
: : : "ecx", "edx", "eax"
);
}
void paging_mark_system(uint64_t addr) {
set_frame(addr);
}
void paging_finalize(void) {
debug_print(INFO, "Placement pointer is at 0x%x", placement_pointer);
#if 1
get_page(0,1,kernel_directory)->present = 0;
set_frame(0);
for (uintptr_t i = 0x1000; i < 0x80000; i += 0x1000) {
#else
for (uintptr_t i = 0x0; i < 0x80000; i += 0x1000) {
#endif
dma_frame(get_page(i, 1, kernel_directory), 1, 0, i);
}
for (uintptr_t i = 0x80000; i < 0x100000; i += 0x1000) {
dma_frame(get_page(i, 1, kernel_directory), 1, 0, i);
}
for (uintptr_t i = 0x100000; i < placement_pointer + 0x3000; i += 0x1000) {
dma_frame(get_page(i, 1, kernel_directory), 1, 0, i);
}
debug_print(INFO, "Mapping VGA text-mode directly.");
for (uintptr_t j = 0xb8000; j < 0xc0000; j += 0x1000) {
dma_frame(get_page(j, 0, kernel_directory), 0, 1, j);
}
isrs_install_handler(14, page_fault);
kernel_directory->physical_address = (uintptr_t)kernel_directory->physical_tables;
uintptr_t tmp_heap_start = KERNEL_HEAP_INIT;
if (tmp_heap_start <= placement_pointer + 0x3000) {
debug_print(ERROR, "Foo: 0x%x, 0x%x", tmp_heap_start, placement_pointer + 0x3000);
tmp_heap_start = placement_pointer + 0x100000;
kernel_heap_alloc_point = tmp_heap_start;
}
/* Kernel Heap Space */
for (uintptr_t i = placement_pointer + 0x3000; i < tmp_heap_start; i += 0x1000) {
alloc_frame(get_page(i, 1, kernel_directory), 1, 0);
}
/* And preallocate the page entries for all the rest of the kernel heap as well */
for (uintptr_t i = tmp_heap_start; i < KERNEL_HEAP_END; i += 0x1000) {
get_page(i, 1, kernel_directory);
}
for (unsigned int i = 0xE000; i <= 0xFFF0; i += 0x40) {
get_page(i << 16UL, 1, kernel_directory);
}
debug_print(NOTICE, "Setting directory.");
current_directory = clone_directory(kernel_directory);
switch_page_directory(kernel_directory);
}
uintptr_t map_to_physical(uintptr_t virtual) {
uintptr_t remaining = virtual % 0x1000;
uintptr_t frame = virtual / 0x1000;
uintptr_t table = frame / 1024;
uintptr_t subframe = frame % 1024;
if (current_directory->tables[table]) {
page_t * p = &current_directory->tables[table]->pages[subframe];
return p->frame * 0x1000 + remaining;
} else {
return 0;
}
}
void debug_print_directory(page_directory_t * arg) {
page_directory_t * current_directory = arg;
debug_print(INSANE, " ---- [k:0x%x u:0x%x]", kernel_directory, current_directory);
for (uintptr_t i = 0; i < 1024; ++i) {
if (!current_directory->tables[i] || (uintptr_t)current_directory->tables[i] == (uintptr_t)0xFFFFFFFF) {
continue;
}
if (kernel_directory->tables[i] == current_directory->tables[i]) {
debug_print(INSANE, " 0x%x - kern [0x%x/0x%x] 0x%x", current_directory->tables[i], &current_directory->tables[i], &kernel_directory->tables[i], i * 0x1000 * 1024);
for (uint16_t j = 0; j < 1024; ++j) {
#if 1
page_t * p= &current_directory->tables[i]->pages[j];
if (p->frame) {
debug_print(INSANE, " k 0x%x 0x%x %s", (i * 1024 + j) * 0x1000, p->frame * 0x1000, p->present ? "[present]" : "");
}
#endif
}
} else {
debug_print(INSANE, " 0x%x - user [0x%x] 0x%x [0x%x]", current_directory->tables[i], &current_directory->tables[i], i * 0x1000 * 1024, kernel_directory->tables[i]);
for (uint16_t j = 0; j < 1024; ++j) {
#if 1
page_t * p= &current_directory->tables[i]->pages[j];
if (p->frame) {
debug_print(INSANE, " 0x%x 0x%x %s", (i * 1024 + j) * 0x1000, p->frame * 0x1000, p->present ? "[present]" : "");
}
#endif
}
}
}
debug_print(INFO, " ---- [done]");
}
void
switch_page_directory(
page_directory_t * dir
) {
current_directory = dir;
asm volatile (
"mov %0, %%cr3\n"
"mov %%cr0, %%eax\n"
"orl $0x80000000, %%eax\n"
"mov %%eax, %%cr0\n"
:: "r"(dir->physical_address)
: "%eax");
}
void invalidate_page_tables(void) {
asm volatile (
"movl %%cr3, %%eax\n"
"movl %%eax, %%cr3\n"
::: "%eax");
}
void invalidate_tables_at(uintptr_t addr) {
asm volatile (
"movl %0,%%eax\n"
"invlpg (%%eax)\n"
:: "r"(addr) : "%eax");
}
page_t *
get_page(
uintptr_t address,
int make,
page_directory_t * dir
) {
address /= 0x1000;
uint32_t table_index = address / 1024;
if (dir->tables[table_index]) {
return &dir->tables[table_index]->pages[address % 1024];
} else if(make) {
uint32_t temp;
dir->tables[table_index] = (page_table_t *)kvmalloc_p(sizeof(page_table_t), (uintptr_t *)(&temp));
ASSUME(dir->tables[table_index] != NULL);
memset(dir->tables[table_index], 0, sizeof(page_table_t));
dir->physical_tables[table_index] = temp | 0x7; /* Present, R/w, User */
return &dir->tables[table_index]->pages[address % 1024];
} else {
return 0;
}
}
void
page_fault(
struct regs *r) {
ASSUME(r != NULL);
uint32_t faulting_address;
asm volatile("mov %%cr2, %0" : "=r"(faulting_address));
if (r->eip == SIGNAL_RETURN) {
return_from_signal_handler();
} else if (r->eip == THREAD_RETURN) {
debug_print(INFO, "Returned from thread.");
kexit(0);
}
#if 1
int present = !(r->err_code & 0x1) ? 1 : 0;
int rw = r->err_code & 0x2 ? 1 : 0;
int user = r->err_code & 0x4 ? 1 : 0;
int reserved = r->err_code & 0x8 ? 1 : 0;
int id = r->err_code & 0x10 ? 1 : 0;
debug_print(ERROR, "\033[1;37;41mSegmentation fault. (p:%d,rw:%d,user:%d,res:%d,id:%d) at 0x%x eip: 0x%x pid=%d,%d [%s]\033[0m",
present, rw, user, reserved, id, faulting_address, r->eip, current_process->id, current_process->group, current_process->name);
if (r->eip < heap_end) {
/* find closest symbol */
char * closest = NULL;
size_t distance = 0xFFFFFFFF;
uintptr_t addr = 0;
if (modules_get_symbols()) {
list_t * hash_keys = hashmap_keys(modules_get_symbols());
foreach(_key, hash_keys) {
char * key = (char *)_key->value;
uintptr_t a = (uintptr_t)hashmap_get(modules_get_symbols(), key);
if (!a) continue;
size_t d;
if (a <= r->eip) {
d = r->eip - a;
if (d < distance) {
closest = key;
distance = d;
addr = a;
}
}
}
free(hash_keys);
debug_print(ERROR, "\033[1;31mClosest symbol to faulting address:\033[0m %s [0x%x]", closest, addr);
hash_keys = hashmap_keys(modules_get_list());
foreach(_key, hash_keys) {
char * key = (char *)_key->value;
module_data_t * m = (module_data_t *)hashmap_get(modules_get_list(), key);
if ((r->eip >= (uintptr_t)m->bin_data) && (r->eip < m->end)) {
debug_print(ERROR, "\033[1;31mIn module:\033[0m %s (starts at 0x%x)", m->mod_info->name, m->bin_data);
break;
}
}
free(hash_keys);
debug_print(ERROR, "User EIP: 0x%x", current_process->syscall_registers->eip);
}
} else {
debug_print(ERROR, "\033[1;31m(In userspace)\033[0m");
}
#endif
send_signal(current_process->id, SIGSEGV, 1);
}
/*
* Heap
* Stop using kalloc and friends after installing the heap
* otherwise shit will break. I've conveniently broken
* kalloc when installing the heap, just for those of you
* who feel the need to screw up.
*/
void heap_install(void ) {
heap_end = (placement_pointer + 0x1000) & ~0xFFF;
}
void * sbrk(uintptr_t increment) {
assert((increment % 0x1000 == 0) && "Kernel requested to expand heap by a non-page-multiple value");
assert((heap_end % 0x1000 == 0) && "Kernel heap is not page-aligned!");
assert((heap_end + increment <= KERNEL_HEAP_END - 1) && "The kernel has attempted to allocate beyond the end of its heap.");
uintptr_t address = heap_end;
if (heap_end + increment > kernel_heap_alloc_point) {
debug_print(INFO, "Hit the end of available kernel heap, going to allocate more (at 0x%x, want to be at 0x%x)", heap_end, heap_end + increment);
for (uintptr_t i = heap_end; i < heap_end + increment; i += 0x1000) {
debug_print(INFO, "Allocating frame at 0x%x...", i);
page_t * page = get_page(i, 0, kernel_directory);
assert(page && "Kernel heap allocation fault.");
alloc_frame(page, 1, 0);
}
invalidate_page_tables();
debug_print(INFO, "Done.");
}
heap_end += increment;
memset((void *)address, 0x0, increment);
return (void *)address;
}