Implement paging subsystem with identity mapping and kernel heap (AI)

- Created two-level x86 paging (page directory + page tables) with 4 KiB pages.
- Identity maps all detected physical memory in two phases:
  1) Static: first 16 MiB using 4 BSS-allocated page tables (avoids
     chicken-and-egg with PMM bitmap in BSS).
  2) Dynamic: memory above 16 MiB using PMM-allocated page tables,
     created before paging is enabled so physical addresses still work.
- Provides kernel heap at 0xD0000000–0xF0000000 for virtual page allocation.
- API: paging_map_page, paging_unmap_page, paging_alloc_page, paging_free_page,
  paging_get_physical.
- Added pmm_get_memory_size() to expose detected RAM for paging init.
- Kernel tests paging by allocating a virtual page, writing 0xDEADBEEF, and
  reading it back, then freeing it.
- Added documentation in docs/paging.md.

Tested: boots and passes paging test with both 4 MiB and 128 MiB RAM in QEMU.
This commit is contained in:
AI
2026-02-23 11:03:27 +00:00
parent f2e7d6c5d7
commit fb61ab7c15
8 changed files with 467 additions and 9 deletions

278
src/paging.c Normal file
View File

@@ -0,0 +1,278 @@
/**
* @file paging.c
* @brief Virtual memory paging subsystem implementation.
*
* Implements two-level x86 paging (page directory + page tables) with 4 KiB
* pages. At initialization, all detected physical memory is identity-mapped
* so that physical addresses equal virtual addresses. Drivers and the kernel
* can then allocate additional virtual pages as needed.
*
* The kernel heap region starts at KERNEL_HEAP_START (0xD0000000) and grows
* upward as pages are requested through paging_alloc_page().
*/
#include "paging.h"
#include "pmm.h"
#include "port_io.h"
#include <stddef.h>
#include <string.h>
/* Debug print helpers defined in kernel.c */
extern void offset_print(const char *str);
extern void print_hex(uint32_t val);
/** Kernel heap starts at 0xD0000000 (above the 0xC0000000 higher-half region). */
#define KERNEL_HEAP_START 0xD0000000
/** Kernel heap ends at 0xF0000000 (768 MiB of virtual space for kernel heap). */
#define KERNEL_HEAP_END 0xF0000000
/**
* The page directory. Must be page-aligned (4 KiB).
* Each entry either points to a page table or is zero (not present).
*/
static uint32_t page_directory[PAGE_ENTRIES] __attribute__((aligned(4096)));
/**
* Storage for page tables. We pre-allocate enough for identity mapping.
* For a system with up to 4 GiB, we'd need 1024 page tables, but we
* only use these for the first 16 MiB during early boot. Additional page
* tables are allocated from the PMM as needed.
*
* The first 16 MiB must be statically allocated because the PMM bitmap
* itself lives in BSS within this region.
*/
#define STATIC_PT_COUNT 4
static uint32_t static_page_tables[STATIC_PT_COUNT][PAGE_ENTRIES] __attribute__((aligned(4096)));
/**
* Dynamically allocated page tables for memory above 16 MiB.
* Before paging is enabled, we allocate these from the PMM and store
* their physical addresses here so we can access them after paging.
*/
#define MAX_DYNAMIC_PT 256
static uint32_t *dynamic_page_tables[MAX_DYNAMIC_PT];
static uint32_t dynamic_pt_count = 0;
/** Next virtual address to hand out from the kernel heap. */
static uint32_t heap_next = KERNEL_HEAP_START;
/**
* Flush a single TLB entry for the given virtual address.
*
* @param vaddr The virtual address whose TLB entry to invalidate.
*/
static inline void tlb_flush_single(uint32_t vaddr) {
__asm__ volatile("invlpg (%0)" : : "r"(vaddr) : "memory");
}
/**
* Reload CR3 to flush the entire TLB.
*/
static inline void tlb_flush_all(void) {
uint32_t cr3;
__asm__ volatile("mov %%cr3, %0" : "=r"(cr3));
__asm__ volatile("mov %0, %%cr3" : : "r"(cr3) : "memory");
}
/**
* Get a page table for a given page directory index.
*
* If the page directory entry is not present, allocate a new page table
* from the PMM and install it.
*
* @param pd_idx Page directory index (01023).
* @param create If non-zero, create the page table if it doesn't exist.
* @return Pointer to the page table, or NULL if not present and !create.
*/
static uint32_t *get_page_table(uint32_t pd_idx, int create) {
if (page_directory[pd_idx] & PAGE_PRESENT) {
return (uint32_t *)(page_directory[pd_idx] & 0xFFFFF000);
}
if (!create) {
return NULL;
}
/* Allocate a new page table from the PMM */
phys_addr_t pt_phys = pmm_alloc_page(PMM_ZONE_NORMAL);
if (pt_phys == 0) {
offset_print(" PAGING: FATAL - could not allocate page table\n");
return NULL;
}
/* Zero the new page table */
memset((void *)pt_phys, 0, 4096);
/* Install it in the page directory */
page_directory[pd_idx] = pt_phys | PAGE_PRESENT | PAGE_WRITE;
return (uint32_t *)pt_phys;
}
void paging_map_page(uint32_t vaddr, uint32_t paddr, uint32_t flags) {
uint32_t pd_idx = PD_INDEX(vaddr);
uint32_t pt_idx = PT_INDEX(vaddr);
uint32_t *pt = get_page_table(pd_idx, 1);
if (!pt) {
return;
}
pt[pt_idx] = (paddr & 0xFFFFF000) | (flags & 0xFFF);
tlb_flush_single(vaddr);
}
void paging_unmap_page(uint32_t vaddr) {
uint32_t pd_idx = PD_INDEX(vaddr);
uint32_t pt_idx = PT_INDEX(vaddr);
uint32_t *pt = get_page_table(pd_idx, 0);
if (!pt) {
return;
}
pt[pt_idx] = 0;
tlb_flush_single(vaddr);
}
uint32_t paging_get_physical(uint32_t vaddr) {
uint32_t pd_idx = PD_INDEX(vaddr);
uint32_t pt_idx = PT_INDEX(vaddr);
uint32_t *pt = get_page_table(pd_idx, 0);
if (!pt) {
return 0;
}
if (!(pt[pt_idx] & PAGE_PRESENT)) {
return 0;
}
return (pt[pt_idx] & 0xFFFFF000) | (vaddr & 0xFFF);
}
void *paging_alloc_page(void) {
if (heap_next >= KERNEL_HEAP_END) {
offset_print(" PAGING: kernel heap exhausted\n");
return NULL;
}
/* Allocate a physical page */
phys_addr_t paddr = pmm_alloc_page(PMM_ZONE_NORMAL);
if (paddr == 0) {
offset_print(" PAGING: out of physical memory\n");
return NULL;
}
/* Map it into the kernel heap */
uint32_t vaddr = heap_next;
paging_map_page(vaddr, paddr, PAGE_PRESENT | PAGE_WRITE);
heap_next += 4096;
return (void *)vaddr;
}
void paging_free_page(void *vaddr) {
uint32_t va = (uint32_t)vaddr;
/* Look up the physical address before unmapping */
uint32_t paddr = paging_get_physical(va);
if (paddr == 0) {
return;
}
/* Unmap the virtual page */
paging_unmap_page(va);
/* Return the physical page to the PMM */
pmm_free_page(paddr & 0xFFFFF000);
}
void init_paging(void) {
/* 1. Zero the page directory */
memset(page_directory, 0, sizeof(page_directory));
/* 2. Identity map the first 16 MiB using static page tables.
* This covers the kernel (loaded at 1 MiB), the PMM bitmap (in BSS),
* the stack, and typical BIOS/device regions.
* Each page table maps 4 MiB (1024 entries × 4 KiB).
*/
for (uint32_t i = 0; i < STATIC_PT_COUNT; i++) {
memset(static_page_tables[i], 0, sizeof(static_page_tables[i]));
for (uint32_t j = 0; j < PAGE_ENTRIES; j++) {
uint32_t paddr = (i * PAGE_ENTRIES + j) * 4096;
static_page_tables[i][j] = paddr | PAGE_PRESENT | PAGE_WRITE;
}
page_directory[i] = (uint32_t)static_page_tables[i] | PAGE_PRESENT | PAGE_WRITE;
}
offset_print(" PAGING: identity mapped first 16 MiB\n");
/* 3. Identity map memory above 16 MiB using dynamically allocated page
* tables. We do this BEFORE enabling paging, so physical addresses
* are still directly accessible.
*
* mem_upper is in KiB and starts at 1 MiB, so total memory is
* approximately (mem_upper + 1024) KiB.
*/
uint32_t mem_kb = pmm_get_memory_size() + 1024; /* total memory in KiB */
uint32_t total_bytes = mem_kb * 1024;
uint32_t pd_entries_needed = (total_bytes + (4 * 1024 * 1024 - 1)) / (4 * 1024 * 1024);
if (pd_entries_needed > PAGE_ENTRIES) {
pd_entries_needed = PAGE_ENTRIES;
}
dynamic_pt_count = 0;
for (uint32_t i = STATIC_PT_COUNT; i < pd_entries_needed; i++) {
if (dynamic_pt_count >= MAX_DYNAMIC_PT) {
break;
}
/* Allocate a page for this page table from the DMA zone,
* since we need it to be accessible before paging is enabled
* (i.e., within the first 16 MiB identity map won't help for
* the page table itself, but we haven't enabled paging yet so
* ALL physical memory is accessible). */
phys_addr_t pt_phys = pmm_alloc_page(PMM_ZONE_DMA);
if (pt_phys == 0) {
pt_phys = pmm_alloc_page(PMM_ZONE_NORMAL);
}
if (pt_phys == 0) {
offset_print(" PAGING: WARNING - could not alloc page table\n");
break;
}
uint32_t *pt = (uint32_t *)pt_phys;
dynamic_page_tables[dynamic_pt_count++] = pt;
/* Fill the page table with identity mappings */
for (uint32_t j = 0; j < PAGE_ENTRIES; j++) {
uint32_t paddr = (i * PAGE_ENTRIES + j) * 4096;
pt[j] = paddr | PAGE_PRESENT | PAGE_WRITE;
}
page_directory[i] = pt_phys | PAGE_PRESENT | PAGE_WRITE;
}
if (dynamic_pt_count > 0) {
offset_print(" PAGING: identity mapped ");
print_hex(pd_entries_needed * 4);
offset_print(" PAGING: MiB total using ");
print_hex(dynamic_pt_count);
offset_print(" PAGING: additional page tables\n");
}
/* 4. Load the page directory into CR3 */
__asm__ volatile("mov %0, %%cr3" : : "r"(page_directory) : "memory");
/* 5. Enable paging by setting bit 31 (PG) of CR0 */
uint32_t cr0;
__asm__ volatile("mov %%cr0, %0" : "=r"(cr0));
cr0 |= 0x80000000;
__asm__ volatile("mov %0, %%cr0" : : "r"(cr0) : "memory");
offset_print(" PAGING: enabled\n");
}