| #include "hf/mm.h" |
| |
| #include <assert.h> |
| #include <stdatomic.h> |
| #include <stdint.h> |
| |
| #include "hf/alloc.h" |
| #include "hf/dlog.h" |
| |
| /* The type of addresses stored in the page table. */ |
| typedef uintvaddr_t ptable_addr_t; |
| |
| /* For stage 2, the input is an intermediate physical addresses rather than a |
| * virtual address so: */ |
| static_assert( |
| sizeof(ptable_addr_t) == sizeof(uintpaddr_t), |
| "Currently, the same code manages the stage 1 and stage 2 page tables " |
| "which only works if the virtual and intermediate physical addresses " |
| "are the same size. It looks like that assumption might not be holding " |
| "so we need to check that everything is going to be ok."); |
| |
| /* Keep macro alignment */ |
| /* clang-format off */ |
| |
| #define MAP_FLAG_SYNC 0x01 |
| #define MAP_FLAG_COMMIT 0x02 |
| |
| /* clang-format on */ |
| |
| extern uint8_t text_begin[]; |
| extern uint8_t text_end[]; |
| extern uint8_t rodata_begin[]; |
| extern uint8_t rodata_end[]; |
| extern uint8_t data_begin[]; |
| extern uint8_t data_end[]; |
| |
| static struct mm_ptable ptable; |
| |
| /** |
| * Rounds an address down to a page boundary. |
| */ |
| static ptable_addr_t mm_round_down_to_page(ptable_addr_t addr) |
| { |
| return addr & ~((ptable_addr_t)(PAGE_SIZE - 1)); |
| } |
| |
| /** |
| * Rounds an address up to a page boundary. |
| */ |
| static ptable_addr_t mm_round_up_to_page(ptable_addr_t addr) |
| { |
| return mm_round_down_to_page(addr + PAGE_SIZE - 1); |
| } |
| |
| /** |
| * Calculates the size of the address space represented by a page table entry at |
| * the given level. |
| */ |
| static inline size_t mm_entry_size(int level) |
| { |
| return UINT64_C(1) << (PAGE_BITS + level * PAGE_LEVEL_BITS); |
| } |
| |
| /** |
| * For a given address, calculates the maximum (plus one) address that can be |
| * represented by the same table at the given level. |
| */ |
| static inline ptable_addr_t mm_level_end(ptable_addr_t addr, int level) |
| { |
| size_t offset = PAGE_BITS + (level + 1) * PAGE_LEVEL_BITS; |
| return ((addr >> offset) + 1) << offset; |
| } |
| |
| /** |
| * For a given address, calculates the index at which its entry is stored in a |
| * table at the given level. |
| */ |
| static inline size_t mm_index(ptable_addr_t addr, int level) |
| { |
| ptable_addr_t v = addr >> (PAGE_BITS + level * PAGE_LEVEL_BITS); |
| return v & ((UINT64_C(1) << PAGE_LEVEL_BITS) - 1); |
| } |
| |
| /** |
| * Populates the provided page table entry with a reference to another table if |
| * needed, that is, if it does not yet point to another table. |
| * |
| * Returns a pointer to the table the entry now points to. |
| */ |
| static pte_t *mm_populate_table_pte(pte_t *pte, int level, bool sync_alloc) |
| { |
| pte_t *ntable; |
| pte_t v = *pte; |
| pte_t new_pte; |
| size_t i; |
| size_t inc; |
| |
| /* Just return pointer to table if it's already populated. */ |
| if (arch_mm_pte_is_table(v, level)) { |
| return ptr_from_va(va_from_pa(arch_mm_table_from_pte(v))); |
| } |
| |
| /* Allocate a new table. */ |
| ntable = (sync_alloc ? halloc_aligned : halloc_aligned_nosync)( |
| PAGE_SIZE, PAGE_SIZE); |
| if (!ntable) { |
| dlog("Failed to allocate memory for page table\n"); |
| return NULL; |
| } |
| |
| /* Determine template for new pte and its increment. */ |
| if (arch_mm_pte_is_block(v, level)) { |
| int level_below = level - 1; |
| inc = mm_entry_size(level_below); |
| new_pte = arch_mm_block_pte(level_below, |
| arch_mm_block_from_pte(v), |
| arch_mm_pte_attrs(v)); |
| } else { |
| inc = 0; |
| new_pte = arch_mm_absent_pte(level); |
| } |
| |
| /* Initialise entries in the new table. */ |
| for (i = 0; i < PAGE_SIZE / sizeof(paddr_t); i++) { |
| ntable[i] = new_pte; |
| new_pte += inc; |
| } |
| |
| /* |
| * Ensure initialisation is visible before updating the actual pte, then |
| * update it. |
| */ |
| atomic_thread_fence(memory_order_release); |
| *pte = arch_mm_table_pte(level, pa_init((uintpaddr_t)ntable)); |
| |
| return ntable; |
| } |
| |
| /** |
| * Frees all page-table-related memory associated with the given pte at the |
| * given level, including any subtables recursively. |
| */ |
| static void mm_free_page_pte(pte_t pte, int level) |
| { |
| pte_t *table; |
| uint64_t i; |
| |
| if (!arch_mm_pte_is_table(pte, level)) { |
| return; |
| } |
| |
| table = ptr_from_va(va_from_pa(arch_mm_table_from_pte(pte))); |
| /* Recursively free any subtables. */ |
| for (i = 0; i < PAGE_SIZE / sizeof(pte_t); ++i) { |
| mm_free_page_pte(table[i], level - 1); |
| } |
| |
| /* Free the table itself. */ |
| hfree(table); |
| } |
| |
| /** |
| * Updates the page table at the given level to map the given address range to a |
| * physical range using the provided (architecture-specific) attributes. |
| * |
| * This function calls itself recursively if it needs to update additional |
| * levels, but the recursion is bound by the maximum number of levels in a page |
| * table. |
| */ |
| static bool mm_map_level(ptable_addr_t begin, ptable_addr_t end, paddr_t pa, |
| uint64_t attrs, pte_t *table, int level, int flags) |
| { |
| pte_t *pte = &table[mm_index(begin, level)]; |
| ptable_addr_t level_end = mm_level_end(begin, level); |
| size_t entry_size = mm_entry_size(level); |
| bool commit = flags & MAP_FLAG_COMMIT; |
| bool sync = flags & MAP_FLAG_SYNC; |
| |
| /* Cap end so that we don't go over the current level max. */ |
| if (end > level_end) { |
| end = level_end; |
| } |
| |
| /* Fill each entry in the table. */ |
| while (begin < end) { |
| if ((end - begin) >= entry_size && |
| arch_mm_is_block_allowed(level) && |
| (begin & (entry_size - 1)) == 0) { |
| if (commit) { |
| pte_t v = *pte; |
| *pte = arch_mm_block_pte(level, pa, attrs); |
| /* TODO: Add barrier. How do we ensure this |
| * isn't in use by another CPU? Send IPI? */ |
| mm_free_page_pte(v, level); |
| } |
| } else { |
| pte_t *nt = mm_populate_table_pte(pte, level, sync); |
| if (!nt) { |
| return false; |
| } |
| |
| if (!mm_map_level(begin, end, pa, attrs, nt, level - 1, |
| flags)) { |
| return false; |
| } |
| } |
| |
| begin = (begin + entry_size) & ~(entry_size - 1); |
| pa = pa_init((pa_addr(pa) + entry_size) & ~(entry_size - 1)); |
| pte++; |
| } |
| |
| return true; |
| } |
| |
| /** |
| * Invalidates the TLB for the given address range. |
| */ |
| static void mm_invalidate_tlb(ptable_addr_t begin, ptable_addr_t end, |
| bool stage1) |
| { |
| if (stage1) { |
| arch_mm_invalidate_stage1_range(va_init(begin), va_init(end)); |
| } else { |
| arch_mm_invalidate_stage2_range(ipa_init(begin), ipa_init(end)); |
| } |
| } |
| |
| /** |
| * Updates the given table such that the given physical address range is mapped |
| * into the address space with the corresponding address range in the |
| * architecture-agnostic mode provided. |
| */ |
| static bool mm_ptable_identity_map(struct mm_ptable *t, paddr_t pa_begin, |
| paddr_t pa_end, int mode) |
| { |
| uint64_t attrs = arch_mm_mode_to_attrs(mode); |
| int flags = (mode & MM_MODE_NOSYNC) ? 0 : MAP_FLAG_SYNC; |
| int level = arch_mm_max_level(mode); |
| pte_t *table = ptr_from_va(va_from_pa(t->table)); |
| ptable_addr_t begin; |
| ptable_addr_t end; |
| |
| pa_begin = arch_mm_clear_pa(pa_begin); |
| begin = pa_addr(pa_begin); |
| end = mm_round_up_to_page(pa_addr(pa_end)); |
| |
| /* |
| * Do it in two steps to prevent leaving the table in a halfway updated |
| * state. In such a two-step implementation, the table may be left with |
| * extra internal tables, but no different mapping on failure. |
| */ |
| if (!mm_map_level(begin, end, pa_begin, attrs, table, level, flags)) { |
| return false; |
| } |
| |
| mm_map_level(begin, end, pa_begin, attrs, table, level, |
| flags | MAP_FLAG_COMMIT); |
| |
| /* Invalidate the tlb. */ |
| if (!(mode & MM_MODE_NOINVALIDATE)) { |
| mm_invalidate_tlb(begin, end, (mode & MM_MODE_STAGE1) != 0); |
| } |
| |
| return true; |
| } |
| |
| /** |
| * Updates the given table such that the given physical address range is not |
| * mapped into the address space. |
| */ |
| static bool mm_ptable_unmap(struct mm_ptable *t, paddr_t pa_begin, |
| paddr_t pa_end, int mode) |
| { |
| int flags = (mode & MM_MODE_NOSYNC) ? 0 : MAP_FLAG_SYNC; |
| int level = arch_mm_max_level(mode); |
| pte_t *table = ptr_from_va(va_from_pa(t->table)); |
| ptable_addr_t begin; |
| ptable_addr_t end; |
| |
| pa_begin = arch_mm_clear_pa(pa_begin); |
| begin = pa_addr(pa_begin); |
| end = mm_round_up_to_page(pa_addr(pa_end)); |
| |
| /* Also do updates in two steps, similarly to mm_ptable_identity_map. */ |
| if (!mm_map_level(begin, end, pa_begin, 0, table, level, flags)) { |
| return false; |
| } |
| |
| mm_map_level(begin, end, pa_begin, 0, table, level, |
| flags | MAP_FLAG_COMMIT); |
| |
| /* Invalidate the tlb. */ |
| if (!(mode & MM_MODE_NOINVALIDATE)) { |
| mm_invalidate_tlb(begin, end, (mode & MM_MODE_STAGE1) != 0); |
| } |
| |
| return true; |
| } |
| |
| /** |
| * Updates the given table such that a single physical address page is mapped |
| * into the address space with the corresponding address page in the provided |
| * architecture-agnostic mode. |
| */ |
| static bool mm_ptable_identity_map_page(struct mm_ptable *t, paddr_t pa, |
| int mode) |
| { |
| size_t i; |
| uint64_t attrs = arch_mm_mode_to_attrs(mode); |
| pte_t *table = ptr_from_va(va_from_pa(t->table)); |
| bool sync = !(mode & MM_MODE_NOSYNC); |
| ptable_addr_t addr; |
| |
| pa = arch_mm_clear_pa(pa); |
| addr = pa_addr(pa); |
| |
| for (i = arch_mm_max_level(mode); i > 0; i--) { |
| table = mm_populate_table_pte(&table[mm_index(addr, i)], i, |
| sync); |
| if (!table) { |
| return false; |
| } |
| } |
| |
| i = mm_index(addr, 0); |
| table[i] = arch_mm_block_pte(0, pa, attrs); |
| return true; |
| } |
| |
| /** |
| * Writes the given table to the debug log, calling itself recursively to |
| * write sub-tables. |
| */ |
| static void mm_dump_table_recursive(pte_t *table, int level, int max_level) |
| { |
| uint64_t i; |
| for (i = 0; i < PAGE_SIZE / sizeof(pte_t); i++) { |
| if (!arch_mm_pte_is_present(table[i], level)) { |
| continue; |
| } |
| |
| dlog("%*s%x: %x\n", 4 * (max_level - level), "", i, table[i]); |
| |
| if (arch_mm_pte_is_table(table[i], level)) { |
| mm_dump_table_recursive( |
| ptr_from_va(va_from_pa( |
| arch_mm_table_from_pte(table[i]))), |
| level - 1, max_level); |
| } |
| } |
| } |
| |
| /** |
| * Write the given table to the debug log. |
| */ |
| void mm_ptable_dump(struct mm_ptable *t, int mode) |
| { |
| pte_t *table = ptr_from_va(va_from_pa(t->table)); |
| int max_level = arch_mm_max_level(mode); |
| mm_dump_table_recursive(table, max_level, max_level); |
| } |
| |
| /** |
| * Defragments the given page table by converting page table references to |
| * blocks whenever possible. |
| */ |
| void mm_ptable_defrag(struct mm_ptable *t, int mode) |
| { |
| /* TODO: Implement. */ |
| (void)t; |
| (void)mode; |
| } |
| |
| /** |
| * Unmaps the hypervisor pages from the given page table. |
| */ |
| bool mm_ptable_unmap_hypervisor(struct mm_ptable *t, int mode) |
| { |
| /* TODO: If we add pages dynamically, they must be included here too. */ |
| return mm_ptable_unmap(t, pa_init((uintpaddr_t)text_begin), |
| pa_init((uintpaddr_t)text_end), mode) && |
| mm_ptable_unmap(t, pa_init((uintpaddr_t)rodata_begin), |
| pa_init((uintpaddr_t)rodata_end), mode) && |
| mm_ptable_unmap(t, pa_init((uintpaddr_t)data_begin), |
| pa_init((uintpaddr_t)data_end), mode); |
| } |
| |
| /** |
| * Determines if the given address is mapped in the given page table by |
| * recursively traversing all levels of the page table. |
| */ |
| static bool mm_is_mapped_recursive(const pte_t *table, ptable_addr_t addr, |
| int level) |
| { |
| pte_t pte; |
| ptable_addr_t va_level_end = mm_level_end(addr, level); |
| |
| /* It isn't mapped if it doesn't fit in the table. */ |
| if (addr >= va_level_end) { |
| return false; |
| } |
| |
| pte = table[mm_index(addr, level)]; |
| |
| if (arch_mm_pte_is_block(pte, level)) { |
| return true; |
| } |
| |
| if (arch_mm_pte_is_table(pte, level)) { |
| return mm_is_mapped_recursive( |
| ptr_from_va(va_from_pa(arch_mm_table_from_pte(pte))), |
| addr, level - 1); |
| } |
| |
| /* The entry is not present. */ |
| return false; |
| } |
| |
| /** |
| * Determines if the given address is mapped in the given page table. |
| */ |
| static bool mm_ptable_is_mapped(struct mm_ptable *t, ptable_addr_t addr, |
| int mode) |
| { |
| pte_t *table = ptr_from_va(va_from_pa(t->table)); |
| int level = arch_mm_max_level(mode); |
| |
| addr = mm_round_down_to_page(addr); |
| |
| return mm_is_mapped_recursive(table, addr, level); |
| } |
| |
| /** |
| * Initialises the given page table. |
| */ |
| bool mm_ptable_init(struct mm_ptable *t, int mode) |
| { |
| size_t i; |
| pte_t *table; |
| |
| if (mode & MM_MODE_NOSYNC) { |
| table = halloc_aligned_nosync(PAGE_SIZE, PAGE_SIZE); |
| } else { |
| table = halloc_aligned(PAGE_SIZE, PAGE_SIZE); |
| } |
| |
| if (!table) { |
| return false; |
| } |
| |
| for (i = 0; i < PAGE_SIZE / sizeof(pte_t); i++) { |
| table[i] = arch_mm_absent_pte(arch_mm_max_level(mode)); |
| } |
| |
| /* TODO: halloc could return a virtual or physical address if mm not |
| * enabled? */ |
| t->table = pa_init((uintpaddr_t)table); |
| |
| return true; |
| } |
| |
| /** |
| * Updates a VM's page table such that the given physical address range is |
| * mapped in the address space at the corresponding address range in the |
| * architecture-agnostic mode provided. |
| */ |
| bool mm_vm_identity_map(struct mm_ptable *t, paddr_t begin, paddr_t end, |
| int mode, ipaddr_t *ipa) |
| { |
| bool success = |
| mm_ptable_identity_map(t, begin, end, mode & ~MM_MODE_STAGE1); |
| |
| if (success && ipa != NULL) { |
| *ipa = ipa_from_pa(begin); |
| } |
| |
| return success; |
| } |
| |
| /** |
| * Updates a VM's page table such that the given physical address page is |
| * mapped in the address space at the corresponding address page in the |
| * architecture-agnostic mode provided. |
| */ |
| bool mm_vm_identity_map_page(struct mm_ptable *t, paddr_t begin, int mode, |
| ipaddr_t *ipa) |
| { |
| bool success = |
| mm_ptable_identity_map_page(t, begin, mode & ~MM_MODE_STAGE1); |
| |
| if (success && ipa != NULL) { |
| *ipa = ipa_from_pa(begin); |
| } |
| |
| return success; |
| } |
| |
| /** |
| * Updates the VM's table such that the given physical address range is not |
| * mapped in the address space. |
| */ |
| bool mm_vm_unmap(struct mm_ptable *t, paddr_t begin, paddr_t end, int mode) |
| { |
| return mm_ptable_unmap(t, begin, end, mode & ~MM_MODE_STAGE1); |
| } |
| |
| /** |
| * Checks whether the given intermediate physical addess is mapped in the given |
| * page table of a VM. |
| */ |
| bool mm_vm_is_mapped(struct mm_ptable *t, ipaddr_t ipa, int mode) |
| { |
| return mm_ptable_is_mapped(t, ipa_addr(ipa), mode & ~MM_MODE_STAGE1); |
| } |
| |
| /** |
| * Translates an intermediate physical address to a physical address. Addresses |
| * are currently identity mapped so this is a simple type convertion. Returns |
| * true if the address was mapped in the table and the address was converted. |
| */ |
| bool mm_vm_translate(struct mm_ptable *t, ipaddr_t ipa, paddr_t *pa) |
| { |
| bool mapped = mm_vm_is_mapped(t, ipa, 0); |
| |
| if (mapped) { |
| *pa = pa_init(ipa_addr(ipa)); |
| } |
| |
| return mapped; |
| } |
| |
| /** |
| * Updates the hypervisor page table such that the given physical address range |
| * is mapped into the address space at the corresponding address range in the |
| * architecture-agnostic mode provided. |
| */ |
| void *mm_identity_map(paddr_t begin, paddr_t end, int mode) |
| { |
| if (mm_ptable_identity_map(&ptable, begin, end, |
| mode | MM_MODE_STAGE1)) { |
| return ptr_from_va(va_from_pa(begin)); |
| } |
| |
| return NULL; |
| } |
| |
| /** |
| * Updates the hypervisor table such that the given physical address range is |
| * not mapped in the address space. |
| */ |
| bool mm_unmap(paddr_t begin, paddr_t end, int mode) |
| { |
| return mm_ptable_unmap(&ptable, begin, end, mode | MM_MODE_STAGE1); |
| } |
| |
| /** |
| * Initialises memory management for the hypervisor itself. |
| */ |
| bool mm_init(void) |
| { |
| dlog("text: 0x%x - 0x%x\n", text_begin, text_end); |
| dlog("rodata: 0x%x - 0x%x\n", rodata_begin, rodata_end); |
| dlog("data: 0x%x - 0x%x\n", data_begin, data_end); |
| |
| if (!mm_ptable_init(&ptable, MM_MODE_NOSYNC | MM_MODE_STAGE1)) { |
| dlog("Unable to allocate memory for page table.\n"); |
| return false; |
| } |
| |
| /* Map page for uart. */ |
| /* TODO: We may not want to map this. */ |
| mm_ptable_identity_map_page(&ptable, pa_init(PL011_BASE), |
| MM_MODE_R | MM_MODE_W | MM_MODE_D | |
| MM_MODE_NOSYNC | MM_MODE_STAGE1); |
| |
| /* Map each section. */ |
| mm_identity_map(pa_init((uintpaddr_t)text_begin), |
| pa_init((uintpaddr_t)text_end), |
| MM_MODE_X | MM_MODE_NOSYNC); |
| |
| mm_identity_map(pa_init((uintpaddr_t)rodata_begin), |
| pa_init((uintpaddr_t)rodata_end), |
| MM_MODE_R | MM_MODE_NOSYNC); |
| |
| mm_identity_map(pa_init((uintpaddr_t)data_begin), |
| pa_init((uintpaddr_t)data_end), |
| MM_MODE_R | MM_MODE_W | MM_MODE_NOSYNC); |
| |
| return arch_mm_init(ptable.table, true); |
| } |
| |
| bool mm_cpu_init(void) |
| { |
| return arch_mm_init(ptable.table, false); |
| } |
| |
| /** |
| * Defragments the hypervisor page table. |
| */ |
| void mm_defrag(void) |
| { |
| mm_ptable_defrag(&ptable, MM_MODE_STAGE1); |
| } |