From dc580f1c115015f3d909c0b539042ae343d7ab50 Mon Sep 17 00:00:00 2001
From: Graham MacDonald <grahamamacdonald@gmail.com>
Date: Tue, 23 Jul 2024 21:23:23 +0100
Subject: [PATCH 1/8] Initial vmem code (wip)

Signed-off-by: Graham MacDonald <grahamamacdonald@gmail.com>
---
 aarch64/lib/kernel.ld    |   6 +
 aarch64/src/kmem.rs      | 112 ++++-
 aarch64/src/main.rs      |  45 +-
 aarch64/src/pagealloc.rs |   2 +-
 aarch64/src/runtime.rs   |   6 +-
 aarch64/src/vm.rs        |  24 +-
 aarch64/src/vmalloc.rs   |  54 +++
 port/src/lib.rs          |   1 +
 port/src/mem.rs          |  11 +
 port/src/vmem.rs         | 894 +++++++++++++++++++++++++++++++++++++++
 rust-toolchain.toml      |   2 +-
 11 files changed, 1102 insertions(+), 55 deletions(-)
 create mode 100644 aarch64/src/vmalloc.rs
 create mode 100644 port/src/vmem.rs
diff --git a/aarch64/lib/kernel.ld b/aarch64/lib/kernel.ld
index 4e1cd05..0be01b7 100644
--- a/aarch64/lib/kernel.ld
+++ b/aarch64/lib/kernel.ld
@@ -51,6 +51,12 @@ SECTIONS {
 	}
 	ebss = .;
 
+	heap = .;
+	.heap : ALIGN(4096) {
+		. = ALIGN(8*2097152);
+	}
+	eheap = .;
+
 	/* Reserve section for early pagetables.  Align to 2MiB to allow us to map
 	   as a 2MiB page.Note that this won't be needed once we transition to
 	   recursive pagetables.
diff --git a/aarch64/src/kmem.rs b/aarch64/src/kmem.rs
index e7a7a28..9c9efbe 100644
--- a/aarch64/src/kmem.rs
+++ b/aarch64/src/kmem.rs
@@ -1,36 +1,86 @@
 use crate::param::KZERO;
-use port::mem::{PhysAddr, PhysRange};
+use port::mem::{PhysAddr, PhysRange, VirtRange};
 
 // These map to definitions in kernel.ld
 extern "C" {
+    static boottext: [u64; 0];
+    static eboottext: [u64; 0];
+    static text: [u64; 0];
     static etext: [u64; 0];
+    static rodata: [u64; 0];
     static erodata: [u64; 0];
+    static data: [u64; 0];
+    static edata: [u64; 0];
+    static bss: [u64; 0];
     static ebss: [u64; 0];
     static early_pagetables: [u64; 0];
     static eearly_pagetables: [u64; 0];
+    static heap: [u64; 0];
+    static eheap: [u64; 0];
+    static end: [u64; 0];
 }
 
-pub fn text_addr() -> usize {
-    0xffff_8000_0000_0000
+fn start_addr() -> usize {
+    unsafe { boottext.as_ptr().addr() }
 }
 
-pub fn etext_addr() -> usize {
+fn end_addr() -> usize {
+    unsafe { end.as_ptr().addr() }
+}
+
+fn boottext_addr() -> usize {
+    unsafe { boottext.as_ptr().addr() }
+}
+
+fn eboottext_addr() -> usize {
+    unsafe { eboottext.as_ptr().addr() }
+}
+
+fn text_addr() -> usize {
+    unsafe { text.as_ptr().addr() }
+}
+
+fn etext_addr() -> usize {
     unsafe { etext.as_ptr().addr() }
 }
 
-pub fn erodata_addr() -> usize {
+fn rodata_addr() -> usize {
+    unsafe { rodata.as_ptr().addr() }
+}
+
+fn erodata_addr() -> usize {
     unsafe { erodata.as_ptr().addr() }
 }
 
-pub fn ebss_addr() -> usize {
+fn data_addr() -> usize {
+    unsafe { data.as_ptr().addr() }
+}
+
+fn edata_addr() -> usize {
+    unsafe { edata.as_ptr().addr() }
+}
+
+fn bss_addr() -> usize {
+    unsafe { bss.as_ptr().addr() }
+}
+
+fn ebss_addr() -> usize {
     unsafe { ebss.as_ptr().addr() }
 }
 
-pub fn early_pagetables_addr() -> usize {
+fn heap_addr() -> usize {
+    unsafe { heap.as_ptr().addr() }
+}
+
+fn eheap_addr() -> usize {
+    unsafe { eheap.as_ptr().addr() }
+}
+
+fn early_pagetables_addr() -> usize {
     unsafe { early_pagetables.as_ptr().addr() }
 }
 
-pub fn eearly_pagetables_addr() -> usize {
+fn eearly_pagetables_addr() -> usize {
     unsafe { eearly_pagetables.as_ptr().addr() }
 }
 
@@ -50,7 +100,51 @@ pub fn from_ptr_to_physaddr<T>(a: *const T) -> PhysAddr {
     from_virt_to_physaddr(a.addr())
 }
 
-pub fn early_pages_range() -> PhysRange {
+pub fn kernel_text_physrange() -> PhysRange {
+    PhysRange(from_virt_to_physaddr(text_addr())..from_virt_to_physaddr(etext_addr()))
+}
+
+pub fn kernel_data_physrange() -> PhysRange {
+    PhysRange::with_len(from_virt_to_physaddr(etext_addr()).addr(), erodata_addr() - etext_addr())
+}
+
+pub fn kernel_bss_physrange() -> PhysRange {
+    PhysRange::with_len(from_virt_to_physaddr(erodata_addr()).addr(), ebss_addr() - erodata_addr())
+}
+
+pub fn kernel_heap_physrange() -> PhysRange {
+    PhysRange::with_len(from_virt_to_physaddr(heap_addr()).addr(), eheap_addr() - heap_addr())
+}
+
+pub fn total_virtrange() -> VirtRange {
+    VirtRange(start_addr()..end_addr())
+}
+
+pub fn boottext_virtrange() -> VirtRange {
+    VirtRange(boottext_addr()..eboottext_addr())
+}
+
+pub fn text_virtrange() -> VirtRange {
+    VirtRange(text_addr()..etext_addr())
+}
+
+pub fn rodata_virtrange() -> VirtRange {
+    VirtRange(rodata_addr()..erodata_addr())
+}
+
+pub fn data_virtrange() -> VirtRange {
+    VirtRange(data_addr()..edata_addr())
+}
+
+pub fn bss_virtrange() -> VirtRange {
+    VirtRange(bss_addr()..ebss_addr())
+}
+
+pub fn heap_virtrange() -> VirtRange {
+    VirtRange::with_len(heap_addr(), eheap_addr() - heap_addr())
+}
+
+pub fn early_pages_physrange() -> PhysRange {
     PhysRange::new(
         from_virt_to_physaddr(early_pagetables_addr()),
         from_virt_to_physaddr(eearly_pagetables_addr()),
diff --git a/aarch64/src/main.rs b/aarch64/src/main.rs
index 2edce89..1eab130 100644
--- a/aarch64/src/main.rs
+++ b/aarch64/src/main.rs
@@ -19,13 +19,13 @@ mod trap;
 mod uartmini;
 mod uartpl011;
 mod vm;
+mod vmalloc;
 
 use crate::kmem::from_virt_to_physaddr;
 use crate::vm::kernel_root;
-use core::ffi::c_void;
 use core::ptr;
 use port::fdt::DeviceTree;
-use port::mem::PhysRange;
+use port::mem::{PhysRange, VirtRange};
 use port::println;
 use vm::PageTable;
 
@@ -34,35 +34,23 @@ core::arch::global_asm!(include_str!("l.S"));
 
 static mut KPGTBL: PageTable = PageTable::empty();
 
-unsafe fn print_memory_range(name: &str, start: &*const c_void, end: &*const c_void) {
-    let start = start as *const _ as u64;
-    let end = end as *const _ as u64;
-    let size = end - start;
+unsafe fn print_memory_range(name: &str, range: VirtRange) {
+    let start = range.start();
+    let end = range.end();
+    let size = range.size();
     println!("  {name}{start:#x}..{end:#x} ({size:#x})");
 }
 
 fn print_binary_sections() {
-    extern "C" {
-        static boottext: *const c_void;
-        static eboottext: *const c_void;
-        static text: *const c_void;
-        static etext: *const c_void;
-        static rodata: *const c_void;
-        static erodata: *const c_void;
-        static data: *const c_void;
-        static edata: *const c_void;
-        static bss: *const c_void;
-        static end: *const c_void;
-    }
-
     println!("Binary sections:");
     unsafe {
-        print_memory_range("boottext:\t", &boottext, &eboottext);
-        print_memory_range("text:\t\t", &text, &etext);
-        print_memory_range("rodata:\t", &rodata, &erodata);
-        print_memory_range("data:\t\t", &data, &edata);
-        print_memory_range("bss:\t\t", &bss, &end);
-        print_memory_range("total:\t", &boottext, &end);
+        print_memory_range("boottext:\t", kmem::boottext_virtrange());
+        print_memory_range("text:\t\t", kmem::text_virtrange());
+        print_memory_range("rodata:\t", kmem::rodata_virtrange());
+        print_memory_range("data:\t\t", kmem::data_virtrange());
+        print_memory_range("bss:\t\t", kmem::bss_virtrange());
+        print_memory_range("heap:\t\t", kmem::heap_virtrange());
+        print_memory_range("total:\t", kmem::total_virtrange());
     }
 }
 
@@ -145,6 +133,13 @@ pub extern "C" fn main9(dtb_va: usize) {
 
     println!("looping now");
 
+    {
+        let test = vmalloc::alloc(1024);
+        println!("test alloc: {:p}", test);
+        let test2 = vmalloc::alloc(1024);
+        println!("test alloc: {:p}", test2);
+    }
+
     #[allow(clippy::empty_loop)]
     loop {}
 }
diff --git a/aarch64/src/pagealloc.rs b/aarch64/src/pagealloc.rs
index f3ca378..9d8367a 100644
--- a/aarch64/src/pagealloc.rs
+++ b/aarch64/src/pagealloc.rs
@@ -33,7 +33,7 @@ pub fn init_page_allocator() {
     let mut lock = PAGE_ALLOC.lock(&node);
     let page_alloc = &mut *lock;
 
-    let early_pages_range = kmem::early_pages_range();
+    let early_pages_range = kmem::early_pages_physrange();
     if let Err(err) = page_alloc.mark_free(&early_pages_range) {
         panic!("Couldn't mark early pages free: range: {} err: {:?}", early_pages_range, err);
     }
diff --git a/aarch64/src/runtime.rs b/aarch64/src/runtime.rs
index aa65a36..a5740fb 100644
--- a/aarch64/src/runtime.rs
+++ b/aarch64/src/runtime.rs
@@ -40,9 +40,9 @@ fn oom(_layout: Layout) -> ! {
     panic!("oom");
 }
 
-struct FakeAlloc;
+struct VmemAllocator;
 
-unsafe impl GlobalAlloc for FakeAlloc {
+unsafe impl GlobalAlloc for VmemAllocator {
     unsafe fn alloc(&self, _layout: Layout) -> *mut u8 {
         panic!("fake alloc");
     }
@@ -52,4 +52,4 @@ unsafe impl GlobalAlloc for FakeAlloc {
 }
 
 #[global_allocator]
-static FAKE_ALLOCATOR: FakeAlloc = FakeAlloc {};
+static VMEM_ALLOCATOR: VmemAllocator = VmemAllocator {};
diff --git a/aarch64/src/vm.rs b/aarch64/src/vm.rs
index 02c8c52..27b3a06 100644
--- a/aarch64/src/vm.rs
+++ b/aarch64/src/vm.rs
@@ -2,11 +2,12 @@
 
 use crate::{
     kmem::{
-        ebss_addr, erodata_addr, etext_addr, from_ptr_to_physaddr, from_virt_to_physaddr,
-        physaddr_as_ptr_mut, physaddr_as_virt, text_addr,
+        from_ptr_to_physaddr, heap_virtrange, kernel_bss_physrange, kernel_data_physrange,
+        kernel_heap_physrange, kernel_text_physrange, physaddr_as_ptr_mut, physaddr_as_virt,
     },
     pagealloc,
     registers::rpi_mmio,
+    vmalloc,
 };
 use bitstruct::bitstruct;
 use core::fmt;
@@ -468,6 +469,7 @@ fn print_pte(indent: usize, i: usize, level: Level, pte: Entry) {
 
 pub unsafe fn init(kpage_table: &mut PageTable, dtb_range: PhysRange, available_mem: PhysRange) {
     pagealloc::init_page_allocator();
+    vmalloc::init(heap_virtrange());
 
     // We use recursive page tables, but we have to be careful in the init call,
     // since the kpage_table is not currently pointed to by ttbr1_el1.  Any
@@ -485,24 +487,14 @@ pub unsafe fn init(kpage_table: &mut PageTable, dtb_range: PhysRange, available_
 
     // TODO leave the first page unmapped to catch null pointer dereferences in unsafe code
     let custom_map = {
-        let text_range =
-            PhysRange(from_virt_to_physaddr(text_addr())..from_virt_to_physaddr(etext_addr()));
-        let data_range = PhysRange::with_len(
-            from_virt_to_physaddr(etext_addr()).addr(),
-            erodata_addr() - etext_addr(),
-        );
-        let bss_range = PhysRange::with_len(
-            from_virt_to_physaddr(erodata_addr()).addr(),
-            ebss_addr() - erodata_addr(),
-        );
-
         let mmio_range = rpi_mmio().expect("mmio base detect failed");
 
         let mut map = [
             ("DTB", dtb_range, Entry::ro_kernel_data(), PageSize::Page4K),
-            ("Kernel Text", text_range, Entry::ro_kernel_text(), PageSize::Page2M),
-            ("Kernel Data", data_range, Entry::ro_kernel_data(), PageSize::Page2M),
-            ("Kernel BSS", bss_range, Entry::rw_kernel_data(), PageSize::Page2M),
+            ("Kernel Text", kernel_text_physrange(), Entry::ro_kernel_text(), PageSize::Page2M),
+            ("Kernel Data", kernel_data_physrange(), Entry::ro_kernel_data(), PageSize::Page2M),
+            ("Kernel BSS", kernel_bss_physrange(), Entry::rw_kernel_data(), PageSize::Page2M),
+            ("Kernel Heap", kernel_heap_physrange(), Entry::rw_kernel_data(), PageSize::Page2M),
             ("MMIO", mmio_range, Entry::ro_kernel_device(), PageSize::Page2M),
         ];
         map.sort_by_key(|a| a.1.start());
diff --git a/aarch64/src/vmalloc.rs b/aarch64/src/vmalloc.rs
new file mode 100644
index 0000000..f978f12
--- /dev/null
+++ b/aarch64/src/vmalloc.rs
@@ -0,0 +1,54 @@
+use core::{mem::MaybeUninit, ptr::addr_of};
+
+use port::{
+    mcslock::{Lock, LockNode},
+    mem::VirtRange,
+    vmem::{Arena, Boundary},
+};
+
+static VMALLOC: Lock<Option<&'static mut VmAlloc>> = Lock::new("vmalloc", None);
+
+static mut EARLY_TAGS_PAGE: [u8; 4096] = [0; 4096];
+
+struct VmAlloc {
+    heap_arena: Arena,
+}
+
+impl VmAlloc {
+    fn new(heap_range: VirtRange) -> Self {
+        let quantum = 4096;
+
+        let early_tags_ptr = unsafe { addr_of!(EARLY_TAGS_PAGE) as usize };
+        let early_tags_size = unsafe { EARLY_TAGS_PAGE.len() };
+        let early_tags_range = VirtRange::with_len(early_tags_ptr, early_tags_size);
+
+        Self {
+            heap_arena: Arena::new_with_static_range(
+                "heap",
+                Some(Boundary::from(heap_range)),
+                quantum,
+                None,
+                early_tags_range,
+            ),
+        }
+    }
+}
+
+pub fn init(heap_range: VirtRange) {
+    let node = LockNode::new();
+    let mut vmalloc = VMALLOC.lock(&node);
+    *vmalloc = Some({
+        static mut MAYBE_VMALLOC: MaybeUninit<VmAlloc> = MaybeUninit::uninit();
+        unsafe {
+            MAYBE_VMALLOC.write(VmAlloc::new(heap_range));
+            MAYBE_VMALLOC.assume_init_mut()
+        }
+    });
+}
+
+pub fn alloc(size: usize) -> *mut u8 {
+    let node = LockNode::new();
+    let mut lock = VMALLOC.lock(&node);
+    let vmalloc = lock.as_deref_mut().unwrap();
+    vmalloc.heap_arena.alloc(size)
+}
diff --git a/port/src/lib.rs b/port/src/lib.rs
index 8120f05..44a9e6e 100644
--- a/port/src/lib.rs
+++ b/port/src/lib.rs
@@ -10,3 +10,4 @@ pub mod devcons;
 pub mod fdt;
 pub mod mcslock;
 pub mod mem;
+pub mod vmem;
diff --git a/port/src/mem.rs b/port/src/mem.rs
index 40154ee..92d03b1 100644
--- a/port/src/mem.rs
+++ b/port/src/mem.rs
@@ -32,6 +32,10 @@ impl VirtRange {
     pub fn end(&self) -> usize {
         self.0.end
     }
+
+    pub fn size(&self) -> usize {
+        self.0.end - self.0.start
+    }
 }
 
 impl From<&RegBlock> for VirtRange {
@@ -42,6 +46,13 @@ impl From<&RegBlock> for VirtRange {
     }
 }
 
+impl fmt::Debug for VirtRange {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        write!(f, "VirtRange({:#016x}..{:#016x})", self.start(), self.end())?;
+        Ok(())
+    }
+}
+
 #[derive(Clone, Copy, PartialEq, PartialOrd, Eq, Ord)]
 #[repr(transparent)]
 pub struct PhysAddr(pub u64);
diff --git a/port/src/vmem.rs b/port/src/vmem.rs
new file mode 100644
index 0000000..f7b2bd5
--- /dev/null
+++ b/port/src/vmem.rs
@@ -0,0 +1,894 @@
+use core::{ops::Range, ptr::null_mut, slice};
+
+use crate::mem::VirtRange;
+
+#[cfg(not(test))]
+use crate::println;
+
+// TODO reserve recursive area in vmem(?)
+// TODO Add hashtable for allocated tags - makes it faster when freeing, given only an address.
+// TODO Add support for quantum caches once we have slab allocators implemented.
+// TODO Add power-of-two freelists for freed allocations.
+
+#[derive(Debug, PartialEq)]
+pub enum BoundaryError {
+    ZeroSize,
+}
+
+#[derive(Debug, PartialEq)]
+pub enum AllocError {
+    NoSpace,
+    AllocationNotFound,
+}
+
+#[cfg(test)]
+type BoundaryResult<T> = core::result::Result<T, BoundaryError>;
+
+#[derive(Clone, Copy, Debug, PartialEq)]
+pub struct Boundary {
+    start: usize,
+    size: usize,
+}
+
+impl Boundary {
+    #[cfg(test)]
+    fn new(start: usize, size: usize) -> BoundaryResult<Self> {
+        if size == 0 {
+            Err(BoundaryError::ZeroSize)
+        } else {
+            Ok(Self { start, size })
+        }
+    }
+
+    fn new_unchecked(start: usize, size: usize) -> Self {
+        Self { start, size }
+    }
+
+    #[allow(dead_code)]
+    fn overlaps(&self, other: &Boundary) -> bool {
+        let boundary_end = self.start + self.size;
+        let tag_end = other.start + other.size;
+        (self.start <= other.start && boundary_end > other.start)
+            || (self.start < tag_end && boundary_end >= tag_end)
+            || (self.start <= other.start && boundary_end >= tag_end)
+    }
+
+    #[allow(dead_code)]
+    fn end(&self) -> usize {
+        self.start + self.size
+    }
+}
+
+impl From<VirtRange> for Boundary {
+    fn from(r: VirtRange) -> Self {
+        Boundary::new_unchecked(r.start(), r.size())
+    }
+}
+
+impl From<Range<usize>> for Boundary {
+    fn from(r: Range<usize>) -> Self {
+        Boundary::new_unchecked(r.start, r.end - r.start)
+    }
+}
+
+#[derive(Clone, Copy, Debug, PartialEq)]
+enum TagType {
+    Allocated,
+    Free,
+    Span,
+}
+
+#[derive(Clone, Copy, Debug, PartialEq)]
+struct Tag {
+    tag_type: TagType,
+    boundary: Boundary,
+}
+
+impl Tag {
+    fn new(tag_type: TagType, boundary: Boundary) -> Self {
+        Self { tag_type, boundary }
+    }
+
+    #[cfg(test)]
+    fn new_allocated(boundary: Boundary) -> Self {
+        Tag::new(TagType::Allocated, boundary)
+    }
+
+    fn new_free(boundary: Boundary) -> Self {
+        Tag::new(TagType::Free, boundary)
+    }
+
+    fn new_span(boundary: Boundary) -> Self {
+        Tag::new(TagType::Span, boundary)
+    }
+}
+
+// impl fmt::Debug for Tag {
+//     fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+//         write!(
+//             f,
+//             "Tag({:?} {}..{} (size: {}))",
+//             self.tag_type,
+//             self.boundary.start,
+//             self.boundary.start + self.boundary.size,
+//             self.boundary.size
+//         )?;
+//         Ok(())
+//     }
+// }
+
+#[derive(Debug)]
+struct TagItem {
+    tag: Tag,
+    next: *mut TagItem,
+    prev: *mut TagItem,
+}
+
+impl TagItem {
+    #[cfg(test)]
+    fn new_allocated(boundary: Boundary) -> Self {
+        Self { tag: Tag::new_allocated(boundary), next: null_mut(), prev: null_mut() }
+    }
+}
+
+/// Pool of boundary tags.  Vmem uses external boundary tags.  We allocate a page
+/// of tags at a time, making them available via this pool.  This allows us to
+/// set up the pool initially with a static page, before we have any kind of
+/// allocator.  The pool can later be populated dynamically.
+struct TagPool {
+    tags: *mut TagItem,
+}
+
+impl TagPool {
+    fn new() -> Self {
+        Self { tags: null_mut() }
+    }
+
+    fn add(&mut self, tag: &mut TagItem) {
+        if self.tags.is_null() {
+            self.tags = tag;
+        } else {
+            tag.next = self.tags;
+            unsafe { (*tag.next).prev = tag };
+            self.tags = tag;
+        }
+    }
+
+    fn take(&mut self, tag: Tag) -> *mut TagItem {
+        if let Some(tag_item) = unsafe { self.tags.as_mut() } {
+            self.tags = tag_item.next;
+            if let Some(next_tag) = unsafe { self.tags.as_mut() } {
+                next_tag.prev = null_mut();
+            }
+            tag_item.next = null_mut();
+            tag_item.prev = null_mut();
+            tag_item.tag = tag;
+            tag_item as *mut TagItem
+        } else {
+            null_mut()
+        }
+    }
+
+    #[allow(dead_code)]
+    fn len(&self) -> usize {
+        let mut n = 0;
+        let mut free_tag = self.tags;
+        while let Some(tag) = unsafe { free_tag.as_ref() } {
+            n += 1;
+            free_tag = tag.next;
+        }
+        n
+    }
+}
+
+/// Ordered list of tags (by Tag::start)
+/// This is a simple linked list that assumes no overlaps.
+struct TagList {
+    tags: *mut TagItem,
+}
+
+impl TagList {
+    fn new() -> Self {
+        Self { tags: null_mut() }
+    }
+
+    fn push(&mut self, new_tag: &mut TagItem) {
+        if self.tags.is_null() {
+            self.tags = new_tag;
+        } else {
+            let mut curr_tag_item = self.tags;
+            while let Some(item) = unsafe { curr_tag_item.as_mut() } {
+                if item.tag.boundary.start > new_tag.tag.boundary.start {
+                    // Insert before tag
+                    if let Some(prev_tag) = unsafe { item.prev.as_mut() } {
+                        prev_tag.next = new_tag;
+                    } else {
+                        // Inserting as first tag
+                        self.tags = new_tag;
+                    }
+                    new_tag.next = item;
+                    item.prev = new_tag;
+                    return;
+                }
+                if item.next.is_null() {
+                    // Inserting as last tag
+                    new_tag.prev = item;
+                    item.next = new_tag;
+                    return;
+                }
+                curr_tag_item = item.next;
+            }
+        }
+    }
+
+    /// Remove tag_item from the list.  Placing tag_item onto the free list is
+    /// the callers responsibility.
+    fn unlink(tag_item: &mut TagItem) {
+        if let Some(prev) = unsafe { tag_item.prev.as_mut() } {
+            prev.next = tag_item.next;
+        }
+        if let Some(next) = unsafe { tag_item.next.as_mut() } {
+            next.prev = tag_item.prev;
+        }
+        tag_item.next = null_mut();
+        tag_item.prev = null_mut();
+    }
+
+    fn len(&self) -> usize {
+        let mut n = 0;
+        let mut curr_tag = self.tags;
+        while let Some(tag) = unsafe { curr_tag.as_ref() } {
+            n += 1;
+            curr_tag = tag.next;
+        }
+        n
+    }
+
+    fn tags_iter(&self) -> impl Iterator<Item = Tag> + '_ {
+        let mut curr_tag_item = self.tags;
+        core::iter::from_fn(move || {
+            if let Some(item) = unsafe { curr_tag_item.as_ref() } {
+                curr_tag_item = item.next;
+                return Some(item.tag);
+            } else {
+                return None;
+            }
+        })
+    }
+
+    // fn add_tag(&mut self, boundary: Boundary, free_tags: &mut TagStack) -> BoundaryResult<()> {
+    //     // Code to pop a tag
+    //     // let tag = unsafe {
+    //     //     arena.free_tags.pop().as_mut().expect("Arena::new_with_tags no free tags")
+    //     // };
+
+    //     if boundary.size == 0 {
+    //         return Err(BoundaryError::ZeroSize);
+    //     }
+
+    //     let bstart = boundary.start;
+    //     let bend = boundary.start + boundary.size;
+
+    //     let mut curr_tag = self.tags;
+    //     while let Some(tag) = unsafe { curr_tag.as_ref() } {
+    //         let tag_start = tag.boundary.start;
+    //         let tag_end = tag_start + tag.boundary.size;
+    //         if (bstart <= tag_start && bend > tag_start)
+    //             || (bstart < tag_end && bend >= tag_end)
+    //             || (bstart <= tag_start && bend >= tag_end)
+    //         {}
+    //         curr_tag = tag.next;
+    //     }
+
+    //     Ok(())
+    // }
+}
+
+pub struct Arena {
+    _name: &'static str,
+    quantum: usize,
+
+    tag_pool: TagPool,     // Pool of available tags
+    segment_list: TagList, // List of all segments in address order
+}
+
+impl Arena {
+    /// Only to be used for creation of initial heap
+    pub fn new_with_static_range(
+        name: &'static str,
+        initial_span: Option<Boundary>,
+        quantum: usize,
+        parent: Option<Arena>,
+        static_range: VirtRange,
+    ) -> Self {
+        let tags_addr = unsafe { &mut *(static_range.start() as *mut TagItem) };
+        let tags = unsafe {
+            slice::from_raw_parts_mut(tags_addr, static_range.size() / size_of::<TagItem>())
+        };
+
+        println!(
+            "Arena::new_with_static_range name:{} initial_span:{:?} quantum:{:x}",
+            name, initial_span, quantum
+        );
+
+        Self::new_with_tags(name, initial_span, quantum, parent, tags)
+    }
+
+    /// Create a new arena, assuming there is no dynamic allocation available,
+    /// and all free tags come from the free_tags provided.
+    fn new_with_tags(
+        name: &'static str,
+        initial_span: Option<Boundary>,
+        quantum: usize,
+        _parent: Option<Arena>,
+        free_tags: &mut [TagItem],
+    ) -> Self {
+        let mut arena = Self {
+            _name: name,
+            quantum: quantum,
+            segment_list: TagList::new(),
+            tag_pool: TagPool::new(),
+        };
+        arena.add_tags_to_pool(free_tags);
+
+        if let Some(span) = initial_span {
+            assert_eq!(span.start % quantum, 0);
+            assert_eq!(span.size % quantum, 0);
+            assert!(span.start.checked_add(span.size).is_some());
+            arena.add_free_span(span);
+        }
+
+        arena
+    }
+
+    fn add_free_span(&mut self, boundary: Boundary) {
+        self.segment_list.push(unsafe {
+            self.tag_pool.take(Tag::new_span(boundary)).as_mut().expect("no free tags")
+        });
+        self.segment_list.push(unsafe {
+            self.tag_pool.take(Tag::new_free(boundary)).as_mut().expect("no free tags")
+        });
+    }
+
+    fn add_tags_to_pool(&mut self, tags: &mut [TagItem]) {
+        for tag in tags {
+            tag.next = null_mut();
+            tag.prev = null_mut();
+            self.tag_pool.add(tag);
+        }
+    }
+
+    pub fn alloc(&mut self, size: usize) -> *mut u8 {
+        let boundary = self.alloc_segment(size);
+        if boundary.is_ok() {
+            boundary.unwrap().start as *mut u8
+        } else {
+            null_mut()
+        }
+    }
+
+    pub fn free(&mut self, addr: *mut u8) {
+        let _ = self.free_segment(addr as usize);
+    }
+
+    /// Allocate a segment, returned as a boundary
+    fn alloc_segment(&mut self, size: usize) -> Result<Boundary, AllocError> {
+        println!("alloc_segment size: {}", size);
+
+        // Round size up to a multiple of quantum
+        let size = {
+            let rem = size % self.quantum;
+            if rem == 0 {
+                size
+            } else {
+                size + (self.quantum - rem)
+            }
+        };
+
+        // Find the first free tag that's large enough
+        let mut curr_item = self.segment_list.tags;
+        while let Some(item) = unsafe { curr_item.as_mut() } {
+            if item.tag.tag_type == TagType::Free && item.tag.boundary.size >= size {
+                // Mark this tag as allocated, and if there's any left over space,
+                // create and insert a new tag
+                item.tag.tag_type = TagType::Allocated;
+                if item.tag.boundary.size > size {
+                    // Work out the size of the new free item, and change the size
+                    // of the current, now allocated, item
+                    let remainder = item.tag.boundary.size - size;
+                    item.tag.boundary.size = size;
+
+                    let new_tag = Tag::new_free(Boundary::new_unchecked(
+                        item.tag.boundary.start + size,
+                        remainder,
+                    ));
+                    let new_item =
+                        unsafe { self.tag_pool.take(new_tag).as_mut().expect("no free tags") };
+
+                    // Insert new_item after item
+                    new_item.next = item.next;
+                    new_item.prev = item;
+                    item.next = new_item;
+                    if !new_item.next.is_null() {
+                        unsafe { (*new_item.next).prev = new_item };
+                    }
+                }
+                return Ok(item.tag.boundary);
+            }
+            curr_item = item.next;
+        }
+        Err(AllocError::NoSpace)
+    }
+
+    // Free addr.  We don't need to know size because we don't merge allocations.
+    // (We only merge freed segments)
+    // TODO Error on precondition fail
+    fn free_segment(&mut self, addr: usize) -> Result<(), AllocError> {
+        // Need to manually scan the used tags
+        let mut curr_item = self.segment_list.tags;
+        while let Some(item) = unsafe { curr_item.as_mut() } {
+            if item.tag.boundary.start == addr && item.tag.tag_type == TagType::Allocated {
+                break;
+            }
+            curr_item = item.next;
+        }
+
+        if curr_item.is_null() {
+            return Err(AllocError::AllocationNotFound);
+        }
+
+        let mut curr_tag: &mut TagItem = unsafe { curr_item.as_mut() }.unwrap();
+
+        // Found tag to free
+        let prev_type = unsafe { curr_tag.prev.as_ref() }.map(|t| t.tag.tag_type);
+        let next_type = unsafe { curr_tag.next.as_ref() }.map(|t| t.tag.tag_type);
+
+        match (prev_type, next_type) {
+            (Some(TagType::Allocated), Some(TagType::Allocated))
+            | (Some(TagType::Span), Some(TagType::Span))
+            | (Some(TagType::Span), Some(TagType::Allocated))
+            | (Some(TagType::Allocated), Some(TagType::Span))
+            | (Some(TagType::Span), None)
+            | (Some(TagType::Allocated), None) => {
+                // No frees on either side
+                // -> Change curr_tag to free
+                curr_tag.tag.tag_type = TagType::Free;
+            }
+            (Some(TagType::Span), Some(TagType::Free))
+            | (Some(TagType::Allocated), Some(TagType::Free)) => {
+                // Prev non-free, next free
+                // Change next tag start to merge with curr_tag, release curr_tag
+                let next = unsafe { curr_tag.next.as_mut() }.unwrap();
+                next.tag.boundary.start = curr_tag.tag.boundary.start;
+                next.tag.boundary.size += curr_tag.tag.boundary.size;
+                TagList::unlink(&mut curr_tag);
+                self.tag_pool.add(&mut curr_tag);
+            }
+            (Some(TagType::Free), None)
+            | (Some(TagType::Free), Some(TagType::Span))
+            | (Some(TagType::Free), Some(TagType::Allocated)) => {
+                // Prev free, next non-free
+                // Change prev tag size to merge with curr_tag, release curr_tag
+                let prev = unsafe { curr_tag.prev.as_mut() }.unwrap();
+                prev.tag.boundary.size += curr_tag.tag.boundary.size;
+                TagList::unlink(&mut curr_tag);
+                self.tag_pool.add(&mut curr_tag);
+            }
+            (Some(TagType::Free), Some(TagType::Free)) => {
+                // Prev and next both free
+                // Change prev size to merge with both curr_tag and next, release curr_tag
+                let prev = unsafe { curr_tag.prev.as_mut() }.unwrap();
+                let mut next = unsafe { curr_tag.next.as_mut() }.unwrap();
+                prev.tag.boundary.size += curr_tag.tag.boundary.size + next.tag.boundary.size;
+                TagList::unlink(&mut curr_tag);
+                TagList::unlink(&mut next);
+                self.tag_pool.add(&mut curr_tag);
+                self.tag_pool.add(&mut next);
+            }
+            (None, None)
+            | (None, Some(TagType::Span))
+            | (None, Some(TagType::Allocated))
+            | (None, Some(TagType::Free)) => {
+                self.assert_tags_are_consistent();
+                panic!("Unexpected tags when freeing");
+            }
+        }
+
+        Ok(())
+    }
+
+    fn tags_iter(&self) -> impl Iterator<Item = Tag> + '_ {
+        self.segment_list.tags_iter()
+    }
+
+    /// Checks that all invariants are correct.
+    fn assert_tags_are_consistent(&self) {
+        // There must be at least 2 tags
+        debug_assert!(self.segment_list.len() >= 2);
+
+        // Tags must be in order, without gaps
+        let mut last_tag: Option<Tag> = None;
+        let mut last_span: Option<Tag> = None;
+        let mut last_span_total = 0;
+        for (i, tag) in self.tags_iter().enumerate() {
+            debug_assert!(tag.boundary.size > 0);
+
+            if i == 0 {
+                debug_assert_eq!(tag.tag_type, TagType::Span);
+                debug_assert!(last_tag.is_none());
+                debug_assert!(last_span.is_none());
+                debug_assert_eq!(last_span_total, 0);
+            } else {
+                debug_assert!(last_tag.is_some());
+                debug_assert!(last_span.is_some());
+
+                // Tags should be ordered
+                let last_tag = last_tag.unwrap();
+                let out_of_order = (last_tag.tag_type == TagType::Span
+                    && tag.boundary.start >= last_tag.boundary.start)
+                    || (last_tag.tag_type != TagType::Span
+                        && tag.boundary.start > last_tag.boundary.start);
+                debug_assert!(
+                    out_of_order,
+                    "Tags out of order: tag{}: {:?}, tag{}: {:?}",
+                    i - 1,
+                    last_tag,
+                    i,
+                    tag,
+                );
+            }
+
+            match tag.tag_type {
+                TagType::Span => {
+                    // Spans must not overlap
+                    if last_span.is_some() {
+                        debug_assert_eq!(last_span_total, last_span.unwrap().boundary.size);
+                    }
+                    last_span = Some(tag);
+                }
+                TagType::Allocated | TagType::Free => {
+                    last_span_total += tag.boundary.size;
+                    // First tag after span should have same start as span
+                    if last_tag.is_some_and(|t| t.tag_type == TagType::Span) {
+                        debug_assert_eq!(tag.boundary.start, last_tag.unwrap().boundary.start);
+                    }
+                }
+            }
+            last_tag = Some(tag);
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+
+    use super::*;
+
+    #[test]
+    fn ensure_sizes() {
+        assert_eq!(size_of::<Tag>(), 24);
+        assert_eq!(size_of::<TagItem>(), 40);
+    }
+
+    #[test]
+    fn test_boundary() {
+        assert!(Boundary::new(10, 1).is_ok());
+        assert_eq!(Boundary::new(10, 0), BoundaryResult::Err(BoundaryError::ZeroSize));
+
+        // Overlap left
+        assert!(!Boundary::new(10, 10).unwrap().overlaps(&Boundary::new(2, 5).unwrap()));
+        assert!(!Boundary::new(10, 10).unwrap().overlaps(&Boundary::new(0, 10).unwrap()));
+        assert!(Boundary::new(10, 10).unwrap().overlaps(&Boundary::new(0, 11).unwrap()));
+
+        // Overlap right
+        assert!(!Boundary::new(10, 10).unwrap().overlaps(&Boundary::new(25, 5).unwrap()));
+        assert!(!Boundary::new(10, 10).unwrap().overlaps(&Boundary::new(20, 10).unwrap()));
+        assert!(Boundary::new(10, 10).unwrap().overlaps(&Boundary::new(19, 1).unwrap()));
+
+        // Exact match
+        assert!(Boundary::new(10, 10).unwrap().overlaps(&Boundary::new(10, 10).unwrap()));
+
+        // Inside
+        assert!(Boundary::new(10, 10).unwrap().overlaps(&Boundary::new(15, 1).unwrap()));
+        assert!(Boundary::new(10, 10).unwrap().overlaps(&Boundary::new(10, 1).unwrap()));
+        assert!(Boundary::new(10, 10).unwrap().overlaps(&Boundary::new(19, 1).unwrap()));
+
+        // Outside left
+        assert!(!Boundary::new(10, 10).unwrap().overlaps(&Boundary::new(0, 1).unwrap()));
+        assert!(!Boundary::new(10, 10).unwrap().overlaps(&Boundary::new(0, 10).unwrap()));
+
+        // Outside right
+        assert!(!Boundary::new(10, 10).unwrap().overlaps(&Boundary::new(20, 1).unwrap()));
+        assert!(!Boundary::new(10, 10).unwrap().overlaps(&Boundary::new(25, 1).unwrap()));
+    }
+
+    // Page4K would normally be in the arch crate, but we define something
+    // similar here for testing.
+    #[repr(C, align(4096))]
+    #[derive(Clone, Copy)]
+    pub struct Page4K([u8; 4096]);
+
+    #[test]
+    fn test_tagstack() {
+        let mut page = Page4K([0; 4096]);
+        const NUM_TAGS: usize = size_of::<Page4K>() / size_of::<TagItem>();
+        let tags = unsafe { &mut *(&mut page as *mut Page4K as *mut [TagItem; NUM_TAGS]) };
+        let mut tag_stack = TagPool::new();
+
+        assert_eq!(tag_stack.len(), 0);
+        for tag in tags {
+            tag_stack.add(tag);
+        }
+        assert_eq!(tag_stack.len(), NUM_TAGS);
+    }
+
+    #[test]
+    fn test_taglist() {
+        let mut list = TagList::new();
+        assert_eq!(list.len(), 0);
+        assert_eq!(list.tags_iter().collect::<Vec<Tag>>(), []);
+
+        let mut tag1 = TagItem::new_allocated(Boundary::new(100, 100).unwrap());
+        list.push(&mut tag1);
+        assert_eq!(list.len(), 1);
+        assert_eq!(
+            list.tags_iter().collect::<Vec<Tag>>(),
+            [Tag::new_allocated(Boundary::new(100, 100).unwrap())]
+        );
+
+        // Insert new at end
+        let mut tag2 = TagItem::new_allocated(Boundary::new(500, 100).unwrap());
+        list.push(&mut tag2);
+        assert_eq!(list.len(), 2);
+        assert_eq!(
+            list.tags_iter().collect::<Vec<Tag>>(),
+            [
+                Tag::new_allocated(Boundary::new(100, 100).unwrap()),
+                Tag::new_allocated(Boundary::new(500, 100).unwrap())
+            ]
+        );
+
+        // Insert new at start
+        let mut tag3 = TagItem::new_allocated(Boundary::new(0, 100).unwrap());
+        list.push(&mut tag3);
+        assert_eq!(list.len(), 3);
+        assert_eq!(
+            list.tags_iter().collect::<Vec<Tag>>(),
+            [
+                Tag::new_allocated(Boundary::new(0, 100).unwrap()),
+                Tag::new_allocated(Boundary::new(100, 100).unwrap()),
+                Tag::new_allocated(Boundary::new(500, 100).unwrap())
+            ]
+        );
+
+        // Insert new in middle
+        let mut tag4 = TagItem::new_allocated(Boundary::new(200, 100).unwrap());
+        list.push(&mut tag4);
+        assert_eq!(list.len(), 4);
+        assert_eq!(
+            list.tags_iter().collect::<Vec<Tag>>(),
+            [
+                Tag::new_allocated(Boundary::new(0, 100).unwrap()),
+                Tag::new_allocated(Boundary::new(100, 100).unwrap()),
+                Tag::new_allocated(Boundary::new(200, 100).unwrap()),
+                Tag::new_allocated(Boundary::new(500, 100).unwrap())
+            ]
+        );
+    }
+
+    fn create_arena_with_static_tags(
+        name: &'static str,
+        initial_span: Option<Boundary>,
+        quantum: usize,
+        _parent_arena: Option<&mut Arena>,
+    ) -> Arena {
+        let mut page = Page4K([0; 4096]);
+        const NUM_TAGS: usize = size_of::<Page4K>() / size_of::<TagItem>();
+        let tags = unsafe { &mut *(&mut page as *mut Page4K as *mut [TagItem; NUM_TAGS]) };
+        Arena::new_with_tags(name, initial_span, quantum, None, tags)
+    }
+
+    fn assert_tags_eq(arena: &Arena, expected: &[Tag]) {
+        arena.assert_tags_are_consistent();
+        let actual_tags = arena.tags_iter().collect::<Vec<Tag>>();
+        assert_eq!(actual_tags, expected, "arena tag mismatch");
+    }
+
+    #[test]
+    fn test_arena_create() {
+        let arena = create_arena_with_static_tags(
+            "test",
+            Some(Boundary::new_unchecked(4096, 4096 * 20)),
+            4096,
+            None,
+        );
+        assert_eq!(arena.tag_pool.len(), 100);
+
+        assert_tags_eq(
+            &arena,
+            &[
+                Tag::new_span(Boundary::new(4096, 4096 * 20).unwrap()),
+                Tag::new_free(Boundary::new(4096, 4096 * 20).unwrap()),
+            ],
+        );
+    }
+
+    #[test]
+    fn test_arena_alloc() {
+        let mut arena = create_arena_with_static_tags(
+            "test",
+            Some(Boundary::new_unchecked(4096, 4096 * 20)),
+            4096,
+            None,
+        );
+
+        arena.alloc(4096 * 2);
+
+        assert_tags_eq(
+            &arena,
+            &[
+                Tag::new_span(Boundary::new(4096, 4096 * 20).unwrap()),
+                Tag::new_allocated(Boundary::new(4096, 4096 * 2).unwrap()),
+                Tag::new_free(Boundary::new(4096 * 3, 4096 * 18).unwrap()),
+            ],
+        );
+    }
+
+    #[test]
+    fn test_arena_alloc_rounds_if_wrong_granule() {
+        let mut arena = create_arena_with_static_tags(
+            "test",
+            Some(Boundary::new_unchecked(4096, 4096 * 20)),
+            4096,
+            None,
+        );
+        let a = arena.alloc_segment(1024);
+        assert_eq!(a.unwrap().size, 4096);
+    }
+
+    #[test]
+    fn test_arena_free() {
+        let mut arena = create_arena_with_static_tags(
+            "test",
+            Some(Boundary::new_unchecked(4096, 4096 * 20)),
+            4096,
+            None,
+        );
+        assert_eq!(arena.tag_pool.len(), 100);
+
+        // We need to test each case where we're freeing by scanning the tags linearly.
+        // To do this we run through each case (comments from the `free` function)
+
+        // Prev and next both non-free
+        let a1 = arena.alloc(4096);
+        let a2 = arena.alloc(4096);
+        assert_eq!(arena.tag_pool.len(), 98);
+        assert_tags_eq(
+            &arena,
+            &[
+                Tag::new(TagType::Span, Boundary::new(4096, 4096 * 20).unwrap()),
+                Tag::new(TagType::Allocated, Boundary::new(4096, 4096).unwrap()),
+                Tag::new(TagType::Allocated, Boundary::new(4096 * 2, 4096).unwrap()),
+                Tag::new(TagType::Free, Boundary::new(4096 * 3, 4096 * 18).unwrap()),
+            ],
+        );
+        arena.free(a1);
+        assert_eq!(arena.tag_pool.len(), 98);
+        assert_tags_eq(
+            &arena,
+            &[
+                Tag::new(TagType::Span, Boundary::new(4096, 4096 * 20).unwrap()),
+                Tag::new(TagType::Free, Boundary::new(4096, 4096).unwrap()),
+                Tag::new(TagType::Allocated, Boundary::new(4096 * 2, 4096).unwrap()),
+                Tag::new(TagType::Free, Boundary::new(4096 * 3, 4096 * 18).unwrap()),
+            ],
+        );
+
+        // Prev and next both free
+        arena.free(a2);
+        assert_eq!(arena.tag_pool.len(), 100);
+        assert_tags_eq(
+            &arena,
+            &[
+                Tag::new(TagType::Span, Boundary::new(4096, 4096 * 20).unwrap()),
+                Tag::new(TagType::Free, Boundary::new(4096, 4096 * 20).unwrap()),
+            ],
+        );
+
+        // Prev free, next non-free
+        let a1 = arena.alloc(4096);
+        let a2 = arena.alloc(4096);
+        let a3 = arena.alloc(4096);
+        arena.free(a1);
+        assert_eq!(arena.tag_pool.len(), 97);
+        assert_tags_eq(
+            &arena,
+            &[
+                Tag::new(TagType::Span, Boundary::new(4096, 4096 * 20).unwrap()),
+                Tag::new(TagType::Free, Boundary::new(4096, 4096).unwrap()),
+                Tag::new(TagType::Allocated, Boundary::new(4096 * 2, 4096).unwrap()),
+                Tag::new(TagType::Allocated, Boundary::new(4096 * 3, 4096).unwrap()),
+                Tag::new(TagType::Free, Boundary::new(4096 * 4, 4096 * 17).unwrap()),
+            ],
+        );
+        arena.free(a2);
+        assert_eq!(arena.tag_pool.len(), 98);
+        assert_tags_eq(
+            &arena,
+            &[
+                Tag::new(TagType::Span, Boundary::new(4096, 4096 * 20).unwrap()),
+                Tag::new(TagType::Free, Boundary::new(4096, 4096 * 2).unwrap()),
+                Tag::new(TagType::Allocated, Boundary::new(4096 * 3, 4096).unwrap()),
+                Tag::new(TagType::Free, Boundary::new(4096 * 4, 4096 * 17).unwrap()),
+            ],
+        );
+
+        // Prev non-free, next free
+        arena.free(a3);
+        let a1 = arena.alloc(4096);
+        assert_eq!(arena.tag_pool.len(), 99);
+        assert_tags_eq(
+            &arena,
+            &[
+                Tag::new(TagType::Span, Boundary::new(4096, 4096 * 20).unwrap()),
+                Tag::new(TagType::Allocated, Boundary::new(4096, 4096).unwrap()),
+                Tag::new(TagType::Free, Boundary::new(4096 * 2, 4096 * 19).unwrap()),
+            ],
+        );
+        arena.free(a1);
+        assert_eq!(arena.tag_pool.len(), 100);
+        assert_tags_eq(
+            &arena,
+            &[
+                Tag::new(TagType::Span, Boundary::new(4096, 4096 * 20).unwrap()),
+                Tag::new(TagType::Free, Boundary::new(4096, 4096 * 20).unwrap()),
+            ],
+        );
+    }
+
+    #[test]
+    fn test_arena_nesting() {
+        // Create a page of tags we can share amongst the first arenas
+        let mut page = Page4K([0; 4096]);
+        const NUM_TAGS: usize = size_of::<Page4K>() / size_of::<TagItem>();
+        let all_tags = unsafe { &mut *(&mut page as *mut Page4K as *mut [TagItem; NUM_TAGS]) };
+
+        const NUM_ARENAS: usize = 4;
+        const NUM_TAGS_PER_ARENA: usize = NUM_TAGS / NUM_ARENAS;
+        let (arena1_tags, all_tags) = all_tags.split_at_mut(NUM_TAGS_PER_ARENA);
+        let (arena2_tags, all_tags) = all_tags.split_at_mut(NUM_TAGS_PER_ARENA);
+        let (arena3a_tags, all_tags) = all_tags.split_at_mut(NUM_TAGS_PER_ARENA);
+        let (arena3b_tags, _) = all_tags.split_at_mut(NUM_TAGS_PER_ARENA);
+
+        let mut arena1 = Arena::new_with_tags(
+            "arena1",
+            Some(Boundary::new_unchecked(4096, 4096 * 20)),
+            4096,
+            None,
+            arena1_tags,
+        );
+
+        // Import all
+        let mut arena2 = Arena::new_with_tags("arena2", None, 4096, None, arena2_tags);
+
+        // Import first half
+        let mut arena3a = Arena::new_with_tags(
+            "arena3a",
+            Some(Boundary::from(4096..4096 * 10)),
+            4096,
+            None,
+            arena3a_tags,
+        );
+
+        // Import second half
+        let mut arena3b = Arena::new_with_tags(
+            "arena3b",
+            Some(Boundary::from(4096 * 10..4096 * 21)),
+            4096,
+            None,
+            arena3b_tags,
+        );
+
+        // Let's do some allocations
+    }
+}
diff --git a/rust-toolchain.toml b/rust-toolchain.toml
index edc3dd8..cdd3635 100644
--- a/rust-toolchain.toml
+++ b/rust-toolchain.toml
@@ -1,5 +1,5 @@
 [toolchain]
-channel = "nightly-2024-06-08"
+channel = "nightly-2024-07-01"
 components = [ "rustfmt", "rust-src", "clippy", "llvm-tools" ]
 targets = [
   "aarch64-unknown-none",

From 9fc921d1111abb004d566b3e7ed6d51bcfa8e501 Mon Sep 17 00:00:00 2001
From: Graham MacDonald <grahamamacdonald@gmail.com>
Date: Sat, 3 Aug 2024 15:02:52 +0100
Subject: [PATCH 2/8] Add bump alloc, restructure init code

Signed-off-by: Graham MacDonald <grahamamacdonald@gmail.com>
---
 aarch64/src/init.rs    | 143 +++++++++++++++++++++++++++
 aarch64/src/main.rs    | 126 +++---------------------
 aarch64/src/runtime.rs |  46 +++++++--
 aarch64/src/vm.rs      |   6 +-
 aarch64/src/vmalloc.rs |  58 ++++++++---
 port/src/bumpalloc.rs  |  97 ++++++++++++++++++
 port/src/lib.rs        |   1 +
 port/src/mem.rs        |   8 +-
 port/src/vmem.rs       | 219 ++++++++++++++++++++++++-----------------
 rust-toolchain.toml    |   6 +-
 10 files changed, 477 insertions(+), 233 deletions(-)
 create mode 100644 aarch64/src/init.rs
 create mode 100644 port/src/bumpalloc.rs

diff --git a/aarch64/src/init.rs b/aarch64/src/init.rs
new file mode 100644
index 0000000..d8f74cd
--- /dev/null
+++ b/aarch64/src/init.rs
@@ -0,0 +1,143 @@
+use crate::devcons;
+use crate::kmem;
+use crate::kmem::from_virt_to_physaddr;
+use crate::kmem::heap_virtrange;
+use crate::mailbox;
+use crate::pagealloc;
+use crate::registers;
+use crate::runtime;
+use crate::trap;
+use crate::vm;
+use crate::vm::kernel_root;
+use crate::vm::PageTable;
+use crate::vmalloc;
+use alloc::boxed::Box;
+use core::ptr;
+use port::fdt::DeviceTree;
+use port::mem::{PhysRange, VirtRange};
+use port::println;
+
+static mut KPGTBL: PageTable = PageTable::empty();
+
+unsafe fn print_memory_range(name: &str, range: VirtRange) {
+    let start = range.start();
+    let end = range.end();
+    let size = range.size();
+    println!("  {name}{start:#x}..{end:#x} ({size:#x})");
+}
+
+fn print_binary_sections() {
+    println!("Binary sections:");
+    unsafe {
+        print_memory_range("boottext:\t", kmem::boottext_virtrange());
+        print_memory_range("text:\t\t", kmem::text_virtrange());
+        print_memory_range("rodata:\t", kmem::rodata_virtrange());
+        print_memory_range("data:\t\t", kmem::data_virtrange());
+        print_memory_range("bss:\t\t", kmem::bss_virtrange());
+        print_memory_range("heap:\t\t", kmem::heap_virtrange());
+        print_memory_range("total:\t", kmem::total_virtrange());
+    }
+}
+
+fn print_physical_memory_info() {
+    println!("Physical memory map:");
+    let arm_mem = mailbox::get_arm_memory();
+    println!("  Memory:\t{arm_mem} ({:#x})", arm_mem.size());
+    let vc_mem = mailbox::get_vc_memory();
+    println!("  Video:\t{vc_mem} ({:#x})", vc_mem.size());
+}
+
+fn print_memory_info() {
+    println!("Memory usage:");
+    let (used, total) = pagealloc::usage_bytes();
+    println!("  Used:\t\t{used:#016x}");
+    println!("  Total:\t{total:#016x}");
+}
+
+// https://github.com/raspberrypi/documentation/blob/develop/documentation/asciidoc/computers/raspberry-pi/revision-codes.adoc
+fn print_pi_name(board_revision: u32) {
+    let name = match board_revision {
+        0xa21041 => "Raspberry Pi 2B",
+        0xa02082 => "Raspberry Pi 3B",
+        0xb03115 => "Raspberry Pi 4B",
+        0xa220a0 => "Raspberry Compute Module 3",
+        _ => "Unrecognised",
+    };
+    println!("  Board Name:\t{name}");
+}
+
+fn print_board_info() {
+    println!("Board information:");
+    let board_revision = mailbox::get_board_revision();
+    print_pi_name(board_revision);
+    println!("  Board Rev:\t{board_revision:#010x}");
+    let model = mailbox::get_board_model();
+    println!("  Board Model:\t{model:#010x}");
+    let serial = mailbox::get_board_serial();
+    println!("  Serial Num:\t{serial:#010x}");
+    let mailbox::MacAddress { a, b, c, d, e, f } = mailbox::get_board_macaddr();
+    println!("  MAC Address:\t{a:02x}:{b:02x}:{c:02x}:{d:02x}:{e:02x}:{f:02x}");
+    let fw_revision = mailbox::get_firmware_revision();
+    println!("  Firmware Rev:\t{fw_revision:#010x}");
+}
+
+/// This function is concerned with preparing the system to the point where an
+/// allocator can be set up and allocation is available.  We can't assume
+/// there's any allocator available when executing this function.
+fn init_pre_allocator(dtb_va: usize) {
+    trap::init();
+
+    // Parse the DTB before we set up memory so we can correctly map it
+    let dt = unsafe { DeviceTree::from_usize(dtb_va).unwrap() };
+
+    // Set up uart so we can log as early as possible
+    mailbox::init(&dt);
+    devcons::init(&dt);
+
+    println!();
+    println!("r9 from the Internet");
+    println!("DTB found at: {:#x}", dtb_va);
+    println!("midr_el1: {:?}", registers::MidrEl1::read());
+
+    print_binary_sections();
+    print_physical_memory_info();
+    print_board_info();
+
+    // Map address space accurately using rust VM code to manage page tables
+    unsafe {
+        let dtb_range = PhysRange::with_len(from_virt_to_physaddr(dtb_va).addr(), dt.size());
+        vm::init(&mut *ptr::addr_of_mut!(KPGTBL), dtb_range, mailbox::get_arm_memory());
+        vm::switch(&*ptr::addr_of!(KPGTBL));
+    }
+}
+
+pub fn init(dtb_va: usize) {
+    init_pre_allocator(dtb_va);
+
+    // From this point we can use the global allocator.  Initially it uses a
+    // bump allocator that makes permanent allocations.  This can be used to
+    // create the more complex vmem allocator.  Once the vmem allocator is
+    // available, we switch to that.
+    runtime::enable_bump_allocator();
+
+    vmalloc::init(heap_virtrange());
+    //runtime::enable_vmem_allocator();
+
+    let _b = Box::new("ddododo");
+
+    print_memory_info();
+
+    kernel_root().print_recursive_tables();
+
+    println!("looping now");
+
+    {
+        let test = vmalloc::alloc(1024);
+        println!("test alloc: {:p}", test);
+        let test2 = vmalloc::alloc(1024);
+        println!("test alloc: {:p}", test2);
+    }
+
+    #[allow(clippy::empty_loop)]
+    loop {}
+}
diff --git a/aarch64/src/main.rs b/aarch64/src/main.rs
index 1eab130..3249950 100644
--- a/aarch64/src/main.rs
+++ b/aarch64/src/main.rs
@@ -4,11 +4,19 @@
 #![cfg_attr(not(test), no_main)]
 #![feature(alloc_error_handler)]
 #![feature(asm_const)]
+#![feature(const_refs_to_static)]
 #![feature(core_intrinsics)]
 #![feature(strict_provenance)]
+#![feature(sync_unsafe_cell)]
 #![forbid(unsafe_op_in_unsafe_fn)]
 
+/// Keep this file as sparse as possible for two reasons:
+/// 1. We keep the rust main weirdness isolated
+/// 2. rust-analyzer gets confused about cfgs and thinks none of this code is
+///    enabled and is therefore greyed out in VS Code, so let's move the bulk
+///    of the code elsewhere.
 mod devcons;
+mod init;
 mod io;
 mod kmem;
 mod mailbox;
@@ -21,126 +29,18 @@ mod uartpl011;
 mod vm;
 mod vmalloc;
 
-use crate::kmem::from_virt_to_physaddr;
-use crate::vm::kernel_root;
-use core::ptr;
-use port::fdt::DeviceTree;
-use port::mem::{PhysRange, VirtRange};
-use port::println;
-use vm::PageTable;
+extern crate alloc;
+
+use crate::init::init;
 
 #[cfg(not(test))]
 core::arch::global_asm!(include_str!("l.S"));
 
-static mut KPGTBL: PageTable = PageTable::empty();
-
-unsafe fn print_memory_range(name: &str, range: VirtRange) {
-    let start = range.start();
-    let end = range.end();
-    let size = range.size();
-    println!("  {name}{start:#x}..{end:#x} ({size:#x})");
-}
-
-fn print_binary_sections() {
-    println!("Binary sections:");
-    unsafe {
-        print_memory_range("boottext:\t", kmem::boottext_virtrange());
-        print_memory_range("text:\t\t", kmem::text_virtrange());
-        print_memory_range("rodata:\t", kmem::rodata_virtrange());
-        print_memory_range("data:\t\t", kmem::data_virtrange());
-        print_memory_range("bss:\t\t", kmem::bss_virtrange());
-        print_memory_range("heap:\t\t", kmem::heap_virtrange());
-        print_memory_range("total:\t", kmem::total_virtrange());
-    }
-}
-
-fn print_physical_memory_info() {
-    println!("Physical memory map:");
-    let arm_mem = mailbox::get_arm_memory();
-    println!("  Memory:\t{arm_mem} ({:#x})", arm_mem.size());
-    let vc_mem = mailbox::get_vc_memory();
-    println!("  Video:\t{vc_mem} ({:#x})", vc_mem.size());
-}
-
-fn print_memory_info() {
-    println!("Memory usage:");
-    let (used, total) = pagealloc::usage_bytes();
-    println!("  Used:\t\t{used:#016x}");
-    println!("  Total:\t{total:#016x}");
-}
-
-// https://github.com/raspberrypi/documentation/blob/develop/documentation/asciidoc/computers/raspberry-pi/revision-codes.adoc
-fn print_pi_name(board_revision: u32) {
-    let name = match board_revision {
-        0xa21041 => "Raspberry Pi 2B",
-        0xa02082 => "Raspberry Pi 3B",
-        0xb03115 => "Raspberry Pi 4B",
-        0xa220a0 => "Raspberry Compute Module 3",
-        _ => "Unrecognised",
-    };
-    println!("  Board Name:\t{name}");
-}
-
-fn print_board_info() {
-    println!("Board information:");
-    let board_revision = mailbox::get_board_revision();
-    print_pi_name(board_revision);
-    println!("  Board Rev:\t{board_revision:#010x}");
-    let model = mailbox::get_board_model();
-    println!("  Board Model:\t{model:#010x}");
-    let serial = mailbox::get_board_serial();
-    println!("  Serial Num:\t{serial:#010x}");
-    let mailbox::MacAddress { a, b, c, d, e, f } = mailbox::get_board_macaddr();
-    println!("  MAC Address:\t{a:02x}:{b:02x}:{c:02x}:{d:02x}:{e:02x}:{f:02x}");
-    let fw_revision = mailbox::get_firmware_revision();
-    println!("  Firmware Rev:\t{fw_revision:#010x}");
-}
-
 /// dtb_va is the virtual address of the DTB structure.  The physical address is
 /// assumed to be dtb_va-KZERO.
 #[no_mangle]
 pub extern "C" fn main9(dtb_va: usize) {
-    trap::init();
-
-    // Parse the DTB before we set up memory so we can correctly map it
-    let dt = unsafe { DeviceTree::from_usize(dtb_va).unwrap() };
-
-    // Set up uart so we can log as early as possible
-    mailbox::init(&dt);
-    devcons::init(&dt);
-
-    println!();
-    println!("r9 from the Internet");
-    println!("DTB found at: {:#x}", dtb_va);
-    println!("midr_el1: {:?}", registers::MidrEl1::read());
-
-    print_binary_sections();
-    print_physical_memory_info();
-    print_board_info();
-
-    // Map address space accurately using rust VM code to manage page tables
-    unsafe {
-        let dtb_range = PhysRange::with_len(from_virt_to_physaddr(dtb_va).addr(), dt.size());
-        vm::init(&mut *ptr::addr_of_mut!(KPGTBL), dtb_range, mailbox::get_arm_memory());
-        vm::switch(&*ptr::addr_of!(KPGTBL));
-    }
-
-    // From this point we can use the global allocator
-
-    print_memory_info();
-
-    kernel_root().print_recursive_tables();
-
-    println!("looping now");
-
-    {
-        let test = vmalloc::alloc(1024);
-        println!("test alloc: {:p}", test);
-        let test2 = vmalloc::alloc(1024);
-        println!("test alloc: {:p}", test2);
-    }
-
-    #[allow(clippy::empty_loop)]
-    loop {}
+    init(dtb_va);
 }
+
 mod runtime;
diff --git a/aarch64/src/runtime.rs b/aarch64/src/runtime.rs
index a5740fb..efc3c57 100644
--- a/aarch64/src/runtime.rs
+++ b/aarch64/src/runtime.rs
@@ -8,8 +8,11 @@ use crate::uartmini::MiniUart;
 use alloc::alloc::{GlobalAlloc, Layout};
 use core::fmt::Write;
 use core::panic::PanicInfo;
+use core::sync::atomic::{AtomicU8, Ordering::Relaxed};
+use num_enum::{FromPrimitive, IntoPrimitive};
+use port::bumpalloc::Bump;
 use port::devcons::PanicConsole;
-use port::mem::VirtRange;
+use port::mem::{VirtRange, PAGE_SIZE_4K};
 
 // TODO
 //  - Add qemu integration test
@@ -40,16 +43,43 @@ fn oom(_layout: Layout) -> ! {
     panic!("oom");
 }
 
-struct VmemAllocator;
+#[derive(Debug, IntoPrimitive, FromPrimitive)]
+#[repr(u8)]
+enum AllocatorType {
+    #[num_enum(default)]
+    None = 0,
+    Bump,
+}
+
+/// A simple wrapper that allows the allocator to be changed at runtime.
+#[repr(C, align(4096))]
+struct Allocator {
+    bump_alloc: Bump<PAGE_SIZE_4K, PAGE_SIZE_4K>,
+    enabled_allocator: AtomicU8,
+}
 
-unsafe impl GlobalAlloc for VmemAllocator {
-    unsafe fn alloc(&self, _layout: Layout) -> *mut u8 {
-        panic!("fake alloc");
+pub fn enable_bump_allocator() {
+    ALLOCATOR.enabled_allocator.store(AllocatorType::Bump as u8, Relaxed);
+}
+
+unsafe impl GlobalAlloc for Allocator {
+    unsafe fn alloc(&self, layout: Layout) -> *mut u8 {
+        match AllocatorType::try_from(self.enabled_allocator.load(Relaxed)) {
+            Ok(AllocatorType::None) | Err(_) => panic!("no allocator available for alloc"),
+            Ok(AllocatorType::Bump) => unsafe { self.bump_alloc.alloc(layout) },
+        }
     }
-    unsafe fn dealloc(&self, _ptr: *mut u8, _layout: Layout) {
-        panic!("fake dealloc");
+
+    unsafe fn dealloc(&self, ptr: *mut u8, layout: Layout) {
+        match AllocatorType::try_from(self.enabled_allocator.load(Relaxed)) {
+            Ok(AllocatorType::None) | Err(_) => panic!("no allocator available for dealloc"),
+            Ok(AllocatorType::Bump) => unsafe { self.bump_alloc.dealloc(ptr, layout) },
+        }
     }
 }
 
 #[global_allocator]
-static VMEM_ALLOCATOR: VmemAllocator = VmemAllocator {};
+static ALLOCATOR: Allocator = Allocator {
+    bump_alloc: Bump::new(0),
+    enabled_allocator: AtomicU8::new(AllocatorType::None as u8),
+};
diff --git a/aarch64/src/vm.rs b/aarch64/src/vm.rs
index 27b3a06..6619d7f 100644
--- a/aarch64/src/vm.rs
+++ b/aarch64/src/vm.rs
@@ -2,12 +2,11 @@
 
 use crate::{
     kmem::{
-        from_ptr_to_physaddr, heap_virtrange, kernel_bss_physrange, kernel_data_physrange,
-        kernel_heap_physrange, kernel_text_physrange, physaddr_as_ptr_mut, physaddr_as_virt,
+        from_ptr_to_physaddr, kernel_bss_physrange, kernel_data_physrange, kernel_heap_physrange,
+        kernel_text_physrange, physaddr_as_ptr_mut, physaddr_as_virt,
     },
     pagealloc,
     registers::rpi_mmio,
-    vmalloc,
 };
 use bitstruct::bitstruct;
 use core::fmt;
@@ -469,7 +468,6 @@ fn print_pte(indent: usize, i: usize, level: Level, pte: Entry) {
 
 pub unsafe fn init(kpage_table: &mut PageTable, dtb_range: PhysRange, available_mem: PhysRange) {
     pagealloc::init_page_allocator();
-    vmalloc::init(heap_virtrange());
 
     // We use recursive page tables, but we have to be careful in the init call,
     // since the kpage_table is not currently pointed to by ttbr1_el1.  Any
diff --git a/aarch64/src/vmalloc.rs b/aarch64/src/vmalloc.rs
index f978f12..0577dd7 100644
--- a/aarch64/src/vmalloc.rs
+++ b/aarch64/src/vmalloc.rs
@@ -2,34 +2,66 @@ use core::{mem::MaybeUninit, ptr::addr_of};
 
 use port::{
     mcslock::{Lock, LockNode},
-    mem::VirtRange,
-    vmem::{Arena, Boundary},
+    mem::{VirtRange, PAGE_SIZE_4K},
+    vmem::{Allocator, Arena, Boundary},
 };
 
+// TODO replace with some sort of OnceLock?  We need this to be dynamically created,
+// but we're assuming VmAlloc is Sync.
 static VMALLOC: Lock<Option<&'static mut VmAlloc>> = Lock::new("vmalloc", None);
 
+// The core arenas are statically allocated.  They cannot be created in const
+// functions, so the we declare them as MaybeUninit before intialising and
+// referening them from VmAlloc, from where they can be used in the global allocator.
+//static mut MAYBE_HEAP_ARENA: MaybeUninit<Arena> = MaybeUninit::uninit();
+
 static mut EARLY_TAGS_PAGE: [u8; 4096] = [0; 4096];
 
 struct VmAlloc {
     heap_arena: Arena,
+    //heap_arena: Lock<NonNull<Arena>>,
+    // heap_arena: Lock<Arena<'a>>,
+    // va_arena: Lock<Arena<'a>>,
 }
 
 impl VmAlloc {
     fn new(heap_range: VirtRange) -> Self {
-        let quantum = 4096;
+        // Heap_arena is the lowest level arena.  We pass an address range from which
+        // it can allocate a block of tags to build the initial structures.
+        // let heap_arena = unsafe {
+        //     let early_tags_ptr = addr_of!(EARLY_TAGS_PAGE) as usize;
+        //     let early_tags_size = EARLY_TAGS_PAGE.len();
+        //     let early_tags_range = VirtRange::with_len(early_tags_ptr, early_tags_size);
+
+        //     MAYBE_HEAP_ARENA.write(Arena::new_with_static_range(
+        //         "heap",
+        //         Some(Boundary::from(heap_range)),
+        //         PAGE_SIZE_4K,
+        //         early_tags_range,
+        //     ));
+        //     MAYBE_HEAP_ARENA.assume_init_mut()
+        // };
 
-        let early_tags_ptr = unsafe { addr_of!(EARLY_TAGS_PAGE) as usize };
+        let early_tags_ptr = addr_of!(EARLY_TAGS_PAGE) as usize;
         let early_tags_size = unsafe { EARLY_TAGS_PAGE.len() };
         let early_tags_range = VirtRange::with_len(early_tags_ptr, early_tags_size);
 
+        let heap_arena = Arena::new_with_static_range(
+            "heap",
+            Some(Boundary::from(heap_range)),
+            PAGE_SIZE_4K,
+            early_tags_range,
+        );
+
+        // va_arena imports from heap_arena, so can use allocations from that heap to
+        // allocate blocks of tags.
+        // let va_arena = Arena::new("kmem_va", None, QUANTUM, Some(&heap_arena));
+
         Self {
-            heap_arena: Arena::new_with_static_range(
-                "heap",
-                Some(Boundary::from(heap_range)),
-                quantum,
-                None,
-                early_tags_range,
-            ),
+            heap_arena,
+            //heap_arena,
+            //heap_arena: Lock::new(heap_arena.name(), heap_arena),
+            //va_arena: Lock::new(va_arena.name(), va_arena),
         }
     }
 }
@@ -50,5 +82,9 @@ pub fn alloc(size: usize) -> *mut u8 {
     let node = LockNode::new();
     let mut lock = VMALLOC.lock(&node);
     let vmalloc = lock.as_deref_mut().unwrap();
+
+    // let node = LockNode::new();
+    // let mut guard = vmalloc.heap_arena.lock(&node);
+    //guard.alloc(size)
     vmalloc.heap_arena.alloc(size)
 }
diff --git a/port/src/bumpalloc.rs b/port/src/bumpalloc.rs
new file mode 100644
index 0000000..72eefcc
--- /dev/null
+++ b/port/src/bumpalloc.rs
@@ -0,0 +1,97 @@
+use core::alloc::{GlobalAlloc, Layout};
+use core::cell::UnsafeCell;
+use core::ptr::null_mut;
+use core::sync::atomic::{AtomicUsize, Ordering::Relaxed};
+
+/// Bump allocator to be used for earliest allocations in r9.  These allocations
+/// can never be freed - attempting to do so will panic.
+/// This has been originally based on the example here:
+/// https://doc.rust-lang.org/std/alloc/trait.GlobalAlloc.html
+#[repr(C, align(4096))]
+pub struct Bump<const SIZE_BYTES: usize, const MAX_SUPPORTED_ALIGN: usize> {
+    bytes: UnsafeCell<[u8; SIZE_BYTES]>,
+    remaining: AtomicUsize,
+}
+
+unsafe impl<const SIZE_BYTES: usize, const MAX_SUPPORTED_ALIGN: usize> Send
+    for Bump<SIZE_BYTES, MAX_SUPPORTED_ALIGN>
+{
+}
+unsafe impl<const SIZE_BYTES: usize, const MAX_SUPPORTED_ALIGN: usize> Sync
+    for Bump<SIZE_BYTES, MAX_SUPPORTED_ALIGN>
+{
+}
+
+impl<const SIZE_BYTES: usize, const MAX_SUPPORTED_ALIGN: usize>
+    Bump<SIZE_BYTES, MAX_SUPPORTED_ALIGN>
+{
+    pub const fn new(init_value: u8) -> Self {
+        Self {
+            bytes: UnsafeCell::new([init_value; SIZE_BYTES]),
+            remaining: AtomicUsize::new(SIZE_BYTES),
+        }
+    }
+}
+
+unsafe impl<const SIZE_BYTES: usize, const MAX_SUPPORTED_ALIGN: usize> GlobalAlloc
+    for Bump<SIZE_BYTES, MAX_SUPPORTED_ALIGN>
+{
+    unsafe fn alloc(&self, layout: Layout) -> *mut u8 {
+        let size = layout.size();
+        let align = layout.align();
+
+        if align > MAX_SUPPORTED_ALIGN {
+            return null_mut();
+        }
+
+        let mut allocated = 0;
+        if self
+            .remaining
+            .fetch_update(Relaxed, Relaxed, |mut remaining| {
+                if size > remaining {
+                    return None;
+                }
+
+                // `Layout` contract forbids making a `Layout` with align=0, or
+                // align not power of 2.  So we can safely use a mask to ensure
+                // alignment without worrying about UB.
+                let align_mask_to_round_down = !(align - 1);
+
+                remaining -= size;
+                remaining &= align_mask_to_round_down;
+                allocated = remaining;
+                Some(remaining)
+            })
+            .is_err()
+        {
+            null_mut()
+        } else {
+            unsafe { self.bytes.get().cast::<u8>().add(allocated) }
+        }
+    }
+
+    unsafe fn dealloc(&self, ptr: *mut u8, layout: Layout) {
+        panic!("Can't dealloc from Bump allocator (ptr: {:p}, layout: {:?})", ptr, layout)
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn bump_new() {
+        let bump = Bump::<4096, 4096>::new(0);
+        let ptr = unsafe { bump.alloc(Layout::from_size_align_unchecked(4096, 4096)) };
+        assert!(!ptr.is_null());
+        let ptr = unsafe { bump.alloc(Layout::from_size_align_unchecked(1, 1)) };
+        assert!(ptr.is_null());
+    }
+
+    #[test]
+    fn align_too_high() {
+        let bump = Bump::<4096, 4096>::new(0);
+        let ptr = unsafe { bump.alloc(Layout::from_size_align_unchecked(4096, 8192)) };
+        assert!(ptr.is_null());
+    }
+}
diff --git a/port/src/lib.rs b/port/src/lib.rs
index 44a9e6e..ec83b5e 100644
--- a/port/src/lib.rs
+++ b/port/src/lib.rs
@@ -5,6 +5,7 @@
 #![forbid(unsafe_op_in_unsafe_fn)]
 
 pub mod bitmapalloc;
+pub mod bumpalloc;
 pub mod dat;
 pub mod devcons;
 pub mod fdt;
diff --git a/port/src/mem.rs b/port/src/mem.rs
index 92d03b1..3232d4b 100644
--- a/port/src/mem.rs
+++ b/port/src/mem.rs
@@ -12,7 +12,13 @@ pub const PAGE_SIZE_1G: usize = 1 << 30;
 pub struct VirtRange(pub Range<usize>);
 
 impl VirtRange {
-    pub fn with_len(start: usize, len: usize) -> Self {
+    pub fn from_any<T>(a: T) -> Self {
+        let addr = &a as *const _ as usize;
+        let size = core::mem::size_of_val(&a);
+        Self(addr..addr + size)
+    }
+
+    pub const fn with_len(start: usize, len: usize) -> Self {
         Self(start..start + len)
     }
 
diff --git a/port/src/vmem.rs b/port/src/vmem.rs
index f7b2bd5..de44df1 100644
--- a/port/src/vmem.rs
+++ b/port/src/vmem.rs
@@ -249,9 +249,9 @@ impl TagList {
         core::iter::from_fn(move || {
             if let Some(item) = unsafe { curr_tag_item.as_ref() } {
                 curr_tag_item = item.next;
-                return Some(item.tag);
+                Some(item.tag)
             } else {
-                return None;
+                None
             }
         })
     }
@@ -284,21 +284,51 @@ impl TagList {
     // }
 }
 
+// TODO this needs to be Sync, so actually make it sync
 pub struct Arena {
-    _name: &'static str,
+    name: &'static str,
     quantum: usize,
 
-    tag_pool: TagPool,     // Pool of available tags
+    tag_pool: TagPool, // Pool of available tags
     segment_list: TagList, // List of all segments in address order
+
+                       //parent: Option<&Arena>, // Parent arena to import from
+}
+
+unsafe impl Send for Arena {}
+unsafe impl Sync for Arena {}
+
+pub trait Allocator {
+    fn alloc(&mut self, size: usize) -> *mut u8;
+    fn free(&mut self, addr: *mut u8);
 }
 
 impl Arena {
+    pub fn new(
+        name: &'static str,
+        initial_span: Option<Boundary>,
+        quantum: usize,
+        _parent: Option<Arena>,
+    ) -> Self {
+        println!("Arena::new name:{} initial_span:{:?} quantum:{:x}", name, initial_span, quantum);
+
+        let mut arena =
+            Self { name, quantum, segment_list: TagList::new(), tag_pool: TagPool::new() };
+
+        if let Some(span) = initial_span {
+            arena.add_initial_span(span);
+        }
+
+        arena
+    }
+
     /// Only to be used for creation of initial heap
+    /// Create a new arena, assuming there is no dynamic allocation available,
+    /// and all free tags come from the free_tags provided.
     pub fn new_with_static_range(
         name: &'static str,
         initial_span: Option<Boundary>,
         quantum: usize,
-        parent: Option<Arena>,
         static_range: VirtRange,
     ) -> Self {
         let tags_addr = unsafe { &mut *(static_range.start() as *mut TagItem) };
@@ -306,41 +336,45 @@ impl Arena {
             slice::from_raw_parts_mut(tags_addr, static_range.size() / size_of::<TagItem>())
         };
 
-        println!(
-            "Arena::new_with_static_range name:{} initial_span:{:?} quantum:{:x}",
-            name, initial_span, quantum
-        );
-
-        Self::new_with_tags(name, initial_span, quantum, parent, tags)
+        Self::new_with_tags(name, initial_span, quantum, tags)
     }
 
+    /// Only to be used for creation of initial heap
     /// Create a new arena, assuming there is no dynamic allocation available,
     /// and all free tags come from the free_tags provided.
     fn new_with_tags(
         name: &'static str,
         initial_span: Option<Boundary>,
         quantum: usize,
-        _parent: Option<Arena>,
-        free_tags: &mut [TagItem],
+        tags: &mut [TagItem],
     ) -> Self {
-        let mut arena = Self {
-            _name: name,
-            quantum: quantum,
-            segment_list: TagList::new(),
-            tag_pool: TagPool::new(),
-        };
-        arena.add_tags_to_pool(free_tags);
+        println!(
+            "Arena::new_with_tags name:{} initial_span:{:?} quantum:{:x}",
+            name, initial_span, quantum
+        );
+
+        let mut arena =
+            Self { name, quantum, segment_list: TagList::new(), tag_pool: TagPool::new() };
+        arena.add_tags_to_pool(tags);
 
         if let Some(span) = initial_span {
-            assert_eq!(span.start % quantum, 0);
-            assert_eq!(span.size % quantum, 0);
-            assert!(span.start.checked_add(span.size).is_some());
-            arena.add_free_span(span);
+            arena.add_initial_span(span);
         }
 
         arena
     }
 
+    fn add_initial_span(&mut self, span: Boundary) {
+        assert_eq!(span.start % self.quantum, 0);
+        assert_eq!(span.size % self.quantum, 0);
+        assert!(span.start.checked_add(span.size).is_some());
+        self.add_free_span(span);
+    }
+
+    pub fn name(&self) -> &'static str {
+        self.name
+    }
+
     fn add_free_span(&mut self, boundary: Boundary) {
         self.segment_list.push(unsafe {
             self.tag_pool.take(Tag::new_span(boundary)).as_mut().expect("no free tags")
@@ -358,19 +392,6 @@ impl Arena {
         }
     }
 
-    pub fn alloc(&mut self, size: usize) -> *mut u8 {
-        let boundary = self.alloc_segment(size);
-        if boundary.is_ok() {
-            boundary.unwrap().start as *mut u8
-        } else {
-            null_mut()
-        }
-    }
-
-    pub fn free(&mut self, addr: *mut u8) {
-        let _ = self.free_segment(addr as usize);
-    }
-
     /// Allocate a segment, returned as a boundary
     fn alloc_segment(&mut self, size: usize) -> Result<Boundary, AllocError> {
         println!("alloc_segment size: {}", size);
@@ -437,7 +458,7 @@ impl Arena {
             return Err(AllocError::AllocationNotFound);
         }
 
-        let mut curr_tag: &mut TagItem = unsafe { curr_item.as_mut() }.unwrap();
+        let curr_tag: &mut TagItem = unsafe { curr_item.as_mut() }.unwrap();
 
         // Found tag to free
         let prev_type = unsafe { curr_tag.prev.as_ref() }.map(|t| t.tag.tag_type);
@@ -461,8 +482,8 @@ impl Arena {
                 let next = unsafe { curr_tag.next.as_mut() }.unwrap();
                 next.tag.boundary.start = curr_tag.tag.boundary.start;
                 next.tag.boundary.size += curr_tag.tag.boundary.size;
-                TagList::unlink(&mut curr_tag);
-                self.tag_pool.add(&mut curr_tag);
+                TagList::unlink(curr_tag);
+                self.tag_pool.add(curr_tag);
             }
             (Some(TagType::Free), None)
             | (Some(TagType::Free), Some(TagType::Span))
@@ -471,19 +492,19 @@ impl Arena {
                 // Change prev tag size to merge with curr_tag, release curr_tag
                 let prev = unsafe { curr_tag.prev.as_mut() }.unwrap();
                 prev.tag.boundary.size += curr_tag.tag.boundary.size;
-                TagList::unlink(&mut curr_tag);
-                self.tag_pool.add(&mut curr_tag);
+                TagList::unlink(curr_tag);
+                self.tag_pool.add(curr_tag);
             }
             (Some(TagType::Free), Some(TagType::Free)) => {
                 // Prev and next both free
                 // Change prev size to merge with both curr_tag and next, release curr_tag
                 let prev = unsafe { curr_tag.prev.as_mut() }.unwrap();
-                let mut next = unsafe { curr_tag.next.as_mut() }.unwrap();
+                let next = unsafe { curr_tag.next.as_mut() }.unwrap();
                 prev.tag.boundary.size += curr_tag.tag.boundary.size + next.tag.boundary.size;
-                TagList::unlink(&mut curr_tag);
-                TagList::unlink(&mut next);
-                self.tag_pool.add(&mut curr_tag);
-                self.tag_pool.add(&mut next);
+                TagList::unlink(curr_tag);
+                TagList::unlink(next);
+                self.tag_pool.add(curr_tag);
+                self.tag_pool.add(next);
             }
             (None, None)
             | (None, Some(TagType::Span))
@@ -559,6 +580,21 @@ impl Arena {
     }
 }
 
+impl Allocator for Arena {
+    fn alloc(&mut self, size: usize) -> *mut u8 {
+        let boundary = self.alloc_segment(size);
+        if let Ok(boundary) = boundary {
+            boundary.start as *mut u8
+        } else {
+            null_mut()
+        }
+    }
+
+    fn free(&mut self, addr: *mut u8) {
+        let _ = self.free_segment(addr as usize);
+    }
+}
+
 #[cfg(test)]
 mod tests {
 
@@ -685,7 +721,7 @@ mod tests {
         let mut page = Page4K([0; 4096]);
         const NUM_TAGS: usize = size_of::<Page4K>() / size_of::<TagItem>();
         let tags = unsafe { &mut *(&mut page as *mut Page4K as *mut [TagItem; NUM_TAGS]) };
-        Arena::new_with_tags(name, initial_span, quantum, None, tags)
+        Arena::new_with_tags(name, initial_span, quantum, tags)
     }
 
     fn assert_tags_eq(arena: &Arena, expected: &[Tag]) {
@@ -846,49 +882,46 @@ mod tests {
         );
     }
 
-    #[test]
-    fn test_arena_nesting() {
-        // Create a page of tags we can share amongst the first arenas
-        let mut page = Page4K([0; 4096]);
-        const NUM_TAGS: usize = size_of::<Page4K>() / size_of::<TagItem>();
-        let all_tags = unsafe { &mut *(&mut page as *mut Page4K as *mut [TagItem; NUM_TAGS]) };
-
-        const NUM_ARENAS: usize = 4;
-        const NUM_TAGS_PER_ARENA: usize = NUM_TAGS / NUM_ARENAS;
-        let (arena1_tags, all_tags) = all_tags.split_at_mut(NUM_TAGS_PER_ARENA);
-        let (arena2_tags, all_tags) = all_tags.split_at_mut(NUM_TAGS_PER_ARENA);
-        let (arena3a_tags, all_tags) = all_tags.split_at_mut(NUM_TAGS_PER_ARENA);
-        let (arena3b_tags, _) = all_tags.split_at_mut(NUM_TAGS_PER_ARENA);
-
-        let mut arena1 = Arena::new_with_tags(
-            "arena1",
-            Some(Boundary::new_unchecked(4096, 4096 * 20)),
-            4096,
-            None,
-            arena1_tags,
-        );
-
-        // Import all
-        let mut arena2 = Arena::new_with_tags("arena2", None, 4096, None, arena2_tags);
-
-        // Import first half
-        let mut arena3a = Arena::new_with_tags(
-            "arena3a",
-            Some(Boundary::from(4096..4096 * 10)),
-            4096,
-            None,
-            arena3a_tags,
-        );
-
-        // Import second half
-        let mut arena3b = Arena::new_with_tags(
-            "arena3b",
-            Some(Boundary::from(4096 * 10..4096 * 21)),
-            4096,
-            None,
-            arena3b_tags,
-        );
-
-        // Let's do some allocations
-    }
+    // #[test]
+    // fn test_arena_nesting() {
+    //     // Create a page of tags we can share amongst the first arenas
+    //     let mut page = Page4K([0; 4096]);
+    //     const NUM_TAGS: usize = size_of::<Page4K>() / size_of::<TagItem>();
+    //     let all_tags = unsafe { &mut *(&mut page as *mut Page4K as *mut [TagItem; NUM_TAGS]) };
+
+    //     const NUM_ARENAS: usize = 4;
+    //     const NUM_TAGS_PER_ARENA: usize = NUM_TAGS / NUM_ARENAS;
+    //     let (arena1_tags, all_tags) = all_tags.split_at_mut(NUM_TAGS_PER_ARENA);
+    //     let (arena2_tags, all_tags) = all_tags.split_at_mut(NUM_TAGS_PER_ARENA);
+    //     let (arena3a_tags, all_tags) = all_tags.split_at_mut(NUM_TAGS_PER_ARENA);
+    //     let (arena3b_tags, _) = all_tags.split_at_mut(NUM_TAGS_PER_ARENA);
+
+    //     let mut arena1 = Arena::new_with_tags(
+    //         "arena1",
+    //         Some(Boundary::new_unchecked(4096, 4096 * 20)),
+    //         4096,
+    //         arena1_tags,
+    //     );
+
+    //     // Import all
+    //     let mut arena2 = Arena::new_with_tags("arena2", None, 4096, arena2_tags);
+
+    //     // Import first half
+    //     let mut arena3a = Arena::new_with_tags(
+    //         "arena3a",
+    //         Some(Boundary::from(4096..4096 * 10)),
+    //         4096,
+    //         arena3a_tags,
+    //     );
+
+    //     // Import second half
+    //     let mut arena3b = Arena::new_with_tags(
+    //         "arena3b",
+    //         Some(Boundary::from(4096 * 10..4096 * 21)),
+    //         4096,
+    //         arena3b_tags,
+    //     );
+
+    //     // Let's do some allocations
+    // }
 }
diff --git a/rust-toolchain.toml b/rust-toolchain.toml
index cdd3635..b6cd1b9 100644
--- a/rust-toolchain.toml
+++ b/rust-toolchain.toml
@@ -1,8 +1,8 @@
 [toolchain]
-channel = "nightly-2024-07-01"
-components = [ "rustfmt", "rust-src", "clippy", "llvm-tools" ]
+channel = "nightly-2024-07-24"
+components = ["rustfmt", "rust-src", "clippy", "llvm-tools"]
 targets = [
   "aarch64-unknown-none",
   "riscv64gc-unknown-none-elf",
-  "x86_64-unknown-none"
+  "x86_64-unknown-none",
 ]

From 12f67146696f9888714004f358ada4a97e92f363 Mon Sep 17 00:00:00 2001
From: Graham MacDonald <grahamamacdonald@gmail.com>
Date: Sat, 3 Aug 2024 19:53:53 +0100
Subject: [PATCH 3/8] Fix all warnings, lints, etc

Signed-off-by: Graham MacDonald <grahamamacdonald@gmail.com>
---
 aarch64/src/init.rs    | 8 ++++++--
 aarch64/src/main.rs    | 3 +--
 riscv64/Cargo.toml     | 5 +++++
 riscv64/src/main.rs    | 1 -
 riscv64/src/runtime.rs | 2 +-
 5 files changed, 13 insertions(+), 6 deletions(-)

diff --git a/aarch64/src/init.rs b/aarch64/src/init.rs
index d8f74cd..80956a0 100644
--- a/aarch64/src/init.rs
+++ b/aarch64/src/init.rs
@@ -5,7 +5,6 @@ use crate::kmem::heap_virtrange;
 use crate::mailbox;
 use crate::pagealloc;
 use crate::registers;
-use crate::runtime;
 use crate::trap;
 use crate::vm;
 use crate::vm::kernel_root;
@@ -81,6 +80,11 @@ fn print_board_info() {
     println!("  Firmware Rev:\t{fw_revision:#010x}");
 }
 
+fn enable_bump_allocator() {
+    #[cfg(not(test))]
+    crate::runtime::enable_bump_allocator();
+}
+
 /// This function is concerned with preparing the system to the point where an
 /// allocator can be set up and allocation is available.  We can't assume
 /// there's any allocator available when executing this function.
@@ -118,7 +122,7 @@ pub fn init(dtb_va: usize) {
     // bump allocator that makes permanent allocations.  This can be used to
     // create the more complex vmem allocator.  Once the vmem allocator is
     // available, we switch to that.
-    runtime::enable_bump_allocator();
+    enable_bump_allocator();
 
     vmalloc::init(heap_virtrange());
     //runtime::enable_vmem_allocator();
diff --git a/aarch64/src/main.rs b/aarch64/src/main.rs
index 3249950..23a3151 100644
--- a/aarch64/src/main.rs
+++ b/aarch64/src/main.rs
@@ -23,6 +23,7 @@ mod mailbox;
 mod pagealloc;
 mod param;
 mod registers;
+mod runtime;
 mod trap;
 mod uartmini;
 mod uartpl011;
@@ -42,5 +43,3 @@ core::arch::global_asm!(include_str!("l.S"));
 pub extern "C" fn main9(dtb_va: usize) {
     init(dtb_va);
 }
-
-mod runtime;
diff --git a/riscv64/Cargo.toml b/riscv64/Cargo.toml
index 2ea5ad9..7a81798 100644
--- a/riscv64/Cargo.toml
+++ b/riscv64/Cargo.toml
@@ -11,3 +11,8 @@ port = { path = "../port" }
 
 [features]
 opensbi = []
+
+[lints.rust]
+unexpected_cfgs = { level = "warn", check-cfg = [
+    'cfg(platform, values("nezha", "virt"))',
+] }
diff --git a/riscv64/src/main.rs b/riscv64/src/main.rs
index 19f1621..73dd10d 100644
--- a/riscv64/src/main.rs
+++ b/riscv64/src/main.rs
@@ -1,6 +1,5 @@
 #![feature(alloc_error_handler)]
 #![feature(asm_const)]
-#![feature(panic_info_message)]
 #![cfg_attr(not(any(test)), no_std)]
 #![cfg_attr(not(test), no_main)]
 #![allow(clippy::upper_case_acronyms)]
diff --git a/riscv64/src/runtime.rs b/riscv64/src/runtime.rs
index 78eef68..d228373 100644
--- a/riscv64/src/runtime.rs
+++ b/riscv64/src/runtime.rs
@@ -18,7 +18,7 @@ extern "C" fn eh_personality() {}
 fn panic(info: &PanicInfo) -> ! {
     print!("Panic: ");
     if let Some(p) = info.location() {
-        println!("line {}, file {}: {}", p.line(), p.file(), info.message().unwrap());
+        println!("line {}, file {}: {}", p.line(), p.file(), info.message());
     } else {
         println!("no information available.");
     }

From 2f7a3a685ae92a92c1a19cae3e3c362e734d9837 Mon Sep 17 00:00:00 2001
From: Graham MacDonald <grahamamacdonald@gmail.com>
Date: Sun, 4 Aug 2024 23:11:35 +0100
Subject: [PATCH 4/8] arena arc

Signed-off-by: Graham MacDonald <grahamamacdonald@gmail.com>
---
 aarch64/src/init.rs    |  7 ++++-
 aarch64/src/vmalloc.rs | 61 ++++++++++++++++--------------------------
 port/src/lib.rs        |  2 ++
 port/src/vmem.rs       | 11 ++++----
 4 files changed, 37 insertions(+), 44 deletions(-)

diff --git a/aarch64/src/init.rs b/aarch64/src/init.rs
index 80956a0..7a7421e 100644
--- a/aarch64/src/init.rs
+++ b/aarch64/src/init.rs
@@ -85,6 +85,11 @@ fn enable_bump_allocator() {
     crate::runtime::enable_bump_allocator();
 }
 
+// fn enable_vmem_allocator() {
+//     #[cfg(not(test))]
+//     crate::runtime::enable_vmem_allocator();
+// }
+
 /// This function is concerned with preparing the system to the point where an
 /// allocator can be set up and allocation is available.  We can't assume
 /// there's any allocator available when executing this function.
@@ -125,7 +130,7 @@ pub fn init(dtb_va: usize) {
     enable_bump_allocator();
 
     vmalloc::init(heap_virtrange());
-    //runtime::enable_vmem_allocator();
+    //enable_vmem_allocator();
 
     let _b = Box::new("ddododo");
 
diff --git a/aarch64/src/vmalloc.rs b/aarch64/src/vmalloc.rs
index 0577dd7..5347d3d 100644
--- a/aarch64/src/vmalloc.rs
+++ b/aarch64/src/vmalloc.rs
@@ -1,5 +1,5 @@
+use alloc::sync::Arc;
 use core::{mem::MaybeUninit, ptr::addr_of};
-
 use port::{
     mcslock::{Lock, LockNode},
     mem::{VirtRange, PAGE_SIZE_4K},
@@ -17,52 +17,38 @@ static VMALLOC: Lock<Option<&'static mut VmAlloc>> = Lock::new("vmalloc", None);
 
 static mut EARLY_TAGS_PAGE: [u8; 4096] = [0; 4096];
 
+/// VmAlloc is an attempt to write a Bonwick vmem-style allocator.  It currently
+/// expects another allocator to exist beforehand.
+/// TODO Use the allocator api trait.
 struct VmAlloc {
-    heap_arena: Arena,
-    //heap_arena: Lock<NonNull<Arena>>,
-    // heap_arena: Lock<Arena<'a>>,
-    // va_arena: Lock<Arena<'a>>,
+    heap_arena: Arc<Lock<Arena>>,
+    va_arena: Arc<Lock<Arena>>,
 }
 
 impl VmAlloc {
     fn new(heap_range: VirtRange) -> Self {
-        // Heap_arena is the lowest level arena.  We pass an address range from which
-        // it can allocate a block of tags to build the initial structures.
-        // let heap_arena = unsafe {
-        //     let early_tags_ptr = addr_of!(EARLY_TAGS_PAGE) as usize;
-        //     let early_tags_size = EARLY_TAGS_PAGE.len();
-        //     let early_tags_range = VirtRange::with_len(early_tags_ptr, early_tags_size);
-
-        //     MAYBE_HEAP_ARENA.write(Arena::new_with_static_range(
-        //         "heap",
-        //         Some(Boundary::from(heap_range)),
-        //         PAGE_SIZE_4K,
-        //         early_tags_range,
-        //     ));
-        //     MAYBE_HEAP_ARENA.assume_init_mut()
-        // };
-
         let early_tags_ptr = addr_of!(EARLY_TAGS_PAGE) as usize;
         let early_tags_size = unsafe { EARLY_TAGS_PAGE.len() };
         let early_tags_range = VirtRange::with_len(early_tags_ptr, early_tags_size);
 
-        let heap_arena = Arena::new_with_static_range(
-            "heap",
-            Some(Boundary::from(heap_range)),
-            PAGE_SIZE_4K,
-            early_tags_range,
-        );
+        let heap_arena = Arc::new(Lock::new(
+            "heap_arena",
+            Arena::new_with_static_range(
+                "heap",
+                Some(Boundary::from(heap_range)),
+                PAGE_SIZE_4K,
+                early_tags_range,
+            ),
+        ));
 
         // va_arena imports from heap_arena, so can use allocations from that heap to
         // allocate blocks of tags.
-        // let va_arena = Arena::new("kmem_va", None, QUANTUM, Some(&heap_arena));
+        let va_arena = Arc::new(Lock::new(
+            "heap_arena",
+            Arena::new("kmem_va", None, PAGE_SIZE_4K, Some(heap_arena.clone())),
+        ));
 
-        Self {
-            heap_arena,
-            //heap_arena,
-            //heap_arena: Lock::new(heap_arena.name(), heap_arena),
-            //va_arena: Lock::new(va_arena.name(), va_arena),
-        }
+        Self { heap_arena, va_arena }
     }
 }
 
@@ -83,8 +69,7 @@ pub fn alloc(size: usize) -> *mut u8 {
     let mut lock = VMALLOC.lock(&node);
     let vmalloc = lock.as_deref_mut().unwrap();
 
-    // let node = LockNode::new();
-    // let mut guard = vmalloc.heap_arena.lock(&node);
-    //guard.alloc(size)
-    vmalloc.heap_arena.alloc(size)
+    let node = LockNode::new();
+    let mut guard = vmalloc.heap_arena.lock(&node);
+    guard.alloc(size)
 }
diff --git a/port/src/lib.rs b/port/src/lib.rs
index ec83b5e..e08d6f5 100644
--- a/port/src/lib.rs
+++ b/port/src/lib.rs
@@ -12,3 +12,5 @@ pub mod fdt;
 pub mod mcslock;
 pub mod mem;
 pub mod vmem;
+
+extern crate alloc;
diff --git a/port/src/vmem.rs b/port/src/vmem.rs
index de44df1..f53266e 100644
--- a/port/src/vmem.rs
+++ b/port/src/vmem.rs
@@ -1,6 +1,7 @@
-use core::{ops::Range, ptr::null_mut, slice};
-
+use crate::mcslock::Lock;
 use crate::mem::VirtRange;
+use alloc::sync::Arc;
+use core::{ops::Range, ptr::null_mut, slice};
 
 #[cfg(not(test))]
 use crate::println;
@@ -295,8 +296,8 @@ pub struct Arena {
                        //parent: Option<&Arena>, // Parent arena to import from
 }
 
-unsafe impl Send for Arena {}
-unsafe impl Sync for Arena {}
+// unsafe impl Send for Arena {}
+// unsafe impl Sync for Arena {}
 
 pub trait Allocator {
     fn alloc(&mut self, size: usize) -> *mut u8;
@@ -308,7 +309,7 @@ impl Arena {
         name: &'static str,
         initial_span: Option<Boundary>,
         quantum: usize,
-        _parent: Option<Arena>,
+        _parent: Option<Arc<Lock<Arena>>>,
     ) -> Self {
         println!("Arena::new name:{} initial_span:{:?} quantum:{:x}", name, initial_span, quantum);
 

From 39a350817da1cdec5db85e3618c1ccdbe014af89 Mon Sep 17 00:00:00 2001
From: Graham MacDonald <grahamamacdonald@gmail.com>
Date: Sat, 17 Aug 2024 16:50:24 +0100
Subject: [PATCH 5/8] Bump allocator reports wasted space

Signed-off-by: Graham MacDonald <grahamamacdonald@gmail.com>
---
 aarch64/src/init.rs    |  30 ++++------
 aarch64/src/main.rs    |   1 +
 aarch64/src/runtime.rs |  42 +++----------
 aarch64/src/vmalloc.rs |  49 ++++++++-------
 port/src/bumpalloc.rs  | 133 ++++++++++++++++++++++++++++++-----------
 port/src/lib.rs        |   1 +
 port/src/vmem.rs       |   2 +-
 7 files changed, 146 insertions(+), 112 deletions(-)

diff --git a/aarch64/src/init.rs b/aarch64/src/init.rs
index 7a7421e..34aa0bf 100644
--- a/aarch64/src/init.rs
+++ b/aarch64/src/init.rs
@@ -11,8 +11,11 @@ use crate::vm::kernel_root;
 use crate::vm::PageTable;
 use crate::vmalloc;
 use alloc::boxed::Box;
+use core::alloc::Layout;
 use core::ptr;
+use port::bumpalloc::Bump;
 use port::fdt::DeviceTree;
+use port::mem::PAGE_SIZE_4K;
 use port::mem::{PhysRange, VirtRange};
 use port::println;
 
@@ -80,16 +83,6 @@ fn print_board_info() {
     println!("  Firmware Rev:\t{fw_revision:#010x}");
 }
 
-fn enable_bump_allocator() {
-    #[cfg(not(test))]
-    crate::runtime::enable_bump_allocator();
-}
-
-// fn enable_vmem_allocator() {
-//     #[cfg(not(test))]
-//     crate::runtime::enable_vmem_allocator();
-// }
-
 /// This function is concerned with preparing the system to the point where an
 /// allocator can be set up and allocation is available.  We can't assume
 /// there's any allocator available when executing this function.
@@ -123,14 +116,11 @@ fn init_pre_allocator(dtb_va: usize) {
 pub fn init(dtb_va: usize) {
     init_pre_allocator(dtb_va);
 
-    // From this point we can use the global allocator.  Initially it uses a
-    // bump allocator that makes permanent allocations.  This can be used to
-    // create the more complex vmem allocator.  Once the vmem allocator is
-    // available, we switch to that.
-    enable_bump_allocator();
+    static BUMP_ALLOC: Bump<{ 4 * PAGE_SIZE_4K }, PAGE_SIZE_4K> = Bump::new(0);
+    vmalloc::init(&BUMP_ALLOC, heap_virtrange());
+    BUMP_ALLOC.print_status();
 
-    vmalloc::init(heap_virtrange());
-    //enable_vmem_allocator();
+    // From this point we can use the global allocator
 
     let _b = Box::new("ddododo");
 
@@ -141,10 +131,12 @@ pub fn init(dtb_va: usize) {
     println!("looping now");
 
     {
-        let test = vmalloc::alloc(1024);
+        let test = vmalloc::alloc(unsafe { Layout::from_size_align_unchecked(1024, 16) });
         println!("test alloc: {:p}", test);
-        let test2 = vmalloc::alloc(1024);
+        let test2 = vmalloc::alloc(unsafe { Layout::from_size_align_unchecked(1024, 16) });
         println!("test alloc: {:p}", test2);
+        let test3 = vmalloc::alloc(unsafe { Layout::from_size_align_unchecked(1024, 4096) });
+        println!("test alloc: {:p}", test3);
     }
 
     #[allow(clippy::empty_loop)]
diff --git a/aarch64/src/main.rs b/aarch64/src/main.rs
index 23a3151..4929c11 100644
--- a/aarch64/src/main.rs
+++ b/aarch64/src/main.rs
@@ -2,6 +2,7 @@
 #![allow(internal_features)]
 #![cfg_attr(not(any(test)), no_std)]
 #![cfg_attr(not(test), no_main)]
+#![feature(allocator_api)]
 #![feature(alloc_error_handler)]
 #![feature(asm_const)]
 #![feature(const_refs_to_static)]
diff --git a/aarch64/src/runtime.rs b/aarch64/src/runtime.rs
index efc3c57..b844348 100644
--- a/aarch64/src/runtime.rs
+++ b/aarch64/src/runtime.rs
@@ -5,14 +5,12 @@ extern crate alloc;
 use crate::kmem::physaddr_as_virt;
 use crate::registers::rpi_mmio;
 use crate::uartmini::MiniUart;
+use crate::vmalloc;
 use alloc::alloc::{GlobalAlloc, Layout};
 use core::fmt::Write;
 use core::panic::PanicInfo;
-use core::sync::atomic::{AtomicU8, Ordering::Relaxed};
-use num_enum::{FromPrimitive, IntoPrimitive};
-use port::bumpalloc::Bump;
 use port::devcons::PanicConsole;
-use port::mem::{VirtRange, PAGE_SIZE_4K};
+use port::mem::VirtRange;
 
 // TODO
 //  - Add qemu integration test
@@ -43,43 +41,17 @@ fn oom(_layout: Layout) -> ! {
     panic!("oom");
 }
 
-#[derive(Debug, IntoPrimitive, FromPrimitive)]
-#[repr(u8)]
-enum AllocatorType {
-    #[num_enum(default)]
-    None = 0,
-    Bump,
-}
-
-/// A simple wrapper that allows the allocator to be changed at runtime.
-#[repr(C, align(4096))]
-struct Allocator {
-    bump_alloc: Bump<PAGE_SIZE_4K, PAGE_SIZE_4K>,
-    enabled_allocator: AtomicU8,
-}
-
-pub fn enable_bump_allocator() {
-    ALLOCATOR.enabled_allocator.store(AllocatorType::Bump as u8, Relaxed);
-}
+struct Allocator {}
 
 unsafe impl GlobalAlloc for Allocator {
     unsafe fn alloc(&self, layout: Layout) -> *mut u8 {
-        match AllocatorType::try_from(self.enabled_allocator.load(Relaxed)) {
-            Ok(AllocatorType::None) | Err(_) => panic!("no allocator available for alloc"),
-            Ok(AllocatorType::Bump) => unsafe { self.bump_alloc.alloc(layout) },
-        }
+        vmalloc::alloc(layout)
     }
 
-    unsafe fn dealloc(&self, ptr: *mut u8, layout: Layout) {
-        match AllocatorType::try_from(self.enabled_allocator.load(Relaxed)) {
-            Ok(AllocatorType::None) | Err(_) => panic!("no allocator available for dealloc"),
-            Ok(AllocatorType::Bump) => unsafe { self.bump_alloc.dealloc(ptr, layout) },
-        }
+    unsafe fn dealloc(&self, _ptr: *mut u8, _layout: Layout) {
+        panic!("fake dealloc");
     }
 }
 
 #[global_allocator]
-static ALLOCATOR: Allocator = Allocator {
-    bump_alloc: Bump::new(0),
-    enabled_allocator: AtomicU8::new(AllocatorType::None as u8),
-};
+static ALLOCATOR: Allocator = Allocator {};
diff --git a/aarch64/src/vmalloc.rs b/aarch64/src/vmalloc.rs
index 5347d3d..8abef30 100644
--- a/aarch64/src/vmalloc.rs
+++ b/aarch64/src/vmalloc.rs
@@ -1,5 +1,5 @@
 use alloc::sync::Arc;
-use core::{mem::MaybeUninit, ptr::addr_of};
+use core::{alloc::Layout, mem::MaybeUninit, ptr::addr_of};
 use port::{
     mcslock::{Lock, LockNode},
     mem::{VirtRange, PAGE_SIZE_4K},
@@ -21,55 +21,62 @@ static mut EARLY_TAGS_PAGE: [u8; 4096] = [0; 4096];
 /// expects another allocator to exist beforehand.
 /// TODO Use the allocator api trait.
 struct VmAlloc {
-    heap_arena: Arc<Lock<Arena>>,
-    va_arena: Arc<Lock<Arena>>,
+    heap_arena: Arc<Lock<Arena>, &'static dyn core::alloc::Allocator>,
+    _va_arena: Arc<Lock<Arena>, &'static dyn core::alloc::Allocator>,
 }
 
 impl VmAlloc {
-    fn new(heap_range: VirtRange) -> Self {
+    fn new(early_allocator: &'static dyn core::alloc::Allocator, heap_range: VirtRange) -> Self {
         let early_tags_ptr = addr_of!(EARLY_TAGS_PAGE) as usize;
         let early_tags_size = unsafe { EARLY_TAGS_PAGE.len() };
         let early_tags_range = VirtRange::with_len(early_tags_ptr, early_tags_size);
 
-        let heap_arena = Arc::new(Lock::new(
-            "heap_arena",
-            Arena::new_with_static_range(
-                "heap",
-                Some(Boundary::from(heap_range)),
-                PAGE_SIZE_4K,
-                early_tags_range,
+        let heap_arena = Arc::new_in(
+            Lock::new(
+                "heap_arena",
+                Arena::new_with_static_range(
+                    "heap",
+                    Some(Boundary::from(heap_range)),
+                    PAGE_SIZE_4K,
+                    early_tags_range,
+                ),
             ),
-        ));
+            early_allocator,
+        );
 
         // va_arena imports from heap_arena, so can use allocations from that heap to
         // allocate blocks of tags.
-        let va_arena = Arc::new(Lock::new(
-            "heap_arena",
-            Arena::new("kmem_va", None, PAGE_SIZE_4K, Some(heap_arena.clone())),
-        ));
+        let va_arena = Arc::new_in(
+            Lock::new(
+                "kmem_va_arena",
+                Arena::new("kmem_va_arena", None, PAGE_SIZE_4K, Some(heap_arena.clone())),
+            ),
+            early_allocator,
+        );
 
-        Self { heap_arena, va_arena }
+        Self { heap_arena, _va_arena: va_arena }
     }
 }
 
-pub fn init(heap_range: VirtRange) {
+pub fn init(early_allocator: &'static dyn core::alloc::Allocator, heap_range: VirtRange) {
     let node = LockNode::new();
     let mut vmalloc = VMALLOC.lock(&node);
     *vmalloc = Some({
         static mut MAYBE_VMALLOC: MaybeUninit<VmAlloc> = MaybeUninit::uninit();
         unsafe {
-            MAYBE_VMALLOC.write(VmAlloc::new(heap_range));
+            MAYBE_VMALLOC.write(VmAlloc::new(early_allocator, heap_range));
             MAYBE_VMALLOC.assume_init_mut()
         }
     });
 }
 
-pub fn alloc(size: usize) -> *mut u8 {
+pub fn alloc(layout: Layout) -> *mut u8 {
     let node = LockNode::new();
     let mut lock = VMALLOC.lock(&node);
     let vmalloc = lock.as_deref_mut().unwrap();
 
     let node = LockNode::new();
     let mut guard = vmalloc.heap_arena.lock(&node);
-    guard.alloc(size)
+    // TODO use layout properly
+    guard.alloc(layout.size())
 }
diff --git a/port/src/bumpalloc.rs b/port/src/bumpalloc.rs
index 72eefcc..8ba7b06 100644
--- a/port/src/bumpalloc.rs
+++ b/port/src/bumpalloc.rs
@@ -1,16 +1,18 @@
-use core::alloc::{GlobalAlloc, Layout};
+use core::alloc::{AllocError, Allocator, Layout};
 use core::cell::UnsafeCell;
-use core::ptr::null_mut;
+use core::ptr::NonNull;
 use core::sync::atomic::{AtomicUsize, Ordering::Relaxed};
 
+#[cfg(not(test))]
+use crate::println;
+
 /// Bump allocator to be used for earliest allocations in r9.  These allocations
 /// can never be freed - attempting to do so will panic.
-/// This has been originally based on the example here:
-/// https://doc.rust-lang.org/std/alloc/trait.GlobalAlloc.html
 #[repr(C, align(4096))]
 pub struct Bump<const SIZE_BYTES: usize, const MAX_SUPPORTED_ALIGN: usize> {
     bytes: UnsafeCell<[u8; SIZE_BYTES]>,
-    remaining: AtomicUsize,
+    next_offset: AtomicUsize,
+    wasted: AtomicUsize,
 }
 
 unsafe impl<const SIZE_BYTES: usize, const MAX_SUPPORTED_ALIGN: usize> Send
@@ -28,70 +30,129 @@ impl<const SIZE_BYTES: usize, const MAX_SUPPORTED_ALIGN: usize>
     pub const fn new(init_value: u8) -> Self {
         Self {
             bytes: UnsafeCell::new([init_value; SIZE_BYTES]),
-            remaining: AtomicUsize::new(SIZE_BYTES),
+            next_offset: AtomicUsize::new(0),
+            wasted: AtomicUsize::new(0),
+        }
+    }
+
+    pub fn print_status(&self) {
+        let allocated = self.next_offset.load(Relaxed);
+        let remaining = SIZE_BYTES - allocated;
+        let wasted = self.wasted.load(Relaxed);
+        println!(
+            "Bump: allocated: {allocated} free: {remaining} total: {SIZE_BYTES} wasted: {wasted}"
+        );
+    }
+
+    /// Test helper to get the offset of the result in the buffer
+    #[cfg(test)]
+    fn result_offset(&self, result: Result<NonNull<[u8]>, AllocError>) -> Option<isize> {
+        unsafe {
+            result
+                .ok()
+                .map(|bytes| bytes.byte_offset_from(NonNull::new_unchecked(self.bytes.get())))
         }
     }
 }
 
-unsafe impl<const SIZE_BYTES: usize, const MAX_SUPPORTED_ALIGN: usize> GlobalAlloc
+unsafe impl<const SIZE_BYTES: usize, const MAX_SUPPORTED_ALIGN: usize> Allocator
     for Bump<SIZE_BYTES, MAX_SUPPORTED_ALIGN>
 {
-    unsafe fn alloc(&self, layout: Layout) -> *mut u8 {
+    fn allocate(&self, layout: Layout) -> Result<NonNull<[u8]>, AllocError> {
         let size = layout.size();
         let align = layout.align();
 
         if align > MAX_SUPPORTED_ALIGN {
-            return null_mut();
+            return Err(AllocError {});
         }
 
-        let mut allocated = 0;
+        let mut wasted = 0;
+        let mut alloc_offset = 0;
         if self
-            .remaining
-            .fetch_update(Relaxed, Relaxed, |mut remaining| {
-                if size > remaining {
-                    return None;
-                }
+            .next_offset
+            .fetch_update(Relaxed, Relaxed, |last_offset| {
+                let align_mask = !(align - 1);
+                alloc_offset = if last_offset & !align_mask != 0 {
+                    (last_offset + align) & align_mask
+                } else {
+                    last_offset
+                };
+                wasted = alloc_offset - last_offset;
 
-                // `Layout` contract forbids making a `Layout` with align=0, or
-                // align not power of 2.  So we can safely use a mask to ensure
-                // alignment without worrying about UB.
-                let align_mask_to_round_down = !(align - 1);
-
-                remaining -= size;
-                remaining &= align_mask_to_round_down;
-                allocated = remaining;
-                Some(remaining)
+                let new_offset = alloc_offset + size;
+                if new_offset > SIZE_BYTES {
+                    None
+                } else {
+                    Some(new_offset)
+                }
             })
             .is_err()
         {
-            null_mut()
+            Err(AllocError {})
         } else {
-            unsafe { self.bytes.get().cast::<u8>().add(allocated) }
+            self.wasted.fetch_add(wasted, Relaxed);
+            Ok(unsafe { NonNull::new_unchecked(self.bytes.get().byte_add(alloc_offset)) })
         }
     }
 
-    unsafe fn dealloc(&self, ptr: *mut u8, layout: Layout) {
-        panic!("Can't dealloc from Bump allocator (ptr: {:p}, layout: {:?})", ptr, layout)
+    unsafe fn deallocate(&self, ptr: NonNull<u8>, layout: Layout) {
+        panic!("Can't deallocate from Bump allocator (ptr: {:p}, layout: {:?})", ptr, layout)
     }
 }
 
 #[cfg(test)]
 mod tests {
+    use crate::mem::PAGE_SIZE_4K;
+
     use super::*;
 
     #[test]
     fn bump_new() {
-        let bump = Bump::<4096, 4096>::new(0);
-        let ptr = unsafe { bump.alloc(Layout::from_size_align_unchecked(4096, 4096)) };
-        assert!(!ptr.is_null());
-        let ptr = unsafe { bump.alloc(Layout::from_size_align_unchecked(1, 1)) };
-        assert!(ptr.is_null());
+        let bump = Bump::<PAGE_SIZE_4K, PAGE_SIZE_4K>::new(0);
+        let result = unsafe { bump.allocate(Layout::from_size_align_unchecked(4096, 4096)) };
+        assert!(result.is_ok());
+        assert_eq!(bump.result_offset(result), Some(0));
+        assert_eq!(bump.wasted.load(Relaxed), 0);
+        assert_eq!(bump.next_offset.load(Relaxed), 4096);
+
+        // Next should fail - out of space
+        let result = unsafe { bump.allocate(Layout::from_size_align_unchecked(1, 1)) };
+        assert!(result.is_err());
+    }
+
+    #[test]
+    fn bump_alignment() {
+        let bump = Bump::<{ 3 * PAGE_SIZE_4K }, PAGE_SIZE_4K>::new(0);
+
+        // Small allocation
+        let mut expected_waste = 0;
+        let result = unsafe { bump.allocate(Layout::from_size_align_unchecked(16, 1)) };
+        assert!(result.is_ok());
+        assert_eq!(bump.result_offset(result), Some(0));
+        assert_eq!(bump.wasted.load(Relaxed), expected_waste);
+        assert_eq!(bump.next_offset.load(Relaxed), 16);
+
+        // Align next allocation to 4096, wasting space
+        expected_waste += 4096 - 16;
+        let result = unsafe { bump.allocate(Layout::from_size_align_unchecked(16, 4096)) };
+        assert!(result.is_ok());
+        assert_eq!(bump.result_offset(result), Some(4096));
+        assert_eq!(bump.wasted.load(Relaxed), expected_waste);
+        assert_eq!(bump.next_offset.load(Relaxed), 4096 + 16);
+
+        // Align next allocation to 4096, wasting space
+        expected_waste += 4096 - 16;
+        let result = unsafe { bump.allocate(Layout::from_size_align_unchecked(4096, 4096)) };
+        assert!(result.is_ok());
+        assert_eq!(bump.result_offset(result), Some(2 * 4096));
+        assert_eq!(bump.wasted.load(Relaxed), expected_waste);
+        assert_eq!(bump.next_offset.load(Relaxed), 3 * 4096);
     }
 
     #[test]
     fn align_too_high() {
-        let bump = Bump::<4096, 4096>::new(0);
-        let ptr = unsafe { bump.alloc(Layout::from_size_align_unchecked(4096, 8192)) };
-        assert!(ptr.is_null());
+        let bump = Bump::<PAGE_SIZE_4K, PAGE_SIZE_4K>::new(0);
+        let result = unsafe { bump.allocate(Layout::from_size_align_unchecked(4096, 8192)) };
+        assert!(result.is_err());
     }
 }
diff --git a/port/src/lib.rs b/port/src/lib.rs
index e08d6f5..39e99ac 100644
--- a/port/src/lib.rs
+++ b/port/src/lib.rs
@@ -1,5 +1,6 @@
 #![allow(clippy::upper_case_acronyms)]
 #![cfg_attr(not(any(test)), no_std)]
+#![feature(allocator_api)]
 #![feature(maybe_uninit_slice)]
 #![feature(step_trait)]
 #![forbid(unsafe_op_in_unsafe_fn)]
diff --git a/port/src/vmem.rs b/port/src/vmem.rs
index f53266e..d989b13 100644
--- a/port/src/vmem.rs
+++ b/port/src/vmem.rs
@@ -309,7 +309,7 @@ impl Arena {
         name: &'static str,
         initial_span: Option<Boundary>,
         quantum: usize,
-        _parent: Option<Arc<Lock<Arena>>>,
+        _parent: Option<Arc<Lock<Arena>, &dyn core::alloc::Allocator>>,
     ) -> Self {
         println!("Arena::new name:{} initial_span:{:?} quantum:{:x}", name, initial_span, quantum);
 

From 44decce91c39a5212015df2102282e0441851e9f Mon Sep 17 00:00:00 2001
From: Graham MacDonald <grahamamacdonald@gmail.com>
Date: Sat, 17 Aug 2024 20:52:06 +0100
Subject: [PATCH 6/8] Use allocator for early tags

Signed-off-by: Graham MacDonald <grahamamacdonald@gmail.com>
---
 aarch64/src/vmalloc.rs | 12 +++---------
 port/src/lib.rs        |  1 +
 port/src/vmem.rs       | 17 +++++++++++------
 3 files changed, 15 insertions(+), 15 deletions(-)

diff --git a/aarch64/src/vmalloc.rs b/aarch64/src/vmalloc.rs
index 8abef30..7860b91 100644
--- a/aarch64/src/vmalloc.rs
+++ b/aarch64/src/vmalloc.rs
@@ -1,5 +1,5 @@
 use alloc::sync::Arc;
-use core::{alloc::Layout, mem::MaybeUninit, ptr::addr_of};
+use core::{alloc::Layout, mem::MaybeUninit};
 use port::{
     mcslock::{Lock, LockNode},
     mem::{VirtRange, PAGE_SIZE_4K},
@@ -15,8 +15,6 @@ static VMALLOC: Lock<Option<&'static mut VmAlloc>> = Lock::new("vmalloc", None);
 // referening them from VmAlloc, from where they can be used in the global allocator.
 //static mut MAYBE_HEAP_ARENA: MaybeUninit<Arena> = MaybeUninit::uninit();
 
-static mut EARLY_TAGS_PAGE: [u8; 4096] = [0; 4096];
-
 /// VmAlloc is an attempt to write a Bonwick vmem-style allocator.  It currently
 /// expects another allocator to exist beforehand.
 /// TODO Use the allocator api trait.
@@ -27,18 +25,14 @@ struct VmAlloc {
 
 impl VmAlloc {
     fn new(early_allocator: &'static dyn core::alloc::Allocator, heap_range: VirtRange) -> Self {
-        let early_tags_ptr = addr_of!(EARLY_TAGS_PAGE) as usize;
-        let early_tags_size = unsafe { EARLY_TAGS_PAGE.len() };
-        let early_tags_range = VirtRange::with_len(early_tags_ptr, early_tags_size);
-
         let heap_arena = Arc::new_in(
             Lock::new(
                 "heap_arena",
-                Arena::new_with_static_range(
+                Arena::new_with_allocator(
                     "heap",
                     Some(Boundary::from(heap_range)),
                     PAGE_SIZE_4K,
-                    early_tags_range,
+                    early_allocator,
                 ),
             ),
             early_allocator,
diff --git a/port/src/lib.rs b/port/src/lib.rs
index 39e99ac..e5e17d6 100644
--- a/port/src/lib.rs
+++ b/port/src/lib.rs
@@ -2,6 +2,7 @@
 #![cfg_attr(not(any(test)), no_std)]
 #![feature(allocator_api)]
 #![feature(maybe_uninit_slice)]
+#![feature(slice_ptr_get)]
 #![feature(step_trait)]
 #![forbid(unsafe_op_in_unsafe_fn)]
 
diff --git a/port/src/vmem.rs b/port/src/vmem.rs
index d989b13..ee16575 100644
--- a/port/src/vmem.rs
+++ b/port/src/vmem.rs
@@ -1,7 +1,7 @@
-use crate::mcslock::Lock;
 use crate::mem::VirtRange;
+use crate::{mcslock::Lock, mem::PAGE_SIZE_4K};
 use alloc::sync::Arc;
-use core::{ops::Range, ptr::null_mut, slice};
+use core::{alloc::Layout, ops::Range, ptr::null_mut, slice};
 
 #[cfg(not(test))]
 use crate::println;
@@ -326,15 +326,20 @@ impl Arena {
     /// Only to be used for creation of initial heap
     /// Create a new arena, assuming there is no dynamic allocation available,
     /// and all free tags come from the free_tags provided.
-    pub fn new_with_static_range(
+    pub fn new_with_allocator(
         name: &'static str,
         initial_span: Option<Boundary>,
         quantum: usize,
-        static_range: VirtRange,
+        allocator: &'static dyn core::alloc::Allocator,
     ) -> Self {
-        let tags_addr = unsafe { &mut *(static_range.start() as *mut TagItem) };
+        let layout = unsafe { Layout::from_size_align_unchecked(PAGE_SIZE_4K, PAGE_SIZE_4K) };
+        let tags_buffer =
+            allocator.allocate_zeroed(layout).expect("unable to allocate initial vmem tags");
         let tags = unsafe {
-            slice::from_raw_parts_mut(tags_addr, static_range.size() / size_of::<TagItem>())
+            slice::from_raw_parts_mut(
+                tags_buffer.as_mut_ptr() as *mut TagItem,
+                layout.size() / size_of::<TagItem>(),
+            )
         };
 
         Self::new_with_tags(name, initial_span, quantum, tags)

From d8954156045ff4627f61d197023613d9597b57f1 Mon Sep 17 00:00:00 2001
From: Graham MacDonald <grahamamacdonald@gmail.com>
Date: Thu, 29 Aug 2024 08:18:23 +0100
Subject: [PATCH 7/8] Upgrade rust, fix lintx, clippy

Signed-off-by: Graham MacDonald <grahamamacdonald@gmail.com>
---
 aarch64/src/main.rs               | 1 -
 lib/aarch64-unknown-none-elf.json | 2 +-
 port/src/bumpalloc.rs             | 4 ++--
 port/src/fdt.rs                   | 1 +
 riscv64/src/main.rs               | 1 -
 rust-toolchain.toml               | 2 +-
 x86_64/src/main.rs                | 1 -
 7 files changed, 5 insertions(+), 7 deletions(-)

diff --git a/aarch64/src/main.rs b/aarch64/src/main.rs
index 4929c11..984304e 100644
--- a/aarch64/src/main.rs
+++ b/aarch64/src/main.rs
@@ -4,7 +4,6 @@
 #![cfg_attr(not(test), no_main)]
 #![feature(allocator_api)]
 #![feature(alloc_error_handler)]
-#![feature(asm_const)]
 #![feature(const_refs_to_static)]
 #![feature(core_intrinsics)]
 #![feature(strict_provenance)]
diff --git a/lib/aarch64-unknown-none-elf.json b/lib/aarch64-unknown-none-elf.json
index ee81954..c12cb41 100644
--- a/lib/aarch64-unknown-none-elf.json
+++ b/lib/aarch64-unknown-none-elf.json
@@ -1,6 +1,6 @@
 {
 	"arch": "aarch64",
-	"data-layout": "e-m:e-i8:8:32-i16:16:32-i64:64-i128:128-n32:64-S128",
+	"data-layout": "e-m:e-i8:8:32-i16:16:32-i64:64-i128:128-n32:64-S128-Fn32",
 	"disable-redzone": true,
 	"executables": true,
 	"features": "+strict-align,+neon,+fp-armv8",
diff --git a/port/src/bumpalloc.rs b/port/src/bumpalloc.rs
index 8ba7b06..dd53783 100644
--- a/port/src/bumpalloc.rs
+++ b/port/src/bumpalloc.rs
@@ -95,8 +95,8 @@ unsafe impl<const SIZE_BYTES: usize, const MAX_SUPPORTED_ALIGN: usize> Allocator
         }
     }
 
-    unsafe fn deallocate(&self, ptr: NonNull<u8>, layout: Layout) {
-        panic!("Can't deallocate from Bump allocator (ptr: {:p}, layout: {:?})", ptr, layout)
+    unsafe fn deallocate(&self, _ptr: NonNull<u8>, _layout: Layout) {
+        // panic!("Can't deallocate from Bump allocator (ptr: {:p}, layout: {:?})", ptr, layout)
     }
 }
 
diff --git a/port/src/fdt.rs b/port/src/fdt.rs
index b4a6251..f05900b 100644
--- a/port/src/fdt.rs
+++ b/port/src/fdt.rs
@@ -46,6 +46,7 @@ fn align4(n: usize) -> usize {
 }
 
 /// DeviceTree is the class entrypoint to the Devicetree operations.
+///
 /// This code focuses only on parsing a Flattened Devicetree without using the heap.
 /// The Devicetree specification can be found here:
 /// https://www.devicetree.org/specifications/
diff --git a/riscv64/src/main.rs b/riscv64/src/main.rs
index 73dd10d..8551859 100644
--- a/riscv64/src/main.rs
+++ b/riscv64/src/main.rs
@@ -1,5 +1,4 @@
 #![feature(alloc_error_handler)]
-#![feature(asm_const)]
 #![cfg_attr(not(any(test)), no_std)]
 #![cfg_attr(not(test), no_main)]
 #![allow(clippy::upper_case_acronyms)]
diff --git a/rust-toolchain.toml b/rust-toolchain.toml
index b6cd1b9..43c30b6 100644
--- a/rust-toolchain.toml
+++ b/rust-toolchain.toml
@@ -1,5 +1,5 @@
 [toolchain]
-channel = "nightly-2024-07-24"
+channel = "nightly-2024-08-27"
 components = ["rustfmt", "rust-src", "clippy", "llvm-tools"]
 targets = [
   "aarch64-unknown-none",
diff --git a/x86_64/src/main.rs b/x86_64/src/main.rs
index cd85932..ebd4a42 100644
--- a/x86_64/src/main.rs
+++ b/x86_64/src/main.rs
@@ -1,5 +1,4 @@
 #![feature(alloc_error_handler)]
-#![feature(asm_const)]
 #![feature(naked_functions)]
 #![feature(sync_unsafe_cell)]
 #![cfg_attr(not(any(test)), no_std)]

From 4a11bbb98046430d8de2bb46f0364f3ba542310a Mon Sep 17 00:00:00 2001
From: Graham MacDonald <grahamamacdonald@gmail.com>
Date: Wed, 25 Sep 2024 22:15:22 +0100
Subject: [PATCH 8/8] wip

Signed-off-by: Graham MacDonald <grahamamacdonald@gmail.com>
---
 aarch64/src/init.rs    |  17 +++---
 aarch64/src/runtime.rs |  20 ++-----
 aarch64/src/vmalloc.rs |  88 ++++++++++-----------------
 port/src/lib.rs        |   1 +
 port/src/vmem.rs       |  16 +++--
 port/src/vmemalloc.rs  | 131 +++++++++++++++++++++++++++++++++++++++++
 rust-toolchain.toml    |   2 +-
 7 files changed, 182 insertions(+), 93 deletions(-)
 create mode 100644 port/src/vmemalloc.rs

diff --git a/aarch64/src/init.rs b/aarch64/src/init.rs
index 34aa0bf..ae05f8c 100644
--- a/aarch64/src/init.rs
+++ b/aarch64/src/init.rs
@@ -11,7 +11,6 @@ use crate::vm::kernel_root;
 use crate::vm::PageTable;
 use crate::vmalloc;
 use alloc::boxed::Box;
-use core::alloc::Layout;
 use core::ptr;
 use port::bumpalloc::Bump;
 use port::fdt::DeviceTree;
@@ -130,14 +129,14 @@ pub fn init(dtb_va: usize) {
 
     println!("looping now");
 
-    {
-        let test = vmalloc::alloc(unsafe { Layout::from_size_align_unchecked(1024, 16) });
-        println!("test alloc: {:p}", test);
-        let test2 = vmalloc::alloc(unsafe { Layout::from_size_align_unchecked(1024, 16) });
-        println!("test alloc: {:p}", test2);
-        let test3 = vmalloc::alloc(unsafe { Layout::from_size_align_unchecked(1024, 4096) });
-        println!("test alloc: {:p}", test3);
-    }
+    // {
+    //     let test = vmalloc::alloc(unsafe { Layout::from_size_align_unchecked(1024, 16) });
+    //     println!("test alloc: {:p}", test);
+    //     let test2 = vmalloc::alloc(unsafe { Layout::from_size_align_unchecked(1024, 16) });
+    //     println!("test alloc: {:p}", test2);
+    //     let test3 = vmalloc::alloc(unsafe { Layout::from_size_align_unchecked(1024, 4096) });
+    //     println!("test alloc: {:p}", test3);
+    // }
 
     #[allow(clippy::empty_loop)]
     loop {}
diff --git a/aarch64/src/runtime.rs b/aarch64/src/runtime.rs
index b844348..665b4ad 100644
--- a/aarch64/src/runtime.rs
+++ b/aarch64/src/runtime.rs
@@ -6,12 +6,15 @@ use crate::kmem::physaddr_as_virt;
 use crate::registers::rpi_mmio;
 use crate::uartmini::MiniUart;
 use crate::vmalloc;
-use alloc::alloc::{GlobalAlloc, Layout};
+use alloc::alloc::Layout;
 use core::fmt::Write;
 use core::panic::PanicInfo;
 use port::devcons::PanicConsole;
 use port::mem::VirtRange;
 
+#[global_allocator]
+static ALLOCATOR: vmalloc::Allocator = vmalloc::Allocator {};
+
 // TODO
 //  - Add qemu integration test
 //  - Use Console via println!() macro once available
@@ -40,18 +43,3 @@ pub fn panic(info: &PanicInfo) -> ! {
 fn oom(_layout: Layout) -> ! {
     panic!("oom");
 }
-
-struct Allocator {}
-
-unsafe impl GlobalAlloc for Allocator {
-    unsafe fn alloc(&self, layout: Layout) -> *mut u8 {
-        vmalloc::alloc(layout)
-    }
-
-    unsafe fn dealloc(&self, _ptr: *mut u8, _layout: Layout) {
-        panic!("fake dealloc");
-    }
-}
-
-#[global_allocator]
-static ALLOCATOR: Allocator = Allocator {};
diff --git a/aarch64/src/vmalloc.rs b/aarch64/src/vmalloc.rs
index 7860b91..438a06c 100644
--- a/aarch64/src/vmalloc.rs
+++ b/aarch64/src/vmalloc.rs
@@ -1,76 +1,48 @@
-use alloc::sync::Arc;
-use core::{alloc::Layout, mem::MaybeUninit};
+use alloc::alloc::{GlobalAlloc, Layout};
+use core::mem::MaybeUninit;
 use port::{
     mcslock::{Lock, LockNode},
-    mem::{VirtRange, PAGE_SIZE_4K},
-    vmem::{Allocator, Arena, Boundary},
+    mem::VirtRange,
+    vmemalloc::VmemAlloc,
 };
 
+#[cfg(not(test))]
+use port::println;
+
 // TODO replace with some sort of OnceLock?  We need this to be dynamically created,
 // but we're assuming VmAlloc is Sync.
-static VMALLOC: Lock<Option<&'static mut VmAlloc>> = Lock::new("vmalloc", None);
-
-// The core arenas are statically allocated.  They cannot be created in const
-// functions, so the we declare them as MaybeUninit before intialising and
-// referening them from VmAlloc, from where they can be used in the global allocator.
-//static mut MAYBE_HEAP_ARENA: MaybeUninit<Arena> = MaybeUninit::uninit();
-
-/// VmAlloc is an attempt to write a Bonwick vmem-style allocator.  It currently
-/// expects another allocator to exist beforehand.
-/// TODO Use the allocator api trait.
-struct VmAlloc {
-    heap_arena: Arc<Lock<Arena>, &'static dyn core::alloc::Allocator>,
-    _va_arena: Arc<Lock<Arena>, &'static dyn core::alloc::Allocator>,
-}
-
-impl VmAlloc {
-    fn new(early_allocator: &'static dyn core::alloc::Allocator, heap_range: VirtRange) -> Self {
-        let heap_arena = Arc::new_in(
-            Lock::new(
-                "heap_arena",
-                Arena::new_with_allocator(
-                    "heap",
-                    Some(Boundary::from(heap_range)),
-                    PAGE_SIZE_4K,
-                    early_allocator,
-                ),
-            ),
-            early_allocator,
-        );
-
-        // va_arena imports from heap_arena, so can use allocations from that heap to
-        // allocate blocks of tags.
-        let va_arena = Arc::new_in(
-            Lock::new(
-                "kmem_va_arena",
-                Arena::new("kmem_va_arena", None, PAGE_SIZE_4K, Some(heap_arena.clone())),
-            ),
-            early_allocator,
-        );
-
-        Self { heap_arena, _va_arena: va_arena }
-    }
-}
+static VMEM_ALLOC: Lock<Option<&'static mut VmemAlloc>> = Lock::new("vmemalloc", None);
 
 pub fn init(early_allocator: &'static dyn core::alloc::Allocator, heap_range: VirtRange) {
     let node = LockNode::new();
-    let mut vmalloc = VMALLOC.lock(&node);
+    let mut vmalloc = VMEM_ALLOC.lock(&node);
     *vmalloc = Some({
-        static mut MAYBE_VMALLOC: MaybeUninit<VmAlloc> = MaybeUninit::uninit();
+        static mut MAYBE_VMALLOC: MaybeUninit<VmemAlloc> = MaybeUninit::uninit();
         unsafe {
-            MAYBE_VMALLOC.write(VmAlloc::new(early_allocator, heap_range));
+            MAYBE_VMALLOC.write({
+                let vmemalloc = VmemAlloc::new(early_allocator, heap_range);
+                vmemalloc.init();
+                vmemalloc
+            });
             MAYBE_VMALLOC.assume_init_mut()
         }
     });
 }
 
-pub fn alloc(layout: Layout) -> *mut u8 {
-    let node = LockNode::new();
-    let mut lock = VMALLOC.lock(&node);
-    let vmalloc = lock.as_deref_mut().unwrap();
+pub struct Allocator {}
 
-    let node = LockNode::new();
-    let mut guard = vmalloc.heap_arena.lock(&node);
-    // TODO use layout properly
-    guard.alloc(layout.size())
+unsafe impl GlobalAlloc for Allocator {
+    unsafe fn alloc(&self, layout: Layout) -> *mut u8 {
+        println!("vmalloc::alloc");
+
+        // Get the main allocator
+        let node = LockNode::new();
+        let mut lock = VMEM_ALLOC.lock(&node);
+        let vmemalloc = lock.as_deref_mut().unwrap();
+        vmemalloc.alloc(layout)
+    }
+
+    unsafe fn dealloc(&self, _ptr: *mut u8, _layout: Layout) {
+        panic!("fake dealloc");
+    }
 }
diff --git a/port/src/lib.rs b/port/src/lib.rs
index e5e17d6..fb0704f 100644
--- a/port/src/lib.rs
+++ b/port/src/lib.rs
@@ -14,5 +14,6 @@ pub mod fdt;
 pub mod mcslock;
 pub mod mem;
 pub mod vmem;
+pub mod vmemalloc;
 
 extern crate alloc;
diff --git a/port/src/vmem.rs b/port/src/vmem.rs
index ee16575..91c5c90 100644
--- a/port/src/vmem.rs
+++ b/port/src/vmem.rs
@@ -3,9 +3,6 @@ use crate::{mcslock::Lock, mem::PAGE_SIZE_4K};
 use alloc::sync::Arc;
 use core::{alloc::Layout, ops::Range, ptr::null_mut, slice};
 
-#[cfg(not(test))]
-use crate::println;
-
 // TODO reserve recursive area in vmem(?)
 // TODO Add hashtable for allocated tags - makes it faster when freeing, given only an address.
 // TODO Add support for quantum caches once we have slab allocators implemented.
@@ -311,10 +308,11 @@ impl Arena {
         quantum: usize,
         _parent: Option<Arc<Lock<Arena>, &dyn core::alloc::Allocator>>,
     ) -> Self {
-        println!("Arena::new name:{} initial_span:{:?} quantum:{:x}", name, initial_span, quantum);
+        // println!("Arena::new name:{} initial_span:{:?} quantum:{:x}", name, initial_span, quantum);
 
         let mut arena =
             Self { name, quantum, segment_list: TagList::new(), tag_pool: TagPool::new() };
+        //arena.add_tags_to_pool(tags);
 
         if let Some(span) = initial_span {
             arena.add_initial_span(span);
@@ -354,10 +352,10 @@ impl Arena {
         quantum: usize,
         tags: &mut [TagItem],
     ) -> Self {
-        println!(
-            "Arena::new_with_tags name:{} initial_span:{:?} quantum:{:x}",
-            name, initial_span, quantum
-        );
+        // println!(
+        //     "Arena::new_with_tags name:{} initial_span:{:?} quantum:{:x}",
+        //     name, initial_span, quantum
+        // );
 
         let mut arena =
             Self { name, quantum, segment_list: TagList::new(), tag_pool: TagPool::new() };
@@ -400,7 +398,7 @@ impl Arena {
 
     /// Allocate a segment, returned as a boundary
     fn alloc_segment(&mut self, size: usize) -> Result<Boundary, AllocError> {
-        println!("alloc_segment size: {}", size);
+        // println!("alloc_segment size: {}", size);
 
         // Round size up to a multiple of quantum
         let size = {
diff --git a/port/src/vmemalloc.rs b/port/src/vmemalloc.rs
new file mode 100644
index 0000000..96b1125
--- /dev/null
+++ b/port/src/vmemalloc.rs
@@ -0,0 +1,131 @@
+use crate::{
+    mcslock::{Lock, LockNode},
+    mem::{VirtRange, PAGE_SIZE_4K},
+    vmem::{Allocator, Arena, Boundary},
+};
+use alloc::sync::Arc;
+use core::alloc::{AllocError, Layout};
+use core::ptr::NonNull;
+
+/// VmAlloc is an attempt to write a Bonwick vmem-style allocator.  It currently
+/// expects another allocator to exist beforehand.
+/// TODO Use the allocator api trait.
+pub struct VmemAlloc {
+    heap_arena: Arc<Lock<Arena>, &'static dyn core::alloc::Allocator>,
+    va_arena: Option<Arc<Lock<Arena>, &'static dyn core::alloc::Allocator>>,
+    kmem_default_arena: Option<Arc<Lock<Arena>, &'static dyn core::alloc::Allocator>>,
+}
+
+impl VmemAlloc {
+    // TODO Specify quantum caching
+    pub fn new(
+        early_allocator: &'static dyn core::alloc::Allocator,
+        heap_range: VirtRange,
+    ) -> Self {
+        let heap_arena = Arc::new_in(
+            Lock::new(
+                "heap_arena",
+                Arena::new_with_allocator(
+                    "heap",
+                    Some(Boundary::from(heap_range)),
+                    PAGE_SIZE_4K,
+                    early_allocator,
+                ),
+            ),
+            early_allocator,
+        );
+
+        // va_arena imports from heap_arena, so can use allocations from that heap to
+        // allocate blocks of tags.
+        let va_arena = Arc::new_in(
+            Lock::new(
+                "kmem_va",
+                Arena::new("kmem_va_arena", None, PAGE_SIZE_4K, Some(heap_arena.clone())),
+            ),
+            early_allocator,
+        );
+
+        // kmem_default_arena - backing store for most object caches
+        let kmem_default_arena = Arc::new_in(
+            Lock::new(
+                "kmem_default_arena",
+                Arena::new("kmem_default", None, PAGE_SIZE_4K, Some(va_arena.clone())),
+            ),
+            early_allocator,
+        );
+
+        Self { heap_arena, va_arena: Some(va_arena), kmem_default_arena: Some(kmem_default_arena) }
+    }
+
+    /// Create the remaining early arenas.  To be called immediately after new()
+    /// as it uses self as the allocator.
+    pub fn init(&self) {
+        // va_arena imports from heap_arena, so can use allocations from that heap to
+        // allocate blocks of tags.
+        let va_arena = Arc::new_in(
+            Lock::new(
+                "kmem_va",
+                Arena::new("kmem_va_arena", None, PAGE_SIZE_4K, Some(self.heap_arena.clone())),
+            ),
+            self,
+        );
+
+        // kmem_default_arena - backing store for most object caches
+        // let kmem_default_arena = Arc::new_in(
+        //     Lock::new(
+        //         "kmem_default_arena",
+        //         Arena::new("kmem_default", None, PAGE_SIZE_4K, Some(va_arena.clone())),
+        //     ),
+        //     self,
+        // );
+        //self.va_arena = Some(va_arena as Allocator);
+    }
+
+    pub fn alloc(&self, layout: Layout) -> *mut u8 {
+        let node = LockNode::new();
+        let mut guard = self
+            .kmem_default_arena
+            .as_deref()
+            .expect("kmem_default_arena not yet created")
+            .lock(&node);
+        // TODO use layout properly
+        guard.alloc(layout.size())
+    }
+}
+
+unsafe impl core::alloc::Allocator for VmemAlloc {
+    fn allocate(
+        &self,
+        layout: Layout,
+    ) -> Result<core::ptr::NonNull<[u8]>, core::alloc::AllocError> {
+        let bytes = self.alloc(layout);
+        if bytes.is_null() {
+            Err(AllocError {})
+        } else {
+            let nonnull_bytes_ptr = NonNull::new(bytes).unwrap();
+            Ok(NonNull::slice_from_raw_parts(nonnull_bytes_ptr, layout.size()))
+        }
+    }
+
+    unsafe fn deallocate(&self, _ptr: core::ptr::NonNull<u8>, _layout: Layout) {
+        todo!()
+    }
+}
+
+#[cfg(test)]
+mod tests {
+
+    use crate::bumpalloc::Bump;
+
+    use super::*;
+
+    #[test]
+    fn alloc_with_importing() {
+        static BUMP_ALLOC: Bump<{ 4 * PAGE_SIZE_4K }, PAGE_SIZE_4K> = Bump::new(0);
+        let vmalloc =
+            VmemAlloc::new(&BUMP_ALLOC, VirtRange::with_len(0xffff800000800000, 0x1000000));
+        vmalloc.init();
+        let b = vmalloc.alloc(unsafe { Layout::from_size_align_unchecked(1024, 1) });
+        assert_ne!(b, 0 as *mut u8);
+    }
+}
diff --git a/rust-toolchain.toml b/rust-toolchain.toml
index 43c30b6..a179883 100644
--- a/rust-toolchain.toml
+++ b/rust-toolchain.toml
@@ -1,5 +1,5 @@
 [toolchain]
-channel = "nightly-2024-08-27"
+channel = "nightly-2024-09-08"
 components = ["rustfmt", "rust-src", "clippy", "llvm-tools"]
 targets = [
   "aarch64-unknown-none",