MemoryManager.cpp 28 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815
  1. #include "CMOS.h"
  2. #include "Process.h"
  3. #include "StdLib.h"
  4. #include <AK/Assertions.h>
  5. #include <AK/kstdio.h>
  6. #include <Kernel/Arch/i386/CPU.h>
  7. #include <Kernel/FileSystem/Inode.h>
  8. #include <Kernel/Multiboot.h>
  9. #include <Kernel/VM/AnonymousVMObject.h>
  10. #include <Kernel/VM/InodeVMObject.h>
  11. #include <Kernel/VM/MemoryManager.h>
  12. //#define MM_DEBUG
  13. //#define PAGE_FAULT_DEBUG
  14. static MemoryManager* s_the;
  15. MemoryManager& MM
  16. {
  17. return *s_the;
  18. }
  19. MemoryManager::MemoryManager()
  20. {
  21. m_kernel_page_directory = PageDirectory::create_at_fixed_address(PhysicalAddress(0x4000));
  22. m_page_table_zero = (PageTableEntry*)0x6000;
  23. m_page_table_one = (PageTableEntry*)0x7000;
  24. initialize_paging();
  25. kprintf("MM initialized.\n");
  26. }
  27. MemoryManager::~MemoryManager()
  28. {
  29. }
  30. void MemoryManager::populate_page_directory(PageDirectory& page_directory)
  31. {
  32. page_directory.m_directory_page = allocate_supervisor_physical_page();
  33. page_directory.entries()[0].copy_from({}, kernel_page_directory().entries()[0]);
  34. page_directory.entries()[1].copy_from({}, kernel_page_directory().entries()[1]);
  35. // Defer to the kernel page tables for 0xC0000000-0xFFFFFFFF
  36. for (int i = 768; i < 1024; ++i)
  37. page_directory.entries()[i].copy_from({}, kernel_page_directory().entries()[i]);
  38. }
  39. void MemoryManager::initialize_paging()
  40. {
  41. memset(m_page_table_zero, 0, PAGE_SIZE);
  42. memset(m_page_table_one, 0, PAGE_SIZE);
  43. #ifdef MM_DEBUG
  44. dbgprintf("MM: Kernel page directory @ %p\n", kernel_page_directory().cr3());
  45. #endif
  46. #ifdef MM_DEBUG
  47. dbgprintf("MM: Protect against null dereferences\n");
  48. #endif
  49. // Make null dereferences crash.
  50. map_protected(VirtualAddress(0), PAGE_SIZE);
  51. #ifdef MM_DEBUG
  52. dbgprintf("MM: Identity map bottom 5MB\n");
  53. #endif
  54. // The bottom 5 MB (except for the null page) are identity mapped & supervisor only.
  55. // Every process shares these mappings.
  56. create_identity_mapping(kernel_page_directory(), VirtualAddress(PAGE_SIZE), (5 * MB) - PAGE_SIZE);
  57. // Basic memory map:
  58. // 0 -> 512 kB Kernel code. Root page directory & PDE 0.
  59. // (last page before 1MB) Used by quickmap_page().
  60. // 1 MB -> 3 MB kmalloc_eternal() space.
  61. // 3 MB -> 4 MB kmalloc() space.
  62. // 4 MB -> 5 MB Supervisor physical pages (available for allocation!)
  63. // 5 MB -> 0xc0000000 Userspace physical pages (available for allocation!)
  64. // 0xc0000000-0xffffffff Kernel-only virtual address space
  65. #ifdef MM_DEBUG
  66. dbgprintf("MM: Quickmap will use %p\n", m_quickmap_addr.get());
  67. #endif
  68. m_quickmap_addr = VirtualAddress((1 * MB) - PAGE_SIZE);
  69. RefPtr<PhysicalRegion> region;
  70. bool region_is_super = false;
  71. for (auto* mmap = (multiboot_memory_map_t*)multiboot_info_ptr->mmap_addr; (unsigned long)mmap < multiboot_info_ptr->mmap_addr + multiboot_info_ptr->mmap_length; mmap = (multiboot_memory_map_t*)((unsigned long)mmap + mmap->size + sizeof(mmap->size))) {
  72. kprintf("MM: Multiboot mmap: base_addr = 0x%x%08x, length = 0x%x%08x, type = 0x%x\n",
  73. (u32)(mmap->addr >> 32),
  74. (u32)(mmap->addr & 0xffffffff),
  75. (u32)(mmap->len >> 32),
  76. (u32)(mmap->len & 0xffffffff),
  77. (u32)mmap->type);
  78. if (mmap->type != MULTIBOOT_MEMORY_AVAILABLE)
  79. continue;
  80. // FIXME: Maybe make use of stuff below the 1MB mark?
  81. if (mmap->addr < (1 * MB))
  82. continue;
  83. if ((mmap->addr + mmap->len) > 0xffffffff)
  84. continue;
  85. auto diff = (u32)mmap->addr % PAGE_SIZE;
  86. if (diff != 0) {
  87. kprintf("MM: got an unaligned region base from the bootloader; correcting %p by %d bytes\n", mmap->addr, diff);
  88. diff = PAGE_SIZE - diff;
  89. mmap->addr += diff;
  90. mmap->len -= diff;
  91. }
  92. if ((mmap->len % PAGE_SIZE) != 0) {
  93. kprintf("MM: got an unaligned region length from the bootloader; correcting %d by %d bytes\n", mmap->len, mmap->len % PAGE_SIZE);
  94. mmap->len -= mmap->len % PAGE_SIZE;
  95. }
  96. if (mmap->len < PAGE_SIZE) {
  97. kprintf("MM: memory region from bootloader is too small; we want >= %d bytes, but got %d bytes\n", PAGE_SIZE, mmap->len);
  98. continue;
  99. }
  100. #ifdef MM_DEBUG
  101. kprintf("MM: considering memory at %p - %p\n",
  102. (u32)mmap->addr, (u32)(mmap->addr + mmap->len));
  103. #endif
  104. for (size_t page_base = mmap->addr; page_base < (mmap->addr + mmap->len); page_base += PAGE_SIZE) {
  105. auto addr = PhysicalAddress(page_base);
  106. if (page_base < 4 * MB) {
  107. // nothing
  108. } else if (page_base >= 4 * MB && page_base < 5 * MB) {
  109. if (region.is_null() || !region_is_super || region->upper().offset(PAGE_SIZE) != addr) {
  110. m_super_physical_regions.append(PhysicalRegion::create(addr, addr));
  111. region = m_super_physical_regions.last();
  112. region_is_super = true;
  113. } else {
  114. region->expand(region->lower(), addr);
  115. }
  116. } else {
  117. if (region.is_null() || region_is_super || region->upper().offset(PAGE_SIZE) != addr) {
  118. m_user_physical_regions.append(PhysicalRegion::create(addr, addr));
  119. region = &m_user_physical_regions.last();
  120. region_is_super = false;
  121. } else {
  122. region->expand(region->lower(), addr);
  123. }
  124. }
  125. }
  126. }
  127. for (auto& region : m_super_physical_regions)
  128. m_super_physical_pages += region.finalize_capacity();
  129. for (auto& region : m_user_physical_regions)
  130. m_user_physical_pages += region.finalize_capacity();
  131. #ifdef MM_DEBUG
  132. dbgprintf("MM: Installing page directory\n");
  133. #endif
  134. asm volatile("movl %%eax, %%cr3" ::"a"(kernel_page_directory().cr3()));
  135. asm volatile(
  136. "movl %%cr0, %%eax\n"
  137. "orl $0x80000001, %%eax\n"
  138. "movl %%eax, %%cr0\n" ::
  139. : "%eax", "memory");
  140. #ifdef MM_DEBUG
  141. dbgprintf("MM: Paging initialized.\n");
  142. #endif
  143. }
  144. PageTableEntry& MemoryManager::ensure_pte(PageDirectory& page_directory, VirtualAddress vaddr)
  145. {
  146. ASSERT_INTERRUPTS_DISABLED();
  147. u32 page_directory_index = (vaddr.get() >> 22) & 0x3ff;
  148. u32 page_table_index = (vaddr.get() >> 12) & 0x3ff;
  149. PageDirectoryEntry& pde = page_directory.entries()[page_directory_index];
  150. if (!pde.is_present()) {
  151. #ifdef MM_DEBUG
  152. dbgprintf("MM: PDE %u not present (requested for V%p), allocating\n", page_directory_index, vaddr.get());
  153. #endif
  154. if (page_directory_index == 0) {
  155. ASSERT(&page_directory == m_kernel_page_directory);
  156. pde.set_page_table_base((u32)m_page_table_zero);
  157. pde.set_user_allowed(false);
  158. pde.set_present(true);
  159. pde.set_writable(true);
  160. } else if (page_directory_index == 1) {
  161. ASSERT(&page_directory == m_kernel_page_directory);
  162. pde.set_page_table_base((u32)m_page_table_one);
  163. pde.set_user_allowed(false);
  164. pde.set_present(true);
  165. pde.set_writable(true);
  166. } else {
  167. //ASSERT(&page_directory != m_kernel_page_directory.ptr());
  168. auto page_table = allocate_supervisor_physical_page();
  169. #ifdef MM_DEBUG
  170. dbgprintf("MM: PD K%p (%s) at P%p allocated page table #%u (for V%p) at P%p\n",
  171. &page_directory,
  172. &page_directory == m_kernel_page_directory ? "Kernel" : "User",
  173. page_directory.cr3(),
  174. page_directory_index,
  175. vaddr.get(),
  176. page_table->paddr().get());
  177. #endif
  178. pde.set_page_table_base(page_table->paddr().get());
  179. pde.set_user_allowed(true);
  180. pde.set_present(true);
  181. pde.set_writable(true);
  182. page_directory.m_physical_pages.set(page_directory_index, move(page_table));
  183. }
  184. }
  185. return pde.page_table_base()[page_table_index];
  186. }
  187. void MemoryManager::map_protected(VirtualAddress vaddr, size_t length)
  188. {
  189. InterruptDisabler disabler;
  190. ASSERT(vaddr.is_page_aligned());
  191. for (u32 offset = 0; offset < length; offset += PAGE_SIZE) {
  192. auto pte_address = vaddr.offset(offset);
  193. auto& pte = ensure_pte(kernel_page_directory(), pte_address);
  194. pte.set_physical_page_base(pte_address.get());
  195. pte.set_user_allowed(false);
  196. pte.set_present(false);
  197. pte.set_writable(false);
  198. flush_tlb(pte_address);
  199. }
  200. }
  201. void MemoryManager::create_identity_mapping(PageDirectory& page_directory, VirtualAddress vaddr, size_t size)
  202. {
  203. InterruptDisabler disabler;
  204. ASSERT((vaddr.get() & ~PAGE_MASK) == 0);
  205. for (u32 offset = 0; offset < size; offset += PAGE_SIZE) {
  206. auto pte_address = vaddr.offset(offset);
  207. auto& pte = ensure_pte(page_directory, pte_address);
  208. pte.set_physical_page_base(pte_address.get());
  209. pte.set_user_allowed(false);
  210. pte.set_present(true);
  211. pte.set_writable(true);
  212. page_directory.flush(pte_address);
  213. }
  214. }
  215. void MemoryManager::initialize()
  216. {
  217. s_the = new MemoryManager;
  218. }
  219. Region* MemoryManager::kernel_region_from_vaddr(VirtualAddress vaddr)
  220. {
  221. if (vaddr.get() < 0xc0000000)
  222. return nullptr;
  223. for (auto& region : MM.m_kernel_regions) {
  224. if (region.contains(vaddr))
  225. return &region;
  226. }
  227. return nullptr;
  228. }
  229. Region* MemoryManager::user_region_from_vaddr(Process& process, VirtualAddress vaddr)
  230. {
  231. // FIXME: Use a binary search tree (maybe red/black?) or some other more appropriate data structure!
  232. for (auto& region : process.m_regions) {
  233. if (region.contains(vaddr))
  234. return &region;
  235. }
  236. dbg() << process << " Couldn't find user region for " << vaddr;
  237. return nullptr;
  238. }
  239. Region* MemoryManager::region_from_vaddr(Process& process, VirtualAddress vaddr)
  240. {
  241. ASSERT_INTERRUPTS_DISABLED();
  242. if (auto* region = kernel_region_from_vaddr(vaddr))
  243. return region;
  244. return user_region_from_vaddr(process, vaddr);
  245. }
  246. const Region* MemoryManager::region_from_vaddr(const Process& process, VirtualAddress vaddr)
  247. {
  248. if (auto* region = kernel_region_from_vaddr(vaddr))
  249. return region;
  250. return user_region_from_vaddr(const_cast<Process&>(process), vaddr);
  251. }
  252. bool MemoryManager::zero_page(Region& region, unsigned page_index_in_region)
  253. {
  254. ASSERT_INTERRUPTS_DISABLED();
  255. auto& vmo = region.vmobject();
  256. auto& vmo_page = vmo.physical_pages()[region.first_page_index() + page_index_in_region];
  257. sti();
  258. LOCKER(vmo.m_paging_lock);
  259. cli();
  260. if (!vmo_page.is_null()) {
  261. #ifdef PAGE_FAULT_DEBUG
  262. dbgprintf("MM: zero_page() but page already present. Fine with me!\n");
  263. #endif
  264. remap_region_page(region, page_index_in_region);
  265. return true;
  266. }
  267. if (current)
  268. current->process().did_zero_fault();
  269. auto physical_page = allocate_user_physical_page(ShouldZeroFill::Yes);
  270. #ifdef PAGE_FAULT_DEBUG
  271. dbgprintf(" >> ZERO P%p\n", physical_page->paddr().get());
  272. #endif
  273. vmo.physical_pages()[page_index_in_region] = move(physical_page);
  274. remap_region_page(region, page_index_in_region);
  275. return true;
  276. }
  277. bool MemoryManager::copy_on_write(Region& region, unsigned page_index_in_region)
  278. {
  279. ASSERT_INTERRUPTS_DISABLED();
  280. auto& vmo = region.vmobject();
  281. if (vmo.physical_pages()[page_index_in_region]->ref_count() == 1) {
  282. #ifdef PAGE_FAULT_DEBUG
  283. dbgprintf(" >> It's a COW page but nobody is sharing it anymore. Remap r/w\n");
  284. #endif
  285. region.set_should_cow(page_index_in_region, false);
  286. remap_region_page(region, page_index_in_region);
  287. return true;
  288. }
  289. if (current)
  290. current->process().did_cow_fault();
  291. #ifdef PAGE_FAULT_DEBUG
  292. dbgprintf(" >> It's a COW page and it's time to COW!\n");
  293. #endif
  294. auto physical_page_to_copy = move(vmo.physical_pages()[page_index_in_region]);
  295. auto physical_page = allocate_user_physical_page(ShouldZeroFill::No);
  296. u8* dest_ptr = quickmap_page(*physical_page);
  297. const u8* src_ptr = region.vaddr().offset(page_index_in_region * PAGE_SIZE).as_ptr();
  298. #ifdef PAGE_FAULT_DEBUG
  299. dbgprintf(" >> COW P%p <- P%p\n", physical_page->paddr().get(), physical_page_to_copy->paddr().get());
  300. #endif
  301. memcpy(dest_ptr, src_ptr, PAGE_SIZE);
  302. vmo.physical_pages()[page_index_in_region] = move(physical_page);
  303. unquickmap_page();
  304. region.set_should_cow(page_index_in_region, false);
  305. remap_region_page(region, page_index_in_region);
  306. return true;
  307. }
  308. bool MemoryManager::page_in_from_inode(Region& region, unsigned page_index_in_region)
  309. {
  310. ASSERT(region.page_directory());
  311. auto& vmo = region.vmobject();
  312. ASSERT(vmo.is_inode());
  313. auto& inode_vmobject = static_cast<InodeVMObject&>(vmo);
  314. auto& vmo_page = inode_vmobject.physical_pages()[region.first_page_index() + page_index_in_region];
  315. InterruptFlagSaver saver;
  316. sti();
  317. LOCKER(vmo.m_paging_lock);
  318. cli();
  319. if (!vmo_page.is_null()) {
  320. #ifdef PAGE_FAULT_DEBUG
  321. dbgprintf("MM: page_in_from_inode() but page already present. Fine with me!\n");
  322. #endif
  323. remap_region_page(region, page_index_in_region);
  324. return true;
  325. }
  326. if (current)
  327. current->process().did_inode_fault();
  328. #ifdef MM_DEBUG
  329. dbgprintf("MM: page_in_from_inode ready to read from inode\n");
  330. #endif
  331. sti();
  332. u8 page_buffer[PAGE_SIZE];
  333. auto& inode = inode_vmobject.inode();
  334. auto nread = inode.read_bytes((region.first_page_index() + page_index_in_region) * PAGE_SIZE, PAGE_SIZE, page_buffer, nullptr);
  335. if (nread < 0) {
  336. kprintf("MM: page_in_from_inode had error (%d) while reading!\n", nread);
  337. return false;
  338. }
  339. if (nread < PAGE_SIZE) {
  340. // If we read less than a page, zero out the rest to avoid leaking uninitialized data.
  341. memset(page_buffer + nread, 0, PAGE_SIZE - nread);
  342. }
  343. cli();
  344. vmo_page = allocate_user_physical_page(ShouldZeroFill::No);
  345. if (vmo_page.is_null()) {
  346. kprintf("MM: page_in_from_inode was unable to allocate a physical page\n");
  347. return false;
  348. }
  349. remap_region_page(region, page_index_in_region);
  350. u8* dest_ptr = region.vaddr().offset(page_index_in_region * PAGE_SIZE).as_ptr();
  351. memcpy(dest_ptr, page_buffer, PAGE_SIZE);
  352. return true;
  353. }
  354. Region* MemoryManager::region_from_vaddr(VirtualAddress vaddr)
  355. {
  356. if (auto* region = kernel_region_from_vaddr(vaddr))
  357. return region;
  358. auto page_directory = PageDirectory::find_by_pdb(cpu_cr3());
  359. if (!page_directory)
  360. return nullptr;
  361. ASSERT(page_directory->process());
  362. return user_region_from_vaddr(*page_directory->process(), vaddr);
  363. }
  364. PageFaultResponse MemoryManager::handle_page_fault(const PageFault& fault)
  365. {
  366. ASSERT_INTERRUPTS_DISABLED();
  367. ASSERT(current);
  368. #ifdef PAGE_FAULT_DEBUG
  369. dbgprintf("MM: handle_page_fault(%w) at V%p\n", fault.code(), fault.vaddr().get());
  370. #endif
  371. ASSERT(fault.vaddr() != m_quickmap_addr);
  372. if (fault.type() == PageFault::Type::PageNotPresent && fault.vaddr().get() >= 0xc0000000) {
  373. auto* current_page_directory = reinterpret_cast<PageDirectoryEntry*>(cpu_cr3());
  374. u32 page_directory_index = (fault.vaddr().get() >> 22) & 0x3ff;
  375. auto& kernel_pde = kernel_page_directory().entries()[page_directory_index];
  376. auto& current_pde = current_page_directory[page_directory_index];
  377. if (kernel_pde.is_present() && !current_pde.is_present()) {
  378. dbg() << "NP(kernel): Copying new kernel mapping for " << fault.vaddr() << " into current page directory";
  379. current_pde.copy_from({}, kernel_pde);
  380. flush_tlb(fault.vaddr().page_base());
  381. return PageFaultResponse::Continue;
  382. }
  383. }
  384. auto* region = region_from_vaddr(fault.vaddr());
  385. if (!region) {
  386. kprintf("NP(error) fault at invalid address V%p\n", fault.vaddr().get());
  387. return PageFaultResponse::ShouldCrash;
  388. }
  389. auto page_index_in_region = region->page_index_from_address(fault.vaddr());
  390. if (fault.type() == PageFault::Type::PageNotPresent) {
  391. if (region->vmobject().is_inode()) {
  392. #ifdef PAGE_FAULT_DEBUG
  393. dbgprintf("NP(inode) fault in Region{%p}[%u]\n", region, page_index_in_region);
  394. #endif
  395. page_in_from_inode(*region, page_index_in_region);
  396. return PageFaultResponse::Continue;
  397. }
  398. #ifdef PAGE_FAULT_DEBUG
  399. dbgprintf("NP(zero) fault in Region{%p}[%u]\n", region, page_index_in_region);
  400. #endif
  401. zero_page(*region, page_index_in_region);
  402. return PageFaultResponse::Continue;
  403. }
  404. ASSERT(fault.type() == PageFault::Type::ProtectionViolation);
  405. if (fault.access() == PageFault::Access::Write && region->should_cow(page_index_in_region)) {
  406. #ifdef PAGE_FAULT_DEBUG
  407. dbgprintf("PV(cow) fault in Region{%p}[%u]\n", region, page_index_in_region);
  408. #endif
  409. bool success = copy_on_write(*region, page_index_in_region);
  410. ASSERT(success);
  411. return PageFaultResponse::Continue;
  412. }
  413. kprintf("PV(error) fault in Region{%p}[%u] at V%p\n", region, page_index_in_region, fault.vaddr().get());
  414. return PageFaultResponse::ShouldCrash;
  415. }
  416. OwnPtr<Region> MemoryManager::allocate_kernel_region(size_t size, const StringView& name, bool user_accessible, bool should_commit)
  417. {
  418. InterruptDisabler disabler;
  419. ASSERT(!(size % PAGE_SIZE));
  420. auto range = kernel_page_directory().range_allocator().allocate_anywhere(size);
  421. ASSERT(range.is_valid());
  422. OwnPtr<Region> region;
  423. if (user_accessible)
  424. region = Region::create_user_accessible(range, name, PROT_READ | PROT_WRITE | PROT_EXEC);
  425. else
  426. region = Region::create_kernel_only(range, name, PROT_READ | PROT_WRITE | PROT_EXEC);
  427. MM.map_region_at_address(*m_kernel_page_directory, *region, range.base());
  428. // FIXME: It would be cool if these could zero-fill on demand instead.
  429. if (should_commit)
  430. region->commit();
  431. return region;
  432. }
  433. OwnPtr<Region> MemoryManager::allocate_user_accessible_kernel_region(size_t size, const StringView& name)
  434. {
  435. return allocate_kernel_region(size, name, true);
  436. }
  437. void MemoryManager::deallocate_user_physical_page(PhysicalPage&& page)
  438. {
  439. for (auto& region : m_user_physical_regions) {
  440. if (!region.contains(page)) {
  441. kprintf(
  442. "MM: deallocate_user_physical_page: %p not in %p -> %p\n",
  443. page.paddr(), region.lower().get(), region.upper().get());
  444. continue;
  445. }
  446. region.return_page(move(page));
  447. --m_user_physical_pages_used;
  448. return;
  449. }
  450. kprintf("MM: deallocate_user_physical_page couldn't figure out region for user page @ %p\n", page.paddr());
  451. ASSERT_NOT_REACHED();
  452. }
  453. RefPtr<PhysicalPage> MemoryManager::allocate_user_physical_page(ShouldZeroFill should_zero_fill)
  454. {
  455. InterruptDisabler disabler;
  456. RefPtr<PhysicalPage> page;
  457. for (auto& region : m_user_physical_regions) {
  458. page = region.take_free_page(false);
  459. if (page.is_null())
  460. continue;
  461. }
  462. if (!page) {
  463. if (m_user_physical_regions.is_empty()) {
  464. kprintf("MM: no user physical regions available (?)\n");
  465. }
  466. kprintf("MM: no user physical pages available\n");
  467. ASSERT_NOT_REACHED();
  468. return {};
  469. }
  470. #ifdef MM_DEBUG
  471. dbgprintf("MM: allocate_user_physical_page vending P%p\n", page->paddr().get());
  472. #endif
  473. if (should_zero_fill == ShouldZeroFill::Yes) {
  474. auto* ptr = (u32*)quickmap_page(*page);
  475. fast_u32_fill(ptr, 0, PAGE_SIZE / sizeof(u32));
  476. unquickmap_page();
  477. }
  478. ++m_user_physical_pages_used;
  479. return page;
  480. }
  481. void MemoryManager::deallocate_supervisor_physical_page(PhysicalPage&& page)
  482. {
  483. for (auto& region : m_super_physical_regions) {
  484. if (!region.contains(page)) {
  485. kprintf(
  486. "MM: deallocate_supervisor_physical_page: %p not in %p -> %p\n",
  487. page.paddr(), region.lower().get(), region.upper().get());
  488. continue;
  489. }
  490. region.return_page(move(page));
  491. --m_super_physical_pages_used;
  492. return;
  493. }
  494. kprintf("MM: deallocate_supervisor_physical_page couldn't figure out region for super page @ %p\n", page.paddr());
  495. ASSERT_NOT_REACHED();
  496. }
  497. RefPtr<PhysicalPage> MemoryManager::allocate_supervisor_physical_page()
  498. {
  499. InterruptDisabler disabler;
  500. RefPtr<PhysicalPage> page;
  501. for (auto& region : m_super_physical_regions) {
  502. page = region.take_free_page(true);
  503. if (page.is_null())
  504. continue;
  505. }
  506. if (!page) {
  507. if (m_super_physical_regions.is_empty()) {
  508. kprintf("MM: no super physical regions available (?)\n");
  509. }
  510. kprintf("MM: no super physical pages available\n");
  511. ASSERT_NOT_REACHED();
  512. return {};
  513. }
  514. #ifdef MM_DEBUG
  515. dbgprintf("MM: allocate_supervisor_physical_page vending P%p\n", page->paddr().get());
  516. #endif
  517. fast_u32_fill((u32*)page->paddr().as_ptr(), 0, PAGE_SIZE / sizeof(u32));
  518. ++m_super_physical_pages_used;
  519. return page;
  520. }
  521. void MemoryManager::enter_process_paging_scope(Process& process)
  522. {
  523. ASSERT(current);
  524. InterruptDisabler disabler;
  525. current->tss().cr3 = process.page_directory().cr3();
  526. asm volatile("movl %%eax, %%cr3" ::"a"(process.page_directory().cr3())
  527. : "memory");
  528. }
  529. void MemoryManager::flush_entire_tlb()
  530. {
  531. asm volatile(
  532. "mov %%cr3, %%eax\n"
  533. "mov %%eax, %%cr3\n" ::
  534. : "%eax", "memory");
  535. }
  536. void MemoryManager::flush_tlb(VirtualAddress vaddr)
  537. {
  538. asm volatile("invlpg %0"
  539. :
  540. : "m"(*(char*)vaddr.get())
  541. : "memory");
  542. }
  543. void MemoryManager::map_for_kernel(VirtualAddress vaddr, PhysicalAddress paddr, bool cache_disabled)
  544. {
  545. auto& pte = ensure_pte(kernel_page_directory(), vaddr);
  546. pte.set_physical_page_base(paddr.get());
  547. pte.set_present(true);
  548. pte.set_writable(true);
  549. pte.set_user_allowed(false);
  550. pte.set_cache_disabled(cache_disabled);
  551. flush_tlb(vaddr);
  552. }
  553. u8* MemoryManager::quickmap_page(PhysicalPage& physical_page)
  554. {
  555. ASSERT_INTERRUPTS_DISABLED();
  556. ASSERT(!m_quickmap_in_use);
  557. m_quickmap_in_use = true;
  558. auto page_vaddr = m_quickmap_addr;
  559. auto& pte = ensure_pte(kernel_page_directory(), page_vaddr);
  560. pte.set_physical_page_base(physical_page.paddr().get());
  561. pte.set_present(true);
  562. pte.set_writable(true);
  563. pte.set_user_allowed(false);
  564. flush_tlb(page_vaddr);
  565. ASSERT((u32)pte.physical_page_base() == physical_page.paddr().get());
  566. #ifdef MM_DEBUG
  567. dbg() << "MM: >> quickmap_page " << page_vaddr << " => " << physical_page.paddr() << " @ PTE=" << (void*)pte.raw() << " {" << &pte << "}";
  568. #endif
  569. return page_vaddr.as_ptr();
  570. }
  571. void MemoryManager::unquickmap_page()
  572. {
  573. ASSERT_INTERRUPTS_DISABLED();
  574. ASSERT(m_quickmap_in_use);
  575. auto page_vaddr = m_quickmap_addr;
  576. auto& pte = ensure_pte(kernel_page_directory(), page_vaddr);
  577. #ifdef MM_DEBUG
  578. auto old_physical_address = pte.physical_page_base();
  579. #endif
  580. pte.set_physical_page_base(0);
  581. pte.set_present(false);
  582. pte.set_writable(false);
  583. flush_tlb(page_vaddr);
  584. #ifdef MM_DEBUG
  585. dbg() << "MM: >> unquickmap_page " << page_vaddr << " =/> " << old_physical_address;
  586. #endif
  587. m_quickmap_in_use = false;
  588. }
  589. void MemoryManager::remap_region_page(Region& region, unsigned page_index_in_region)
  590. {
  591. ASSERT(region.page_directory());
  592. InterruptDisabler disabler;
  593. auto page_vaddr = region.vaddr().offset(page_index_in_region * PAGE_SIZE);
  594. auto& pte = ensure_pte(*region.page_directory(), page_vaddr);
  595. auto& physical_page = region.vmobject().physical_pages()[page_index_in_region];
  596. ASSERT(physical_page);
  597. pte.set_physical_page_base(physical_page->paddr().get());
  598. pte.set_present(true); // FIXME: Maybe we should use the is_readable flag here?
  599. if (region.should_cow(page_index_in_region))
  600. pte.set_writable(false);
  601. else
  602. pte.set_writable(region.is_writable());
  603. pte.set_user_allowed(region.is_user_accessible());
  604. region.page_directory()->flush(page_vaddr);
  605. #ifdef MM_DEBUG
  606. dbg() << "MM: >> remap_region_page (PD=" << region.page_directory()->cr3() << ", PTE=" << (void*)pte.raw() << "{" << &pte << "}) " << region.name() << " " << page_vaddr << " => " << physical_page->paddr() << " (@" << physical_page.ptr() << ")";
  607. #endif
  608. }
  609. void MemoryManager::remap_region(PageDirectory& page_directory, Region& region)
  610. {
  611. InterruptDisabler disabler;
  612. ASSERT(region.page_directory() == &page_directory);
  613. map_region_at_address(page_directory, region, region.vaddr());
  614. }
  615. void MemoryManager::map_region_at_address(PageDirectory& page_directory, Region& region, VirtualAddress vaddr)
  616. {
  617. InterruptDisabler disabler;
  618. region.set_page_directory(page_directory);
  619. auto& vmo = region.vmobject();
  620. #ifdef MM_DEBUG
  621. dbgprintf("MM: map_region_at_address will map VMO pages %u - %u (VMO page count: %u)\n", region.first_page_index(), region.last_page_index(), vmo.page_count());
  622. #endif
  623. for (size_t i = 0; i < region.page_count(); ++i) {
  624. auto page_vaddr = vaddr.offset(i * PAGE_SIZE);
  625. auto& pte = ensure_pte(page_directory, page_vaddr);
  626. auto& physical_page = vmo.physical_pages()[region.first_page_index() + i];
  627. if (physical_page) {
  628. pte.set_physical_page_base(physical_page->paddr().get());
  629. pte.set_present(true); // FIXME: Maybe we should use the is_readable flag here?
  630. // FIXME: It seems wrong that the *region* cow map is essentially using *VMO* relative indices.
  631. if (region.should_cow(region.first_page_index() + i))
  632. pte.set_writable(false);
  633. else
  634. pte.set_writable(region.is_writable());
  635. } else {
  636. pte.set_physical_page_base(0);
  637. pte.set_present(false);
  638. pte.set_writable(region.is_writable());
  639. }
  640. pte.set_user_allowed(region.is_user_accessible());
  641. page_directory.flush(page_vaddr);
  642. #ifdef MM_DEBUG
  643. dbgprintf("MM: >> map_region_at_address (PD=%p) '%s' V%p => P%p (@%p)\n", &page_directory, region.name().characters(), page_vaddr, physical_page ? physical_page->paddr().get() : 0, physical_page.ptr());
  644. #endif
  645. }
  646. }
  647. bool MemoryManager::unmap_region(Region& region, bool deallocate_range)
  648. {
  649. ASSERT(region.page_directory());
  650. InterruptDisabler disabler;
  651. for (size_t i = 0; i < region.page_count(); ++i) {
  652. auto vaddr = region.vaddr().offset(i * PAGE_SIZE);
  653. auto& pte = ensure_pte(*region.page_directory(), vaddr);
  654. pte.set_physical_page_base(0);
  655. pte.set_present(false);
  656. pte.set_writable(false);
  657. pte.set_user_allowed(false);
  658. region.page_directory()->flush(vaddr);
  659. #ifdef MM_DEBUG
  660. auto& physical_page = region.vmobject().physical_pages()[region.first_page_index() + i];
  661. dbgprintf("MM: >> Unmapped V%p => P%p <<\n", vaddr, physical_page ? physical_page->paddr().get() : 0);
  662. #endif
  663. }
  664. if (deallocate_range)
  665. region.page_directory()->range_allocator().deallocate(region.range());
  666. region.release_page_directory();
  667. return true;
  668. }
  669. bool MemoryManager::map_region(Process& process, Region& region)
  670. {
  671. map_region_at_address(process.page_directory(), region, region.vaddr());
  672. return true;
  673. }
  674. bool MemoryManager::validate_user_read(const Process& process, VirtualAddress vaddr) const
  675. {
  676. auto* region = region_from_vaddr(process, vaddr);
  677. return region && region->is_readable();
  678. }
  679. bool MemoryManager::validate_user_write(const Process& process, VirtualAddress vaddr) const
  680. {
  681. auto* region = region_from_vaddr(process, vaddr);
  682. return region && region->is_writable();
  683. }
  684. void MemoryManager::register_vmo(VMObject& vmo)
  685. {
  686. InterruptDisabler disabler;
  687. m_vmobjects.append(&vmo);
  688. }
  689. void MemoryManager::unregister_vmo(VMObject& vmo)
  690. {
  691. InterruptDisabler disabler;
  692. m_vmobjects.remove(&vmo);
  693. }
  694. void MemoryManager::register_region(Region& region)
  695. {
  696. InterruptDisabler disabler;
  697. if (region.vaddr().get() >= 0xc0000000)
  698. m_kernel_regions.append(&region);
  699. else
  700. m_user_regions.append(&region);
  701. }
  702. void MemoryManager::unregister_region(Region& region)
  703. {
  704. InterruptDisabler disabler;
  705. if (region.vaddr().get() >= 0xc0000000)
  706. m_kernel_regions.remove(&region);
  707. else
  708. m_user_regions.remove(&region);
  709. }
  710. ProcessPagingScope::ProcessPagingScope(Process& process)
  711. {
  712. ASSERT(current);
  713. MM.enter_process_paging_scope(process);
  714. }
  715. ProcessPagingScope::~ProcessPagingScope()
  716. {
  717. MM.enter_process_paging_scope(current->process());
  718. }