mmap.c 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541
  1. #include "mm.h"
  2. #include "slab.h"
  3. #include "internal.h"
  4. #include <common/compiler.h>
  5. extern uint64_t mm_total_2M_pages;
  6. /**
  7. * @brief 虚拟地址长度所需要的entry数量
  8. *
  9. */
  10. typedef struct
  11. {
  12. int64_t num_PML4E;
  13. int64_t num_PDPTE;
  14. int64_t num_PDE;
  15. int64_t num_PTE;
  16. } mm_pgt_entry_num_t;
  17. /**
  18. * @brief 计算虚拟地址长度对应的页表entry数量
  19. *
  20. * @param length 长度
  21. * @param ent 返回的entry数量结构体
  22. */
  23. static void mm_calculate_entry_num(uint64_t length, mm_pgt_entry_num_t *ent)
  24. {
  25. if (ent == NULL)
  26. return;
  27. ent->num_PML4E = (length + (1UL << PAGE_GDT_SHIFT) - 1) >> PAGE_GDT_SHIFT;
  28. ent->num_PDPTE = (length + PAGE_1G_SIZE - 1) >> PAGE_1G_SHIFT;
  29. ent->num_PDE = (length + PAGE_2M_SIZE - 1) >> PAGE_2M_SHIFT;
  30. ent->num_PTE = (length + PAGE_4K_SIZE - 1) >> PAGE_4K_SHIFT;
  31. }
  32. /**
  33. * @brief 将物理地址映射到页表的函数
  34. *
  35. * @param virt_addr_start 要映射到的虚拟地址的起始位置
  36. * @param phys_addr_start 物理地址的起始位置
  37. * @param length 要映射的区域的长度(字节)
  38. * @param flags 标志位
  39. * @param use4k 是否使用4k页
  40. */
  41. int mm_map_phys_addr(ul virt_addr_start, ul phys_addr_start, ul length, ul flags, bool use4k)
  42. {
  43. uint64_t global_CR3 = (uint64_t)get_CR3();
  44. return mm_map_proc_page_table(global_CR3, true, virt_addr_start, phys_addr_start, length, flags, false, true, use4k);
  45. }
  46. int mm_map_phys_addr_user(ul virt_addr_start, ul phys_addr_start, ul length, ul flags)
  47. {
  48. uint64_t global_CR3 = (uint64_t)get_CR3();
  49. return mm_map_proc_page_table(global_CR3, true, virt_addr_start, phys_addr_start, length, flags, true, true, false);
  50. }
  51. /**
  52. * @brief 将将物理地址填写到进程的页表的函数
  53. *
  54. * @param proc_page_table_addr 页表的基地址
  55. * @param is_phys 页表的基地址是否为物理地址
  56. * @param virt_addr_start 要映射到的虚拟地址的起始位置
  57. * @param phys_addr_start 物理地址的起始位置
  58. * @param length 要映射的区域的长度(字节)
  59. * @param user 用户态是否可访问
  60. * @param flush 是否刷新tlb
  61. * @param use4k 是否使用4k页
  62. */
  63. int mm_map_proc_page_table(ul proc_page_table_addr, bool is_phys, ul virt_addr_start, ul phys_addr_start, ul length, ul flags, bool user, bool flush, bool use4k)
  64. {
  65. // 计算线性地址对应的pml4页表项的地址
  66. mm_pgt_entry_num_t pgt_num;
  67. mm_calculate_entry_num(length, &pgt_num);
  68. // 已映射的内存大小
  69. uint64_t length_mapped = 0;
  70. // 对user标志位进行校正
  71. if ((flags & PAGE_U_S) != 0)
  72. user = true;
  73. else
  74. user = false;
  75. uint64_t pml4e_id = ((virt_addr_start >> PAGE_GDT_SHIFT) & 0x1ff);
  76. uint64_t *pml4_ptr;
  77. if (is_phys)
  78. pml4_ptr = phys_2_virt((ul *)((ul)proc_page_table_addr & (~0xfffUL)));
  79. else
  80. pml4_ptr = (ul *)((ul)proc_page_table_addr & (~0xfffUL));
  81. // 循环填写顶层页表
  82. for (; (pgt_num.num_PML4E > 0) && pml4e_id < 512; ++pml4e_id)
  83. {
  84. // 剩余需要处理的pml4E -1
  85. --(pgt_num.num_PML4E);
  86. ul *pml4e_ptr = pml4_ptr + pml4e_id;
  87. // 创建新的二级页表
  88. if (*pml4e_ptr == 0)
  89. {
  90. ul *virt_addr = kmalloc(PAGE_4K_SIZE, 0);
  91. memset(virt_addr, 0, PAGE_4K_SIZE);
  92. set_pml4t(pml4e_ptr, mk_pml4t(virt_2_phys(virt_addr), (user ? PAGE_USER_PGT : PAGE_KERNEL_PGT)));
  93. }
  94. uint64_t pdpte_id = (((virt_addr_start + length_mapped) >> PAGE_1G_SHIFT) & 0x1ff);
  95. uint64_t *pdpt_ptr = (uint64_t *)phys_2_virt(*pml4e_ptr & (~0xfffUL));
  96. // 循环填写二级页表
  97. for (; (pgt_num.num_PDPTE > 0) && pdpte_id < 512; ++pdpte_id)
  98. {
  99. --pgt_num.num_PDPTE;
  100. uint64_t *pdpte_ptr = (pdpt_ptr + pdpte_id);
  101. // 创建新的三级页表
  102. if (*pdpte_ptr == 0)
  103. {
  104. ul *virt_addr = kmalloc(PAGE_4K_SIZE, 0);
  105. memset(virt_addr, 0, PAGE_4K_SIZE);
  106. set_pdpt(pdpte_ptr, mk_pdpt(virt_2_phys(virt_addr), (user ? PAGE_USER_DIR : PAGE_KERNEL_DIR)));
  107. }
  108. uint64_t pde_id = (((virt_addr_start + length_mapped) >> PAGE_2M_SHIFT) & 0x1ff);
  109. uint64_t *pd_ptr = (uint64_t *)phys_2_virt(*pdpte_ptr & (~0xfffUL));
  110. // 循环填写三级页表,初始化2M物理页
  111. for (; (pgt_num.num_PDE > 0) && pde_id < 512; ++pde_id)
  112. {
  113. --pgt_num.num_PDE;
  114. // 计算当前2M物理页对应的pdt的页表项的物理地址
  115. ul *pde_ptr = pd_ptr + pde_id;
  116. // ====== 使用4k页 =======
  117. if (unlikely(use4k))
  118. {
  119. // kdebug("use 4k");
  120. if (*pde_ptr == 0)
  121. {
  122. // 创建四级页表
  123. uint64_t *vaddr = kmalloc(PAGE_4K_SIZE, 0);
  124. memset(vaddr, 0, PAGE_4K_SIZE);
  125. set_pdt(pde_ptr, mk_pdt(virt_2_phys(vaddr), (user ? PAGE_USER_PDE : PAGE_KERNEL_PDE)));
  126. }
  127. else if (unlikely(*pde_ptr & (1 << 7)))
  128. {
  129. // 当前页表项已经被映射了2MB物理页
  130. goto failed;
  131. }
  132. uint64_t pte_id = (((virt_addr_start + length_mapped) >> PAGE_4K_SHIFT) & 0x1ff);
  133. uint64_t *pt_ptr = (uint64_t *)phys_2_virt(*pde_ptr & (~0xfffUL));
  134. // 循环填写4级页表,初始化4K页
  135. for (; (pgt_num.num_PTE > 0) && pte_id < 512; ++pte_id)
  136. {
  137. --pgt_num.num_PTE;
  138. uint64_t *pte_ptr = pt_ptr + pte_id;
  139. if (unlikely(*pte_ptr != 0))
  140. kwarn("pte already exists.");
  141. else
  142. set_pt(pte_ptr, mk_pt((ul)phys_addr_start + length_mapped, flags | (user ? PAGE_USER_4K_PAGE : PAGE_KERNEL_4K_PAGE)));
  143. length_mapped += PAGE_4K_SIZE;
  144. }
  145. }
  146. // ======= 使用2M页 ========
  147. else
  148. {
  149. if (unlikely((*pde_ptr != 0) && user == true))
  150. {
  151. // 如果是用户态可访问的页,则释放当前新获取的物理页
  152. if (likely((((ul)phys_addr_start + length_mapped) >> PAGE_2M_SHIFT) < mm_total_2M_pages)) // 校验是否为内存中的物理页
  153. free_pages(Phy_to_2M_Page((ul)phys_addr_start + length_mapped), 1);
  154. length_mapped += PAGE_2M_SIZE;
  155. continue;
  156. }
  157. // 页面写穿,禁止缓存
  158. set_pdt(pde_ptr, mk_pdt((ul)phys_addr_start + length_mapped, flags | (user ? PAGE_USER_PAGE : PAGE_KERNEL_PAGE)));
  159. length_mapped += PAGE_2M_SIZE;
  160. }
  161. }
  162. }
  163. }
  164. if (likely(flush))
  165. flush_tlb();
  166. return 0;
  167. failed:;
  168. kerror("Map memory failed. use4k=%d, vaddr=%#018lx, paddr=%#018lx", use4k, virt_addr_start, phys_addr_start);
  169. return -EFAULT;
  170. }
  171. /**
  172. * @brief 从页表中清除虚拟地址的映射
  173. *
  174. * @param proc_page_table_addr 页表的地址
  175. * @param is_phys 页表地址是否为物理地址
  176. * @param virt_addr_start 要清除的虚拟地址的起始地址
  177. * @param length 要清除的区域的长度
  178. */
  179. void mm_unmap_proc_table(ul proc_page_table_addr, bool is_phys, ul virt_addr_start, ul length)
  180. {
  181. // 计算线性地址对应的pml4页表项的地址
  182. mm_pgt_entry_num_t pgt_num;
  183. mm_calculate_entry_num(length, &pgt_num);
  184. // 已取消映射的内存大小
  185. uint64_t length_unmapped = 0;
  186. uint64_t pml4e_id = ((virt_addr_start >> PAGE_GDT_SHIFT) & 0x1ff);
  187. uint64_t *pml4_ptr;
  188. if (is_phys)
  189. pml4_ptr = phys_2_virt((ul *)((ul)proc_page_table_addr & (~0xfffUL)));
  190. else
  191. pml4_ptr = (ul *)((ul)proc_page_table_addr & (~0xfffUL));
  192. // 循环填写顶层页表
  193. for (; (pgt_num.num_PML4E > 0) && pml4e_id < 512; ++pml4e_id)
  194. {
  195. // 剩余需要处理的pml4E -1
  196. --(pgt_num.num_PML4E);
  197. ul *pml4e_ptr = NULL;
  198. pml4e_ptr = pml4_ptr + pml4e_id;
  199. // 二级页表不存在
  200. if (*pml4e_ptr == 0)
  201. {
  202. continue;
  203. }
  204. uint64_t pdpte_id = (((virt_addr_start + length_unmapped) >> PAGE_1G_SHIFT) & 0x1ff);
  205. uint64_t *pdpt_ptr = (uint64_t *)phys_2_virt(*pml4e_ptr & (~0xfffUL));
  206. // kdebug("pdpt_ptr=%#018lx", pdpt_ptr);
  207. // 循环处理二级页表
  208. for (; (pgt_num.num_PDPTE > 0) && pdpte_id < 512; ++pdpte_id)
  209. {
  210. --pgt_num.num_PDPTE;
  211. uint64_t *pdpte_ptr = (pdpt_ptr + pdpte_id);
  212. // kdebug("pgt_num.num_PDPTE=%ld pdpte_ptr=%#018lx", pgt_num.num_PDPTE, pdpte_ptr);
  213. // 三级页表为空
  214. if (*pdpte_ptr == 0)
  215. {
  216. continue;
  217. }
  218. uint64_t pde_id = (((virt_addr_start + length_unmapped) >> PAGE_2M_SHIFT) & 0x1ff);
  219. uint64_t *pd_ptr = (uint64_t *)phys_2_virt(*pdpte_ptr & (~0xfffUL));
  220. // kdebug("pd_ptr=%#018lx, *pd_ptr=%#018lx", pd_ptr, *pd_ptr);
  221. // 循环处理三级页表
  222. for (; (pgt_num.num_PDE > 0) && pde_id < 512; ++pde_id)
  223. {
  224. --pgt_num.num_PDE;
  225. // 计算当前2M物理页对应的pdt的页表项的物理地址
  226. ul *pde_ptr = pd_ptr + pde_id;
  227. // 存在4级页表
  228. if (((*pde_ptr) & (1 << 7)) == 0)
  229. {
  230. // 存在4K页
  231. uint64_t pte_id = (((virt_addr_start + length_unmapped) >> PAGE_4K_SHIFT) & 0x1ff);
  232. uint64_t *pt_ptr = (uint64_t *)phys_2_virt(*pde_ptr & (~0xfffUL));
  233. // 循环处理4K页表
  234. for (; pgt_num.num_PTE > 0 && pte_id < 512; ++pte_id)
  235. {
  236. uint64_t *pte_ptr = pt_ptr + pte_id;
  237. --pgt_num.num_PTE;
  238. *pte_ptr = 0;
  239. length_unmapped += PAGE_4K_SIZE;
  240. }
  241. // 4级页表已经空了,释放页表
  242. if (unlikely(mm_check_page_table(pt_ptr)) == 0)
  243. {
  244. *pde_ptr = 0;
  245. kfree(pt_ptr);
  246. }
  247. }
  248. else
  249. {
  250. *pde_ptr = 0;
  251. length_unmapped += PAGE_2M_SIZE;
  252. pgt_num.num_PTE -= 512;
  253. }
  254. }
  255. // 3级页表已经空了,释放页表
  256. if (unlikely(mm_check_page_table(pd_ptr)) == 0)
  257. {
  258. *pdpte_ptr = 0;
  259. kfree(pd_ptr);
  260. }
  261. }
  262. // 2级页表已经空了,释放页表
  263. if (unlikely(mm_check_page_table(pdpt_ptr)) == 0)
  264. {
  265. *pml4e_ptr = 0;
  266. kfree(pdpt_ptr);
  267. }
  268. }
  269. flush_tlb();
  270. }
  271. /**
  272. * @brief 创建VMA
  273. *
  274. * @param mm 要绑定的内存空间分布结构体
  275. * @param vaddr 起始虚拟地址
  276. * @param length 长度(字节)
  277. * @param vm_flags vma的标志
  278. * @param vm_ops vma的操作接口
  279. * @param res_vma 返回的vma指针
  280. * @return int 错误码
  281. */
  282. int mm_create_vma(struct mm_struct *mm, uint64_t vaddr, uint64_t length, vm_flags_t vm_flags, struct vm_operations_t *vm_ops, struct vm_area_struct **res_vma)
  283. {
  284. int retval = 0;
  285. struct vm_area_struct *vma = vm_area_alloc(mm);
  286. if (unlikely(vma == NULL))
  287. return -ENOMEM;
  288. vma->vm_ops = vm_ops;
  289. vma->vm_flags = vm_flags;
  290. vma->vm_start = vaddr;
  291. vma->vm_end = vaddr + length;
  292. // 将VMA加入mm的链表
  293. retval = vma_insert(mm, vma);
  294. if (retval == -EEXIST) // 之前已经存在了相同的vma,直接返回
  295. {
  296. *res_vma = vma_find(mm, vma->vm_start);
  297. kfree(vma);
  298. return -EEXIST;
  299. }
  300. if (res_vma != NULL)
  301. *res_vma = vma;
  302. return 0;
  303. }
  304. /**
  305. * @brief 将指定的物理地址映射到指定的vma处
  306. *
  307. * @param vma 要进行映射的VMA结构体
  308. * @param paddr 起始物理地址
  309. * @return int 错误码
  310. */
  311. int mm_map_vma(struct vm_area_struct *vma, uint64_t paddr)
  312. {
  313. int retval = 0;
  314. // 获取物理地址对应的页面
  315. struct Page *pg;
  316. if (vma->vm_flags & VM_IO) // 对于mmio的内存,创建新的page结构体
  317. {
  318. if (unlikely(vma->anon_vma == NULL || vma->anon_vma->page == NULL))
  319. pg = __create_mmio_page_struct(paddr);
  320. else
  321. pg = vma->anon_vma->page;
  322. }
  323. else
  324. pg = Phy_to_2M_Page(paddr);
  325. if (unlikely(pg->anon_vma == NULL)) // 若页面不存在anon_vma,则为页面创建anon_vma
  326. {
  327. spin_lock(&pg->op_lock);
  328. if (unlikely(pg->anon_vma == NULL))
  329. __anon_vma_create_alloc(pg, false);
  330. spin_unlock(&pg->op_lock);
  331. }
  332. barrier();
  333. // 将anon vma与vma进行绑定
  334. __anon_vma_add(pg->anon_vma, vma);
  335. barrier();
  336. uint64_t length = vma->vm_end - vma->vm_start;
  337. // ==== 将地址映射到页表 ====
  338. uint64_t len_4k = length % PAGE_2M_SIZE;
  339. uint64_t len_2m = length - len_4k;
  340. /*
  341. todo: 限制页面的读写权限
  342. */
  343. // 先映射2M页
  344. if (likely(len_2m > 0))
  345. {
  346. uint64_t page_flags = 0;
  347. if (vma->vm_flags & VM_USER)
  348. page_flags = PAGE_USER_PAGE;
  349. else
  350. page_flags = PAGE_KERNEL_PAGE;
  351. // 这里直接设置user标志位为false,因为该函数内部会对其进行自动校正
  352. retval = mm_map_proc_page_table((uint64_t)vma->vm_mm->pgd, true, vma->vm_start, paddr, len_2m, page_flags, false, false, false);
  353. if (unlikely(retval != 0))
  354. goto failed;
  355. }
  356. if (likely(len_4k > 0))
  357. {
  358. len_4k = ALIGN(len_4k, PAGE_4K_SIZE);
  359. uint64_t page_flags = 0;
  360. if (vma->vm_flags & VM_USER)
  361. page_flags = PAGE_USER_4K_PAGE;
  362. else
  363. page_flags = PAGE_KERNEL_4K_PAGE;
  364. // 这里直接设置user标志位为false,因为该函数内部会对其进行自动校正
  365. retval = mm_map_proc_page_table((uint64_t)vma->vm_mm->pgd, true, vma->vm_start + len_2m, paddr + len_2m, len_4k, page_flags, false, false, true);
  366. if (unlikely(retval != 0))
  367. goto failed;
  368. }
  369. if (vma->vm_flags & VM_IO)
  370. vma->page_offset = 0;
  371. else
  372. { // 计算当前vma的起始地址在对应的物理页中的偏移量
  373. vma->page_offset = paddr - (paddr & PAGE_2M_MASK);
  374. }
  375. flush_tlb();
  376. return 0;
  377. failed:;
  378. kdebug("map VMA failed.");
  379. return retval;
  380. }
  381. /**
  382. * @brief 在页表中映射物理地址到指定的虚拟地址(需要页表中已存在对应的vma)
  383. *
  384. * @param mm 内存管理结构体
  385. * @param vaddr 虚拟地址
  386. * @param length 长度(字节)
  387. * @param paddr 物理地址
  388. * @return int 返回码
  389. */
  390. int mm_map(struct mm_struct *mm, uint64_t vaddr, uint64_t length, uint64_t paddr)
  391. {
  392. int retval = 0;
  393. for (uint64_t mapped = 0; mapped < length;)
  394. {
  395. struct vm_area_struct *vma = vma_find(mm, vaddr + mapped);
  396. if (unlikely(vma == NULL))
  397. {
  398. kerror("Map addr failed: vma not found. At address: %#018lx, pid=%ld", vaddr + mapped, current_pcb->pid);
  399. return -EINVAL;
  400. }
  401. if (unlikely(vma->vm_start != (vaddr + mapped)))
  402. {
  403. kerror("Map addr failed: addr_start is not equal to current: %#018lx.", vaddr + mapped);
  404. return -EINVAL;
  405. }
  406. retval = mm_map_vma(vma, paddr + mapped);
  407. if (unlikely(retval != 0))
  408. goto failed;
  409. mapped += vma->vm_end - vma->vm_start;
  410. }
  411. return 0;
  412. failed:;
  413. kerror("Map addr failed.");
  414. return retval;
  415. }
  416. /**
  417. * @brief 在页表中取消指定的vma的映射
  418. *
  419. * @param mm 指定的mm
  420. * @param vma 待取消映射的vma
  421. * @param paddr 返回的被取消映射的起始物理地址
  422. * @return int 返回码
  423. */
  424. int mm_unmap_vma(struct mm_struct *mm, struct vm_area_struct *vma, uint64_t *paddr)
  425. {
  426. // 确保vma对应的mm与指定的mm相一致
  427. if (unlikely(vma->vm_mm != mm))
  428. return -EINVAL;
  429. struct anon_vma_t *anon = vma->anon_vma;
  430. if (paddr != NULL)
  431. *paddr = __mm_get_paddr(mm, vma->vm_start);
  432. if (anon == NULL)
  433. kwarn("anon is NULL");
  434. semaphore_down(&anon->sem);
  435. mm_unmap_proc_table((uint64_t)mm->pgd, true, vma->vm_start, vma->vm_end - vma->vm_start);
  436. __anon_vma_del(vma);
  437. /** todo: 这里应该会存在bug,应修复。
  438. * 若anon_vma的等待队列上有其他的进程,由于anon_vma被释放
  439. * 这些在等待队列上的进程将无法被唤醒。
  440. */
  441. list_init(&vma->anon_vma_list);
  442. semaphore_up(&anon->sem);
  443. return 0;
  444. }
  445. /**
  446. * @brief 解除一段虚拟地址的映射(这些地址必须在vma中存在)
  447. *
  448. * @param mm 内存空间结构体
  449. * @param vaddr 起始地址
  450. * @param length 结束地址
  451. * @param destroy 是否释放vma结构体
  452. * @return int 错误码
  453. */
  454. int mm_unmap(struct mm_struct *mm, uint64_t vaddr, uint64_t length, bool destroy)
  455. {
  456. int retval = 0;
  457. for (uint64_t unmapped = 0; unmapped < length;)
  458. {
  459. struct vm_area_struct *vma = vma_find(mm, vaddr + unmapped);
  460. if (unlikely(vma == NULL))
  461. {
  462. kerror("Unmap addr failed: vma not found. At address: %#018lx, pid=%ld", vaddr + unmapped, current_pcb->pid);
  463. return -EINVAL;
  464. }
  465. if (unlikely(vma->vm_start != (vaddr + unmapped)))
  466. {
  467. kerror("Unmap addr failed: addr_start is not equal to current: %#018lx.", vaddr + unmapped);
  468. return -EINVAL;
  469. }
  470. if (vma->anon_vma != NULL)
  471. mm_unmap_vma(mm, vma, NULL);
  472. unmapped += vma->vm_end - vma->vm_start;
  473. // 释放vma结构体
  474. if (destroy)
  475. {
  476. vm_area_del(vma);
  477. vm_area_free(vma);
  478. }
  479. }
  480. return 0;
  481. failed:;
  482. kerror("Unmap addr failed.");
  483. return retval;
  484. }