syscall.c 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613
  1. #include "syscall.h"
  2. #include <common/errno.h>
  3. #include <common/fcntl.h>
  4. #include <common/string.h>
  5. #include <driver/disk/ahci/ahci.h>
  6. #include <exception/gate.h>
  7. #include <exception/irq.h>
  8. #include <filesystem/VFS/VFS.h>
  9. #include <filesystem/fat32/fat32.h>
  10. #include <mm/slab.h>
  11. #include <process/process.h>
  12. #include <time/sleep.h>
  13. // 导出系统调用入口函数,定义在entry.S中
  14. extern void system_call(void);
  15. extern void syscall_int(void);
  16. extern uint64_t sys_clock(struct pt_regs *regs);
  17. extern uint64_t sys_mstat(struct pt_regs *regs);
  18. extern uint64_t sys_open(struct pt_regs *regs);
  19. extern uint64_t sys_rmdir(struct pt_regs *regs);
  20. /**
  21. * @brief 导出系统调用处理函数的符号
  22. *
  23. */
  24. /**
  25. * @brief 系统调用不存在时的处理函数
  26. *
  27. * @param regs 进程3特权级下的寄存器
  28. * @return ul
  29. */
  30. ul system_call_not_exists(struct pt_regs *regs)
  31. {
  32. kerror("System call [ ID #%d ] not exists.", regs->rax);
  33. return ESYSCALL_NOT_EXISTS;
  34. } // 取消前述宏定义
  35. /**
  36. * @brief 重新定义为:把系统调用函数加入系统调用表
  37. * @param syscall_num 系统调用号
  38. * @param symbol 系统调用处理函数
  39. */
  40. #define SYSCALL_COMMON(syscall_num, symbol) [syscall_num] = symbol,
  41. /**
  42. * @brief sysenter的系统调用函数,从entry.S中跳转到这里
  43. *
  44. * @param regs 3特权级下的寄存器值,rax存储系统调用号
  45. * @return ul 对应的系统调用函数的地址
  46. */
  47. ul system_call_function(struct pt_regs *regs)
  48. {
  49. return system_call_table[regs->rax](regs);
  50. }
  51. /**
  52. * @brief 初始化系统调用模块
  53. *
  54. */
  55. void syscall_init()
  56. {
  57. kinfo("Initializing syscall...");
  58. set_system_trap_gate(0x80, 0, syscall_int); // 系统调用门
  59. }
  60. /**
  61. * @brief 通过中断进入系统调用
  62. *
  63. * @param syscall_id
  64. * @param arg0
  65. * @param arg1
  66. * @param arg2
  67. * @param arg3
  68. * @param arg4
  69. * @param arg5
  70. * @param arg6
  71. * @param arg7
  72. * @return long
  73. */
  74. long enter_syscall_int(ul syscall_id, ul arg0, ul arg1, ul arg2, ul arg3, ul arg4, ul arg5, ul arg6, ul arg7)
  75. {
  76. long err_code;
  77. __asm__ __volatile__("movq %2, %%r8 \n\t"
  78. "movq %3, %%r9 \n\t"
  79. "movq %4, %%r10 \n\t"
  80. "movq %5, %%r11 \n\t"
  81. "movq %6, %%r12 \n\t"
  82. "movq %7, %%r13 \n\t"
  83. "movq %8, %%r14 \n\t"
  84. "movq %9, %%r15 \n\t"
  85. "int $0x80 \n\t"
  86. : "=a"(err_code)
  87. : "a"(syscall_id), "m"(arg0), "m"(arg1), "m"(arg2), "m"(arg3), "m"(arg4), "m"(arg5), "m"(arg6),
  88. "m"(arg7)
  89. : "memory", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15", "rcx", "rdx");
  90. return err_code;
  91. }
  92. /**
  93. * @brief 打印字符串的系统调用
  94. *
  95. * 当arg1和arg2均为0时,打印黑底白字,否则按照指定的前景色和背景色来打印
  96. *
  97. * @param regs 寄存器
  98. * @param arg0 要打印的字符串
  99. * @param arg1 前景色
  100. * @param arg2 背景色
  101. * @return ul 返回值
  102. */
  103. ul sys_put_string(struct pt_regs *regs)
  104. {
  105. printk_color(regs->r9, regs->r10, (char *)regs->r8);
  106. // printk_color(BLACK, WHITE, (char *)regs->r8);
  107. return 0;
  108. }
  109. /**
  110. * @brief 关闭文件系统调用
  111. *
  112. * @param fd_num 文件描述符号
  113. *
  114. * @param regs
  115. * @return uint64_t
  116. */
  117. uint64_t sys_close(struct pt_regs *regs)
  118. {
  119. int fd_num = (int)regs->r8;
  120. // kdebug("sys close: fd=%d", fd_num);
  121. // 校验文件描述符范围
  122. if (fd_num < 0 || fd_num > PROC_MAX_FD_NUM)
  123. return -EBADF;
  124. // 文件描述符不存在
  125. if (current_pcb->fds[fd_num] == NULL)
  126. return -EBADF;
  127. struct vfs_file_t *file_ptr = current_pcb->fds[fd_num];
  128. uint64_t ret;
  129. // If there is a valid close function
  130. if (file_ptr->file_ops && file_ptr->file_ops->close)
  131. ret = file_ptr->file_ops->close(file_ptr->dEntry->dir_inode, file_ptr);
  132. kfree(file_ptr);
  133. current_pcb->fds[fd_num] = NULL;
  134. return 0;
  135. }
  136. /**
  137. * @brief 从文件中读取数据
  138. *
  139. * @param fd_num regs->r8 文件描述符号
  140. * @param buf regs->r9 输出缓冲区
  141. * @param count regs->r10 要读取的字节数
  142. *
  143. * @return uint64_t
  144. */
  145. uint64_t sys_read(struct pt_regs *regs)
  146. {
  147. int fd_num = (int)regs->r8;
  148. void *buf = (void *)regs->r9;
  149. int64_t count = (int64_t)regs->r10;
  150. // 校验buf的空间范围
  151. if (SYSCALL_FROM_USER(regs) && (!verify_area((uint64_t)buf, count)))
  152. return -EPERM;
  153. // kdebug("sys read: fd=%d", fd_num);
  154. // 校验文件描述符范围
  155. if (fd_num < 0 || fd_num > PROC_MAX_FD_NUM)
  156. return -EBADF;
  157. // 文件描述符不存在
  158. if (current_pcb->fds[fd_num] == NULL)
  159. return -EBADF;
  160. if (count < 0)
  161. return -EINVAL;
  162. struct vfs_file_t *file_ptr = current_pcb->fds[fd_num];
  163. uint64_t ret = 0;
  164. if (file_ptr->file_ops && file_ptr->file_ops->read)
  165. ret = file_ptr->file_ops->read(file_ptr, (char *)buf, count, &(file_ptr->position));
  166. return ret;
  167. }
  168. /**
  169. * @brief 向文件写入数据
  170. *
  171. * @param fd_num regs->r8 文件描述符号
  172. * @param buf regs->r9 输入缓冲区
  173. * @param count regs->r10 要写入的字节数
  174. *
  175. * @return uint64_t
  176. */
  177. uint64_t sys_write(struct pt_regs *regs)
  178. {
  179. int fd_num = (int)regs->r8;
  180. void *buf = (void *)regs->r9;
  181. int64_t count = (int64_t)regs->r10;
  182. // 校验buf的空间范围
  183. if (SYSCALL_FROM_USER(regs) && (!verify_area((uint64_t)buf, count)))
  184. return -EPERM;
  185. kdebug("sys write: fd=%d", fd_num);
  186. // 校验文件描述符范围
  187. if (fd_num < 0 || fd_num > PROC_MAX_FD_NUM)
  188. return -EBADF;
  189. // 文件描述符不存在
  190. if (current_pcb->fds[fd_num] == NULL)
  191. return -EBADF;
  192. if (count < 0)
  193. return -EINVAL;
  194. struct vfs_file_t *file_ptr = current_pcb->fds[fd_num];
  195. uint64_t ret = 0;
  196. if (file_ptr->file_ops && file_ptr->file_ops->write)
  197. ret = file_ptr->file_ops->write(file_ptr, (char *)buf, count, &(file_ptr->position));
  198. return ret;
  199. }
  200. /**
  201. * @brief 调整文件的访问位置
  202. *
  203. * @param fd_num 文件描述符号
  204. * @param offset 偏移量
  205. * @param whence 调整模式
  206. * @return uint64_t 调整结束后的文件访问位置
  207. */
  208. uint64_t sys_lseek(struct pt_regs *regs)
  209. {
  210. int fd_num = (int)regs->r8;
  211. long offset = (long)regs->r9;
  212. int whence = (int)regs->r10;
  213. // kdebug("sys_lseek: fd=%d", fd_num);
  214. uint64_t retval = 0;
  215. // 校验文件描述符范围
  216. if (fd_num < 0 || fd_num > PROC_MAX_FD_NUM)
  217. return -EBADF;
  218. // 文件描述符不存在
  219. if (current_pcb->fds[fd_num] == NULL)
  220. return -EBADF;
  221. struct vfs_file_t *file_ptr = current_pcb->fds[fd_num];
  222. if (file_ptr->file_ops && file_ptr->file_ops->lseek)
  223. retval = file_ptr->file_ops->lseek(file_ptr, offset, whence);
  224. return retval;
  225. }
  226. uint64_t sys_fork(struct pt_regs *regs)
  227. {
  228. return do_fork(regs, 0, regs->rsp, 0);
  229. }
  230. uint64_t sys_vfork(struct pt_regs *regs)
  231. {
  232. return do_fork(regs, CLONE_VM | CLONE_FS | CLONE_SIGNAL, regs->rsp, 0);
  233. }
  234. /**
  235. * @brief 将堆内存调整为arg0
  236. *
  237. * @param arg0 新的堆区域的结束地址
  238. * arg0=-1 ===> 返回堆区域的起始地址
  239. * arg0=-2 ===> 返回堆区域的结束地址
  240. * @return uint64_t 错误码
  241. *
  242. */
  243. uint64_t sys_brk(struct pt_regs *regs)
  244. {
  245. uint64_t new_brk = PAGE_2M_ALIGN(regs->r8);
  246. // kdebug("sys_brk input= %#010lx , new_brk= %#010lx bytes current_pcb->mm->brk_start=%#018lx
  247. // current->end_brk=%#018lx", regs->r8, new_brk, current_pcb->mm->brk_start, current_pcb->mm->brk_end);
  248. if ((int64_t)regs->r8 == -1)
  249. {
  250. // kdebug("get brk_start=%#018lx", current_pcb->mm->brk_start);
  251. return current_pcb->mm->brk_start;
  252. }
  253. if ((int64_t)regs->r8 == -2)
  254. {
  255. // kdebug("get brk_end=%#018lx", current_pcb->mm->brk_end);
  256. return current_pcb->mm->brk_end;
  257. }
  258. if (new_brk > current_pcb->addr_limit) // 堆地址空间超过限制
  259. return -ENOMEM;
  260. int64_t offset;
  261. if (new_brk >= current_pcb->mm->brk_end)
  262. offset = (int64_t)(new_brk - current_pcb->mm->brk_end);
  263. else
  264. offset = -(int64_t)(current_pcb->mm->brk_end - new_brk);
  265. new_brk = mm_do_brk(current_pcb->mm->brk_end, offset); // 扩展堆内存空间
  266. current_pcb->mm->brk_end = new_brk;
  267. return 0;
  268. }
  269. /**
  270. * @brief 将堆内存空间加上offset(注意,该系统调用只应在普通进程中调用,而不能是内核线程)
  271. *
  272. * @param arg0 offset偏移量
  273. * @return uint64_t the previous program break
  274. */
  275. uint64_t sys_sbrk(struct pt_regs *regs)
  276. {
  277. uint64_t retval = current_pcb->mm->brk_end;
  278. if ((int64_t)regs->r8 > 0)
  279. {
  280. uint64_t new_brk = PAGE_2M_ALIGN(retval + regs->r8);
  281. if (new_brk > current_pcb->addr_limit) // 堆地址空间超过限制
  282. {
  283. kdebug("exceed mem limit, new_brk = %#018lx", new_brk);
  284. return -ENOMEM;
  285. }
  286. }
  287. else
  288. {
  289. if ((__int128_t)current_pcb->mm->brk_end + (__int128_t)regs->r8 < current_pcb->mm->brk_start)
  290. return retval;
  291. }
  292. // kdebug("do brk");
  293. uint64_t new_brk = mm_do_brk(current_pcb->mm->brk_end, (int64_t)regs->r8); // 调整堆内存空间
  294. // kdebug("do brk done, new_brk = %#018lx", new_brk);
  295. current_pcb->mm->brk_end = new_brk;
  296. return retval;
  297. }
  298. /**
  299. * @brief 重启计算机
  300. *
  301. * @return
  302. */
  303. uint64_t sys_reboot(struct pt_regs *regs)
  304. {
  305. // 重启计算机
  306. io_out8(0x64, 0xfe);
  307. return 0;
  308. }
  309. /**
  310. * @brief 切换工作目录
  311. *
  312. * @param dest_path 目标路径
  313. * @return
  314. +--------------+------------------------+
  315. | 返回码 | 描述 |
  316. +--------------+------------------------+
  317. | 0 | 成功 |
  318. | EACCESS | 权限不足 |
  319. | ELOOP | 解析path时遇到路径循环 |
  320. | ENAMETOOLONG | 路径名过长 |
  321. | ENOENT | 目标文件或目录不存在 |
  322. | ENODIR | 检索期间发现非目录项 |
  323. | ENOMEM | 系统内存不足 |
  324. | EFAULT | 错误的地址 |
  325. | ENAMETOOLONG | 路径过长 |
  326. +--------------+------------------------+
  327. */
  328. uint64_t sys_chdir(struct pt_regs *regs)
  329. {
  330. char *dest_path = (char *)regs->r8;
  331. // kdebug("dest_path=%s", dest_path);
  332. // 检查目标路径是否为NULL
  333. if (dest_path == NULL)
  334. return -EFAULT;
  335. // 计算输入的路径长度
  336. int dest_path_len;
  337. if (regs->cs & USER_CS)
  338. {
  339. dest_path_len = strnlen_user(dest_path, PAGE_4K_SIZE);
  340. }
  341. else
  342. dest_path_len = strnlen(dest_path, PAGE_4K_SIZE);
  343. // 长度小于等于0
  344. if (dest_path_len <= 0)
  345. return -EFAULT;
  346. else if (dest_path_len >= PAGE_4K_SIZE)
  347. return -ENAMETOOLONG;
  348. // 为路径字符串申请空间
  349. char *path = kmalloc(dest_path_len + 1, 0);
  350. // 系统内存不足
  351. if (path == NULL)
  352. return -ENOMEM;
  353. memset(path, 0, dest_path_len + 1);
  354. if (regs->cs & USER_CS)
  355. {
  356. // 将字符串从用户空间拷贝进来, +1是为了拷贝结尾的\0
  357. strncpy_from_user(path, dest_path, dest_path_len + 1);
  358. }
  359. else
  360. strncpy(path, dest_path, dest_path_len + 1);
  361. // kdebug("chdir: path = %s", path);
  362. struct vfs_dir_entry_t *dentry = vfs_path_walk(path, 0);
  363. kfree(path);
  364. if (dentry == NULL)
  365. return -ENOENT;
  366. // kdebug("dentry->name=%s, namelen=%d", dentry->name, dentry->name_length);
  367. // 目标不是目录
  368. if (dentry->dir_inode->attribute != VFS_IF_DIR)
  369. return -ENOTDIR;
  370. return 0;
  371. }
  372. /**
  373. * @brief 获取目录中的数据
  374. *
  375. * @param fd 文件描述符号
  376. * @return uint64_t dirent的总大小
  377. */
  378. uint64_t sys_getdents(struct pt_regs *regs)
  379. {
  380. int fd = (int)regs->r8;
  381. void *dirent = (void *)regs->r9;
  382. long count = (long)regs->r10;
  383. if (fd < 0 || fd > PROC_MAX_FD_NUM)
  384. return -EBADF;
  385. if (count < 0)
  386. return -EINVAL;
  387. struct vfs_file_t *filp = current_pcb->fds[fd];
  388. if (filp == NULL)
  389. return -EBADF;
  390. uint64_t retval = 0;
  391. if (filp->file_ops && filp->file_ops->readdir)
  392. retval = filp->file_ops->readdir(filp, dirent, &vfs_fill_dirent);
  393. return retval;
  394. }
  395. /**
  396. * @brief 执行新的程序
  397. *
  398. * @param user_path(r8寄存器) 文件路径
  399. * @param argv(r9寄存器) 参数列表
  400. * @return uint64_t
  401. */
  402. uint64_t sys_execve(struct pt_regs *regs)
  403. {
  404. // kdebug("sys_execve");
  405. char *user_path = (char *)regs->r8;
  406. char **argv = (char **)regs->r9;
  407. int path_len = strnlen_user(user_path, PAGE_4K_SIZE);
  408. // kdebug("path_len=%d", path_len);
  409. if (path_len >= PAGE_4K_SIZE)
  410. return -ENAMETOOLONG;
  411. else if (path_len <= 0)
  412. return -EFAULT;
  413. char *path = (char *)kmalloc(path_len + 1, 0);
  414. if (path == NULL)
  415. return -ENOMEM;
  416. memset(path, 0, path_len + 1);
  417. // kdebug("before copy file path from user");
  418. // 拷贝文件路径
  419. strncpy_from_user(path, user_path, path_len);
  420. path[path_len] = '\0';
  421. // kdebug("before do_execve, path = %s", path);
  422. // 执行新的程序
  423. uint64_t retval = do_execve(regs, path, argv, NULL);
  424. kfree(path);
  425. return retval;
  426. }
  427. /**
  428. * @brief 等待进程退出
  429. *
  430. * @param pid 目标进程id
  431. * @param status 返回的状态信息
  432. * @param options 等待选项
  433. * @param rusage
  434. * @return uint64_t
  435. */
  436. uint64_t sys_wait4(struct pt_regs *regs)
  437. {
  438. uint64_t pid = regs->r8;
  439. int *status = (int *)regs->r9;
  440. int options = regs->r10;
  441. void *rusage = (void *)regs->r11;
  442. struct process_control_block *proc = NULL;
  443. struct process_control_block *child_proc = NULL;
  444. // 查找pid为指定值的进程
  445. // ps: 这里判断子进程的方法没有按照posix 2008来写。
  446. // todo: 根据进程树判断是否为当前进程的子进程
  447. for (proc = &initial_proc_union.pcb; proc->next_pcb != &initial_proc_union.pcb; proc = proc->next_pcb)
  448. {
  449. if (proc->next_pcb->pid == pid)
  450. {
  451. child_proc = proc->next_pcb;
  452. break;
  453. }
  454. }
  455. if (child_proc == NULL)
  456. return -ECHILD;
  457. // 暂时不支持options选项,该值目前必须为0
  458. if (options != 0)
  459. return -EINVAL;
  460. // 如果子进程没有退出,则等待其退出
  461. while (child_proc->state != PROC_ZOMBIE)
  462. wait_queue_sleep_on_interriptible(&current_pcb->wait_child_proc_exit);
  463. // 拷贝子进程的返回码
  464. if (likely(status != NULL))
  465. *status = child_proc->exit_code;
  466. // copy_to_user(status, (void*)child_proc->exit_code, sizeof(int));
  467. proc->next_pcb = child_proc->next_pcb;
  468. // 释放子进程的页表
  469. process_exit_mm(child_proc);
  470. // 释放子进程的pcb
  471. kfree(child_proc);
  472. return 0;
  473. }
  474. /**
  475. * @brief 进程退出
  476. *
  477. * @param exit_code 退出返回码
  478. * @return uint64_t
  479. */
  480. uint64_t sys_exit(struct pt_regs *regs)
  481. {
  482. return process_do_exit(regs->r8);
  483. }
  484. uint64_t sys_nanosleep(struct pt_regs *regs)
  485. {
  486. const struct timespec *rqtp = (const struct timespec *)regs->r8;
  487. struct timespec *rmtp = (struct timespec *)regs->r9;
  488. return nanosleep(rqtp, rmtp);
  489. }
  490. ul sys_ahci_end_req(struct pt_regs *regs)
  491. {
  492. ahci_end_request();
  493. return 0;
  494. }
  495. // 系统调用的内核入口程序
  496. void do_syscall_int(struct pt_regs *regs, unsigned long error_code)
  497. {
  498. ul ret = system_call_table[regs->rax](regs);
  499. regs->rax = ret; // 返回码
  500. }
  501. system_call_t system_call_table[MAX_SYSTEM_CALL_NUM] = {
  502. [0] = system_call_not_exists,
  503. [1] = sys_put_string,
  504. [2] = sys_open,
  505. [3] = sys_close,
  506. [4] = sys_read,
  507. [5] = sys_write,
  508. [6] = sys_lseek,
  509. [7] = sys_fork,
  510. [8] = sys_vfork,
  511. [9] = sys_brk,
  512. [10] = sys_sbrk,
  513. [11] = sys_reboot,
  514. [12] = sys_chdir,
  515. [13] = sys_getdents,
  516. [14] = sys_execve,
  517. [15] = sys_wait4,
  518. [16] = sys_exit,
  519. [17] = sys_mkdir,
  520. [18] = sys_nanosleep,
  521. [19] = sys_clock,
  522. [20] = sys_pipe,
  523. [21] = sys_mstat,
  524. [22] = sys_rmdir,
  525. [23 ... 254] = system_call_not_exists,
  526. [255] = sys_ahci_end_req,
  527. };