parser.rs 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652
  1. use std::{
  2. collections::HashMap,
  3. io::ErrorKind,
  4. os::fd::{AsRawFd, FromRawFd},
  5. process::{Child, ChildStdout, Stdio},
  6. sync::{Arc, Mutex},
  7. };
  8. use regex::Regex;
  9. #[derive(Debug)]
  10. pub enum Token {
  11. Word(String), // 普通的命令或选项
  12. Symbol(String), // 特殊符号
  13. }
  14. #[derive(Debug, Clone)]
  15. pub enum CommandType {
  16. Simple, // 简单命令
  17. Redirect {
  18. target: RedirectTarget,
  19. mode: RedirectMode,
  20. }, // 重定向命令
  21. Pipe, // 管道命令
  22. }
  23. #[derive(Debug, Clone, PartialEq, Eq, Copy)]
  24. pub enum ConnectType {
  25. Simple, // 普通连接
  26. And, // 与连接
  27. Or, // 或连接
  28. }
  29. #[derive(Debug, Clone)]
  30. pub struct Command {
  31. name: String,
  32. args: Vec<String>,
  33. cmd_type: CommandType,
  34. conn_type: ConnectType,
  35. }
  36. impl Command {
  37. pub fn new(
  38. name: &String,
  39. args: &[String],
  40. cmd_type: CommandType,
  41. conn_type: ConnectType,
  42. ) -> Command {
  43. Self {
  44. name: name.clone(),
  45. args: args.to_vec(),
  46. cmd_type,
  47. conn_type,
  48. }
  49. }
  50. pub fn execute(&self) {}
  51. }
  52. #[derive(Debug, Clone)]
  53. pub enum RedirectTarget {
  54. File(String),
  55. FileDiscriptor(i32),
  56. }
  57. impl RedirectTarget {
  58. pub fn from_string(str: &String) -> Option<RedirectTarget> {
  59. if str.starts_with("&") {
  60. if let Ok(fd) = str.split_at(1).1.parse::<i32>() {
  61. Some(RedirectTarget::FileDiscriptor(fd))
  62. } else {
  63. None
  64. }
  65. } else {
  66. Some(RedirectTarget::File(str.clone()))
  67. }
  68. }
  69. }
  70. #[derive(Debug, PartialEq, Eq, Clone, Copy)]
  71. pub enum RedirectMode {
  72. Overwrite,
  73. Append,
  74. }
  75. impl RedirectMode {
  76. pub fn from_string(str: &String) -> Option<RedirectMode> {
  77. match str.as_str() {
  78. ">" => Some(RedirectMode::Overwrite),
  79. ">>" => Some(RedirectMode::Append),
  80. _ => None,
  81. }
  82. }
  83. }
  84. #[derive(Debug, Clone)]
  85. pub enum ParseError {
  86. UnexpectedInput(String),
  87. UnsupportedToken(String),
  88. UnexpectedToken(String),
  89. }
  90. impl ParseError {
  91. pub fn handle(&self) {
  92. match self {
  93. ParseError::UnexpectedInput(str) => eprintln!("Unexpected input: \"{str}\""),
  94. ParseError::UnsupportedToken(str) => eprintln!("Unsupported token: \"{str}\""),
  95. ParseError::UnexpectedToken(str) => eprintln!("Unexpected token: \"{str}\""),
  96. }
  97. }
  98. }
  99. pub struct Parser;
  100. impl Parser {
  101. fn parse_env(str: &str) -> String {
  102. std::env::var(str).unwrap_or(String::new())
  103. }
  104. fn lexer(input: &str) -> Result<Vec<Token>, ParseError> {
  105. let mut tokens = Vec::new();
  106. // 匹配环境变量的正则表达式
  107. let env_token = Regex::new(r#"\$\{(\w[\w\d_]*)\}"#).unwrap();
  108. // 使用具体的符号组合来匹配
  109. let regex_token =
  110. Regex::new(r#"([^'";|&$\s]+)|(["'].*?["'])|(&&|\|\||<<|>>|[<>|&;])"#).unwrap();
  111. // 预先替换"${}"包围的环境变量
  112. let remaining_input = env_token
  113. .replace_all(input, |captures: &regex::Captures| {
  114. Self::parse_env(&captures[1])
  115. })
  116. .into_owned();
  117. let mut remaining_input = remaining_input.trim();
  118. while !remaining_input.is_empty() {
  119. if let Some(mat) = regex_token.find(remaining_input) {
  120. let token_str = mat.as_str();
  121. if token_str.starts_with('"') || token_str.starts_with('\'') {
  122. tokens.push(Token::Word(token_str[1..token_str.len() - 1].to_string()));
  123. } else if token_str.starts_with('$') {
  124. tokens.push(Token::Word(Self::parse_env(&token_str[1..])));
  125. } else if token_str == ">>"
  126. || token_str == ">"
  127. || token_str == "<<"
  128. || token_str == "<"
  129. || token_str == "|"
  130. || token_str == "&"
  131. || token_str == ";"
  132. || token_str == "&&"
  133. || token_str == "||"
  134. {
  135. if token_str == "<" || token_str == "<<" {
  136. return Err(ParseError::UnsupportedToken(token_str.to_string()));
  137. }
  138. tokens.push(Token::Symbol(token_str.to_string()));
  139. } else {
  140. tokens.push(Token::Word(token_str.to_string()));
  141. }
  142. remaining_input = &remaining_input[mat.end()..].trim();
  143. } else {
  144. return Err(ParseError::UnexpectedInput(remaining_input.to_string()));
  145. }
  146. }
  147. Ok(tokens)
  148. }
  149. fn parser(tokens: Vec<Token>) -> Result<Vec<Pipeline>, ParseError> {
  150. let mut commands = Vec::new();
  151. let mut current_command: Vec<String> = Vec::new();
  152. let mut pipelines = Vec::new();
  153. let mut redirect_object: (Option<RedirectMode>, Option<RedirectTarget>) = (None, None);
  154. for token in tokens {
  155. match token {
  156. Token::Word(ref word) => {
  157. if let (Some(_), None) = redirect_object {
  158. redirect_object.1 = RedirectTarget::from_string(word);
  159. } else {
  160. current_command.push(word.to_string());
  161. }
  162. }
  163. Token::Symbol(symbol) => {
  164. match symbol.as_str() {
  165. ">" | ">>" => {
  166. // 重定向符号不能重复出现
  167. if redirect_object.0.is_some() {
  168. return Err(ParseError::UnexpectedToken(symbol));
  169. } else {
  170. redirect_object.0 = RedirectMode::from_string(&symbol);
  171. }
  172. }
  173. "|" | "&" | "||" | "&&" | ";" => {
  174. if let Some((name, args)) = current_command.split_first() {
  175. let mut cmd_type =
  176. if let (Some(mode), Some(ref target)) = redirect_object {
  177. CommandType::Redirect {
  178. target: target.clone(),
  179. mode,
  180. }
  181. } else {
  182. CommandType::Simple
  183. };
  184. let conn_type = match symbol.as_str() {
  185. "|" => {
  186. // 重定向优先级高于管道
  187. if let CommandType::Simple = cmd_type {
  188. cmd_type = CommandType::Pipe;
  189. }
  190. ConnectType::Simple
  191. }
  192. "&" | ";" => ConnectType::Simple,
  193. "||" => ConnectType::Or,
  194. "&&" => ConnectType::And,
  195. _ => todo!(),
  196. };
  197. commands.push(Command::new(name, args, cmd_type, conn_type));
  198. current_command.clear();
  199. if symbol == "&" {
  200. pipelines.push(Pipeline::new(&commands, true));
  201. commands.clear();
  202. }
  203. } else {
  204. // 这些符号之前必须有word作为命令被分隔,否则这些符号是没有意义的
  205. return Err(ParseError::UnexpectedToken(symbol));
  206. }
  207. }
  208. _ => todo!(),
  209. }
  210. }
  211. }
  212. }
  213. // 处理最后一个命令
  214. if let Some((name, args)) = current_command.split_first() {
  215. commands.push(Command::new(
  216. name,
  217. args,
  218. if let (Some(mode), Some(ref target)) = redirect_object {
  219. CommandType::Redirect {
  220. target: target.clone(),
  221. mode,
  222. }
  223. } else {
  224. CommandType::Simple
  225. },
  226. ConnectType::Simple,
  227. ));
  228. }
  229. if !commands.is_empty() {
  230. pipelines.push(Pipeline::new(&commands, false));
  231. }
  232. Ok(pipelines)
  233. }
  234. pub fn parse(input: &str) -> Result<Vec<Pipeline>, ParseError> {
  235. // 解析输入并生成token列表
  236. let tokens = Self::lexer(input)?;
  237. // println!("tokens: {tokens:?}");
  238. // 解析 tokens 生成命令流水线
  239. Self::parser(tokens)
  240. }
  241. }
  242. #[allow(dead_code)]
  243. #[derive(Debug)]
  244. pub struct ExecuteError {
  245. name: String,
  246. err_type: ExecuteErrorType,
  247. }
  248. impl ExecuteError {
  249. pub fn handle(&self, prompt: Option<String>) {
  250. if let Some(prompt) = prompt {
  251. eprint!("{}: ", prompt);
  252. }
  253. eprint!("{}: ", self.name);
  254. match &self.err_type {
  255. ExecuteErrorType::CommandNotFound => eprintln!("Command not found"),
  256. ExecuteErrorType::FileNotFound(file) => eprintln!("Not a file or directory: {}", file),
  257. ExecuteErrorType::NotDir(ref path) => eprintln!("Not a Directory: {path}"),
  258. ExecuteErrorType::NotFile(ref path) => eprintln!("Not a File: {path}"),
  259. ExecuteErrorType::PermissionDenied(ref file) => eprintln!("File open denied: {file}"),
  260. ExecuteErrorType::ExecuteFailed => eprintln!("Command execute failed"),
  261. ExecuteErrorType::ExitWithCode(exit_code) => {
  262. eprintln!("Command exit with code: {}", exit_code)
  263. }
  264. ExecuteErrorType::ProcessTerminated => eprintln!("Process terminated"),
  265. ExecuteErrorType::FileOpenFailed(file) => {
  266. eprintln!("File open failed: {}", file.clone())
  267. }
  268. ExecuteErrorType::TooManyArguments => eprintln!("Too many arguments"),
  269. ExecuteErrorType::TooFewArguments => eprintln!("Too few arguments"),
  270. ExecuteErrorType::InvalidArgument(arg) => eprintln!("Invalid argument: {}", arg),
  271. }
  272. }
  273. }
  274. #[allow(dead_code)]
  275. #[derive(Debug, Clone)]
  276. pub enum ExecuteErrorType {
  277. CommandNotFound,
  278. FileNotFound(String),
  279. NotDir(String),
  280. NotFile(String),
  281. PermissionDenied(String),
  282. ExecuteFailed,
  283. ProcessTerminated,
  284. ExitWithCode(i32),
  285. FileOpenFailed(String),
  286. TooManyArguments,
  287. TooFewArguments,
  288. InvalidArgument(String),
  289. }
  290. pub enum RedirectStdout {
  291. Stdout(Option<ChildStdout>),
  292. RawPipe(i32),
  293. }
  294. impl RedirectStdout {
  295. pub fn as_raw_fd(&mut self) -> i32 {
  296. match self {
  297. RedirectStdout::Stdout(child_stdout) => child_stdout.take().unwrap().as_raw_fd(),
  298. RedirectStdout::RawPipe(fd) => *fd,
  299. }
  300. }
  301. pub fn as_std(&mut self) -> Stdio {
  302. match self {
  303. RedirectStdout::Stdout(child_stdout) => Stdio::from(child_stdout.take().unwrap()),
  304. RedirectStdout::RawPipe(fd) => unsafe { Stdio::from_raw_fd(*fd) },
  305. }
  306. }
  307. }
  308. impl From<i32> for RedirectStdout {
  309. fn from(value: i32) -> Self {
  310. RedirectStdout::RawPipe(value)
  311. }
  312. }
  313. impl From<Option<ChildStdout>> for RedirectStdout {
  314. fn from(mut value: Option<ChildStdout>) -> Self {
  315. RedirectStdout::Stdout(value.take())
  316. }
  317. }
  318. #[derive(Debug)]
  319. pub struct Pipeline {
  320. commands: Vec<Command>, // 存储一系列命令
  321. backend: bool,
  322. }
  323. type CommandMap = HashMap<String, fn(&Vec<String>) -> Result<(), ExecuteErrorType>>;
  324. impl Pipeline {
  325. pub fn new(commands: &Vec<Command>, backend: bool) -> Pipeline {
  326. Self {
  327. commands: commands.to_vec(),
  328. backend,
  329. }
  330. }
  331. pub fn execute(&self, internal_commands: Option<Arc<Mutex<CommandMap>>>) -> Vec<Child> {
  332. // 前一个命令是否为管道输出
  333. let mut stdout: Option<RedirectStdout> = None;
  334. // 提前推断下条命令的布尔值,为None代表下条命令需要运行
  335. let mut result_next: Option<bool> = None;
  336. let mut children: Vec<Child> = Vec::new();
  337. let mut err: Option<ExecuteErrorType> = None;
  338. for cmd in self.commands.iter() {
  339. if let Some(result) = result_next {
  340. // 如果前面已经推导出本条命令的布尔值,则本条命令不需要执行,并继续推断下条命令
  341. if (result && cmd.conn_type == ConnectType::And)
  342. || (!result && cmd.conn_type == ConnectType::Or)
  343. {
  344. // 如果true遇到||或false遇到&&,则下条命令的布尔值相同
  345. // 如果true遇到&&或false遇到||,继承中断,设为None以执行后续命令
  346. result_next = None;
  347. }
  348. continue;
  349. }
  350. let mut internal = false;
  351. if let Some(ref map) = internal_commands {
  352. let map = map.lock().unwrap();
  353. if let Some(f) = map.get(&cmd.name) {
  354. // 找到内部命令,优先执行,设置标记
  355. internal = true;
  356. // child_fd
  357. let child_fd = if self.backend {
  358. unsafe { libc::fork() }
  359. } else {
  360. 0
  361. };
  362. // 为子进程或前台运行
  363. if child_fd == 0 {
  364. let mut old_stdin: Option<i32> = None;
  365. let mut old_stdout: Option<i32> = None;
  366. // 如果上条命令为管道,将标准输入重定向
  367. if let Some(mut redirect_stdout) = stdout {
  368. unsafe {
  369. old_stdin = Some(libc::dup(libc::STDIN_FILENO));
  370. libc::dup2(redirect_stdout.as_raw_fd(), libc::STDIN_FILENO);
  371. stdout = None;
  372. }
  373. }
  374. // 根据命令类型重定向标准输出
  375. match cmd.cmd_type {
  376. CommandType::Simple => {}
  377. CommandType::Pipe => unsafe {
  378. let mut pipe: [i32; 2] = [0; 2];
  379. libc::pipe2(pipe.as_mut_ptr(), libc::O_CLOEXEC);
  380. stdout = Some(RedirectStdout::from(pipe[0]));
  381. old_stdout = Some(libc::dup(libc::STDOUT_FILENO));
  382. libc::dup2(pipe[1], libc::STDOUT_FILENO);
  383. },
  384. CommandType::Redirect {
  385. ref target,
  386. ref mode,
  387. } => unsafe {
  388. let mut pipe: [i32; 2] = [0; 2];
  389. libc::pipe2(pipe.as_mut_ptr(), libc::O_CLOEXEC);
  390. stdout = Some(RedirectStdout::from(pipe[0]));
  391. old_stdout = Some(libc::dup(libc::STDOUT_FILENO));
  392. let append = match mode {
  393. RedirectMode::Overwrite => false,
  394. RedirectMode::Append => true,
  395. };
  396. match target {
  397. RedirectTarget::File(file) => {
  398. match std::fs::OpenOptions::new()
  399. .write(true)
  400. .append(append)
  401. .create(true)
  402. .open(file)
  403. {
  404. Ok(file) => {
  405. libc::dup2(file.as_raw_fd(), libc::STDIN_FILENO);
  406. }
  407. Err(_) => {
  408. err = Some(ExecuteErrorType::FileOpenFailed(
  409. file.clone(),
  410. ));
  411. }
  412. };
  413. }
  414. RedirectTarget::FileDiscriptor(fd) => {
  415. libc::dup2(*fd, libc::STDIN_FILENO);
  416. }
  417. }
  418. },
  419. }
  420. // 如果之前没有出错,执行命令
  421. if err.is_none() {
  422. match f(&cmd.args) {
  423. Ok(_) => err = None,
  424. Err(err_type) => err = Some(err_type),
  425. }
  426. }
  427. // 还原标准输出
  428. unsafe {
  429. if let Some(old_stdin) = old_stdin {
  430. libc::dup2(old_stdin, libc::STDIN_FILENO);
  431. }
  432. if let Some(old_stdout) = old_stdout {
  433. libc::dup2(old_stdout, libc::STDOUT_FILENO);
  434. }
  435. }
  436. } else if child_fd < 0 {
  437. err = Some(ExecuteErrorType::ExecuteFailed)
  438. }
  439. // 后台命令且当前进程为父进程
  440. if self.backend && !child_fd == 0 {
  441. err = match unsafe { libc::waitpid(child_fd, std::ptr::null_mut(), 0) } {
  442. -1 => Some(ExecuteErrorType::ExecuteFailed),
  443. _ => None,
  444. }
  445. }
  446. }
  447. };
  448. // 没找到执行内部命令的标记,尝试作为外部命令执行
  449. if !internal {
  450. let path = if cmd.name.contains('/') {
  451. // 为路径,获取规范的绝对路径
  452. if let Ok(path) = std::fs::canonicalize(&cmd.name) {
  453. if path.is_file() {
  454. Ok(path)
  455. } else {
  456. // 路径不为文件,返回错误
  457. Err(ExecuteErrorType::NotFile(cmd.name.clone()))
  458. }
  459. } else {
  460. Err(ExecuteErrorType::CommandNotFound)
  461. }
  462. } else {
  463. // 不为路径,从环境变量中查找命令
  464. which::which(&cmd.name).map_err(|_| ExecuteErrorType::CommandNotFound)
  465. };
  466. // println!("path: {:?}", path);
  467. match path {
  468. Err(e) => err = Some(e),
  469. Ok(real_path) => {
  470. let mut child_command = std::process::Command::new(real_path);
  471. child_command.args(cmd.args.clone());
  472. child_command.current_dir(std::env::current_dir().unwrap());
  473. if stdout.is_some() {
  474. child_command.stdin(stdout.take().unwrap().as_std());
  475. }
  476. match &cmd.cmd_type {
  477. CommandType::Simple => {}
  478. CommandType::Redirect { target, mode } => {
  479. let append = match mode {
  480. RedirectMode::Overwrite => false,
  481. RedirectMode::Append => true,
  482. };
  483. match target {
  484. RedirectTarget::File(file) => {
  485. match std::fs::OpenOptions::new()
  486. .write(true)
  487. .append(append)
  488. .create(true)
  489. .open(file)
  490. {
  491. Ok(file) => {
  492. child_command.stdout(file);
  493. }
  494. Err(_) => {
  495. err = Some(ExecuteErrorType::FileOpenFailed(
  496. file.clone(),
  497. ));
  498. }
  499. };
  500. }
  501. RedirectTarget::FileDiscriptor(fd) => {
  502. child_command.stdout(unsafe { Stdio::from_raw_fd(*fd) });
  503. }
  504. }
  505. }
  506. CommandType::Pipe => {
  507. // 标准输出重定向到管道
  508. child_command.stdout(Stdio::piped());
  509. }
  510. }
  511. if err.is_none() {
  512. match child_command.spawn() {
  513. Ok(mut child) => {
  514. // 如果为管道命令,记录下来
  515. if let CommandType::Pipe = cmd.cmd_type {
  516. stdout = Some(RedirectStdout::Stdout(child.stdout.take()));
  517. }
  518. // println!("exec command: {child_command:#?}");
  519. match child.wait() {
  520. Ok(exit_status) => match exit_status.code() {
  521. Some(exit_code) => {
  522. if exit_code != 0 {
  523. err = Some(ExecuteErrorType::ExitWithCode(
  524. exit_code,
  525. ));
  526. }
  527. }
  528. None => err = Some(ExecuteErrorType::ProcessTerminated),
  529. },
  530. Err(_) => err = Some(ExecuteErrorType::ExecuteFailed),
  531. };
  532. children.push(child);
  533. }
  534. Err(e) => match e.kind() {
  535. ErrorKind::PermissionDenied => {
  536. err = Some(ExecuteErrorType::PermissionDenied(
  537. cmd.name.clone(),
  538. ))
  539. }
  540. _ => eprintln!("Error occurred: {}", e.kind()),
  541. },
  542. }
  543. }
  544. }
  545. }
  546. }
  547. // 预计算下条命令的结果
  548. result_next = match err {
  549. Some(ref e) => {
  550. ExecuteError {
  551. name: cmd.name.clone(),
  552. err_type: e.clone(),
  553. }
  554. .handle(if internal {
  555. Some("internal command".to_string())
  556. } else {
  557. None
  558. });
  559. if cmd.conn_type == ConnectType::And {
  560. Some(false)
  561. } else {
  562. None
  563. }
  564. }
  565. None => {
  566. if cmd.conn_type == ConnectType::Or {
  567. Some(true)
  568. } else {
  569. None
  570. }
  571. }
  572. }
  573. }
  574. children
  575. }
  576. pub fn backend(&self) -> bool {
  577. self.backend
  578. }
  579. }