assembler.rs 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546
  1. use core::fmt;
  2. #[derive(Debug, Clone, Copy, PartialEq, Eq)]
  3. pub struct TooManyHolesError;
  4. /// A contiguous chunk of absent data, followed by a contiguous chunk of present data.
  5. #[derive(Debug, Clone, Copy, PartialEq, Eq)]
  6. #[cfg_attr(feature = "defmt", derive(defmt::Format))]
  7. struct Contig {
  8. hole_size: usize,
  9. data_size: usize,
  10. }
  11. impl fmt::Display for Contig {
  12. fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
  13. if self.has_hole() {
  14. write!(f, "({})", self.hole_size)?;
  15. }
  16. if self.has_hole() && self.has_data() {
  17. write!(f, " ")?;
  18. }
  19. if self.has_data() {
  20. write!(f, "{}", self.data_size)?;
  21. }
  22. Ok(())
  23. }
  24. }
  25. impl Contig {
  26. fn empty() -> Contig {
  27. Contig {
  28. hole_size: 0,
  29. data_size: 0,
  30. }
  31. }
  32. fn hole(size: usize) -> Contig {
  33. Contig {
  34. hole_size: size,
  35. data_size: 0,
  36. }
  37. }
  38. fn hole_and_data(hole_size: usize, data_size: usize) -> Contig {
  39. Contig {
  40. hole_size,
  41. data_size,
  42. }
  43. }
  44. fn has_hole(&self) -> bool {
  45. self.hole_size != 0
  46. }
  47. fn has_data(&self) -> bool {
  48. self.data_size != 0
  49. }
  50. fn total_size(&self) -> usize {
  51. self.hole_size + self.data_size
  52. }
  53. fn is_empty(&self) -> bool {
  54. self.total_size() == 0
  55. }
  56. fn expand_data_by(&mut self, size: usize) {
  57. self.data_size += size;
  58. }
  59. fn shrink_hole_by(&mut self, size: usize) {
  60. self.hole_size -= size;
  61. }
  62. fn shrink_hole_to(&mut self, size: usize) {
  63. debug_assert!(self.hole_size >= size);
  64. let total_size = self.total_size();
  65. self.hole_size = size;
  66. self.data_size = total_size - size;
  67. }
  68. }
  69. #[cfg(all(feature = "alloc", not(feature = "std")))]
  70. use alloc::boxed::Box;
  71. #[cfg(feature = "std")]
  72. use std::boxed::Box;
  73. #[cfg(any(feature = "std", feature = "alloc"))]
  74. const CONTIG_COUNT: usize = 32;
  75. #[cfg(not(any(feature = "std", feature = "alloc")))]
  76. const CONTIG_COUNT: usize = 4;
  77. /// A buffer (re)assembler.
  78. ///
  79. /// Currently, up to a hardcoded limit of 4 or 32 holes can be tracked in the buffer.
  80. #[derive(Debug, PartialEq, Eq, Clone)]
  81. #[cfg_attr(feature = "defmt", derive(defmt::Format))]
  82. pub struct Assembler {
  83. #[cfg(not(any(feature = "std", feature = "alloc")))]
  84. contigs: [Contig; CONTIG_COUNT],
  85. #[cfg(any(feature = "std", feature = "alloc"))]
  86. contigs: Box<[Contig; CONTIG_COUNT]>,
  87. }
  88. impl fmt::Display for Assembler {
  89. fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
  90. write!(f, "[ ")?;
  91. for contig in self.contigs.iter() {
  92. if contig.is_empty() {
  93. break;
  94. }
  95. write!(f, "{} ", contig)?;
  96. }
  97. write!(f, "]")?;
  98. Ok(())
  99. }
  100. }
  101. impl Assembler {
  102. /// Create a new buffer assembler for buffers of the given size.
  103. pub fn new(size: usize) -> Assembler {
  104. #[cfg(not(any(feature = "std", feature = "alloc")))]
  105. let mut contigs = [Contig::empty(); CONTIG_COUNT];
  106. #[cfg(any(feature = "std", feature = "alloc"))]
  107. let mut contigs = Box::new([Contig::empty(); CONTIG_COUNT]);
  108. contigs[0] = Contig::hole(size);
  109. Assembler { contigs }
  110. }
  111. /// FIXME(whitequark): remove this once I'm certain enough that the assembler works well.
  112. #[allow(dead_code)]
  113. pub(crate) fn total_size(&self) -> usize {
  114. self.contigs.iter().map(|contig| contig.total_size()).sum()
  115. }
  116. fn front(&self) -> Contig {
  117. self.contigs[0]
  118. }
  119. /// Return length of the front contiguous range without removing it from the assembler
  120. pub fn peek_front(&self) -> Option<usize> {
  121. let front = self.front();
  122. if front.has_hole() {
  123. None
  124. } else {
  125. Some(front.data_size)
  126. }
  127. }
  128. fn back(&self) -> Contig {
  129. self.contigs[self.contigs.len() - 1]
  130. }
  131. /// Return whether the assembler contains no data.
  132. pub fn is_empty(&self) -> bool {
  133. !self.front().has_data()
  134. }
  135. /// Remove a contig at the given index, and return a pointer to the first contig
  136. /// without data.
  137. fn remove_contig_at(&mut self, at: usize) -> &mut Contig {
  138. debug_assert!(!self.contigs[at].is_empty());
  139. for i in at..self.contigs.len() - 1 {
  140. self.contigs[i] = self.contigs[i + 1];
  141. if !self.contigs[i].has_data() {
  142. self.contigs[i + 1] = Contig::empty();
  143. return &mut self.contigs[i];
  144. }
  145. }
  146. // Removing the last one.
  147. self.contigs[at] = Contig::empty();
  148. &mut self.contigs[at]
  149. }
  150. /// Add a contig at the given index, and return a pointer to it.
  151. fn add_contig_at(&mut self, at: usize) -> Result<&mut Contig, TooManyHolesError> {
  152. debug_assert!(!self.contigs[at].is_empty());
  153. if !self.back().is_empty() {
  154. return Err(TooManyHolesError);
  155. }
  156. for i in (at + 1..self.contigs.len()).rev() {
  157. self.contigs[i] = self.contigs[i - 1];
  158. }
  159. self.contigs[at] = Contig::empty();
  160. Ok(&mut self.contigs[at])
  161. }
  162. /// Add a new contiguous range to the assembler, and return `Ok(bool)`,
  163. /// or return `Err(())` if too many discontiguities are already recorded.
  164. /// Returns `Ok(true)` when there was an overlap.
  165. pub fn add(&mut self, mut offset: usize, mut size: usize) -> Result<bool, TooManyHolesError> {
  166. let mut index = 0;
  167. let mut overlap = size;
  168. while index != self.contigs.len() && size != 0 {
  169. let contig = self.contigs[index];
  170. if offset >= contig.total_size() {
  171. // The range being added does not cover this contig, skip it.
  172. index += 1;
  173. } else if offset == 0 && size >= contig.hole_size && index > 0 {
  174. // The range being added covers the entire hole in this contig, merge it
  175. // into the previous config.
  176. self.contigs[index - 1].expand_data_by(contig.total_size());
  177. overlap -= contig.total_size();
  178. self.remove_contig_at(index);
  179. index += 0;
  180. } else if offset == 0 && size < contig.hole_size && index > 0 {
  181. // The range being added covers a part of the hole in this contig starting
  182. // at the beginning, shrink the hole in this contig and expand data in
  183. // the previous contig.
  184. self.contigs[index - 1].expand_data_by(size);
  185. self.contigs[index].shrink_hole_by(size);
  186. overlap -= size;
  187. index += 1;
  188. } else if offset <= contig.hole_size && offset + size >= contig.hole_size {
  189. // The range being added covers both a part of the hole and a part of the data
  190. // in this contig, shrink the hole in this contig.
  191. overlap -= contig.hole_size - offset;
  192. self.contigs[index].shrink_hole_to(offset);
  193. index += 1;
  194. } else if offset + size >= contig.hole_size {
  195. // The range being added covers only a part of the data in this contig, skip it.
  196. index += 1;
  197. } else if offset + size < contig.hole_size {
  198. // The range being added covers a part of the hole but not of the data
  199. // in this contig, add a new contig containing the range.
  200. {
  201. let inserted = self.add_contig_at(index)?;
  202. *inserted = Contig::hole_and_data(offset, size);
  203. overlap -= size;
  204. }
  205. // Previous contigs[index] got moved to contigs[index+1]
  206. self.contigs[index + 1].shrink_hole_by(offset + size);
  207. index += 2;
  208. } else {
  209. unreachable!()
  210. }
  211. // Skip the portion of the range covered by this contig.
  212. if offset >= contig.total_size() {
  213. offset = offset.saturating_sub(contig.total_size());
  214. } else {
  215. size = (offset + size).saturating_sub(contig.total_size());
  216. offset = 0;
  217. }
  218. }
  219. debug_assert!(size == 0);
  220. Ok(overlap != 0)
  221. }
  222. /// Remove a contiguous range from the front of the assembler and `Some(data_size)`,
  223. /// or return `None` if there is no such range.
  224. pub fn remove_front(&mut self) -> Option<usize> {
  225. let front = self.front();
  226. if front.has_hole() {
  227. None
  228. } else {
  229. let last_hole = self.remove_contig_at(0);
  230. last_hole.hole_size += front.data_size;
  231. debug_assert!(front.data_size > 0);
  232. Some(front.data_size)
  233. }
  234. }
  235. /// Iterate over all of the contiguous data ranges.
  236. ///
  237. /// This is used in calculating what data ranges have been received. The offset indicates the
  238. /// number of bytes of contiguous data received before the beginnings of this Assembler.
  239. ///
  240. /// Data Hole Data
  241. /// |--- 100 ---|--- 200 ---|--- 100 ---|
  242. ///
  243. /// An offset of 1500 would return the ranges: ``(1500, 1600), (1800, 1900)``
  244. pub fn iter_data(&self, first_offset: usize) -> AssemblerIter {
  245. AssemblerIter::new(self, first_offset)
  246. }
  247. }
  248. pub struct AssemblerIter<'a> {
  249. assembler: &'a Assembler,
  250. offset: usize,
  251. index: usize,
  252. left: usize,
  253. right: usize,
  254. }
  255. impl<'a> AssemblerIter<'a> {
  256. fn new(assembler: &'a Assembler, offset: usize) -> AssemblerIter<'a> {
  257. AssemblerIter {
  258. assembler,
  259. offset,
  260. index: 0,
  261. left: 0,
  262. right: 0,
  263. }
  264. }
  265. }
  266. impl<'a> Iterator for AssemblerIter<'a> {
  267. type Item = (usize, usize);
  268. fn next(&mut self) -> Option<(usize, usize)> {
  269. let mut data_range = None;
  270. while data_range.is_none() && self.index < self.assembler.contigs.len() {
  271. let contig = self.assembler.contigs[self.index];
  272. self.left += contig.hole_size;
  273. self.right = self.left + contig.data_size;
  274. data_range = if self.left < self.right {
  275. let data_range = (self.left + self.offset, self.right + self.offset);
  276. self.left = self.right;
  277. Some(data_range)
  278. } else {
  279. None
  280. };
  281. self.index += 1;
  282. }
  283. data_range
  284. }
  285. }
  286. #[cfg(test)]
  287. mod test {
  288. use super::*;
  289. use std::vec::Vec;
  290. impl From<Vec<(usize, usize)>> for Assembler {
  291. fn from(vec: Vec<(usize, usize)>) -> Assembler {
  292. #[cfg(not(any(feature = "std", feature = "alloc")))]
  293. let mut contigs = [Contig::empty(); CONTIG_COUNT];
  294. #[cfg(any(feature = "std", feature = "alloc"))]
  295. let mut contigs = Box::new([Contig::empty(); CONTIG_COUNT]);
  296. for (i, &(hole_size, data_size)) in vec.iter().enumerate() {
  297. contigs[i] = Contig {
  298. hole_size,
  299. data_size,
  300. };
  301. }
  302. Assembler { contigs }
  303. }
  304. }
  305. macro_rules! contigs {
  306. [$( $x:expr ),*] => ({
  307. Assembler::from(vec![$( $x ),*])
  308. })
  309. }
  310. #[test]
  311. fn test_new() {
  312. let assr = Assembler::new(16);
  313. assert_eq!(assr.total_size(), 16);
  314. assert_eq!(assr, contigs![(16, 0)]);
  315. }
  316. #[test]
  317. fn test_empty_add_full() {
  318. let mut assr = Assembler::new(16);
  319. assert_eq!(assr.add(0, 16), Ok(false));
  320. assert_eq!(assr, contigs![(0, 16)]);
  321. }
  322. #[test]
  323. fn test_empty_add_front() {
  324. let mut assr = Assembler::new(16);
  325. assert_eq!(assr.add(0, 4), Ok(false));
  326. assert_eq!(assr, contigs![(0, 4), (12, 0)]);
  327. }
  328. #[test]
  329. fn test_empty_add_back() {
  330. let mut assr = Assembler::new(16);
  331. assert_eq!(assr.add(12, 4), Ok(false));
  332. assert_eq!(assr, contigs![(12, 4)]);
  333. }
  334. #[test]
  335. fn test_empty_add_mid() {
  336. let mut assr = Assembler::new(16);
  337. assert_eq!(assr.add(4, 8), Ok(false));
  338. assert_eq!(assr, contigs![(4, 8), (4, 0)]);
  339. }
  340. #[test]
  341. fn test_partial_add_front() {
  342. let mut assr = contigs![(4, 8), (4, 0)];
  343. assert_eq!(assr.add(0, 4), Ok(false));
  344. assert_eq!(assr, contigs![(0, 12), (4, 0)]);
  345. }
  346. #[test]
  347. fn test_partial_add_back() {
  348. let mut assr = contigs![(4, 8), (4, 0)];
  349. assert_eq!(assr.add(12, 4), Ok(false));
  350. assert_eq!(assr, contigs![(4, 12)]);
  351. }
  352. #[test]
  353. fn test_partial_add_front_overlap() {
  354. let mut assr = contigs![(4, 8), (4, 0)];
  355. assert_eq!(assr.add(0, 8), Ok(true));
  356. assert_eq!(assr, contigs![(0, 12), (4, 0)]);
  357. }
  358. #[test]
  359. fn test_partial_add_front_overlap_split() {
  360. let mut assr = contigs![(4, 8), (4, 0)];
  361. assert_eq!(assr.add(2, 6), Ok(true));
  362. assert_eq!(assr, contigs![(2, 10), (4, 0)]);
  363. }
  364. #[test]
  365. fn test_partial_add_back_overlap() {
  366. let mut assr = contigs![(4, 8), (4, 0)];
  367. assert_eq!(assr.add(8, 8), Ok(true));
  368. assert_eq!(assr, contigs![(4, 12)]);
  369. }
  370. #[test]
  371. fn test_partial_add_back_overlap_split() {
  372. let mut assr = contigs![(4, 8), (4, 0)];
  373. assert_eq!(assr.add(10, 4), Ok(true));
  374. assert_eq!(assr, contigs![(4, 10), (2, 0)]);
  375. }
  376. #[test]
  377. fn test_partial_add_both_overlap() {
  378. let mut assr = contigs![(4, 8), (4, 0)];
  379. assert_eq!(assr.add(0, 16), Ok(true));
  380. assert_eq!(assr, contigs![(0, 16)]);
  381. }
  382. #[test]
  383. fn test_partial_add_both_overlap_split() {
  384. let mut assr = contigs![(4, 8), (4, 0)];
  385. assert_eq!(assr.add(2, 12), Ok(true));
  386. assert_eq!(assr, contigs![(2, 12), (2, 0)]);
  387. }
  388. #[test]
  389. fn test_rejected_add_keeps_state() {
  390. let mut assr = Assembler::new(CONTIG_COUNT * 20);
  391. for c in 1..=CONTIG_COUNT - 1 {
  392. assert_eq!(assr.add(c * 10, 3), Ok(false));
  393. }
  394. // Maximum of allowed holes is reached
  395. let assr_before = assr.clone();
  396. assert_eq!(assr.add(1, 3), Err(TooManyHolesError));
  397. assert_eq!(assr_before, assr);
  398. }
  399. #[test]
  400. fn test_empty_remove_front() {
  401. let mut assr = contigs![(12, 0)];
  402. assert_eq!(assr.remove_front(), None);
  403. }
  404. #[test]
  405. fn test_trailing_hole_remove_front() {
  406. let mut assr = contigs![(0, 4), (8, 0)];
  407. assert_eq!(assr.remove_front(), Some(4));
  408. assert_eq!(assr, contigs![(12, 0)]);
  409. }
  410. #[test]
  411. fn test_trailing_data_remove_front() {
  412. let mut assr = contigs![(0, 4), (4, 4)];
  413. assert_eq!(assr.remove_front(), Some(4));
  414. assert_eq!(assr, contigs![(4, 4), (4, 0)]);
  415. }
  416. #[test]
  417. fn test_iter_empty() {
  418. let assr = Assembler::new(16);
  419. let segments: Vec<_> = assr.iter_data(10).collect();
  420. assert_eq!(segments, vec![]);
  421. }
  422. #[test]
  423. fn test_iter_full() {
  424. let mut assr = Assembler::new(16);
  425. assert_eq!(assr.add(0, 16), Ok(false));
  426. let segments: Vec<_> = assr.iter_data(10).collect();
  427. assert_eq!(segments, vec![(10, 26)]);
  428. }
  429. #[test]
  430. fn test_iter_offset() {
  431. let mut assr = Assembler::new(16);
  432. assert_eq!(assr.add(0, 16), Ok(false));
  433. let segments: Vec<_> = assr.iter_data(100).collect();
  434. assert_eq!(segments, vec![(100, 116)]);
  435. }
  436. #[test]
  437. fn test_iter_one_front() {
  438. let mut assr = Assembler::new(16);
  439. assert_eq!(assr.add(0, 4), Ok(false));
  440. let segments: Vec<_> = assr.iter_data(10).collect();
  441. assert_eq!(segments, vec![(10, 14)]);
  442. }
  443. #[test]
  444. fn test_iter_one_back() {
  445. let mut assr = Assembler::new(16);
  446. assert_eq!(assr.add(12, 4), Ok(false));
  447. let segments: Vec<_> = assr.iter_data(10).collect();
  448. assert_eq!(segments, vec![(22, 26)]);
  449. }
  450. #[test]
  451. fn test_iter_one_mid() {
  452. let mut assr = Assembler::new(16);
  453. assert_eq!(assr.add(4, 8), Ok(false));
  454. let segments: Vec<_> = assr.iter_data(10).collect();
  455. assert_eq!(segments, vec![(14, 22)]);
  456. }
  457. #[test]
  458. fn test_iter_one_trailing_gap() {
  459. let assr = contigs![(4, 8), (4, 0)];
  460. let segments: Vec<_> = assr.iter_data(100).collect();
  461. assert_eq!(segments, vec![(104, 112)]);
  462. }
  463. #[test]
  464. fn test_iter_two_split() {
  465. let assr = contigs![(2, 6), (4, 1), (1, 0)];
  466. let segments: Vec<_> = assr.iter_data(100).collect();
  467. assert_eq!(segments, vec![(102, 108), (112, 113)]);
  468. }
  469. #[test]
  470. fn test_iter_three_split() {
  471. let assr = contigs![(2, 6), (2, 1), (2, 2), (1, 0)];
  472. let segments: Vec<_> = assr.iter_data(100).collect();
  473. assert_eq!(segments, vec![(102, 108), (110, 111), (113, 115)]);
  474. }
  475. }