assembler.rs 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350
  1. use core::fmt;
  2. /// A contiguous chunk of absent data, followed by a contiguous chunk of present data.
  3. #[derive(Debug, Clone, Copy, PartialEq, Eq)]
  4. struct Contig {
  5. hole_size: usize,
  6. data_size: usize
  7. }
  8. impl fmt::Display for Contig {
  9. fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
  10. if self.has_hole() { write!(f, "({})", self.hole_size)?; }
  11. if self.has_hole() && self.has_data() { write!(f, " ")?; }
  12. if self.has_data() { write!(f, "{}", self.data_size)?; }
  13. Ok(())
  14. }
  15. }
  16. impl Contig {
  17. fn empty() -> Contig {
  18. Contig { hole_size: 0, data_size: 0 }
  19. }
  20. fn hole(size: usize) -> Contig {
  21. Contig { hole_size: size, data_size: 0 }
  22. }
  23. fn hole_and_data(hole_size: usize, data_size: usize) -> Contig {
  24. Contig { hole_size, data_size }
  25. }
  26. fn has_hole(&self) -> bool {
  27. self.hole_size != 0
  28. }
  29. fn has_data(&self) -> bool {
  30. self.data_size != 0
  31. }
  32. fn total_size(&self) -> usize {
  33. self.hole_size + self.data_size
  34. }
  35. fn is_empty(&self) -> bool {
  36. self.total_size() == 0
  37. }
  38. fn expand_data_by(&mut self, size: usize) {
  39. self.data_size += size;
  40. }
  41. fn shrink_hole_by(&mut self, size: usize) {
  42. self.hole_size -= size;
  43. }
  44. fn shrink_hole_to(&mut self, size: usize) {
  45. assert!(self.hole_size >= size);
  46. let total_size = self.total_size();
  47. self.hole_size = size;
  48. self.data_size = total_size - size;
  49. }
  50. }
  51. const CONTIG_COUNT: usize = 4;
  52. /// A buffer (re)assembler.
  53. ///
  54. /// Currently, up to a hardcoded limit of four holes can be tracked in the buffer.
  55. #[derive(Debug)]
  56. #[cfg_attr(test, derive(PartialEq, Eq))]
  57. pub struct Assembler {
  58. contigs: [Contig; CONTIG_COUNT]
  59. }
  60. impl fmt::Display for Assembler {
  61. fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
  62. write!(f, "[ ")?;
  63. for contig in self.contigs.iter() {
  64. if contig.is_empty() { break }
  65. write!(f, "{} ", contig)?;
  66. }
  67. write!(f, "]")?;
  68. Ok(())
  69. }
  70. }
  71. impl Assembler {
  72. /// Create a new buffer assembler for buffers of the given size.
  73. pub fn new(size: usize) -> Assembler {
  74. let mut contigs = [Contig::empty(); CONTIG_COUNT];
  75. contigs[0] = Contig::hole(size);
  76. Assembler { contigs }
  77. }
  78. pub(crate) fn total_size(&self) -> usize {
  79. self.contigs
  80. .iter()
  81. .map(|contig| contig.total_size())
  82. .sum()
  83. }
  84. fn front(&self) -> Contig {
  85. self.contigs[0]
  86. }
  87. fn back(&self) -> Contig {
  88. self.contigs[self.contigs.len() - 1]
  89. }
  90. /// Return whether the assembler contains no data.
  91. pub fn is_empty(&self) -> bool {
  92. !self.front().has_data()
  93. }
  94. /// Remove a contig at the given index, and return a pointer to the first contig
  95. /// without data.
  96. fn remove_contig_at(&mut self, at: usize) -> &mut Contig {
  97. debug_assert!(!self.contigs[at].is_empty());
  98. for i in at..self.contigs.len() - 1 {
  99. self.contigs[i] = self.contigs[i + 1];
  100. if !self.contigs[i].has_data() {
  101. self.contigs[i + 1] = Contig::empty();
  102. return &mut self.contigs[i]
  103. }
  104. }
  105. // Removing the last one.
  106. self.contigs[at] = Contig::empty();
  107. &mut self.contigs[at]
  108. }
  109. /// Add a contig at the given index, and return a pointer to it.
  110. fn add_contig_at(&mut self, at: usize) -> Result<&mut Contig, ()> {
  111. debug_assert!(!self.contigs[at].is_empty());
  112. if !self.back().is_empty() { return Err(()) }
  113. for i in (at + 1..self.contigs.len()).rev() {
  114. self.contigs[i] = self.contigs[i - 1];
  115. }
  116. self.contigs[at] = Contig::empty();
  117. Ok(&mut self.contigs[at])
  118. }
  119. /// Add a new contiguous range to the assembler, and return `Ok(())`,
  120. /// or return `Err(())` if too many discontiguities are already recorded.
  121. pub fn add(&mut self, mut offset: usize, mut size: usize) -> Result<(), ()> {
  122. let mut index = 0;
  123. while index != self.contigs.len() && size != 0 {
  124. let contig = self.contigs[index];
  125. if let Some(new_offset) = offset.checked_sub(contig.total_size()) {
  126. // The range being added does not cover this contig, skip it.
  127. index += 1;
  128. } else if offset == 0 && size >= contig.hole_size && index > 0 {
  129. // The range being added covers the entire hole in this contig, merge it
  130. // into the previous config.
  131. self.contigs[index - 1].expand_data_by(contig.total_size());
  132. self.remove_contig_at(index);
  133. index += 0;
  134. } else if offset == 0 && size < contig.hole_size && index > 0 {
  135. // The range being added covers a part of the hole in this contig starting
  136. // at the beginning, shrink the hole in this contig and expand data in
  137. // the previous contig.
  138. self.contigs[index - 1].expand_data_by(size);
  139. self.contigs[index].shrink_hole_by(size);
  140. index += 1;
  141. } else if offset <= contig.hole_size && offset + size >= contig.hole_size {
  142. // The range being added covers both a part of the hole and a part of the data
  143. // in this contig, shrink the hole in this contig.
  144. self.contigs[index].shrink_hole_to(offset);
  145. index += 1;
  146. } else if offset + size >= contig.hole_size {
  147. // The range being added covers only a part of the data in this contig, skip it.
  148. index += 1;
  149. } else if offset + size < contig.hole_size {
  150. // The range being added covers a part of the hole but not of the data
  151. // in this contig, add a new contig containing the range.
  152. self.contigs[index].shrink_hole_by(offset + size);
  153. let inserted = self.add_contig_at(index)?;
  154. *inserted = Contig::hole_and_data(offset, size);
  155. index += 2;
  156. } else {
  157. unreachable!()
  158. }
  159. // Skip the portion of the range covered by this contig.
  160. if offset >= contig.total_size() {
  161. offset = offset.saturating_sub(contig.total_size());
  162. } else {
  163. size = (offset + size).saturating_sub(contig.total_size());
  164. offset = 0;
  165. }
  166. }
  167. debug_assert!(size == 0);
  168. Ok(())
  169. }
  170. /// Remove a contiguous range from the front of the assembler and `Some(data_size)`,
  171. /// or return `None` if there is no such range.
  172. pub fn remove_front(&mut self) -> Option<usize> {
  173. let front = self.front();
  174. if front.has_hole() {
  175. None
  176. } else {
  177. let last_hole = self.remove_contig_at(0);
  178. last_hole.hole_size += front.data_size;
  179. debug_assert!(front.data_size > 0);
  180. Some(front.data_size)
  181. }
  182. }
  183. }
  184. #[cfg(test)]
  185. mod test {
  186. use std::vec::Vec;
  187. use super::*;
  188. impl From<Vec<(usize, usize)>> for Assembler {
  189. fn from(vec: Vec<(usize, usize)>) -> Assembler {
  190. let mut contigs = [Contig::empty(); CONTIG_COUNT];
  191. for (i, &(hole_size, data_size)) in vec.iter().enumerate() {
  192. contigs[i] = Contig { hole_size, data_size };
  193. }
  194. Assembler { contigs }
  195. }
  196. }
  197. macro_rules! contigs {
  198. [$( $x:expr ),*] => ({
  199. Assembler::from(vec![$( $x ),*])
  200. })
  201. }
  202. #[test]
  203. fn test_new() {
  204. let assr = Assembler::new(16);
  205. assert_eq!(assr.total_size(), 16);
  206. assert_eq!(assr, contigs![(16, 0)]);
  207. }
  208. #[test]
  209. fn test_empty_add_full() {
  210. let mut assr = Assembler::new(16);
  211. assert_eq!(assr.add(0, 16), Ok(()));
  212. assert_eq!(assr, contigs![(0, 16)]);
  213. }
  214. #[test]
  215. fn test_empty_add_front() {
  216. let mut assr = Assembler::new(16);
  217. assert_eq!(assr.add(0, 4), Ok(()));
  218. assert_eq!(assr, contigs![(0, 4), (12, 0)]);
  219. }
  220. #[test]
  221. fn test_empty_add_back() {
  222. let mut assr = Assembler::new(16);
  223. assert_eq!(assr.add(12, 4), Ok(()));
  224. assert_eq!(assr, contigs![(12, 4)]);
  225. }
  226. #[test]
  227. fn test_empty_add_mid() {
  228. let mut assr = Assembler::new(16);
  229. assert_eq!(assr.add(4, 8), Ok(()));
  230. assert_eq!(assr, contigs![(4, 8), (4, 0)]);
  231. }
  232. #[test]
  233. fn test_partial_add_front() {
  234. let mut assr = contigs![(4, 8), (4, 0)];
  235. assert_eq!(assr.add(0, 4), Ok(()));
  236. assert_eq!(assr, contigs![(0, 12), (4, 0)]);
  237. }
  238. #[test]
  239. fn test_partial_add_back() {
  240. let mut assr = contigs![(4, 8), (4, 0)];
  241. assert_eq!(assr.add(12, 4), Ok(()));
  242. assert_eq!(assr, contigs![(4, 12)]);
  243. }
  244. #[test]
  245. fn test_partial_add_front_overlap() {
  246. let mut assr = contigs![(4, 8), (4, 0)];
  247. assert_eq!(assr.add(0, 8), Ok(()));
  248. assert_eq!(assr, contigs![(0, 12), (4, 0)]);
  249. }
  250. #[test]
  251. fn test_partial_add_front_overlap_split() {
  252. let mut assr = contigs![(4, 8), (4, 0)];
  253. assert_eq!(assr.add(2, 6), Ok(()));
  254. assert_eq!(assr, contigs![(2, 10), (4, 0)]);
  255. }
  256. #[test]
  257. fn test_partial_add_back_overlap() {
  258. let mut assr = contigs![(4, 8), (4, 0)];
  259. assert_eq!(assr.add(8, 8), Ok(()));
  260. assert_eq!(assr, contigs![(4, 12)]);
  261. }
  262. #[test]
  263. fn test_partial_add_back_overlap_split() {
  264. let mut assr = contigs![(4, 8), (4, 0)];
  265. assert_eq!(assr.add(10, 4), Ok(()));
  266. assert_eq!(assr, contigs![(4, 10), (2, 0)]);
  267. }
  268. #[test]
  269. fn test_partial_add_both_overlap() {
  270. let mut assr = contigs![(4, 8), (4, 0)];
  271. assert_eq!(assr.add(0, 16), Ok(()));
  272. assert_eq!(assr, contigs![(0, 16)]);
  273. }
  274. #[test]
  275. fn test_partial_add_both_overlap_split() {
  276. let mut assr = contigs![(4, 8), (4, 0)];
  277. assert_eq!(assr.add(2, 12), Ok(()));
  278. assert_eq!(assr, contigs![(2, 12), (2, 0)]);
  279. }
  280. #[test]
  281. fn test_empty_remove_front() {
  282. let mut assr = contigs![(12, 0)];
  283. assert_eq!(assr.remove_front(), None);
  284. }
  285. #[test]
  286. fn test_trailing_hole_remove_front() {
  287. let mut assr = contigs![(0, 4), (8, 0)];
  288. assert_eq!(assr.remove_front(), Some(4));
  289. assert_eq!(assr, contigs![(12, 0)]);
  290. }
  291. #[test]
  292. fn test_trailing_data_remove_front() {
  293. let mut assr = contigs![(0, 4), (4, 4)];
  294. assert_eq!(assr.remove_front(), Some(4));
  295. assert_eq!(assr, contigs![(4, 4), (4, 0)]);
  296. }
  297. }