xsparse.c 9.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469
  1. /* xsparse - expands compressed sparse file images extracted from GNU tar
  2. archives.
  3. Copyright (C) 2006 Free Software Foundation, Inc.
  4. Written by Sergey Poznyakoff
  5. This program is free software; you can redistribute it and/or modify it
  6. under the terms of the GNU General Public License as published by the
  7. Free Software Foundation; either version 2, or (at your option) any later
  8. version.
  9. This program is distributed in the hope that it will be useful, but
  10. WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General
  12. Public License for more details.
  13. You should have received a copy of the GNU General Public License along
  14. with this program; if not, write to the Free Software Foundation, Inc.,
  15. 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. */
  16. #include <stdlib.h>
  17. #include <stdio.h>
  18. #include <stdarg.h>
  19. #include <unistd.h>
  20. #include <getopt.h>
  21. #include <fcntl.h>
  22. #include <sys/stat.h>
  23. #include <limits.h>
  24. #include <errno.h>
  25. /* Bound on length of the string representing an off_t.
  26. See INT_STRLEN_BOUND in intprops.h for explanation */
  27. #define OFF_T_STRLEN_BOUND ((sizeof (off_t) * CHAR_BIT) * 146 / 485 + 1)
  28. #define OFF_T_STRSIZE_BOUND (OFF_T_STRLEN_BOUND+1)
  29. #define BLOCKSIZE 512
  30. struct sp_array
  31. {
  32. off_t offset;
  33. size_t numbytes;
  34. };
  35. char *progname;
  36. int verbose;
  37. void
  38. die (int code, char *fmt, ...)
  39. {
  40. va_list ap;
  41. fprintf (stderr, "%s: ", progname);
  42. va_start (ap, fmt);
  43. vfprintf (stderr, fmt, ap);
  44. va_end (ap);
  45. fprintf (stderr, "\n");
  46. exit (code);
  47. }
  48. void *
  49. emalloc (size_t size)
  50. {
  51. char *p = malloc (size);
  52. if (!p)
  53. die (1, "not enough memory");
  54. return p;
  55. }
  56. off_t
  57. string_to_off (char *p, char **endp)
  58. {
  59. off_t v = 0;
  60. for (; *p; p++)
  61. {
  62. int digit = *p - '0';
  63. off_t x = v * 10;
  64. if (9 < (unsigned) digit)
  65. {
  66. if (endp)
  67. {
  68. *endp = p;
  69. break;
  70. }
  71. die (1, "number parse error near %s", p);
  72. }
  73. else if (x / 10 != v)
  74. die (1, "number out of allowed range, near %s", p);
  75. v = x + digit;
  76. if (v < 0)
  77. die (1, "negative number");
  78. }
  79. if (endp)
  80. *endp = p;
  81. return v;
  82. }
  83. size_t
  84. string_to_size (char *p, char **endp)
  85. {
  86. off_t v = string_to_off (p, endp);
  87. size_t ret = v;
  88. if (ret != v)
  89. die (1, "number too big");
  90. return ret;
  91. }
  92. size_t sparse_map_size;
  93. struct sp_array *sparse_map;
  94. void
  95. get_line (char *s, int size, FILE *stream)
  96. {
  97. char *p = fgets (s, size, stream);
  98. size_t len;
  99. if (!p)
  100. die (1, "unexpected end of file");
  101. len = strlen (p);
  102. if (s[len - 1] != '\n')
  103. die (1, "buffer overflow");
  104. s[len - 1] = 0;
  105. }
  106. int
  107. get_var (FILE *fp, char **name, char **value)
  108. {
  109. static char *buffer;
  110. static size_t bufsize = OFF_T_STRSIZE_BOUND;
  111. char *p, *q;
  112. buffer = emalloc (bufsize);
  113. do
  114. {
  115. size_t len, s;
  116. if (!fgets (buffer, bufsize, fp))
  117. return 0;
  118. len = strlen (buffer);
  119. if (len == 0)
  120. return 0;
  121. s = string_to_size (buffer, &p);
  122. if (*p != ' ')
  123. die (1, "malformed header: expected space but found %s", p);
  124. if (buffer[len-1] != '\n')
  125. {
  126. if (bufsize < s + 1)
  127. {
  128. bufsize = s + 1;
  129. buffer = realloc (buffer, bufsize);
  130. if (!buffer)
  131. die (1, "not enough memory");
  132. }
  133. if (!fgets (buffer + len, s - len + 1, fp))
  134. die (1, "unexpected end of file or read error");
  135. }
  136. p++;
  137. }
  138. while (memcmp (p, "GNU.sparse.", 11));
  139. p += 11;
  140. q = strchr (p, '=');
  141. if (!q)
  142. die (1, "malformed header: expected `=' not found");
  143. *q++ = 0;
  144. q[strlen (q) - 1] = 0;
  145. *name = p;
  146. *value = q;
  147. return 1;
  148. }
  149. char *outname;
  150. off_t outsize;
  151. unsigned version_major;
  152. unsigned version_minor;
  153. void
  154. read_xheader (char *name)
  155. {
  156. char *kw, *val;
  157. FILE *fp = fopen (name, "r");
  158. char *expect = NULL;
  159. size_t i = 0;
  160. if (verbose)
  161. printf ("Reading extended header file\n");
  162. while (get_var (fp, &kw, &val))
  163. {
  164. if (verbose)
  165. printf ("Found variable GNU.sparse.%s = %s\n", kw, val);
  166. if (expect && strcmp (kw, expect))
  167. die (1, "bad keyword sequence: expected `%s' but found `%s'",
  168. expect, kw);
  169. expect = NULL;
  170. if (strcmp (kw, "name") == 0)
  171. {
  172. outname = emalloc (strlen (val) + 1);
  173. strcpy (outname, val);
  174. }
  175. else if (strcmp (kw, "major") == 0)
  176. {
  177. version_major = string_to_size (val, NULL);
  178. }
  179. else if (strcmp (kw, "minor") == 0)
  180. {
  181. version_minor = string_to_size (val, NULL);
  182. }
  183. else if (strcmp (kw, "realsize") == 0
  184. || strcmp (kw, "size") == 0)
  185. {
  186. outsize = string_to_off (val, NULL);
  187. }
  188. else if (strcmp (kw, "numblocks") == 0)
  189. {
  190. sparse_map_size = string_to_size (val, NULL);
  191. sparse_map = emalloc (sparse_map_size * sizeof *sparse_map);
  192. }
  193. else if (strcmp (kw, "offset") == 0)
  194. {
  195. sparse_map[i].offset = string_to_off (val, NULL);
  196. expect = "numbytes";
  197. }
  198. else if (strcmp (kw, "numbytes") == 0)
  199. {
  200. sparse_map[i++].numbytes = string_to_size (val, NULL);
  201. }
  202. else if (strcmp (kw, "map") == 0)
  203. {
  204. for (i = 0; i < sparse_map_size; i++)
  205. {
  206. sparse_map[i].offset = string_to_off (val, &val);
  207. if (*val != ',')
  208. die (1, "bad GNU.sparse.map: expected `,' but found `%c'",
  209. *val);
  210. sparse_map[i].numbytes = string_to_size (val+1, &val);
  211. if (*val != ',')
  212. {
  213. if (!(*val == 0 && i == sparse_map_size-1))
  214. die (1, "bad GNU.sparse.map: expected `,' but found `%c'",
  215. *val);
  216. }
  217. else
  218. val++;
  219. }
  220. if (*val)
  221. die (1, "bad GNU.sparse.map: garbage at the end");
  222. }
  223. }
  224. if (expect)
  225. die (1, "bad keyword sequence: expected `%s' not found", expect);
  226. if (version_major == 0 && sparse_map_size == 0)
  227. die (1, "size of the sparse map unknown");
  228. if (i != sparse_map_size)
  229. die (1, "not all sparse entries supplied");
  230. fclose (fp);
  231. }
  232. void
  233. read_map (FILE *ifp)
  234. {
  235. size_t i;
  236. char nbuf[OFF_T_STRSIZE_BOUND];
  237. if (verbose)
  238. printf ("Reading v.1.0 sparse map\n");
  239. get_line (nbuf, sizeof nbuf, ifp);
  240. sparse_map_size = string_to_size (nbuf, NULL);
  241. sparse_map = emalloc (sparse_map_size * sizeof *sparse_map);
  242. for (i = 0; i < sparse_map_size; i++)
  243. {
  244. get_line (nbuf, sizeof nbuf, ifp);
  245. sparse_map[i].offset = string_to_off (nbuf, NULL);
  246. get_line (nbuf, sizeof nbuf, ifp);
  247. sparse_map[i].numbytes = string_to_size (nbuf, NULL);
  248. }
  249. fseek (ifp, ((ftell (ifp) + BLOCKSIZE - 1) / BLOCKSIZE) * BLOCKSIZE,
  250. SEEK_SET);
  251. }
  252. void
  253. expand_sparse (FILE *sfp, int ofd)
  254. {
  255. size_t i;
  256. size_t maxbytes = 0;
  257. char *buffer;
  258. for (i = 0; i < sparse_map_size; i++)
  259. if (maxbytes < sparse_map[i].numbytes)
  260. maxbytes = sparse_map[i].numbytes;
  261. for (buffer = malloc (maxbytes); !buffer; maxbytes /= 2)
  262. if (maxbytes == 0)
  263. die (1, "not enough memory");
  264. for (i = 0; i < sparse_map_size; i++)
  265. {
  266. size_t size = sparse_map[i].numbytes;
  267. lseek (ofd, sparse_map[i].offset, SEEK_SET);
  268. while (size)
  269. {
  270. size_t rdsize = (size < maxbytes) ? size : maxbytes;
  271. if (rdsize != fread (buffer, 1, rdsize, sfp))
  272. die (1, "read error (%d)", errno);
  273. if (rdsize != write (ofd, buffer, rdsize))
  274. die (1, "write error (%d)", errno);
  275. size -= rdsize;
  276. }
  277. }
  278. free (buffer);
  279. }
  280. void
  281. usage (int code)
  282. {
  283. printf ("Usage: %s [OPTIONS] infile [outfile]\n", progname);
  284. printf ("%s: expand sparse files extracted from GNU archives\n",
  285. progname);
  286. printf ("\nOPTIONS are:\n\n");
  287. printf (" -h Display this help list\n");
  288. printf (" -n Dry run: do nothing, print what would have been done\n");
  289. printf (" -v Increase verbosity level\n");
  290. printf (" -x FILE Parse extended header FILE\n\n");
  291. exit (code);
  292. }
  293. void
  294. guess_outname (char *name)
  295. {
  296. char *p;
  297. char *s;
  298. if (name[0] == '.' && name[1] == '/')
  299. name += 2;
  300. p = name + strlen (name) - 1;
  301. s = NULL;
  302. for (; p > name && *p != '/'; p--)
  303. ;
  304. if (*p == '/')
  305. s = p + 1;
  306. if (p != name)
  307. {
  308. for (p--; p > name && *p != '/'; p--)
  309. ;
  310. }
  311. if (*p != '/')
  312. {
  313. if (s)
  314. outname = s;
  315. else
  316. {
  317. outname = emalloc (4 + strlen (name));
  318. strcpy (outname, "../");
  319. strcpy (outname + 3, name);
  320. }
  321. }
  322. else
  323. {
  324. size_t len = p - name + 1;
  325. outname = emalloc (len + strlen (s) + 1);
  326. memcpy (outname, name, len);
  327. strcpy (outname + len, s);
  328. }
  329. }
  330. int
  331. main (int argc, char **argv)
  332. {
  333. int c;
  334. int dry_run = 0;
  335. char *xheader_file = NULL;
  336. char *inname;
  337. FILE *ifp;
  338. struct stat st;
  339. int ofd;
  340. progname = argv[0];
  341. while ((c = getopt (argc, argv, "hnvx:")) != EOF)
  342. {
  343. switch (c)
  344. {
  345. case 'h':
  346. usage (0);
  347. break;
  348. case 'x':
  349. xheader_file = optarg;
  350. break;
  351. case 'n':
  352. dry_run = 1;
  353. case 'v':
  354. verbose++;
  355. break;
  356. default:
  357. exit (1);
  358. }
  359. }
  360. argc -= optind;
  361. argv += optind;
  362. if (argc == 0 || argc > 2)
  363. usage (1);
  364. if (xheader_file)
  365. read_xheader (xheader_file);
  366. inname = argv[0];
  367. if (argv[1])
  368. outname = argv[1];
  369. if (stat (inname, &st))
  370. die (1, "cannot stat %s (%d)", inname, errno);
  371. ifp = fopen (inname, "r");
  372. if (ifp == NULL)
  373. die (1, "cannot open file %s (%d)", inname, errno);
  374. if (!xheader_file || version_major == 1)
  375. read_map (ifp);
  376. if (!outname)
  377. guess_outname (inname);
  378. ofd = open (outname, O_RDWR|O_CREAT|O_TRUNC, st.st_mode);
  379. if (ofd == -1)
  380. die (1, "cannot open file %s (%d)", outname, errno);
  381. if (verbose)
  382. printf ("Expanding file `%s' to `%s'\n", inname, outname);
  383. if (dry_run)
  384. {
  385. printf ("Finished dry run\n");
  386. return 0;
  387. }
  388. expand_sparse (ifp, ofd);
  389. fclose (ifp);
  390. close (ofd);
  391. if (verbose)
  392. printf ("Done\n");
  393. if (outsize)
  394. {
  395. if (stat (outname, &st))
  396. die (1, "cannot stat output file %s (%d)", outname, errno);
  397. if (st.st_size != outsize)
  398. die (1, "expanded file has wrong size");
  399. }
  400. return 0;
  401. }