tar.c 42 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307
  1. /* vi: set sw=4 ts=4: */
  2. /*
  3. * Mini tar implementation for busybox
  4. *
  5. * Modified to use common extraction code used by ar, cpio, dpkg-deb, dpkg
  6. * by Glenn McGrath
  7. *
  8. * Note, that as of BusyBox-0.43, tar has been completely rewritten from the
  9. * ground up. It still has remnants of the old code lying about, but it is
  10. * very different now (i.e., cleaner, less global variables, etc.)
  11. *
  12. * Copyright (C) 1999-2004 by Erik Andersen <andersen@codepoet.org>
  13. *
  14. * Based in part in the tar implementation in sash
  15. * Copyright (c) 1999 by David I. Bell
  16. * Permission is granted to use, distribute, or modify this source,
  17. * provided that this copyright notice remains intact.
  18. * Permission to distribute sash derived code under GPL has been granted.
  19. *
  20. * Based in part on the tar implementation from busybox-0.28
  21. * Copyright (C) 1995 Bruce Perens
  22. *
  23. * Licensed under GPLv2 or later, see file LICENSE in this source tree.
  24. */
  25. //config:config TAR
  26. //config: bool "tar (39 kb)"
  27. //config: default y
  28. //config: help
  29. //config: tar is an archiving program. It's commonly used with gzip to
  30. //config: create compressed archives. It's probably the most widely used
  31. //config: UNIX archive program.
  32. //config:
  33. //config:config FEATURE_TAR_LONG_OPTIONS
  34. //config: bool "Enable long options"
  35. //config: default y
  36. //config: depends on TAR && LONG_OPTS
  37. //config:
  38. //config:config FEATURE_TAR_CREATE
  39. //config: bool "Enable -c (archive creation)"
  40. //config: default y
  41. //config: depends on TAR
  42. //config:
  43. //config:config FEATURE_TAR_AUTODETECT
  44. //config: bool "Autodetect compressed tarballs"
  45. //config: default y
  46. //config: depends on TAR && (FEATURE_SEAMLESS_Z || FEATURE_SEAMLESS_GZ || FEATURE_SEAMLESS_BZ2 || FEATURE_SEAMLESS_LZMA || FEATURE_SEAMLESS_XZ)
  47. //config: help
  48. //config: With this option tar can automatically detect compressed
  49. //config: tarballs. Currently it works only on files (not pipes etc).
  50. //config:
  51. //config:config FEATURE_TAR_FROM
  52. //config: bool "Enable -X (exclude from) and -T (include from) options"
  53. //config: default y
  54. //config: depends on TAR
  55. //config: help
  56. //config: If you enable this option you'll be able to specify
  57. //config: a list of files to include or exclude from an archive.
  58. //config:
  59. //config:config FEATURE_TAR_OLDGNU_COMPATIBILITY
  60. //config: bool "Support old tar header format"
  61. //config: default y
  62. //config: depends on TAR || DPKG
  63. //config: help
  64. //config: This option is required to unpack archives created in
  65. //config: the old GNU format; help to kill this old format by
  66. //config: repacking your ancient archives with the new format.
  67. //config:
  68. //config:config FEATURE_TAR_OLDSUN_COMPATIBILITY
  69. //config: bool "Enable untarring of tarballs with checksums produced by buggy Sun tar"
  70. //config: default y
  71. //config: depends on TAR || DPKG
  72. //config: help
  73. //config: This option is required to unpack archives created by some old
  74. //config: version of Sun's tar (it was calculating checksum using signed
  75. //config: arithmetic). It is said to be fixed in newer Sun tar, but "old"
  76. //config: tarballs still exist.
  77. //config:
  78. //config:config FEATURE_TAR_GNU_EXTENSIONS
  79. //config: bool "Support GNU tar extensions (long filenames)"
  80. //config: default y
  81. //config: depends on TAR || DPKG
  82. //config:
  83. //config:config FEATURE_TAR_TO_COMMAND
  84. //config: bool "Support writing to an external program (--to-command)"
  85. //config: default y
  86. //config: depends on TAR && FEATURE_TAR_LONG_OPTIONS
  87. //config: help
  88. //config: If you enable this option you'll be able to instruct tar to send
  89. //config: the contents of each extracted file to the standard input of an
  90. //config: external program.
  91. //config:
  92. //config:config FEATURE_TAR_UNAME_GNAME
  93. //config: bool "Enable use of user and group names"
  94. //config: default y
  95. //config: depends on TAR
  96. //config: help
  97. //config: Enable use of user and group names in tar. This affects contents
  98. //config: listings (-t) and preserving permissions when unpacking (-p).
  99. //config: +200 bytes.
  100. //config:
  101. //config:config FEATURE_TAR_NOPRESERVE_TIME
  102. //config: bool "Enable -m (do not preserve time) GNU option"
  103. //config: default y
  104. //config: depends on TAR
  105. //config:
  106. //config:config FEATURE_TAR_SELINUX
  107. //config: bool "Support extracting SELinux labels"
  108. //config: default n
  109. //config: depends on TAR && SELINUX
  110. //config: help
  111. //config: With this option busybox supports restoring SELinux labels
  112. //config: when extracting files from tar archives.
  113. //applet:IF_TAR(APPLET(tar, BB_DIR_BIN, BB_SUID_DROP))
  114. //kbuild:lib-$(CONFIG_TAR) += tar.o
  115. #include <fnmatch.h>
  116. #include "libbb.h"
  117. #include "common_bufsiz.h"
  118. #include "bb_archive.h"
  119. /* FIXME: Stop using this non-standard feature */
  120. #ifndef FNM_LEADING_DIR
  121. # define FNM_LEADING_DIR 0
  122. #endif
  123. #if 0
  124. # define DBG(fmt, ...) bb_error_msg("%s: " fmt, __func__, ## __VA_ARGS__)
  125. #else
  126. # define DBG(...) ((void)0)
  127. #endif
  128. #define DBG_OPTION_PARSING 0
  129. #define block_buf bb_common_bufsiz1
  130. #define INIT_G() do { setup_common_bufsiz(); } while (0)
  131. #if ENABLE_FEATURE_TAR_CREATE
  132. /*
  133. ** writeTarFile(), writeFileToTarball(), and writeTarHeader() are
  134. ** the only functions that deal with the HardLinkInfo structure.
  135. ** Even these functions use the xxxHardLinkInfo() functions.
  136. */
  137. typedef struct HardLinkInfo {
  138. struct HardLinkInfo *next; /* Next entry in list */
  139. dev_t dev; /* Device number */
  140. ino_t ino; /* Inode number */
  141. // short linkCount; /* (Hard) Link Count */
  142. char name[1]; /* Start of filename (must be last) */
  143. } HardLinkInfo;
  144. /* Some info to be carried along when creating a new tarball */
  145. typedef struct TarBallInfo {
  146. int tarFd; /* Open-for-write file descriptor
  147. * for the tarball */
  148. int verboseFlag; /* Whether to print extra stuff or not */
  149. # if ENABLE_FEATURE_TAR_FROM
  150. const llist_t *excludeList; /* List of files to not include */
  151. # endif
  152. HardLinkInfo *hlInfoHead; /* Hard Link Tracking Information */
  153. HardLinkInfo *hlInfo; /* Hard Link Info for the current file */
  154. //TODO: save only st_dev + st_ino
  155. struct stat tarFileStatBuf; /* Stat info for the tarball, letting
  156. * us know the inode and device that the
  157. * tarball lives, so we can avoid trying
  158. * to include the tarball into itself */
  159. } TarBallInfo;
  160. /* A nice enum with all the possible tar file content types */
  161. enum {
  162. REGTYPE = '0', /* regular file */
  163. REGTYPE0 = '\0', /* regular file (ancient bug compat) */
  164. LNKTYPE = '1', /* hard link */
  165. SYMTYPE = '2', /* symbolic link */
  166. CHRTYPE = '3', /* character special */
  167. BLKTYPE = '4', /* block special */
  168. DIRTYPE = '5', /* directory */
  169. FIFOTYPE = '6', /* FIFO special */
  170. CONTTYPE = '7', /* reserved */
  171. GNULONGLINK = 'K', /* GNU long (>100 chars) link name */
  172. GNULONGNAME = 'L', /* GNU long (>100 chars) file name */
  173. };
  174. /* Might be faster (and bigger) if the dev/ino were stored in numeric order;) */
  175. static void addHardLinkInfo(HardLinkInfo **hlInfoHeadPtr,
  176. struct stat *statbuf,
  177. const char *fileName)
  178. {
  179. /* Note: hlInfoHeadPtr can never be NULL! */
  180. HardLinkInfo *hlInfo;
  181. hlInfo = xmalloc(sizeof(HardLinkInfo) + strlen(fileName));
  182. hlInfo->next = *hlInfoHeadPtr;
  183. *hlInfoHeadPtr = hlInfo;
  184. hlInfo->dev = statbuf->st_dev;
  185. hlInfo->ino = statbuf->st_ino;
  186. // hlInfo->linkCount = statbuf->st_nlink;
  187. strcpy(hlInfo->name, fileName);
  188. }
  189. static void freeHardLinkInfo(HardLinkInfo **hlInfoHeadPtr)
  190. {
  191. HardLinkInfo *hlInfo;
  192. HardLinkInfo *hlInfoNext;
  193. if (hlInfoHeadPtr) {
  194. hlInfo = *hlInfoHeadPtr;
  195. while (hlInfo) {
  196. hlInfoNext = hlInfo->next;
  197. free(hlInfo);
  198. hlInfo = hlInfoNext;
  199. }
  200. *hlInfoHeadPtr = NULL;
  201. }
  202. }
  203. /* Might be faster (and bigger) if the dev/ino were stored in numeric order ;) */
  204. static HardLinkInfo *findHardLinkInfo(HardLinkInfo *hlInfo, struct stat *statbuf)
  205. {
  206. while (hlInfo) {
  207. if (statbuf->st_ino == hlInfo->ino
  208. && statbuf->st_dev == hlInfo->dev
  209. ) {
  210. DBG("found hardlink:'%s'", hlInfo->name);
  211. break;
  212. }
  213. hlInfo = hlInfo->next;
  214. }
  215. return hlInfo;
  216. }
  217. /* Put an octal string into the specified buffer.
  218. * The number is zero padded and possibly NUL terminated.
  219. * Stores low-order bits only if whole value does not fit. */
  220. static void putOctal(char *cp, int len, off_t value)
  221. {
  222. char tempBuffer[sizeof(off_t)*3 + 1];
  223. char *tempString = tempBuffer;
  224. int width;
  225. width = sprintf(tempBuffer, "%0*"OFF_FMT"o", len, value);
  226. tempString += (width - len);
  227. /* If string has leading zeroes, we can drop one */
  228. /* and field will have trailing '\0' */
  229. /* (increases chances of compat with other tars) */
  230. if (tempString[0] == '0')
  231. tempString++;
  232. /* Copy the string to the field */
  233. memcpy(cp, tempString, len);
  234. }
  235. #define PUT_OCTAL(a, b) putOctal((a), sizeof(a), (b))
  236. static void chksum_and_xwrite(int fd, struct tar_header_t* hp)
  237. {
  238. /* POSIX says that checksum is done on unsigned bytes
  239. * (Sun and HP-UX gets it wrong... more details in
  240. * GNU tar source) */
  241. const unsigned char *cp;
  242. int chksum, size;
  243. strcpy(hp->magic, "ustar ");
  244. /* Calculate and store the checksum (i.e., the sum of all of the bytes of
  245. * the header). The checksum field must be filled with blanks for the
  246. * calculation. The checksum field is formatted differently from the
  247. * other fields: it has 6 digits, a null, then a space -- rather than
  248. * digits, followed by a null like the other fields... */
  249. memset(hp->chksum, ' ', sizeof(hp->chksum));
  250. cp = (const unsigned char *) hp;
  251. chksum = 0;
  252. size = sizeof(*hp);
  253. do { chksum += *cp++; } while (--size);
  254. putOctal(hp->chksum, sizeof(hp->chksum)-1, chksum);
  255. /* Now write the header out to disk */
  256. xwrite(fd, hp, sizeof(*hp));
  257. }
  258. # if ENABLE_FEATURE_TAR_GNU_EXTENSIONS
  259. static void writeLongname(int fd, int type, const char *name, int dir)
  260. {
  261. struct prefilled {
  262. char mode[8]; /* 100-107 */
  263. char uid[8]; /* 108-115 */
  264. char gid[8]; /* 116-123 */
  265. char size[12]; /* 124-135 */
  266. char mtime[12]; /* 136-147 */
  267. };
  268. struct tar_header_t header;
  269. int size;
  270. memset(&header, 0, sizeof(header));
  271. header.typeflag = type;
  272. strcpy(header.name, "././@LongLink");
  273. /* This sets mode/uid/gid/mtime to "00...00<NUL>" strings */
  274. memset((char*)&header + offsetof(struct tar_header_t, mode), /* make gcc-9.x happy */
  275. '0', sizeof(struct prefilled));
  276. header.mode [sizeof(header.mode ) - 1] = '\0';
  277. header.uid [sizeof(header.uid ) - 1] = '\0';
  278. header.gid [sizeof(header.gid ) - 1] = '\0';
  279. /* header.size is filled by '0' now, will be corrected below */
  280. header.mtime[sizeof(header.mtime) - 1] = '\0';
  281. dir = !!dir; /* normalize: 0/1 */
  282. size = strlen(name) + 1 + dir; /* GNU tar uses strlen+1 */
  283. /* + dir: account for possible '/' */
  284. PUT_OCTAL(header.size, size);
  285. chksum_and_xwrite(fd, &header);
  286. /* Write filename[/] and pad the block. */
  287. /* dir=0: writes 'name<NUL>', pads */
  288. /* dir=1: writes 'name', writes '/<NUL>', pads */
  289. dir *= 2;
  290. xwrite(fd, name, size - dir);
  291. xwrite(fd, "/", dir);
  292. size = (-size) & (TAR_BLOCK_SIZE-1);
  293. memset(&header, 0, size);
  294. xwrite(fd, &header, size);
  295. }
  296. # endif
  297. /* Write out a tar header for the specified file/directory/whatever */
  298. static int writeTarHeader(struct TarBallInfo *tbInfo,
  299. const char *header_name, const char *fileName, struct stat *statbuf)
  300. {
  301. struct tar_header_t header;
  302. memset(&header, 0, sizeof(header));
  303. strncpy(header.name, header_name, sizeof(header.name));
  304. /* POSIX says to mask mode with 07777. */
  305. PUT_OCTAL(header.mode, statbuf->st_mode & 07777);
  306. PUT_OCTAL(header.uid, statbuf->st_uid);
  307. PUT_OCTAL(header.gid, statbuf->st_gid);
  308. memset(header.size, '0', sizeof(header.size)-1); /* Regular file size is handled later */
  309. /* users report that files with negative st_mtime cause trouble, so: */
  310. PUT_OCTAL(header.mtime, statbuf->st_mtime >= 0 ? statbuf->st_mtime : 0);
  311. /* Enter the user and group names */
  312. safe_strncpy(header.uname, get_cached_username(statbuf->st_uid), sizeof(header.uname));
  313. safe_strncpy(header.gname, get_cached_groupname(statbuf->st_gid), sizeof(header.gname));
  314. if (tbInfo->hlInfo) {
  315. /* This is a hard link */
  316. header.typeflag = LNKTYPE;
  317. strncpy(header.linkname, tbInfo->hlInfo->name,
  318. sizeof(header.linkname));
  319. # if ENABLE_FEATURE_TAR_GNU_EXTENSIONS
  320. /* Write out long linkname if needed */
  321. if (header.linkname[sizeof(header.linkname)-1])
  322. writeLongname(tbInfo->tarFd, GNULONGLINK,
  323. tbInfo->hlInfo->name, 0);
  324. # endif
  325. } else if (S_ISLNK(statbuf->st_mode)) {
  326. char *lpath = xmalloc_readlink_or_warn(fileName);
  327. if (!lpath)
  328. return FALSE;
  329. header.typeflag = SYMTYPE;
  330. strncpy(header.linkname, lpath, sizeof(header.linkname));
  331. # if ENABLE_FEATURE_TAR_GNU_EXTENSIONS
  332. /* Write out long linkname if needed */
  333. if (header.linkname[sizeof(header.linkname)-1])
  334. writeLongname(tbInfo->tarFd, GNULONGLINK, lpath, 0);
  335. # else
  336. /* If it is larger than 100 bytes, bail out */
  337. if (header.linkname[sizeof(header.linkname)-1]) {
  338. free(lpath);
  339. bb_simple_error_msg("names longer than "NAME_SIZE_STR" chars not supported");
  340. return FALSE;
  341. }
  342. # endif
  343. free(lpath);
  344. } else if (S_ISDIR(statbuf->st_mode)) {
  345. header.typeflag = DIRTYPE;
  346. /* Append '/' only if there is a space for it */
  347. if (!header.name[sizeof(header.name)-1])
  348. header.name[strlen(header.name)] = '/';
  349. } else if (S_ISCHR(statbuf->st_mode)) {
  350. header.typeflag = CHRTYPE;
  351. PUT_OCTAL(header.devmajor, major(statbuf->st_rdev));
  352. PUT_OCTAL(header.devminor, minor(statbuf->st_rdev));
  353. } else if (S_ISBLK(statbuf->st_mode)) {
  354. header.typeflag = BLKTYPE;
  355. PUT_OCTAL(header.devmajor, major(statbuf->st_rdev));
  356. PUT_OCTAL(header.devminor, minor(statbuf->st_rdev));
  357. } else if (S_ISFIFO(statbuf->st_mode)) {
  358. header.typeflag = FIFOTYPE;
  359. } else if (S_ISREG(statbuf->st_mode)) {
  360. /* header.size field is 12 bytes long */
  361. /* Does octal-encoded size fit? */
  362. uoff_t filesize = statbuf->st_size;
  363. if (sizeof(filesize) <= 4
  364. || filesize <= (uoff_t)0777777777777LL
  365. ) {
  366. PUT_OCTAL(header.size, filesize);
  367. }
  368. /* Does base256-encoded size fit?
  369. * It always does unless off_t is wider than 64 bits.
  370. */
  371. else if (ENABLE_FEATURE_TAR_GNU_EXTENSIONS
  372. # if ULLONG_MAX > 0xffffffffffffffffLL /* 2^64-1 */
  373. && (filesize <= 0x3fffffffffffffffffffffffLL)
  374. # endif
  375. ) {
  376. /* GNU tar uses "base-256 encoding" for very large numbers.
  377. * Encoding is binary, with highest bit always set as a marker
  378. * and sign in next-highest bit:
  379. * 80 00 .. 00 - zero
  380. * bf ff .. ff - largest positive number
  381. * ff ff .. ff - minus 1
  382. * c0 00 .. 00 - smallest negative number
  383. */
  384. char *p8 = header.size + sizeof(header.size);
  385. do {
  386. *--p8 = (uint8_t)filesize;
  387. filesize >>= 8;
  388. } while (p8 != header.size);
  389. *p8 |= 0x80;
  390. } else {
  391. bb_error_msg_and_die("can't store file '%s' "
  392. "of size %"OFF_FMT"u, aborting",
  393. fileName, statbuf->st_size);
  394. }
  395. header.typeflag = REGTYPE;
  396. } else {
  397. bb_error_msg("%s: unknown file type", fileName);
  398. return FALSE;
  399. }
  400. # if ENABLE_FEATURE_TAR_GNU_EXTENSIONS
  401. /* Write out long name if needed */
  402. /* (we, like GNU tar, output long linkname *before* long name) */
  403. if (header.name[sizeof(header.name)-1])
  404. writeLongname(tbInfo->tarFd, GNULONGNAME,
  405. header_name, S_ISDIR(statbuf->st_mode));
  406. # endif
  407. /* Now write the header out to disk */
  408. chksum_and_xwrite(tbInfo->tarFd, &header);
  409. /* Now do the verbose thing (or not) */
  410. if (tbInfo->verboseFlag) {
  411. FILE *vbFd = stdout;
  412. /* If archive goes to stdout, verbose goes to stderr */
  413. if (tbInfo->tarFd == STDOUT_FILENO)
  414. vbFd = stderr;
  415. /* GNU "tar cvvf" prints "extended" listing a-la "ls -l" */
  416. /* We don't have such excesses here: for us "v" == "vv" */
  417. /* '/' is probably a GNUism */
  418. fprintf(vbFd, "%s%s\n", header_name,
  419. S_ISDIR(statbuf->st_mode) ? "/" : "");
  420. }
  421. return TRUE;
  422. }
  423. # if ENABLE_FEATURE_TAR_FROM
  424. static int exclude_file(const llist_t *excluded_files, const char *file)
  425. {
  426. while (excluded_files) {
  427. if (excluded_files->data[0] == '/') {
  428. if (fnmatch(excluded_files->data, file,
  429. FNM_PATHNAME | FNM_LEADING_DIR) == 0)
  430. return 1;
  431. } else {
  432. const char *p;
  433. for (p = file; p[0] != '\0'; p++) {
  434. if ((p == file || p[-1] == '/')
  435. && p[0] != '/'
  436. && fnmatch(excluded_files->data, p,
  437. FNM_PATHNAME | FNM_LEADING_DIR) == 0
  438. ) {
  439. return 1;
  440. }
  441. }
  442. }
  443. excluded_files = excluded_files->link;
  444. }
  445. return 0;
  446. }
  447. # else
  448. # define exclude_file(excluded_files, file) 0
  449. # endif
  450. static int FAST_FUNC writeFileToTarball(struct recursive_state *state,
  451. const char *fileName,
  452. struct stat *statbuf)
  453. {
  454. struct TarBallInfo *tbInfo = (struct TarBallInfo *) state->userData;
  455. const char *header_name;
  456. int inputFileFd = -1;
  457. DBG("writeFileToTarball('%s')", fileName);
  458. /* Strip leading '/' and such (must be before memorizing hardlink's name) */
  459. header_name = strip_unsafe_prefix(fileName);
  460. if (header_name[0] == '\0')
  461. return TRUE;
  462. /* It is against the rules to archive a socket */
  463. if (S_ISSOCK(statbuf->st_mode)) {
  464. bb_error_msg("%s: socket ignored", fileName);
  465. return TRUE;
  466. }
  467. /*
  468. * Check to see if we are dealing with a hard link.
  469. * If so -
  470. * Treat the first occurrence of a given dev/inode as a file while
  471. * treating any additional occurrences as hard links. This is done
  472. * by adding the file information to the HardLinkInfo linked list.
  473. */
  474. tbInfo->hlInfo = NULL;
  475. if (!S_ISDIR(statbuf->st_mode) && statbuf->st_nlink > 1) {
  476. DBG("'%s': st_nlink > 1", header_name);
  477. tbInfo->hlInfo = findHardLinkInfo(tbInfo->hlInfoHead, statbuf);
  478. if (tbInfo->hlInfo == NULL) {
  479. DBG("'%s': addHardLinkInfo", header_name);
  480. addHardLinkInfo(&tbInfo->hlInfoHead, statbuf, header_name);
  481. }
  482. }
  483. /* It is a bad idea to store the archive we are in the process of creating,
  484. * so check the device and inode to be sure that this particular file isn't
  485. * the new tarball */
  486. if (tbInfo->tarFileStatBuf.st_dev == statbuf->st_dev
  487. && tbInfo->tarFileStatBuf.st_ino == statbuf->st_ino
  488. ) {
  489. bb_error_msg("%s: file is the archive; skipping", fileName);
  490. return TRUE;
  491. }
  492. if (exclude_file(tbInfo->excludeList, header_name))
  493. return SKIP;
  494. # if !ENABLE_FEATURE_TAR_GNU_EXTENSIONS
  495. if (strlen(header_name) >= NAME_SIZE) {
  496. bb_simple_error_msg("names longer than "NAME_SIZE_STR" chars not supported");
  497. return TRUE;
  498. }
  499. # endif
  500. /* Is this a regular file? */
  501. if (tbInfo->hlInfo == NULL && S_ISREG(statbuf->st_mode)) {
  502. /* open the file we want to archive, and make sure all is well */
  503. inputFileFd = open_or_warn(fileName, O_RDONLY);
  504. if (inputFileFd < 0) {
  505. return FALSE;
  506. }
  507. }
  508. /* Add an entry to the tarball */
  509. if (writeTarHeader(tbInfo, header_name, fileName, statbuf) == FALSE) {
  510. return FALSE;
  511. }
  512. /* If it was a regular file, write out the body */
  513. if (inputFileFd >= 0) {
  514. size_t readSize;
  515. /* Write the file to the archive. */
  516. /* We record size into header first, */
  517. /* and then write out file. If file shrinks in between, */
  518. /* tar will be corrupted. So we don't allow for that. */
  519. /* NB: GNU tar 1.16 warns and pads with zeroes */
  520. /* or even seeks back and updates header */
  521. bb_copyfd_exact_size(inputFileFd, tbInfo->tarFd, statbuf->st_size);
  522. ////off_t readSize;
  523. ////readSize = bb_copyfd_size(inputFileFd, tbInfo->tarFd, statbuf->st_size);
  524. ////if (readSize != statbuf->st_size && readSize >= 0) {
  525. //// bb_error_msg_and_die("short read from %s, aborting", fileName);
  526. ////}
  527. /* Check that file did not grow in between? */
  528. /* if (safe_read(inputFileFd, 1) == 1) warn but continue? */
  529. close(inputFileFd);
  530. /* Pad the file up to the tar block size */
  531. /* (a few tricks here in the name of code size) */
  532. readSize = (-(int)statbuf->st_size) & (TAR_BLOCK_SIZE-1);
  533. memset(block_buf, 0, readSize);
  534. xwrite(tbInfo->tarFd, block_buf, readSize);
  535. }
  536. return TRUE;
  537. }
  538. # if SEAMLESS_COMPRESSION
  539. /* Don't inline: vfork scares gcc and pessimizes code */
  540. static void NOINLINE vfork_compressor(int tar_fd, const char *gzip)
  541. {
  542. // On Linux, vfork never unpauses parent early, although standard
  543. // allows for that. Do we want to waste bytes checking for it?
  544. # define WAIT_FOR_CHILD 0
  545. volatile int vfork_exec_errno = 0;
  546. struct fd_pair data;
  547. # if WAIT_FOR_CHILD
  548. struct fd_pair status;
  549. xpiped_pair(status);
  550. # endif
  551. xpiped_pair(data);
  552. signal(SIGPIPE, SIG_IGN); /* we only want EPIPE on errors */
  553. if (xvfork() == 0) {
  554. /* child */
  555. int tfd;
  556. /* NB: close _first_, then move fds! */
  557. close(data.wr);
  558. # if WAIT_FOR_CHILD
  559. close(status.rd);
  560. /* status.wr will close only on exec -
  561. * parent waits for this close to happen */
  562. fcntl(status.wr, F_SETFD, FD_CLOEXEC);
  563. # endif
  564. /* copy it: parent's tar_fd variable must not change */
  565. tfd = tar_fd;
  566. if (tfd == 0) {
  567. /* Output tar fd may be zero.
  568. * xmove_fd(data.rd, 0) would destroy it.
  569. * Reproducer:
  570. * exec 0>&-
  571. * exec 1>&-
  572. * tar czf Z.tar.gz FILE
  573. * Swapping move_fd's order wouldn't work:
  574. * data.rd is 1 and _it_ would be destroyed.
  575. */
  576. tfd = dup(tfd);
  577. }
  578. xmove_fd(data.rd, 0);
  579. xmove_fd(tfd, 1);
  580. /* exec gzip/bzip2/... program */
  581. //BB_EXECLP(gzip, gzip, "-f", (char *)0); - WRONG for "xz",
  582. // if xz is an enabled applet, it'll be a version which
  583. // can only decompress. We do need to execute external
  584. // program, not applet.
  585. execlp(gzip, gzip, "-f", (char *)0);
  586. vfork_exec_errno = errno;
  587. _exit(EXIT_FAILURE);
  588. }
  589. /* parent */
  590. xmove_fd(data.wr, tar_fd);
  591. close(data.rd);
  592. # if WAIT_FOR_CHILD
  593. close(status.wr);
  594. while (1) {
  595. /* Wait until child execs (or fails to) */
  596. char buf;
  597. int n = full_read(status.rd, &buf, 1);
  598. if (n < 0 /* && errno == EAGAIN */)
  599. continue; /* try it again */
  600. }
  601. close(status.rd);
  602. # endif
  603. if (vfork_exec_errno) {
  604. errno = vfork_exec_errno;
  605. bb_perror_msg_and_die("can't execute '%s'", gzip);
  606. }
  607. }
  608. # endif /* SEAMLESS_COMPRESSION */
  609. # if !SEAMLESS_COMPRESSION
  610. /* Do not pass gzip flag to writeTarFile() */
  611. #define writeTarFile(tbInfo, recurseFlags, filelist, gzip) \
  612. writeTarFile(tbInfo, recurseFlags, filelist)
  613. # endif
  614. /* gcc 4.2.1 inlines it, making code bigger */
  615. static NOINLINE int writeTarFile(
  616. struct TarBallInfo *tbInfo,
  617. int recurseFlags,
  618. const llist_t *filelist,
  619. const char *gzip)
  620. {
  621. int errorFlag = FALSE;
  622. /*tbInfo->hlInfoHead = NULL; - already is */
  623. /* Store the stat info for the tarball's file, so
  624. * can avoid including the tarball into itself.... */
  625. xfstat(tbInfo->tarFd, &tbInfo->tarFileStatBuf, "can't stat tar file");
  626. # if SEAMLESS_COMPRESSION
  627. if (gzip)
  628. vfork_compressor(tbInfo->tarFd, gzip);
  629. # endif
  630. /* Read the directory/files and iterate over them one at a time */
  631. while (filelist) {
  632. if (!recursive_action(filelist->data, recurseFlags,
  633. writeFileToTarball, writeFileToTarball, tbInfo)
  634. ) {
  635. errorFlag = TRUE;
  636. }
  637. filelist = filelist->link;
  638. }
  639. /* Write two empty blocks to the end of the archive */
  640. memset(block_buf, 0, 2*TAR_BLOCK_SIZE);
  641. xwrite(tbInfo->tarFd, block_buf, 2*TAR_BLOCK_SIZE);
  642. /* To be pedantically correct, we would check if the tarball
  643. * is smaller than 20 tar blocks, and pad it if it was smaller,
  644. * but that isn't necessary for GNU tar interoperability, and
  645. * so is considered a waste of space */
  646. /* Close so the child process (if any) will exit */
  647. close(tbInfo->tarFd);
  648. /* Hang up the tools, close up shop, head home */
  649. if (ENABLE_FEATURE_CLEAN_UP)
  650. freeHardLinkInfo(&tbInfo->hlInfoHead);
  651. if (errorFlag)
  652. bb_simple_error_msg("error exit delayed from previous errors");
  653. # if SEAMLESS_COMPRESSION
  654. if (gzip) {
  655. int status;
  656. if (safe_waitpid(-1, &status, 0) == -1)
  657. bb_simple_perror_msg("waitpid");
  658. else if (!WIFEXITED(status) || WEXITSTATUS(status))
  659. /* gzip was killed or has exited with nonzero! */
  660. errorFlag = TRUE;
  661. }
  662. # endif
  663. return errorFlag;
  664. }
  665. #endif /* FEATURE_TAR_CREATE */
  666. #if ENABLE_FEATURE_TAR_FROM
  667. static llist_t *append_file_list_to_list(llist_t *list)
  668. {
  669. llist_t *newlist = NULL;
  670. while (list) {
  671. FILE *src_stream;
  672. char *line;
  673. src_stream = xfopen_stdin(llist_pop(&list));
  674. while ((line = xmalloc_fgetline(src_stream)) != NULL) {
  675. /* kill trailing '/' unless the string is just "/" */
  676. char *cp = last_char_is(line, '/');
  677. if (cp > line)
  678. *cp = '\0';
  679. llist_add_to_end(&newlist, line);
  680. }
  681. fclose(src_stream);
  682. }
  683. return newlist;
  684. }
  685. #endif
  686. //usage:#define tar_trivial_usage
  687. //usage: IF_FEATURE_TAR_CREATE("c|") "x|t [-"
  688. //usage: IF_FEATURE_SEAMLESS_Z("Z")
  689. //usage: IF_FEATURE_SEAMLESS_GZ("z")
  690. //usage: IF_FEATURE_SEAMLESS_XZ("J")
  691. //usage: IF_FEATURE_SEAMLESS_BZ2("j")
  692. //usage: "a"
  693. //usage: IF_FEATURE_TAR_CREATE("h")
  694. //usage: IF_FEATURE_TAR_NOPRESERVE_TIME("m")
  695. //usage: "vokO] "
  696. //usage: "[-f TARFILE] [-C DIR] "
  697. //usage: IF_FEATURE_TAR_FROM("[-T FILE] [-X FILE] "IF_FEATURE_TAR_LONG_OPTIONS("[--exclude PATTERN]... "))
  698. //usage: "[FILE]..."
  699. //usage:#define tar_full_usage "\n\n"
  700. //usage: IF_FEATURE_TAR_CREATE("Create, extract, ")
  701. //usage: IF_NOT_FEATURE_TAR_CREATE("Extract ")
  702. //usage: "or list files from a tar file"
  703. //usage: "\n"
  704. //usage: IF_FEATURE_TAR_CREATE(
  705. //usage: "\n c Create"
  706. //usage: )
  707. //usage: "\n x Extract"
  708. //usage: "\n t List"
  709. //usage: "\n -f FILE Name of TARFILE ('-' for stdin/out)"
  710. //usage: "\n -C DIR Change to DIR before operation"
  711. //usage: "\n -v Verbose"
  712. //usage: "\n -O Extract to stdout"
  713. //usage: IF_FEATURE_TAR_NOPRESERVE_TIME(
  714. //usage: "\n -m Don't restore mtime"
  715. //usage: )
  716. //usage: "\n -o Don't restore user:group"
  717. ///////:-p - accepted but ignored, restores mode (aliases in GNU tar: --preserve-permissions, --same-permissions)
  718. //usage: "\n -k Don't replace existing files"
  719. //usage: IF_FEATURE_SEAMLESS_Z(
  720. //usage: "\n -Z (De)compress using compress"
  721. //usage: )
  722. //usage: IF_FEATURE_SEAMLESS_GZ(
  723. //usage: "\n -z (De)compress using gzip"
  724. //usage: )
  725. //usage: IF_FEATURE_SEAMLESS_XZ(
  726. //usage: "\n -J (De)compress using xz"
  727. //usage: )
  728. //usage: IF_FEATURE_SEAMLESS_BZ2(
  729. //usage: "\n -j (De)compress using bzip2"
  730. //usage: )
  731. //usage: "\n -a (De)compress based on extension"
  732. //usage: IF_FEATURE_TAR_CREATE(
  733. //usage: "\n -h Follow symlinks"
  734. //usage: )
  735. //usage: IF_FEATURE_TAR_FROM(
  736. //usage: "\n -T FILE File with names to include"
  737. //usage: "\n -X FILE File with glob patterns to exclude"
  738. //usage: IF_FEATURE_TAR_LONG_OPTIONS(
  739. //usage: "\n --exclude PATTERN Glob pattern to exclude"
  740. //usage: )
  741. //usage: )
  742. //usage:
  743. //usage:#define tar_example_usage
  744. //usage: "$ zcat /tmp/tarball.tar.gz | tar -xf -\n"
  745. //usage: "$ tar -cf /tmp/tarball.tar /usr/local\n"
  746. // Supported but aren't in --help:
  747. // lzma
  748. // no-recursion
  749. // numeric-owner
  750. // no-same-permissions
  751. // overwrite
  752. //IF_FEATURE_TAR_TO_COMMAND(
  753. // to-command
  754. //)
  755. enum {
  756. OPTBIT_KEEP_OLD = 8,
  757. IF_FEATURE_TAR_CREATE( OPTBIT_CREATE ,)
  758. IF_FEATURE_TAR_CREATE( OPTBIT_DEREFERENCE ,)
  759. IF_FEATURE_SEAMLESS_BZ2( OPTBIT_BZIP2 ,)
  760. IF_FEATURE_TAR_FROM( OPTBIT_INCLUDE_FROM,)
  761. IF_FEATURE_TAR_FROM( OPTBIT_EXCLUDE_FROM,)
  762. IF_FEATURE_SEAMLESS_GZ( OPTBIT_GZIP ,)
  763. IF_FEATURE_SEAMLESS_XZ( OPTBIT_XZ ,)
  764. IF_FEATURE_SEAMLESS_Z( OPTBIT_COMPRESS ,) // 16th bit
  765. OPTBIT_AUTOCOMPRESS_BY_EXT,
  766. IF_FEATURE_TAR_NOPRESERVE_TIME(OPTBIT_NOPRESERVE_TIME,)
  767. #if ENABLE_FEATURE_TAR_LONG_OPTIONS
  768. OPTBIT_STRIP_COMPONENTS,
  769. IF_FEATURE_SEAMLESS_LZMA(OPTBIT_LZMA ,)
  770. OPTBIT_NORECURSION,
  771. IF_FEATURE_TAR_TO_COMMAND(OPTBIT_2COMMAND ,)
  772. OPTBIT_NUMERIC_OWNER,
  773. OPTBIT_NOPRESERVE_PERM,
  774. OPTBIT_OVERWRITE,
  775. #endif
  776. OPT_TEST = 1 << 0, // t
  777. OPT_EXTRACT = 1 << 1, // x
  778. OPT_BASEDIR = 1 << 2, // C
  779. OPT_TARNAME = 1 << 3, // f
  780. OPT_2STDOUT = 1 << 4, // O
  781. OPT_NOPRESERVE_OWNER = 1 << 5, // o == no-same-owner
  782. OPT_P = 1 << 6, // p
  783. OPT_VERBOSE = 1 << 7, // v
  784. OPT_KEEP_OLD = 1 << 8, // k
  785. OPT_CREATE = IF_FEATURE_TAR_CREATE( (1 << OPTBIT_CREATE )) + 0, // c
  786. OPT_DEREFERENCE = IF_FEATURE_TAR_CREATE( (1 << OPTBIT_DEREFERENCE )) + 0, // h
  787. OPT_BZIP2 = IF_FEATURE_SEAMLESS_BZ2( (1 << OPTBIT_BZIP2 )) + 0, // j
  788. OPT_INCLUDE_FROM = IF_FEATURE_TAR_FROM( (1 << OPTBIT_INCLUDE_FROM)) + 0, // T
  789. OPT_EXCLUDE_FROM = IF_FEATURE_TAR_FROM( (1 << OPTBIT_EXCLUDE_FROM)) + 0, // X
  790. OPT_GZIP = IF_FEATURE_SEAMLESS_GZ( (1 << OPTBIT_GZIP )) + 0, // z
  791. OPT_XZ = IF_FEATURE_SEAMLESS_XZ( (1 << OPTBIT_XZ )) + 0, // J
  792. OPT_COMPRESS = IF_FEATURE_SEAMLESS_Z( (1 << OPTBIT_COMPRESS )) + 0, // Z
  793. OPT_AUTOCOMPRESS_BY_EXT = 1 << OPTBIT_AUTOCOMPRESS_BY_EXT, // a
  794. OPT_NOPRESERVE_TIME = IF_FEATURE_TAR_NOPRESERVE_TIME((1 << OPTBIT_NOPRESERVE_TIME)) + 0, // m
  795. OPT_STRIP_COMPONENTS = IF_FEATURE_TAR_LONG_OPTIONS((1 << OPTBIT_STRIP_COMPONENTS)) + 0, // strip-components
  796. OPT_LZMA = IF_FEATURE_TAR_LONG_OPTIONS(IF_FEATURE_SEAMLESS_LZMA((1 << OPTBIT_LZMA))) + 0, // lzma
  797. OPT_NORECURSION = IF_FEATURE_TAR_LONG_OPTIONS((1 << OPTBIT_NORECURSION )) + 0, // no-recursion
  798. OPT_2COMMAND = IF_FEATURE_TAR_TO_COMMAND( (1 << OPTBIT_2COMMAND )) + 0, // to-command
  799. OPT_NUMERIC_OWNER = IF_FEATURE_TAR_LONG_OPTIONS((1 << OPTBIT_NUMERIC_OWNER )) + 0, // numeric-owner
  800. OPT_NOPRESERVE_PERM = IF_FEATURE_TAR_LONG_OPTIONS((1 << OPTBIT_NOPRESERVE_PERM)) + 0, // no-same-permissions
  801. OPT_OVERWRITE = IF_FEATURE_TAR_LONG_OPTIONS((1 << OPTBIT_OVERWRITE )) + 0, // overwrite
  802. OPT_ANY_COMPRESS = (OPT_BZIP2 | OPT_LZMA | OPT_GZIP | OPT_XZ | OPT_COMPRESS),
  803. };
  804. #if ENABLE_FEATURE_TAR_LONG_OPTIONS
  805. static const char tar_longopts[] ALIGN1 =
  806. "list\0" No_argument "t"
  807. "extract\0" No_argument "x"
  808. "directory\0" Required_argument "C"
  809. "file\0" Required_argument "f"
  810. "to-stdout\0" No_argument "O"
  811. /* do not restore owner */
  812. /* Note: GNU tar handles 'o' as no-same-owner only on extract,
  813. * on create, 'o' is --old-archive. We do not support --old-archive. */
  814. "no-same-owner\0" No_argument "o"
  815. "same-permissions\0" No_argument "p"
  816. "verbose\0" No_argument "v"
  817. "keep-old\0" No_argument "k"
  818. # if ENABLE_FEATURE_TAR_CREATE
  819. "create\0" No_argument "c"
  820. "dereference\0" No_argument "h"
  821. # endif
  822. # if ENABLE_FEATURE_SEAMLESS_BZ2
  823. "bzip2\0" No_argument "j"
  824. # endif
  825. # if ENABLE_FEATURE_TAR_FROM
  826. "files-from\0" Required_argument "T"
  827. "exclude-from\0" Required_argument "X"
  828. # endif
  829. # if ENABLE_FEATURE_SEAMLESS_GZ
  830. "gzip\0" No_argument "z"
  831. # endif
  832. # if ENABLE_FEATURE_SEAMLESS_XZ
  833. "xz\0" No_argument "J"
  834. # endif
  835. # if ENABLE_FEATURE_SEAMLESS_Z
  836. "compress\0" No_argument "Z"
  837. # endif
  838. "auto-compress\0" No_argument "a"
  839. # if ENABLE_FEATURE_TAR_NOPRESERVE_TIME
  840. "touch\0" No_argument "m"
  841. # endif
  842. "strip-components\0" Required_argument "\xf8"
  843. # if ENABLE_FEATURE_SEAMLESS_LZMA
  844. "lzma\0" No_argument "\xf9"
  845. # endif
  846. "no-recursion\0" No_argument "\xfa"
  847. # if ENABLE_FEATURE_TAR_TO_COMMAND
  848. "to-command\0" Required_argument "\xfb"
  849. # endif
  850. /* use numeric uid/gid from tar header, not textual */
  851. "numeric-owner\0" No_argument "\xfc"
  852. /* do not restore mode */
  853. "no-same-permissions\0" No_argument "\xfd"
  854. /* on unpack, open with O_TRUNC and !O_EXCL */
  855. "overwrite\0" No_argument "\xfe"
  856. /* --exclude takes next bit position in option mask, */
  857. /* therefore we have to put it _after_ --no-same-permissions */
  858. # if ENABLE_FEATURE_TAR_FROM
  859. "exclude\0" Required_argument "\xff"
  860. # endif
  861. ;
  862. # define GETOPT32 getopt32long
  863. # define LONGOPTS ,tar_longopts
  864. #else
  865. # define GETOPT32 getopt32
  866. # define LONGOPTS
  867. #endif
  868. int tar_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE;
  869. int tar_main(int argc UNUSED_PARAM, char **argv)
  870. {
  871. archive_handle_t *tar_handle;
  872. char *base_dir = NULL;
  873. const char *tar_filename = "-";
  874. unsigned opt;
  875. int verboseFlag = 0;
  876. #if ENABLE_FEATURE_TAR_LONG_OPTIONS && ENABLE_FEATURE_TAR_FROM
  877. llist_t *excludes = NULL;
  878. #endif
  879. INIT_G();
  880. /* Initialise default values */
  881. tar_handle = init_handle();
  882. tar_handle->ah_flags = ARCHIVE_CREATE_LEADING_DIRS
  883. | ARCHIVE_RESTORE_DATE
  884. | ARCHIVE_UNLINK_OLD;
  885. /* Apparently only root's tar preserves perms (see bug 3844) */
  886. if (getuid() != 0)
  887. tar_handle->ah_flags |= ARCHIVE_DONT_RESTORE_PERM;
  888. #if ENABLE_DESKTOP
  889. /* Lie to buildroot when it starts asking stupid questions. */
  890. if (argv[1] && strcmp(argv[1], "--version") == 0) {
  891. // Output of 'tar --version' examples:
  892. // tar (GNU tar) 1.15.1
  893. // tar (GNU tar) 1.25
  894. // bsdtar 2.8.3 - libarchive 2.8.3
  895. puts("tar (busybox) " BB_VER);
  896. return 0;
  897. }
  898. #endif
  899. if (argv[1] && argv[1][0] != '-' && argv[1][0] != '\0') {
  900. /* Compat:
  901. * 1st argument without dash handles options with parameters
  902. * differently from dashed one: it takes *next argv[i]*
  903. * as parameter even if there are more chars in 1st argument:
  904. * "tar fx TARFILE" - "x" is not taken as f's param
  905. * but is interpreted as -x option
  906. * "tar -xf TARFILE" - dashed equivalent of the above
  907. * "tar -fx ..." - "x" is taken as f's param
  908. * getopt32 wouldn't handle 1st command correctly.
  909. * Unfortunately, people do use such commands.
  910. * We massage argv[1] to work around it by moving 'f'
  911. * to the end of the string.
  912. * More contrived "tar fCx TARFILE DIR" still fails,
  913. * but such commands are much less likely to be used.
  914. */
  915. char *f = strchr(argv[1], 'f');
  916. if (f) {
  917. while (f[1] != '\0') {
  918. *f = f[1];
  919. f++;
  920. }
  921. *f = 'f';
  922. }
  923. /* Prepend '-' to the first argument */
  924. argv[1] = xasprintf("-%s", argv[1]);
  925. }
  926. opt = GETOPT32(argv, "^"
  927. "txC:f:Oopvk"
  928. IF_FEATURE_TAR_CREATE( "ch" )
  929. IF_FEATURE_SEAMLESS_BZ2( "j" )
  930. IF_FEATURE_TAR_FROM( "T:*X:*")
  931. IF_FEATURE_SEAMLESS_GZ( "z" )
  932. IF_FEATURE_SEAMLESS_XZ( "J" )
  933. IF_FEATURE_SEAMLESS_Z( "Z" )
  934. "a"
  935. IF_FEATURE_TAR_NOPRESERVE_TIME("m")
  936. IF_FEATURE_TAR_LONG_OPTIONS("\xf8:") // --strip-components
  937. "\0"
  938. "tt:vv:" // count -t,-v
  939. #if ENABLE_FEATURE_TAR_LONG_OPTIONS && ENABLE_FEATURE_TAR_FROM
  940. "\xff::" // --exclude=PATTERN is a list
  941. #endif
  942. IF_FEATURE_TAR_CREATE("c:") "t:x:" // at least one of these is reqd
  943. IF_FEATURE_TAR_CREATE("c--tx:t--cx:x--ct") // mutually exclusive
  944. IF_NOT_FEATURE_TAR_CREATE("t--x:x--t") // mutually exclusive
  945. #if ENABLE_FEATURE_TAR_LONG_OPTIONS
  946. ":\xf8+" // --strip-components=NUM
  947. #endif
  948. LONGOPTS
  949. , &base_dir // -C dir
  950. , &tar_filename // -f filename
  951. IF_FEATURE_TAR_FROM(, &(tar_handle->accept)) // T
  952. IF_FEATURE_TAR_FROM(, &(tar_handle->reject)) // X
  953. #if ENABLE_FEATURE_TAR_LONG_OPTIONS
  954. , &tar_handle->tar__strip_components // --strip-components
  955. #endif
  956. IF_FEATURE_TAR_TO_COMMAND(, &(tar_handle->tar__to_command)) // --to-command
  957. #if ENABLE_FEATURE_TAR_LONG_OPTIONS && ENABLE_FEATURE_TAR_FROM
  958. , &excludes // --exclude
  959. #endif
  960. , &verboseFlag // combined count for -t and -v
  961. , &verboseFlag // combined count for -t and -v
  962. );
  963. #if DBG_OPTION_PARSING
  964. bb_error_msg("opt: 0x%08x", opt);
  965. # define showopt(o) bb_error_msg("opt & %s(%x):\t%x", #o, o, opt & o);
  966. showopt(OPT_TEST );
  967. showopt(OPT_EXTRACT );
  968. showopt(OPT_BASEDIR );
  969. showopt(OPT_TARNAME );
  970. showopt(OPT_2STDOUT );
  971. showopt(OPT_NOPRESERVE_OWNER);
  972. showopt(OPT_P );
  973. showopt(OPT_VERBOSE );
  974. showopt(OPT_KEEP_OLD );
  975. showopt(OPT_CREATE );
  976. showopt(OPT_DEREFERENCE );
  977. showopt(OPT_BZIP2 );
  978. showopt(OPT_INCLUDE_FROM );
  979. showopt(OPT_EXCLUDE_FROM );
  980. showopt(OPT_GZIP );
  981. showopt(OPT_XZ );
  982. showopt(OPT_COMPRESS );
  983. showopt(OPT_AUTOCOMPRESS_BY_EXT);
  984. showopt(OPT_NOPRESERVE_TIME );
  985. showopt(OPT_STRIP_COMPONENTS);
  986. showopt(OPT_LZMA );
  987. showopt(OPT_NORECURSION );
  988. showopt(OPT_2COMMAND );
  989. showopt(OPT_NUMERIC_OWNER );
  990. showopt(OPT_NOPRESERVE_PERM );
  991. showopt(OPT_OVERWRITE );
  992. showopt(OPT_ANY_COMPRESS );
  993. bb_error_msg("base_dir:'%s'", base_dir);
  994. bb_error_msg("tar_filename:'%s'", tar_filename);
  995. bb_error_msg("verboseFlag:%d", verboseFlag);
  996. bb_error_msg("tar_handle->tar__to_command:'%s'", tar_handle->tar__to_command);
  997. bb_error_msg("tar_handle->tar__strip_components:%u", tar_handle->tar__strip_components);
  998. return 0;
  999. # undef showopt
  1000. #endif
  1001. argv += optind;
  1002. if (verboseFlag)
  1003. tar_handle->action_header = header_verbose_list;
  1004. if (verboseFlag == 1)
  1005. tar_handle->action_header = header_list;
  1006. if (opt & OPT_EXTRACT)
  1007. tar_handle->action_data = data_extract_all;
  1008. if (opt & OPT_2STDOUT)
  1009. tar_handle->action_data = data_extract_to_stdout;
  1010. if (opt & OPT_2COMMAND) {
  1011. putenv((char*)"TAR_FILETYPE=f");
  1012. signal(SIGPIPE, SIG_IGN);
  1013. tar_handle->action_data = data_extract_to_command;
  1014. IF_FEATURE_TAR_TO_COMMAND(tar_handle->tar__to_command_shell = xstrdup(get_shell_name());)
  1015. }
  1016. if (opt & OPT_KEEP_OLD)
  1017. tar_handle->ah_flags &= ~ARCHIVE_UNLINK_OLD;
  1018. if (opt & OPT_NUMERIC_OWNER)
  1019. tar_handle->ah_flags |= ARCHIVE_NUMERIC_OWNER;
  1020. if (opt & OPT_NOPRESERVE_OWNER)
  1021. tar_handle->ah_flags |= ARCHIVE_DONT_RESTORE_OWNER;
  1022. if (opt & OPT_NOPRESERVE_PERM)
  1023. tar_handle->ah_flags |= ARCHIVE_DONT_RESTORE_PERM;
  1024. if (opt & OPT_OVERWRITE) {
  1025. tar_handle->ah_flags &= ~ARCHIVE_UNLINK_OLD;
  1026. tar_handle->ah_flags |= ARCHIVE_O_TRUNC;
  1027. }
  1028. if (opt & OPT_NOPRESERVE_TIME)
  1029. tar_handle->ah_flags &= ~ARCHIVE_RESTORE_DATE;
  1030. #if ENABLE_FEATURE_TAR_FROM
  1031. tar_handle->reject = append_file_list_to_list(tar_handle->reject);
  1032. # if ENABLE_FEATURE_TAR_LONG_OPTIONS
  1033. /* Append excludes to reject */
  1034. while (excludes) {
  1035. llist_t *next = excludes->link;
  1036. excludes->link = tar_handle->reject;
  1037. tar_handle->reject = excludes;
  1038. excludes = next;
  1039. }
  1040. # endif
  1041. tar_handle->accept = append_file_list_to_list(tar_handle->accept);
  1042. #endif
  1043. /* Setup an array of filenames to work with */
  1044. /* TODO: This is the same as in ar, make a separate function? */
  1045. while (*argv) {
  1046. /* kill trailing '/' unless the string is just "/" */
  1047. char *cp = last_char_is(*argv, '/');
  1048. if (cp > *argv)
  1049. *cp = '\0';
  1050. llist_add_to_end(&tar_handle->accept, *argv);
  1051. argv++;
  1052. }
  1053. if (tar_handle->accept || tar_handle->reject)
  1054. tar_handle->filter = filter_accept_reject_list;
  1055. /* Open the tar file */
  1056. {
  1057. int tar_fd = STDIN_FILENO;
  1058. int flags = O_RDONLY;
  1059. if (opt & OPT_CREATE) {
  1060. /* Make sure there is at least one file to tar up */
  1061. if (tar_handle->accept == NULL)
  1062. bb_simple_error_msg_and_die("empty archive");
  1063. tar_fd = STDOUT_FILENO;
  1064. /* Mimicking GNU tar 1.15.1: */
  1065. flags = O_WRONLY | O_CREAT | O_TRUNC;
  1066. }
  1067. if (LONE_DASH(tar_filename)) {
  1068. tar_handle->src_fd = tar_fd;
  1069. tar_handle->seek = seek_by_read;
  1070. } else
  1071. if (ENABLE_FEATURE_TAR_AUTODETECT
  1072. && ENABLE_FEATURE_SEAMLESS_LZMA
  1073. && flags == O_RDONLY
  1074. && !(opt & OPT_ANY_COMPRESS)
  1075. && is_suffixed_with(tar_filename, ".lzma")
  1076. /* We do this only for .lzma files, they have no signature.
  1077. * All other compression formats are recognized in
  1078. * get_header_tar() when first tar block has invalid format.
  1079. * Doing it here for all filenames would falsely trigger
  1080. * on e.g. tarball with 1st file named "BZh5".
  1081. */
  1082. ) {
  1083. tar_handle->src_fd = open_zipped(tar_filename, /*fail_if_not_compressed:*/ 0);
  1084. if (tar_handle->src_fd < 0)
  1085. bb_perror_msg_and_die("can't open '%s'", tar_filename);
  1086. } else {
  1087. tar_handle->src_fd = xopen(tar_filename, flags);
  1088. #if ENABLE_FEATURE_TAR_CREATE
  1089. if ((OPT_GZIP | OPT_BZIP2 | OPT_XZ | OPT_LZMA) != 0 /* at least one is config-enabled */
  1090. && (opt & OPT_AUTOCOMPRESS_BY_EXT)
  1091. && flags != O_RDONLY
  1092. ) {
  1093. if (OPT_GZIP != 0 && is_suffixed_with(tar_filename, "gz"))
  1094. opt |= OPT_GZIP;
  1095. if (OPT_BZIP2 != 0 && is_suffixed_with(tar_filename, "bz2"))
  1096. opt |= OPT_BZIP2;
  1097. if (OPT_XZ != 0 && is_suffixed_with(tar_filename, "xz"))
  1098. opt |= OPT_XZ;
  1099. if (OPT_LZMA != 0 && is_suffixed_with(tar_filename, "lzma"))
  1100. opt |= OPT_LZMA;
  1101. }
  1102. #endif
  1103. }
  1104. }
  1105. if (base_dir)
  1106. xchdir(base_dir);
  1107. #if ENABLE_FEATURE_TAR_CREATE
  1108. /* Create an archive */
  1109. if (opt & OPT_CREATE) {
  1110. struct TarBallInfo *tbInfo;
  1111. # if SEAMLESS_COMPRESSION
  1112. const char *zipMode = NULL;
  1113. if (opt & OPT_COMPRESS)
  1114. zipMode = "compress";
  1115. if (opt & OPT_GZIP)
  1116. zipMode = "gzip";
  1117. if (opt & OPT_BZIP2)
  1118. zipMode = "bzip2";
  1119. if (opt & OPT_LZMA)
  1120. zipMode = "lzma";
  1121. if (opt & OPT_XZ)
  1122. zipMode = "xz";
  1123. # endif
  1124. tbInfo = xzalloc(sizeof(*tbInfo));
  1125. tbInfo->tarFd = tar_handle->src_fd;
  1126. tbInfo->verboseFlag = verboseFlag;
  1127. # if ENABLE_FEATURE_TAR_FROM
  1128. tbInfo->excludeList = tar_handle->reject;
  1129. # endif
  1130. /* NB: writeTarFile() closes tar_handle->src_fd */
  1131. return writeTarFile(tbInfo,
  1132. (opt & OPT_DEREFERENCE ? ACTION_FOLLOWLINKS : 0)
  1133. | (opt & OPT_NORECURSION ? 0 : ACTION_RECURSE),
  1134. tar_handle->accept,
  1135. zipMode);
  1136. }
  1137. #endif
  1138. if (opt & OPT_ANY_COMPRESS) {
  1139. USE_FOR_MMU(IF_DESKTOP(long long) int FAST_FUNC (*xformer)(transformer_state_t *xstate);)
  1140. USE_FOR_NOMMU(const char *xformer_prog;)
  1141. if (opt & OPT_COMPRESS) {
  1142. USE_FOR_MMU(IF_FEATURE_SEAMLESS_Z(xformer = unpack_Z_stream;))
  1143. USE_FOR_NOMMU(xformer_prog = "uncompress";)
  1144. }
  1145. if (opt & OPT_GZIP) {
  1146. USE_FOR_MMU(IF_FEATURE_SEAMLESS_GZ(xformer = unpack_gz_stream;))
  1147. USE_FOR_NOMMU(xformer_prog = "gunzip";)
  1148. }
  1149. if (opt & OPT_BZIP2) {
  1150. USE_FOR_MMU(IF_FEATURE_SEAMLESS_BZ2(xformer = unpack_bz2_stream;))
  1151. USE_FOR_NOMMU(xformer_prog = "bunzip2";)
  1152. }
  1153. if (opt & OPT_LZMA) {
  1154. USE_FOR_MMU(IF_FEATURE_SEAMLESS_LZMA(xformer = unpack_lzma_stream;))
  1155. USE_FOR_NOMMU(xformer_prog = "unlzma";)
  1156. }
  1157. if (opt & OPT_XZ) {
  1158. USE_FOR_MMU(IF_FEATURE_SEAMLESS_XZ(xformer = unpack_xz_stream;))
  1159. USE_FOR_NOMMU(xformer_prog = "unxz";)
  1160. }
  1161. fork_transformer_with_sig(tar_handle->src_fd, xformer, xformer_prog);
  1162. /* Can't lseek over pipes */
  1163. tar_handle->seek = seek_by_read;
  1164. /*tar_handle->offset = 0; - already is */
  1165. }
  1166. /* Zero processed headers (== empty file) is not a valid tarball.
  1167. * We (ab)use bb_got_signal as exitcode here,
  1168. * because check_errors_in_children() uses _it_ as error indicator.
  1169. */
  1170. bb_got_signal = EXIT_FAILURE;
  1171. while (get_header_tar(tar_handle) == EXIT_SUCCESS)
  1172. bb_got_signal = EXIT_SUCCESS; /* saw at least one header, good */
  1173. create_links_from_list(tar_handle->link_placeholders);
  1174. /* Check that every file that should have been extracted was */
  1175. while (tar_handle->accept) {
  1176. if (!find_list_entry(tar_handle->reject, tar_handle->accept->data)
  1177. && !find_list_entry(tar_handle->passed, tar_handle->accept->data)
  1178. ) {
  1179. bb_error_msg_and_die("%s: not found in archive",
  1180. tar_handle->accept->data);
  1181. }
  1182. tar_handle->accept = tar_handle->accept->link;
  1183. }
  1184. if (ENABLE_FEATURE_CLEAN_UP /* && tar_handle->src_fd != STDIN_FILENO */)
  1185. close(tar_handle->src_fd);
  1186. if (SEAMLESS_COMPRESSION || OPT_COMPRESS) {
  1187. /* Set bb_got_signal to 1 if a child died with !0 exitcode */
  1188. check_errors_in_children(0);
  1189. }
  1190. return bb_got_signal;
  1191. }