ecp.c 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617
  1. /*
  2. * ecp - copy a file fast (in big blocks), cope with errors, optionally verify.
  3. *
  4. * Transfers a block at a time. On error, retries one sector at a time,
  5. * and reports all errors on the retry.
  6. * Unlike dd, ecp ignores EOF, since it is sometimes reported on error.
  7. * Also unlike `dd conv=noerror,sync', ecp doesn't get stuck nor give up.
  8. *
  9. * Written by Geoff Collyer, originally to run on RSX-11M(!) in 1979.
  10. * Later simplified for UNIX and ultimately Plan 9.
  11. */
  12. #include <u.h>
  13. #include <libc.h>
  14. #include <ctype.h>
  15. /* fundamental constants */
  16. enum {
  17. No = 0,
  18. Yes,
  19. Noseek = 0, /* need not seek, may seek on seekable files */
  20. Mustseek,
  21. Enone = 0,
  22. Eio,
  23. };
  24. /* tunable parameters */
  25. enum {
  26. Defsectsz = 512, /* default sector size */
  27. /* 10K is a good size for HP WORM drives */
  28. Defblksz = 16*1024, /* default block (big-transfer) size */
  29. Mingoodblks = 3, /* after this many, go back to fast mode */
  30. };
  31. #define TTY "/dev/cons" /* plan 9 */
  32. #define badsect(errno) ((errno) != Enone) /* was last transfer in error? */
  33. /* disk address (in bytes or sectors), also type of 2nd arg. to seek */
  34. typedef uvlong Daddr;
  35. typedef vlong Sdaddr; /* signed disk address */
  36. typedef long Rdwrfn(int, void *, long); /* plan 9 read or write */
  37. typedef struct {
  38. char *name;
  39. int fd;
  40. Daddr startsect;
  41. int fast;
  42. int seekable;
  43. ulong maxconerrs; /* maximum consecutive errors */
  44. ulong conerrs; /* current consecutive errors */
  45. Daddr congoodblks;
  46. Daddr harderrs;
  47. Daddr lasterr; /* sector #s */
  48. Daddr lastgood;
  49. } File;
  50. /* exports */
  51. char *argv0;
  52. /* privates */
  53. static int reblock = No, progress = No, swizzle = No;
  54. static int reverse = No;
  55. static ulong sectsz = Defsectsz;
  56. static ulong blocksize = Defblksz;
  57. static char *buf, *vfybuf;
  58. static int blksects;
  59. /*
  60. * warning - print best error message possible and clear errno
  61. */
  62. void
  63. warning(char *s1, char *s2)
  64. {
  65. char err[100], msg[256];
  66. char *np, *ep = msg + sizeof msg - 1;
  67. errstr(err, sizeof err); /* save error string */
  68. np = seprint(msg, ep, "%s: ", argv0);
  69. np = seprint(np, ep, s1, s2);
  70. errstr(err, sizeof err); /* restore error string */
  71. seprint(np, ep, ": %r\n");
  72. fprint(2, "%s", msg);
  73. }
  74. int
  75. eopen(char *file, int mode)
  76. {
  77. int fd = open(file, mode);
  78. if (fd < 0)
  79. sysfatal("can't open %s: %r", file);
  80. return fd;
  81. }
  82. static int /* boolean */
  83. confirm(File *src, File *dest)
  84. {
  85. int absent, n, tty = eopen(TTY, 2);
  86. char c, junk;
  87. Dir *stp;
  88. if ((stp = dirstat(src->name)) == nil)
  89. sysfatal("no input file %s: %r", src->name);
  90. free(stp);
  91. stp = dirstat(dest->name);
  92. absent = (stp == nil);
  93. free(stp);
  94. fprint(2, "%s: copy %s to %s%s? ", argv0, src->name, dest->name,
  95. (absent? " (missing)": ""));
  96. n = read(tty, &c, 1);
  97. junk = c;
  98. if (n < 1)
  99. c = 'n';
  100. while (n > 0 && junk != '\n')
  101. n = read(tty, &junk, 1);
  102. close(tty);
  103. if (isascii(c) && isupper(c))
  104. c = tolower(c);
  105. return c == 'y';
  106. }
  107. static char *
  108. sectid(File *fp, Daddr sect)
  109. {
  110. static char sectname[256];
  111. if (fp->startsect == 0)
  112. snprint(sectname, sizeof sectname, "%s sector %llud",
  113. fp->name, sect);
  114. else
  115. snprint(sectname, sizeof sectname,
  116. "%s sector %llud (relative %llud)",
  117. fp->name, sect + fp->startsect, sect);
  118. return sectname;
  119. }
  120. static void
  121. io_expl(File *fp, char *rw, Daddr sect) /* explain an i/o error */
  122. {
  123. /* print only first 2 bad sectors in a range, if going forward */
  124. if (reverse || fp->conerrs == 0) {
  125. char msg[128];
  126. snprint(msg, sizeof msg, "%s %s", rw, sectid(fp, sect));
  127. warning("%s", msg);
  128. } else if (fp->conerrs == 1)
  129. fprint(2, "%s: ...\n", argv0);
  130. }
  131. static void
  132. repos(File *fp, Daddr sect)
  133. {
  134. if (!fp->seekable)
  135. sysfatal("%s: trying to seek on unseekable file", fp->name);
  136. if (seek(fp->fd, (sect+fp->startsect)*sectsz, 0) == -1)
  137. sysfatal("can't seek on %s: %r", fp->name);
  138. }
  139. static void
  140. rewind(File *fp)
  141. {
  142. repos(fp, 0);
  143. }
  144. /*
  145. * transfer (many) sectors. reblock input as needed.
  146. * returns Enone if no failures, others on failure with errstr set.
  147. */
  148. static int
  149. bio(File *fp, Rdwrfn *rdwr, char *buff, Daddr stsect, int sects, int mustseek)
  150. {
  151. int xfered;
  152. ulong toread, bytes = sects * sectsz;
  153. static int reblocked = 0;
  154. if (mustseek) {
  155. if (!fp->seekable)
  156. sysfatal("%s: need to seek on unseekable file",
  157. fp->name);
  158. repos(fp, stsect);
  159. }
  160. if ((long)blocksize != blocksize || (long)bytes != bytes)
  161. sysfatal("i/o count too big: %lud", bytes);
  162. werrstr("");
  163. xfered = (*rdwr)(fp->fd, buff, bytes);
  164. if (xfered == bytes)
  165. return Enone; /* did as we asked */
  166. if (xfered < 0)
  167. return Eio; /* out-and-out i/o error */
  168. /*
  169. * Kernel transferred less than asked. Shouldn't happen;
  170. * probably indicates disk driver error or trying to
  171. * transfer past the end of a disk partition. Treat as an
  172. * I/O error that reads zeros past the point of error,
  173. * unless reblocking input and this is a read.
  174. */
  175. if (rdwr == write)
  176. return Eio;
  177. if (!reblock) {
  178. memset(buff+xfered, '\0', bytes-xfered);
  179. return Eio; /* short read */
  180. }
  181. /* for pipes that return less than asked */
  182. if (progress && !reblocked) {
  183. fprint(2, "%s: reblocking input\n", argv0);
  184. reblocked++;
  185. }
  186. for (toread = bytes - xfered; toread != 0; toread -= xfered) {
  187. xfered = (*rdwr)(fp->fd, buff+bytes-toread, toread);
  188. if (xfered <= 0)
  189. break;
  190. }
  191. if (xfered < 0)
  192. return Eio; /* out-and-out i/o error */
  193. if (toread != 0) /* early EOF? */
  194. memset(buff+bytes-toread, '\0', toread);
  195. return Enone;
  196. }
  197. /* called only after a single-sector transfer */
  198. static int
  199. toomanyerrs(File *fp, Daddr sect)
  200. {
  201. if (sect == fp->lasterr+1)
  202. fp->conerrs++;
  203. else
  204. fp->conerrs = 0;
  205. fp->lasterr = sect;
  206. return fp->maxconerrs != 0 && fp->conerrs >= fp->maxconerrs &&
  207. fp->lastgood == -1;
  208. }
  209. static void
  210. ckendrange(File *fp)
  211. {
  212. if (!reverse && fp->conerrs > 0)
  213. fprint(2, "%s: %lld: ... last bad sector in range\n",
  214. argv0, fp->lasterr);
  215. }
  216. static int
  217. transfer(File *fp, Rdwrfn *rdwr, char *buff, Daddr stsect, int sects,
  218. int mustseek)
  219. {
  220. int res = bio(fp, rdwr, buff, stsect, sects, mustseek);
  221. if (badsect(res)) {
  222. fp->fast = 0; /* read single sectors for a while */
  223. fp->congoodblks = 0;
  224. } else
  225. fp->lastgood = stsect + sects - 1;
  226. return res;
  227. }
  228. /*
  229. * Read or write many sectors at once.
  230. * If it fails, retry the individual sectors and report errors.
  231. */
  232. static void
  233. bigxfer(File *fp, Rdwrfn *rdwr, char *buff, Daddr stsect, int sects,
  234. int mustseek)
  235. {
  236. int i, badsects = 0, wasfast = fp->fast;
  237. char *rw = (rdwr == read? "read": "write");
  238. if (fp->fast) {
  239. if (!badsect(transfer(fp, rdwr, buff, stsect, sects, mustseek)))
  240. return;
  241. if (progress)
  242. fprint(2, "%s: breaking up big transfer on %s error "
  243. "`%r' on %s\n", argv0, rw, sectid(fp, stsect));
  244. }
  245. for (i = 0; i < sects; i++)
  246. if (badsect(transfer(fp, rdwr, buff+i*sectsz, stsect+i, 1,
  247. Mustseek))) {
  248. io_expl(fp, rw, stsect+i);
  249. badsects++;
  250. fp->harderrs++;
  251. if (toomanyerrs(fp, stsect+i))
  252. sysfatal("more than %lud consecutive I/O errors",
  253. fp->maxconerrs);
  254. } else {
  255. ckendrange(fp);
  256. fp->conerrs = 0;
  257. }
  258. if (badsects == 0) {
  259. ckendrange(fp);
  260. fp->conerrs = 0;
  261. if (wasfast)
  262. fprint(2, "%s: %s error on big transfer at %s but none "
  263. "on retries!\n", argv0, rw, sectid(fp, stsect));
  264. ++fp->congoodblks;
  265. if (fp->congoodblks >= Mingoodblks) {
  266. fprint(2, "%s: %s: back to big transfers\n", argv0,
  267. fp->name);
  268. fp->fast = 1;
  269. }
  270. } else
  271. /*
  272. * the last sector could have been in error, so the seek pointer
  273. * may need to be corrected.
  274. */
  275. repos(fp, stsect + sects);
  276. }
  277. static void
  278. vrfyfailed(File *src, File *dest, Daddr stsect)
  279. {
  280. char *srcsect = strdup(sectid(src, stsect));
  281. fprint(2, "%s: verify failed at %s (%s)\n", argv0, srcsect,
  282. sectid(dest, stsect));
  283. free(srcsect);
  284. }
  285. /*
  286. * I've seen SCSI read errors that the kernel printed but then didn't
  287. * report to the program doing the read, so if a big verify fails,
  288. * break it up and verify each sector separately to isolate the bad sector(s).
  289. */
  290. int /* error count */
  291. verify(File *src, File *dest, char *buff, char *buft, Daddr stsect,
  292. int sectors)
  293. {
  294. int i, errors = 0;
  295. for (i = 0; i < sectors; i++)
  296. if (memcmp(buff + i*sectsz, buft + i*sectsz, sectsz) != 0)
  297. errors++;
  298. if (errors == 0)
  299. return errors; /* normal case */
  300. if (sectors == 1) {
  301. vrfyfailed(src, dest, stsect);
  302. return errors;
  303. }
  304. /* re-read and verify each sector individually */
  305. errors = 0;
  306. for (i = 0; i < sectors; i++) {
  307. int thissect = stsect + i;
  308. if (badsect(bio(src, read, buff, thissect, 1, Mustseek)))
  309. io_expl(src, "read", thissect);
  310. if (badsect(bio(dest, read, buft, thissect, 1, Mustseek)))
  311. io_expl(dest, "write", thissect);
  312. if (memcmp(buff, buft, sectsz) != 0) {
  313. vrfyfailed(src, dest, thissect);
  314. ++errors;
  315. }
  316. }
  317. if (errors == 0) {
  318. char *srcsect = strdup(sectid(src, stsect));
  319. fprint(2, "%s: verification failed on big read at %s (%s) "
  320. "but not on retries!\n", argv0, srcsect,
  321. sectid(dest, stsect));
  322. free(srcsect);
  323. }
  324. /*
  325. * the last sector of each could have been in error, so the seek
  326. * pointers may need to be corrected.
  327. */
  328. repos(src, stsect + sectors);
  329. repos(dest, stsect + sectors);
  330. return errors;
  331. }
  332. /*
  333. * start is starting sector of proposed transfer;
  334. * nsects is the total number of sectors being copied;
  335. * maxxfr is the block size in sectors.
  336. */
  337. int
  338. sectsleft(Daddr start, Daddr nsects, int maxxfr)
  339. {
  340. /* nsects-start is sectors to the end */
  341. if (start + maxxfr <= nsects - 1)
  342. return maxxfr;
  343. else
  344. return nsects - start;
  345. }
  346. enum {
  347. Rotbits = 3,
  348. };
  349. void
  350. swizzlebits(char *buff, int sects)
  351. {
  352. uchar *bp, *endbp;
  353. endbp = (uchar *)(buff+sects*sectsz);
  354. for (bp = (uchar *)buff; bp < endbp; bp++)
  355. *bp = ~(*bp>>Rotbits | *bp<<(8-Rotbits));
  356. }
  357. /*
  358. * copy at most blksects sectors, with error retries.
  359. * stsect is relative to the start of the copy; 0 is the first sector.
  360. * to get actual sector numbers, add e.g. dest->startsect.
  361. */
  362. static int
  363. copysects(File *src, File *dest, Daddr stsect, Daddr nsects, int mustseek)
  364. {
  365. int xfrsects = sectsleft(stsect, nsects, blksects);
  366. if (xfrsects > blksects) {
  367. fprint(2, "%s: block size of %d is too big.\n", argv0, xfrsects);
  368. exits("block size too big");
  369. }
  370. bigxfer(src, read, buf, stsect, xfrsects, mustseek);
  371. if (swizzle)
  372. swizzlebits(buf, xfrsects);
  373. bigxfer(dest, write, buf, stsect, xfrsects, mustseek);
  374. /* give a few reassurances at the start, then every 10MB */
  375. if (progress &&
  376. (stsect < blksects*10 || stsect%(10*1024*1024/sectsz) == 0))
  377. fprint(2, "%s: copied%s to relative sector %llud\n", argv0,
  378. (swizzle? " swizzled": ""), stsect + xfrsects - 1);
  379. return 0;
  380. }
  381. /*
  382. * verify at most blksects sectors, with error retries.
  383. * return error count.
  384. */
  385. static int
  386. vrfysects(File *src, File *dest, Daddr stsect, Daddr nsects, int mustseek)
  387. {
  388. int xfrsects = sectsleft(stsect, nsects, blksects);
  389. if (xfrsects > blksects) {
  390. fprint(2, "%s: block size of %d is too big.\n", argv0, xfrsects);
  391. exits("block size too big");
  392. }
  393. bigxfer(src, read, buf, stsect, xfrsects, mustseek);
  394. bigxfer(dest, read, vfybuf, stsect, xfrsects, mustseek);
  395. return verify(src, dest, buf, vfybuf, stsect, xfrsects);
  396. }
  397. static void
  398. setupfile(File *fp, int mode)
  399. {
  400. fp->fd = open(fp->name, mode);
  401. if (fp->fd < 0)
  402. sysfatal("can't open %s: %r", fp->name);
  403. fp->seekable = (seek(fp->fd, 0, 1) >= 0);
  404. if (fp->startsect != 0)
  405. rewind(fp);
  406. }
  407. static Daddr
  408. copyfile(File *src, File *dest, Daddr nsects, int plsverify)
  409. {
  410. Sdaddr stsect, vererrs = 0;
  411. Dir *stp;
  412. setupfile(src, OREAD);
  413. if ((stp = dirstat(dest->name)) == nil) {
  414. int fd = create(dest->name, ORDWR, 0666);
  415. if (fd >= 0)
  416. close(fd);
  417. }
  418. free(stp);
  419. setupfile(dest, ORDWR);
  420. if (progress)
  421. fprint(2, "%s: copying first sectors\n", argv0);
  422. if (reverse)
  423. for (stsect = (nsects/blksects)*blksects; stsect >= 0;
  424. stsect -= blksects)
  425. vererrs += copysects(src, dest, stsect, nsects, Mustseek);
  426. else {
  427. for (stsect = 0; stsect < nsects; stsect += blksects)
  428. vererrs += copysects(src, dest, stsect, nsects, Noseek);
  429. ckendrange(src);
  430. ckendrange(dest);
  431. }
  432. /*
  433. * verification is done as a separate pass rather than immediately after
  434. * writing, in part to defeat caching in clever disk controllers.
  435. * we really want to see the bits that hit the disk.
  436. */
  437. if (plsverify) {
  438. fprint(2, "%s: copy done; verifying...\n", argv0);
  439. rewind(src);
  440. rewind(dest);
  441. for (stsect = 0; stsect < nsects; stsect += blksects) /* forward */
  442. vererrs += vrfysects(src, dest, stsect, nsects, Noseek);
  443. if (vererrs <= 0)
  444. fprint(2, "%s: no", argv0);
  445. else
  446. fprint(2, "%s: %llud", argv0, vererrs);
  447. fprint(2, " error%s during verification\n",
  448. (vererrs != 1? "s": ""));
  449. }
  450. close(src->fd);
  451. close(dest->fd);
  452. return vererrs;
  453. }
  454. static void
  455. usage(void)
  456. {
  457. fprint(2, "usage: %s [-bcprvZ][-B blocksz][-e errs][-s sectsz]"
  458. "[-i issect][-o ossect] sectors from to\n", argv0);
  459. exits("usage");
  460. }
  461. void
  462. initfile(File *fp)
  463. {
  464. memset(fp, 0, sizeof *fp);
  465. fp->fast = 1;
  466. fp->lasterr = -1;
  467. fp->lastgood = -1;
  468. }
  469. void
  470. main(int argc, char **argv)
  471. {
  472. int errflg = 0, plsconfirm = No, plsverify = No;
  473. long lval;
  474. File src, dest;
  475. Sdaddr sect;
  476. initfile(&src);
  477. initfile(&dest);
  478. ARGBEGIN {
  479. case 'b':
  480. reblock = Yes;
  481. break;
  482. case 'B':
  483. lval = atol(EARGF(usage()));
  484. if (lval < 0)
  485. usage();
  486. blocksize = lval;
  487. break;
  488. case 'c':
  489. plsconfirm = Yes;
  490. break;
  491. case 'e':
  492. lval = atol(EARGF(usage()));
  493. if (lval < 0)
  494. usage();
  495. src.maxconerrs = lval;
  496. dest.maxconerrs = lval;
  497. break;
  498. case 'i':
  499. sect = atoll(EARGF(usage()));
  500. if (sect < 0)
  501. usage();
  502. src.startsect = sect;
  503. break;
  504. case 'o':
  505. sect = atoll(EARGF(usage()));
  506. if (sect < 0)
  507. usage();
  508. dest.startsect = sect;
  509. break;
  510. case 'p':
  511. progress = Yes;
  512. break;
  513. case 'r':
  514. reverse = Yes;
  515. break;
  516. case 's':
  517. sectsz = atol(EARGF(usage()));
  518. if (sectsz <= 0 || sectsz % 512 != 0)
  519. usage();
  520. break;
  521. case 'v':
  522. plsverify = Yes;
  523. break;
  524. case 'Z':
  525. swizzle = Yes;
  526. break;
  527. default:
  528. errflg++;
  529. break;
  530. } ARGEND
  531. if (errflg || argc != 3)
  532. usage();
  533. if (blocksize <= 0 || blocksize % sectsz != 0)
  534. sysfatal("block size not a multiple of sector size");
  535. if (!isascii(argv[0][0]) || !isdigit(argv[0][0])) {
  536. fprint(2, "%s: %s is not numeric\n", argv0, argv[0]);
  537. exits("non-numeric sector count");
  538. }
  539. src.name = argv[1];
  540. dest.name = argv[2];
  541. blksects = blocksize / sectsz;
  542. if (blksects < 1)
  543. blksects = 1;
  544. buf = malloc(blocksize);
  545. vfybuf = malloc(blocksize);
  546. if (buf == nil || vfybuf == nil)
  547. sysfatal("out of memory: %r");
  548. if (plsconfirm? confirm(&src, &dest): Yes)
  549. copyfile(&src, &dest, atoll(argv[0]), plsverify);
  550. exits(src.harderrs || dest.harderrs? "hard errors": 0);
  551. }