Subversion Repositories planix.SVN

Rev

Go to most recent revision | Blame | Compare with Previous | Last modification | View Log | RSS feed

/*
 * ecp - copy a file fast (in big blocks), cope with errors, optionally verify.
 *
 * Transfers a block at a time.  On error, retries one sector at a time,
 * and reports all errors on the retry.
 * Unlike dd, ecp ignores EOF, since it is sometimes reported on error.
 * Also unlike `dd conv=noerror,sync', ecp doesn't get stuck nor give up.
 *
 * Written by Geoff Collyer, originally to run on RSX-11M(!) in 1979.
 * Later simplified for UNIX and ultimately Plan 9.
 */
#include <u.h>
#include <libc.h>
#include <ctype.h>

/* fundamental constants */
enum {
        No = 0,
        Yes,

        Noseek = 0,             /* need not seek, may seek on seekable files */
        Mustseek,

        Enone = 0,
        Eio,
};

/* tunable parameters */
enum {
        Defsectsz = 512,        /* default sector size */
        /* 10K is a good size for HP WORM drives */
        Defblksz = 16*1024,     /* default block (big-transfer) size */
        Mingoodblks = 3,        /* after this many, go back to fast mode */
};

#define TTY "/dev/cons"                 /* plan 9 */

#define badsect(errno) ((errno) != Enone)  /* was last transfer in error? */

/* disk address (in bytes or sectors), also type of 2nd arg. to seek */
typedef uvlong Daddr;
typedef vlong Sdaddr;                           /* signed disk address */
typedef long Rdwrfn(int, void *, long);         /* plan 9 read or write */

typedef struct {
        char    *name;
        int     fd;
        Daddr   startsect;
        int     fast;
        int     seekable;

        ulong   maxconerrs;             /* maximum consecutive errors */
        ulong   conerrs;                /* current consecutive errors */
        Daddr   congoodblks;

        Daddr   harderrs;
        Daddr   lasterr;                /* sector #s */
        Daddr   lastgood;
} File;

/* exports */
char *argv0;

/* privates */
static int reblock = No, progress = No, swizzle = No;
static int reverse = No;
static ulong sectsz = Defsectsz;
static ulong blocksize = Defblksz;

static char *buf, *vfybuf;
static int blksects;

/*
 * warning - print best error message possible and clear errno
 */
void
warning(char *s1, char *s2)
{
        char err[100], msg[256];
        char *np, *ep = msg + sizeof msg - 1;

        errstr(err, sizeof err);                /* save error string */
        np = seprint(msg, ep, "%s: ", argv0);
        np = seprint(np, ep, s1, s2);
        errstr(err, sizeof err);                /* restore error string */
        seprint(np, ep, ": %r\n");

        fprint(2, "%s", msg);
}

int
eopen(char *file, int mode)
{
        int fd = open(file, mode);

        if (fd < 0)
                sysfatal("can't open %s: %r", file);
        return fd;
}

static int                                      /* boolean */
confirm(File *src, File *dest)
{
        int absent, n, tty = eopen(TTY, 2);
        char c, junk;
        Dir *stp;

        if ((stp = dirstat(src->name)) == nil)
                sysfatal("no input file %s: %r", src->name);
        free(stp);
        stp = dirstat(dest->name);
        absent = (stp == nil);
        free(stp);
        fprint(2, "%s: copy %s to %s%s? ", argv0, src->name, dest->name,
                (absent? " (missing)": ""));
        n = read(tty, &c, 1);
        junk = c;
        if (n < 1)
                c = 'n';
        while (n > 0 && junk != '\n')
                n = read(tty, &junk, 1);
        close(tty);
        if (isascii(c) && isupper(c))
                c = tolower(c);
        return c == 'y';
}

static char *
sectid(File *fp, Daddr sect)
{
        static char sectname[256];

        if (fp->startsect == 0)
                snprint(sectname, sizeof sectname, "%s sector %llud",
                        fp->name, sect);
        else
                snprint(sectname, sizeof sectname,
                        "%s sector %llud (relative %llud)",
                        fp->name, sect + fp->startsect, sect);
        return sectname;
}

static void
io_expl(File *fp, char *rw, Daddr sect)         /* explain an i/o error */
{
        /* print only first 2 bad sectors in a range, if going forward */
        if (reverse || fp->conerrs == 0) {
                char msg[128];

                snprint(msg, sizeof msg, "%s %s", rw, sectid(fp, sect));
                warning("%s", msg);
        } else if (fp->conerrs == 1)
                fprint(2, "%s: ...\n", argv0);
}

static void
repos(File *fp, Daddr sect)
{
        if (!fp->seekable)
                sysfatal("%s: trying to seek on unseekable file", fp->name);
        if (seek(fp->fd, (sect+fp->startsect)*sectsz, 0) == -1)
                sysfatal("can't seek on %s: %r", fp->name);
}

static void
rewind(File *fp)
{
        repos(fp, 0);
}

static char magic[] = "\235any old ☺ rubbish\173";
static char uniq[sizeof magic + 2*sizeof(ulong)];

static char *
putbe(char *p, ulong ul)
{
        *p++ = ul>>24;
        *p++ = ul>>16;
        *p++ = ul>>8;
        *p++ = ul;
        return p;
}

/*
 * generate magic + unique string, add to start & end of buff.
 * return tail pointer.
 */
static char *
addmagic(char *buff, int bytes)
{
        char *p, *tail;
        static ulong seq;

        strcpy(uniq, magic);
        p = putbe(uniq + sizeof magic - 1, time(0));
        putbe(p, ++seq);

        memcpy(buff, uniq, sizeof uniq);
        tail = buff + bytes - sizeof uniq;
        memcpy(tail, uniq, sizeof uniq);
        return tail;
}

/* verify magic + unique strings in buff */
static int
ismagicok(char *buff, char *tail)
{
        return  memcmp(buff, uniq, sizeof uniq) == 0 ||
                memcmp(tail, uniq, sizeof uniq) == 0;
}

/*
 * transfer (many) sectors.  reblock input as needed.
 * returns Enone if no failures, others on failure with errstr set.
 */
static int
bio(File *fp, Rdwrfn *rdwr, char *buff, Daddr stsect, int sects, int mustseek)
{
        int xfered;
        char *tail;
        ulong toread, bytes = sects * sectsz;
        static int reblocked = 0;

        if (mustseek) {
                if (!fp->seekable)
                        sysfatal("%s: need to seek on unseekable file",
                                fp->name);
                repos(fp, stsect);
        }
        if ((long)blocksize != blocksize || (long)bytes != bytes)
                sysfatal("i/o count too big: %lud", bytes);

        SET(tail);
        if (rdwr == read)
                tail = addmagic(buff, bytes);
        werrstr("");
        xfered = (*rdwr)(fp->fd, buff, bytes);
        if (xfered == bytes) {
                /* don't trust the hardware; it may lie */
                if (rdwr == read && ismagicok(buff, tail))
                        fprint(2, "%s: `good' read didn't change buffer\n",
                                argv0);
                return Enone;                   /* did as we asked */
        }
        if (xfered < 0)
                return Eio;                     /* out-and-out i/o error */

        /*
         * Kernel transferred less than asked.  Shouldn't happen;
         * probably indicates disk driver error or trying to
         * transfer past the end of a disk partition.  Treat as an
         * I/O error that reads zeros past the point of error,
         * unless reblocking input and this is a read.
         */

        if (rdwr == write)
                return Eio;
        if (!reblock) {
                memset(buff+xfered, '\0', bytes-xfered);
                return Eio;                     /* short read */
        }

        /* for pipes that return less than asked */
        if (progress && !reblocked) {
                fprint(2, "%s: reblocking input\n", argv0);
                reblocked++;
        }
        for (toread = bytes - xfered; toread != 0; toread -= xfered) {
                xfered = (*rdwr)(fp->fd, buff+bytes-toread, toread);
                if (xfered <= 0)
                        break;
        }
        if (xfered < 0)
                return Eio;                     /* out-and-out i/o error */
        if (toread != 0)                        /* early EOF? */
                memset(buff+bytes-toread, '\0', toread);
        return Enone;
}

/* called only after a single-sector transfer */
static int
toomanyerrs(File *fp, Daddr sect)
{
        if (sect == fp->lasterr+1)
                fp->conerrs++;
        else
                fp->conerrs = 0;
        fp->lasterr = sect;
        return fp->maxconerrs != 0 && fp->conerrs >= fp->maxconerrs &&
                fp->lastgood == -1;
}

static void
ckendrange(File *fp)
{
        if (!reverse && fp->conerrs > 0)
                fprint(2, "%s: %lld: ... last bad sector in range\n",
                        argv0, fp->lasterr);
}

static int
transfer(File *fp, Rdwrfn *rdwr, char *buff, Daddr stsect, int sects,
        int mustseek)
{
        int res = bio(fp, rdwr, buff, stsect, sects, mustseek);

        if (badsect(res)) {
                fp->fast = 0;           /* read single sectors for a while */
                fp->congoodblks = 0;
        } else
                fp->lastgood = stsect + sects - 1;
        return res;
}

/*
 * Read or write many sectors at once.
 * If it fails, retry the individual sectors and report errors.
 */
static void
bigxfer(File *fp, Rdwrfn *rdwr, char *buff, Daddr stsect, int sects,
        int mustseek)
{
        int i, badsects = 0, wasfast = fp->fast;
        char *rw = (rdwr == read? "read": "write");

        if (fp->fast) {
                if (!badsect(transfer(fp, rdwr, buff, stsect, sects, mustseek)))
                        return;
                if (progress)
                        fprint(2, "%s: breaking up big transfer on %s error "
                                "`%r' on %s\n", argv0, rw, sectid(fp, stsect));
        }

        for (i = 0; i < sects; i++)
                if (badsect(transfer(fp, rdwr, buff+i*sectsz, stsect+i, 1,
                    Mustseek))) {
                        io_expl(fp, rw, stsect+i);
                        badsects++;
                        fp->harderrs++;
                        if (toomanyerrs(fp, stsect+i))
                                sysfatal("more than %lud consecutive I/O errors",
                                        fp->maxconerrs);
                } else {
                        ckendrange(fp);
                        fp->conerrs = 0;
                }
        if (badsects == 0) {
                ckendrange(fp);
                fp->conerrs = 0;
                if (wasfast)
                        fprint(2, "%s: %s error on big transfer at %s but none "
                                "on retries!\n", argv0, rw, sectid(fp, stsect));
                ++fp->congoodblks;
                if (fp->congoodblks >= Mingoodblks) {
                        fprint(2, "%s: %s: back to big transfers\n", argv0,
                                fp->name);
                        fp->fast = 1;
                }
        } else
                /*
                 * the last sector could have been in error, so the seek pointer
                 * may need to be corrected.
                 */
                repos(fp, stsect + sects);
}

static void
vrfyfailed(File *src, File *dest, Daddr stsect)
{
        char *srcsect = strdup(sectid(src, stsect));

        fprint(2, "%s: verify failed at %s (%s)\n", argv0, srcsect,
                sectid(dest, stsect));
        free(srcsect);
}

/*
 * I've seen SCSI read errors that the kernel printed but then didn't
 * report to the program doing the read, so if a big verify fails,
 * break it up and verify each sector separately to isolate the bad sector(s).
 */
int                                             /* error count */
verify(File *src, File *dest, char *buff, char *buft, Daddr stsect,
        int sectors)
{
        int i, errors = 0;

        for (i = 0; i < sectors; i++)
                if (memcmp(buff + i*sectsz, buft + i*sectsz, sectsz) != 0)
                        errors++;
        if (errors == 0)
                return errors;                  /* normal case */

        if (sectors == 1) {
                vrfyfailed(src, dest, stsect);
                return errors;
        }

        /* re-read and verify each sector individually */
        errors = 0;
        for (i = 0; i < sectors; i++) {
                int thissect = stsect + i;

                if (badsect(bio(src,  read, buff, thissect, 1, Mustseek)))
                        io_expl(src,  "read",  thissect);
                if (badsect(bio(dest, read, buft, thissect, 1, Mustseek)))
                        io_expl(dest, "write", thissect);
                if (memcmp(buff, buft, sectsz) != 0) {
                        vrfyfailed(src, dest, thissect);
                        ++errors;
                }
        }
        if (errors == 0) {
                char *srcsect = strdup(sectid(src, stsect));

                fprint(2, "%s: verification failed on big read at %s (%s) "
                        "but not on retries!\n", argv0, srcsect,
                        sectid(dest, stsect));
                free(srcsect);
        }
        /*
         * the last sector of each could have been in error, so the seek
         * pointers may need to be corrected.
         */
        repos(src,  stsect + sectors);
        repos(dest, stsect + sectors);
        return errors;
}

/*
 * start is starting sector of proposed transfer;
 * nsects is the total number of sectors being copied;
 * maxxfr is the block size in sectors.
 */
int
sectsleft(Daddr start, Daddr nsects, int maxxfr)
{
        /* nsects-start is sectors to the end */
        if (start + maxxfr <= nsects - 1)
                return maxxfr;
        else
                return nsects - start;
}

enum {
        Rotbits = 3,
};

void
swizzlebits(char *buff, int sects)
{
        uchar *bp, *endbp;

        endbp = (uchar *)(buff+sects*sectsz);
        for (bp = (uchar *)buff; bp < endbp; bp++)
                *bp = ~(*bp>>Rotbits | *bp<<(8-Rotbits));
}

/*
 * copy at most blksects sectors, with error retries.
 * stsect is relative to the start of the copy; 0 is the first sector.
 * to get actual sector numbers, add e.g. dest->startsect.
 */
static int
copysects(File *src, File *dest, Daddr stsect, Daddr nsects, int mustseek)
{
        int xfrsects = sectsleft(stsect, nsects, blksects);

        if (xfrsects > blksects) {
                fprint(2, "%s: block size of %d is too big.\n", argv0, xfrsects);
                exits("block size too big");
        }
        bigxfer(src,  read,  buf, stsect, xfrsects, mustseek);
        if (swizzle)
                swizzlebits(buf, xfrsects);
        bigxfer(dest, write, buf, stsect, xfrsects, mustseek);
        /* give a few reassurances at the start, then every 10MB */
        if (progress &&
            (stsect < blksects*10 || stsect%(10*1024*1024/sectsz) == 0))
                fprint(2, "%s: copied%s to relative sector %llud\n", argv0,
                        (swizzle? " swizzled": ""), stsect + xfrsects - 1);
        return 0;
}

/*
 * verify at most blksects sectors, with error retries.
 * return error count.
 */
static int
vrfysects(File *src, File *dest, Daddr stsect, Daddr nsects, int mustseek)
{
        int xfrsects = sectsleft(stsect, nsects, blksects);

        if (xfrsects > blksects) {
                fprint(2, "%s: block size of %d is too big.\n", argv0, xfrsects);
                exits("block size too big");
        }
        bigxfer(src,  read, buf,    stsect, xfrsects, mustseek);
        bigxfer(dest, read, vfybuf, stsect, xfrsects, mustseek);
        return verify(src, dest, buf, vfybuf, stsect, xfrsects);
}

static void
setupfile(File *fp, int mode)
{
        fp->fd = open(fp->name, mode);
        if (fp->fd < 0)
                sysfatal("can't open %s: %r", fp->name);
        fp->seekable = (seek(fp->fd, 0, 1) >= 0);
        if (fp->startsect != 0)
                rewind(fp);
}

static Daddr
copyfile(File *src, File *dest, Daddr nsects, int plsverify)
{
        Sdaddr stsect, vererrs = 0;
        Dir *stp;

        setupfile(src, OREAD);
        if ((stp = dirstat(dest->name)) == nil) {
                int fd = create(dest->name, ORDWR, 0666);

                if (fd >= 0)
                        close(fd);
        }
        free(stp);
        setupfile(dest, ORDWR);

        if (progress)
                fprint(2, "%s: copying first sectors\n", argv0);
        if (reverse)
                for (stsect = (nsects/blksects)*blksects; stsect >= 0;
                     stsect -= blksects)
                        vererrs += copysects(src, dest, stsect, nsects, Mustseek);
        else {
                for (stsect = 0; stsect < nsects; stsect += blksects)
                        vererrs += copysects(src, dest, stsect, nsects, Noseek);
                ckendrange(src);
                ckendrange(dest);
        }

        /*
         * verification is done as a separate pass rather than immediately after
         * writing, in part to defeat caching in clever disk controllers.
         * we really want to see the bits that hit the disk.
         */
        if (plsverify) {
                fprint(2, "%s: copy done; verifying...\n", argv0);
                rewind(src);
                rewind(dest);
                for (stsect = 0; stsect < nsects; stsect += blksects) /* forward */
                        vererrs += vrfysects(src, dest, stsect, nsects, Noseek);
                if (vererrs <= 0)
                        fprint(2, "%s: no", argv0);
                else
                        fprint(2, "%s: %llud", argv0, vererrs);
                fprint(2, " error%s during verification\n",
                        (vererrs != 1? "s": ""));
        }
        close(src->fd);
        close(dest->fd);
        return vererrs;
}

static void
usage(void)
{
        fprint(2, "usage: %s [-bcprvZ][-B blocksz][-e errs][-s sectsz]"
                "[-i issect][-o ossect] sectors from to\n", argv0);
        exits("usage");
}

void
initfile(File *fp)
{
        memset(fp, 0, sizeof *fp);
        fp->fast = 1;
        fp->lasterr = -1;
        fp->lastgood = -1;
}

void
main(int argc, char **argv)
{
        int errflg = 0, plsconfirm = No, plsverify = No;
        long lval;
        File src, dest;
        Sdaddr sect;

        initfile(&src);
        initfile(&dest);
        ARGBEGIN {
        case 'b':
                reblock = Yes;
                break;
        case 'B':
                lval = atol(EARGF(usage()));
                if (lval < 0)
                        usage();
                blocksize = lval;
                break;
        case 'c':
                plsconfirm = Yes;
                break;
        case 'e':
                lval = atol(EARGF(usage()));
                if (lval < 0)
                        usage();
                src.maxconerrs = lval;
                dest.maxconerrs = lval;
                break;
        case 'i':
                sect = atoll(EARGF(usage()));
                if (sect < 0)
                        usage();
                src.startsect = sect;
                break;
        case 'o':
                sect = atoll(EARGF(usage()));
                if (sect < 0)
                        usage();
                dest.startsect = sect;
                break;
        case 'p':
                progress = Yes;
                break;
        case 'r':
                reverse = Yes;
                break;
        case 's':
                sectsz = atol(EARGF(usage()));
                if (sectsz <= 0 || sectsz % 512 != 0)
                        usage();
                break;
        case 'v':
                plsverify = Yes;
                break;
        case 'Z':
                swizzle = Yes;
                break;
        default:
                errflg++;
                break;
        } ARGEND
        if (errflg || argc != 3)
                usage();
        if (blocksize <= 0 || blocksize % sectsz != 0)
                sysfatal("block size not a multiple of sector size");

        if (!isascii(argv[0][0]) || !isdigit(argv[0][0])) {
                fprint(2, "%s: %s is not numeric\n", argv0, argv[0]);
                exits("non-numeric sector count");
        }
        src.name =  argv[1];
        dest.name = argv[2];

        blksects = blocksize / sectsz;
        if (blksects < 1)
                blksects = 1;
        buf = malloc(blocksize);
        vfybuf = malloc(blocksize);
        if (buf == nil || vfybuf == nil)
                sysfatal("out of memory: %r");

        if (plsconfirm? confirm(&src, &dest): Yes)
                copyfile(&src, &dest, atoll(argv[0]), plsverify);
        exits(src.harderrs || dest.harderrs? "hard errors": 0);
}