diff options
author | dillon <dillon@FreeBSD.org> | 2003-01-13 19:42:41 +0000 |
---|---|---|
committer | dillon <dillon@FreeBSD.org> | 2003-01-13 19:42:41 +0000 |
commit | 5b697ad7ba32cd4546d0a6a44b4ef2a58cc6f9e9 (patch) | |
tree | af69e0b4486eed6e705fe04be584e57921195acb /sbin/dump | |
parent | d0082e294ce62cf63d5aa4738b8f999e18b04fff (diff) | |
download | FreeBSD-src-5b697ad7ba32cd4546d0a6a44b4ef2a58cc6f9e9.zip FreeBSD-src-5b697ad7ba32cd4546d0a6a44b4ef2a58cc6f9e9.tar.gz |
Add a caching option to dump. Use -C. Note that NetBSD has a caching option
called -r but it takes 512 byte blocks instead of megabytes, and I felt a
megabytes specification would be far more useful so I did not use the same
option character.
This will *greatly* improve dump performance at the cost of possibly
missing filesystem changes that occur between passes, and does a fairly
good job making up for the loss of buffered block devices. Caching is disabled
by default to retain historical behavior.
In tests, dump performance improved by about 40% when dumping / or /usr.
Beware that dump forks and the cache may wind up being larger then you
specify, but a more complex shared memory implementation would not produce
results that are all that much better so I kept it simple for now.
MFC after: 3 days
Diffstat (limited to 'sbin/dump')
-rw-r--r-- | sbin/dump/Makefile | 2 | ||||
-rw-r--r-- | sbin/dump/cache.c | 151 | ||||
-rw-r--r-- | sbin/dump/dump.8 | 11 | ||||
-rw-r--r-- | sbin/dump/dump.h | 1 | ||||
-rw-r--r-- | sbin/dump/main.c | 9 | ||||
-rw-r--r-- | sbin/dump/traverse.c | 7 |
6 files changed, 175 insertions, 6 deletions
diff --git a/sbin/dump/Makefile b/sbin/dump/Makefile index 1148d8f..58b5951 100644 --- a/sbin/dump/Makefile +++ b/sbin/dump/Makefile @@ -18,7 +18,7 @@ LINKS= ${BINDIR}/dump ${BINDIR}/rdump CFLAGS+=-DRDUMP CFLAGS+=-I${.CURDIR}/../../libexec/rlogind WARNS= 0 -SRCS= itime.c main.c optr.c dumprmt.c tape.c traverse.c unctime.c +SRCS= itime.c main.c optr.c dumprmt.c tape.c traverse.c unctime.c cache.c MAN= dump.8 MLINKS+=dump.8 rdump.8 diff --git a/sbin/dump/cache.c b/sbin/dump/cache.c new file mode 100644 index 0000000..c049466 --- /dev/null +++ b/sbin/dump/cache.c @@ -0,0 +1,151 @@ +/* + * CACHE.C + * + * Block cache for dump + * + * $FreeBSD$ + */ + +#include <sys/param.h> +#include <sys/stat.h> +#include <sys/mman.h> + +#ifdef sunos +#include <sys/vnode.h> + +#include <ufs/fs.h> +#include <ufs/fsdir.h> +#include <ufs/inode.h> +#else +#include <ufs/ufs/dir.h> +#include <ufs/ufs/dinode.h> +#include <ufs/ffs/fs.h> +#endif + +#include <protocols/dumprestore.h> + +#include <ctype.h> +#include <stdio.h> +#ifdef __STDC__ +#include <errno.h> +#include <string.h> +#include <stdlib.h> +#include <unistd.h> +#endif +#include "dump.h" + +typedef struct Block { + struct Block *b_HNext; /* must be first field */ + off_t b_Offset; + char *b_Data; +} Block; + +#define HFACTOR 4 +#define BLKFACTOR 4 + +static char *DataBase; +static Block **BlockHash; +static int BlockSize; +static int HSize; +static int NBlocks; + +static void +cinit(void) +{ + int i; + int hi; + Block *base; + + if ((BlockSize = sblock->fs_bsize * BLKFACTOR) > MAXBSIZE) + BlockSize = MAXBSIZE; + NBlocks = cachesize / BlockSize; + HSize = NBlocks / HFACTOR; + + msg("Cache %d MB, blocksize = %d\n", + NBlocks * BlockSize / (1024 * 1024), BlockSize); + + base = calloc(sizeof(Block), NBlocks); + BlockHash = calloc(sizeof(Block *), HSize); + DataBase = mmap(NULL, NBlocks * BlockSize, + PROT_READ|PROT_WRITE, MAP_ANON, -1, 0); + for (i = 0; i < NBlocks; ++i) { + base[i].b_Data = DataBase + i * BlockSize; + base[i].b_Offset = (off_t)-1; + hi = i / HFACTOR; + base[i].b_HNext = BlockHash[hi]; + BlockHash[hi] = &base[i]; + } +} + +ssize_t +cread(int fd, void *buf, size_t nbytes, off_t offset) +{ + Block *blk; + Block **pblk; + Block **ppblk; + int hi; + int n; + off_t mask; + + /* + * If the cache is disabled, revert to pread. If the + * cache has not been initialized, initialize the cache. + */ + if (sblock->fs_bsize && DataBase == NULL) { + if (cachesize <= 0) + return(pread(fd, buf, nbytes, offset)); + cinit(); + } + + /* + * If the request crosses a cache block boundary, or the + * request is larger or equal to the cache block size, + * revert to pread(). Full-block-reads are typically + * one-time calls and caching would be detrimental. + */ + mask = ~(off_t)(BlockSize - 1); + if (nbytes >= BlockSize || + ((offset ^ (offset + nbytes - 1)) & mask) != 0) { + return(pread(fd, buf, nbytes, offset)); + } + + /* + * Obtain and access the cache block. Cache a successful + * result. If an error occurs, revert to pread() (this might + * occur near the end of the media). + */ + hi = (offset / BlockSize) % HSize; + pblk = &BlockHash[hi]; + ppblk = NULL; + while ((blk = *pblk) != NULL) { + if (((blk->b_Offset ^ offset) & mask) == 0) { +#if 0 + fprintf(stderr, "%08llx %d (%08x)\n", offset, nbytes, + sblock->fs_size * sblock->fs_fsize); +#endif + break; + } + ppblk = pblk; + pblk = &blk->b_HNext; + } + if (blk == NULL) { + blk = *ppblk; + pblk = ppblk; + blk->b_Offset = offset & mask; + n = pread(fd, blk->b_Data, BlockSize, blk->b_Offset); + if (n != BlockSize) { + blk->b_Offset = (off_t)-1; + blk = NULL; + } + } + if (blk) { + bcopy(blk->b_Data + (offset - blk->b_Offset), buf, nbytes); + *pblk = blk->b_HNext; + blk->b_HNext = BlockHash[hi]; + BlockHash[hi] = blk; + return(nbytes); + } else { + return(pread(fd, buf, nbytes, offset)); + } +} + diff --git a/sbin/dump/dump.8 b/sbin/dump/dump.8 index 23beca3..424e4b3 100644 --- a/sbin/dump/dump.8 +++ b/sbin/dump/dump.8 @@ -46,6 +46,7 @@ .Op Fl B Ar records .Op Fl b Ar blocksize .Op Fl D Ar dumpdates +.Op Fl C Ar cachesize .Op Fl d Ar density .Op Fl f Ar file .Op Fl h Ar level @@ -142,6 +143,16 @@ Specify an alternate path to the file. The default is .Pa /etc/dumpdates . +.It Fl C Ar cachesize +Specify the cache size in megabytes. This will greatly improve performance +at the cost of +.Nm +possibly not noticing changes in the filesystem between passes. It is +recommended that you always use this option when dumping a snapshot. +Beware that +.Nm +forks, and the actual memory use may be larger then the specified cache +size. The recommended cache size is between 8 and 32 (megabytes). .It Fl d Ar density Set tape density to .Ar density . diff --git a/sbin/dump/dump.h b/sbin/dump/dump.h index eb04b0c..feb5913 100644 --- a/sbin/dump/dump.h +++ b/sbin/dump/dump.h @@ -77,6 +77,7 @@ long asize; /* number of 0.1" units written on current tape */ int etapes; /* estimated number of tapes */ int nonodump; /* if set, do not honor UF_NODUMP user flags */ int unlimited; /* if set, write to end of medium */ +int cachesize; /* size of block cache in bytes */ int notify; /* notify operator flag */ int blockswritten; /* number of blocks written on current tape */ diff --git a/sbin/dump/main.c b/sbin/dump/main.c index 34223b1..7fcf112 100644 --- a/sbin/dump/main.c +++ b/sbin/dump/main.c @@ -82,6 +82,7 @@ int density = 0; /* density in bytes/0.1" " <- this is for hilit19 */ int ntrec = NTREC; /* # tape blocks in each tape record */ int cartridge = 0; /* Assume non-cartridge tape */ int dokerberos = 0; /* Use Kerberos authentication */ +int cachesize = 0; /* block cache size (in bytes), defaults to 0 */ long dev_bsize = 1; /* recalculated below */ long blocksperfile; /* output blocks per file */ char *host = NULL; /* remote host (if any) */ @@ -127,9 +128,9 @@ main(int argc, char *argv[]) obsolete(&argc, &argv); #ifdef KERBEROS -#define optstring "0123456789aB:b:cd:f:h:kLns:ST:uWwD:" +#define optstring "0123456789aB:b:cd:f:h:kLns:ST:uWwD:C:" #else -#define optstring "0123456789aB:b:cd:f:h:Lns:ST:uWwD:" +#define optstring "0123456789aB:b:cd:f:h:Lns:ST:uWwD:C:" #endif while ((ch = getopt(argc, argv, optstring)) != -1) #undef optstring @@ -172,6 +173,10 @@ main(int argc, char *argv[]) dumpdates = optarg; break; + case 'C': + cachesize = numarg("cachesize", 0, 0) * 1024 * 1024; + break; + case 'h': honorlevel = numarg("honor level", 0L, 10L); break; diff --git a/sbin/dump/traverse.c b/sbin/dump/traverse.c index ab2ee71..ec0d56e 100644 --- a/sbin/dump/traverse.c +++ b/sbin/dump/traverse.c @@ -739,8 +739,8 @@ bread(ufs2_daddr_t blkno, char *buf, int size) int cnt, i; loop: - if ((cnt = pread(diskfd, buf, size, ((off_t)blkno << dev_bshift))) == - size) + cnt = cread(diskfd, buf, size, ((off_t)blkno << dev_bshift)); + if (cnt == size) return; if (blkno + (size / dev_bsize) > fsbtodb(sblock, sblock->fs_size)) { /* @@ -774,7 +774,8 @@ loop: breaderrors = 0; } /* - * Zero buffer, then try to read each sector of buffer separately. + * Zero buffer, then try to read each sector of buffer separately, + * and bypass the cache. */ memset(buf, 0, size); for (i = 0; i < size; i += dev_bsize, buf += dev_bsize, blkno++) { |