summaryrefslogtreecommitdiffstats
path: root/lib/libarchive
diff options
context:
space:
mode:
authorkientzle <kientzle@FreeBSD.org>2009-12-29 06:34:23 +0000
committerkientzle <kientzle@FreeBSD.org>2009-12-29 06:34:23 +0000
commit3558b2ba52622dd4e0eda72c0c72f47833bd10f1 (patch)
tree3228817baf52ddd62cd9fffc201588e2a5cac4fc /lib/libarchive
parent4ccc9e75ff010d31203e12692e41602a144f55be (diff)
downloadFreeBSD-src-3558b2ba52622dd4e0eda72c0c72f47833bd10f1.zip
FreeBSD-src-3558b2ba52622dd4e0eda72c0c72f47833bd10f1.tar.gz
Essentially eliminate problems with false hardlinks in POSIX cpio
archives by generating synthetic ino values and mapping values from disk into the new values.
Diffstat (limited to 'lib/libarchive')
-rw-r--r--lib/libarchive/archive_write_set_format_cpio.c107
1 files changed, 91 insertions, 16 deletions
diff --git a/lib/libarchive/archive_write_set_format_cpio.c b/lib/libarchive/archive_write_set_format_cpio.c
index fd7e8a9..a0bccc5 100644
--- a/lib/libarchive/archive_write_set_format_cpio.c
+++ b/lib/libarchive/archive_write_set_format_cpio.c
@@ -54,6 +54,12 @@ static int64_t format_octal_recursive(int64_t, char *, int);
struct cpio {
uint64_t entry_bytes_remaining;
+
+ int64_t ino_next;
+
+ struct { int64_t old; int new;} *ino_list;
+ size_t ino_list_size;
+ size_t ino_list_next;
};
struct cpio_header {
@@ -103,35 +109,102 @@ archive_write_set_format_cpio(struct archive *_a)
return (ARCHIVE_OK);
}
+/*
+ * Ino values are as long as 64 bits on some systems; cpio format
+ * only allows 18 bits and relies on the ino values to identify hardlinked
+ * files. So, we can't merely "hash" the ino numbers since collisions
+ * would corrupt the archive. Instead, we generate synthetic ino values
+ * to store in the archive and maintain a map of original ino values to
+ * synthetic ones so we can preserve hardlink information.
+ *
+ * TODO: Make this more efficient. It's not as bad as it looks (most
+ * files don't have any hardlinks and we don't do any work here for those),
+ * but it wouldn't be hard to do better.
+ *
+ * TODO: Work with dev/ino pairs here instead of just ino values.
+ */
+static int
+synthesize_ino_value(struct cpio *cpio, struct archive_entry *entry)
+{
+ int64_t ino = archive_entry_ino64(entry);
+ int ino_new;
+ size_t i;
+
+ /*
+ * If no index number was given, don't assign one. In
+ * particular, this handles the end-of-archive marker
+ * correctly by giving it a zero index value. (This is also
+ * why we start our synthetic index numbers with one below.)
+ */
+ if (ino == 0)
+ return (0);
+
+ /* Don't store a mapping if we don't need to. */
+ if (archive_entry_nlink(entry) < 2) {
+ return ++cpio->ino_next;
+ }
+
+ /* Look up old ino; if we have it, this is a hardlink
+ * and we reuse the same value. */
+ for (i = 0; i < cpio->ino_list_next; ++i) {
+ if (cpio->ino_list[i].old == ino)
+ return (cpio->ino_list[i].new);
+ }
+
+ /* Assign a new index number. */
+ ino_new = ++cpio->ino_next;
+
+ /* Ensure space for the new mapping. */
+ if (cpio->ino_list_size <= cpio->ino_list_next) {
+ size_t newsize = cpio->ino_list_size < 512
+ ? 512 : cpio->ino_list_size * 2;
+ void *newlist = realloc(cpio->ino_list,
+ sizeof(cpio->ino_list[0]) * newsize);
+ if (newlist == NULL)
+ return (-1);
+
+ cpio->ino_list_size = newsize;
+ cpio->ino_list = newlist;
+ }
+
+ /* Record and return the new value. */
+ cpio->ino_list[cpio->ino_list_next].old = ino;
+ cpio->ino_list[cpio->ino_list_next].new = ino_new;
+ ++cpio->ino_list_next;
+ return (ino_new);
+}
+
static int
archive_write_cpio_header(struct archive_write *a, struct archive_entry *entry)
{
struct cpio *cpio;
const char *p, *path;
- int pathlength, ret;
+ int pathlength, ret, ret2;
+ int64_t ino;
struct cpio_header h;
cpio = (struct cpio *)a->format_data;
- ret = 0;
+ ret2 = ARCHIVE_OK;
path = archive_entry_pathname(entry);
- pathlength = strlen(path) + 1; /* Include trailing null. */
+ pathlength = (int)strlen(path) + 1; /* Include trailing null. */
memset(&h, 0, sizeof(h));
format_octal(070707, &h.c_magic, sizeof(h.c_magic));
format_octal(archive_entry_dev(entry), &h.c_dev, sizeof(h.c_dev));
- /*
- * TODO: Generate artificial inode numbers rather than just
- * re-using the ones off the disk. That way, the 18-bit c_ino
- * field only limits the number of files in the archive.
- */
- if ((int)archive_entry_ino(entry) > 0777777) {
+
+ ino = synthesize_ino_value(cpio, entry);
+ if (ino < 0) {
+ archive_set_error(&a->archive, ENOMEM,
+ "No memory for ino translation table");
+ return (ARCHIVE_FATAL);
+ } else if (ino > 0777777) {
archive_set_error(&a->archive, ERANGE,
- "large inode number truncated");
- ret = ARCHIVE_WARN;
+ "Too many files for this cpio format");
+ return (ARCHIVE_FATAL);
}
+ format_octal(ino & 0777777, &h.c_ino, sizeof(h.c_ino));
- format_octal(archive_entry_ino(entry) & 0777777, &h.c_ino, sizeof(h.c_ino));
format_octal(archive_entry_mode(entry), &h.c_mode, sizeof(h.c_mode));
format_octal(archive_entry_uid(entry), &h.c_uid, sizeof(h.c_uid));
format_octal(archive_entry_gid(entry), &h.c_gid, sizeof(h.c_gid));
@@ -170,6 +243,8 @@ archive_write_cpio_header(struct archive_write *a, struct archive_entry *entry)
if (p != NULL && *p != '\0')
ret = (a->compressor.write)(a, p, strlen(p));
+ if (ret == ARCHIVE_OK)
+ ret = ret2;
return (ret);
}
@@ -218,17 +293,15 @@ format_octal_recursive(int64_t v, char *p, int s)
return (v);
v = format_octal_recursive(v, p+1, s-1);
*p = '0' + (v & 7);
- return (v >>= 3);
+ return (v >> 3);
}
static int
archive_write_cpio_finish(struct archive_write *a)
{
- struct cpio *cpio;
int er;
struct archive_entry *trailer;
- cpio = (struct cpio *)a->format_data;
trailer = archive_entry_new();
/* nlink = 1 here for GNU cpio compat. */
archive_entry_set_nlink(trailer, 1);
@@ -244,6 +317,7 @@ archive_write_cpio_destroy(struct archive_write *a)
struct cpio *cpio;
cpio = (struct cpio *)a->format_data;
+ free(cpio->ino_list);
free(cpio);
a->format_data = NULL;
return (ARCHIVE_OK);
@@ -253,7 +327,8 @@ static int
archive_write_cpio_finish_entry(struct archive_write *a)
{
struct cpio *cpio;
- int to_write, ret;
+ size_t to_write;
+ int ret;
cpio = (struct cpio *)a->format_data;
ret = ARCHIVE_OK;
OpenPOWER on IntegriCloud