parent
9a815f30f7
commit
1b6d5bbf07
189
0001-When-exporting-use-hardlinks-for-duplicated-files.patch
Normal file
189
0001-When-exporting-use-hardlinks-for-duplicated-files.patch
Normal file
@ -0,0 +1,189 @@
|
|||||||
|
From 3b2fd6e9ff0a3a91a2b72f524492e4f198069dec Mon Sep 17 00:00:00 2001
|
||||||
|
From: "Owen W. Taylor" <otaylor@fishsoup.net>
|
||||||
|
Date: Fri, 29 Sep 2023 12:09:04 -0400
|
||||||
|
Subject: [PATCH] When exporting, use hardlinks for duplicated files
|
||||||
|
|
||||||
|
For ostree_repo_export_tree_to_archive(), and 'ostree export', when the
|
||||||
|
exported tree contains multiple files with the same checksum, write an
|
||||||
|
archive with hard links.
|
||||||
|
|
||||||
|
Without this, importing a tree, then exporting it again breaks
|
||||||
|
hardlinks.
|
||||||
|
|
||||||
|
As an example of savings: this reduces the (compressed) size of the
|
||||||
|
Fedora Flatpak Runtime image from 1345MiB to 712MiB.
|
||||||
|
|
||||||
|
Resolves: #2925
|
||||||
|
---
|
||||||
|
src/libostree/ostree-repo-libarchive.c | 50 ++++++++++++++++++++------
|
||||||
|
tests/archive-test.sh | 4 +--
|
||||||
|
tests/libtest.sh | 7 ++++
|
||||||
|
tests/test-composefs.sh | 2 +-
|
||||||
|
tests/test-export.sh | 10 +++++-
|
||||||
|
5 files changed, 58 insertions(+), 15 deletions(-)
|
||||||
|
|
||||||
|
diff --git a/src/libostree/ostree-repo-libarchive.c b/src/libostree/ostree-repo-libarchive.c
|
||||||
|
index d0f46883..65a30933 100644
|
||||||
|
--- a/src/libostree/ostree-repo-libarchive.c
|
||||||
|
+++ b/src/libostree/ostree-repo-libarchive.c
|
||||||
|
@@ -943,15 +943,10 @@ ostree_repo_write_archive_to_mtree_from_fd (OstreeRepo *self, int fd, OstreeMuta
|
||||||
|
|
||||||
|
#ifdef HAVE_LIBARCHIVE
|
||||||
|
|
||||||
|
-static gboolean
|
||||||
|
-file_to_archive_entry_common (GFile *root, OstreeRepoExportArchiveOptions *opts, GFile *path,
|
||||||
|
- GFileInfo *file_info, struct archive_entry *entry, GError **error)
|
||||||
|
+static char *
|
||||||
|
+file_to_pathstr (GFile *root, OstreeRepoExportArchiveOptions *opts, GFile *path)
|
||||||
|
{
|
||||||
|
- gboolean ret = FALSE;
|
||||||
|
g_autofree char *pathstr = g_file_get_relative_path (root, path);
|
||||||
|
- g_autoptr (GVariant) xattrs = NULL;
|
||||||
|
- time_t ts = (time_t)opts->timestamp_secs;
|
||||||
|
-
|
||||||
|
if (opts->path_prefix && opts->path_prefix[0])
|
||||||
|
{
|
||||||
|
g_autofree char *old_pathstr = pathstr;
|
||||||
|
@@ -964,6 +959,18 @@ file_to_archive_entry_common (GFile *root, OstreeRepoExportArchiveOptions *opts,
|
||||||
|
pathstr = g_strdup (".");
|
||||||
|
}
|
||||||
|
|
||||||
|
+ return g_steal_pointer (&pathstr);
|
||||||
|
+}
|
||||||
|
+
|
||||||
|
+static gboolean
|
||||||
|
+file_to_archive_entry_common (GFile *root, OstreeRepoExportArchiveOptions *opts, GFile *path,
|
||||||
|
+ GFileInfo *file_info, struct archive_entry *entry, GError **error)
|
||||||
|
+{
|
||||||
|
+ gboolean ret = FALSE;
|
||||||
|
+ g_autofree char *pathstr = file_to_pathstr (root, opts, path);
|
||||||
|
+ g_autoptr (GVariant) xattrs = NULL;
|
||||||
|
+ time_t ts = (time_t)opts->timestamp_secs;
|
||||||
|
+
|
||||||
|
archive_entry_update_pathname_utf8 (entry, pathstr);
|
||||||
|
archive_entry_set_ctime (entry, ts, OSTREE_TIMESTAMP);
|
||||||
|
archive_entry_set_mtime (entry, ts, OSTREE_TIMESTAMP);
|
||||||
|
@@ -1021,7 +1028,8 @@ out:
|
||||||
|
static gboolean
|
||||||
|
write_directory_to_libarchive_recurse (OstreeRepo *self, OstreeRepoExportArchiveOptions *opts,
|
||||||
|
GFile *root, GFile *dir, struct archive *a,
|
||||||
|
- GCancellable *cancellable, GError **error)
|
||||||
|
+ GHashTable *seen_checksums, GCancellable *cancellable,
|
||||||
|
+ GError **error)
|
||||||
|
{
|
||||||
|
gboolean ret = FALSE;
|
||||||
|
g_autoptr (GFileInfo) dir_info = NULL;
|
||||||
|
@@ -1057,8 +1065,8 @@ write_directory_to_libarchive_recurse (OstreeRepo *self, OstreeRepoExportArchive
|
||||||
|
/* First, handle directories recursively */
|
||||||
|
if (g_file_info_get_file_type (file_info) == G_FILE_TYPE_DIRECTORY)
|
||||||
|
{
|
||||||
|
- if (!write_directory_to_libarchive_recurse (self, opts, root, path, a, cancellable,
|
||||||
|
- error))
|
||||||
|
+ if (!write_directory_to_libarchive_recurse (self, opts, root, path, a, seen_checksums,
|
||||||
|
+ cancellable, error))
|
||||||
|
goto out;
|
||||||
|
|
||||||
|
/* Go to the next entry */
|
||||||
|
@@ -1086,9 +1094,27 @@ write_directory_to_libarchive_recurse (OstreeRepo *self, OstreeRepoExportArchive
|
||||||
|
g_autoptr (GInputStream) file_in = NULL;
|
||||||
|
g_autoptr (GFileInfo) regular_file_info = NULL;
|
||||||
|
const char *checksum;
|
||||||
|
+ GFile *old_path;
|
||||||
|
|
||||||
|
checksum = ostree_repo_file_get_checksum ((OstreeRepoFile *)path);
|
||||||
|
|
||||||
|
+ old_path = g_hash_table_lookup (seen_checksums, checksum);
|
||||||
|
+ if (old_path)
|
||||||
|
+ {
|
||||||
|
+ g_autofree char *old_pathstr = file_to_pathstr (root, opts, old_path);
|
||||||
|
+
|
||||||
|
+ archive_entry_set_hardlink (entry, old_pathstr);
|
||||||
|
+ if (!write_header_free_entry (a, &entry, error))
|
||||||
|
+ goto out;
|
||||||
|
+
|
||||||
|
+ break;
|
||||||
|
+ }
|
||||||
|
+ else
|
||||||
|
+ {
|
||||||
|
+ /* The checksum is owned by path (an OstreeRepoFile) */
|
||||||
|
+ g_hash_table_insert (seen_checksums, (char *)checksum, g_object_ref (path));
|
||||||
|
+ }
|
||||||
|
+
|
||||||
|
if (!ostree_repo_load_file (self, checksum, &file_in, ®ular_file_info, NULL,
|
||||||
|
cancellable, error))
|
||||||
|
goto out;
|
||||||
|
@@ -1168,9 +1194,11 @@ ostree_repo_export_tree_to_archive (OstreeRepo *self, OstreeRepoExportArchiveOpt
|
||||||
|
#ifdef HAVE_LIBARCHIVE
|
||||||
|
gboolean ret = FALSE;
|
||||||
|
struct archive *a = archive;
|
||||||
|
+ g_autoptr (GHashTable) seen_checksums
|
||||||
|
+ = g_hash_table_new_full (g_str_hash, g_str_equal, NULL, g_object_unref);
|
||||||
|
|
||||||
|
if (!write_directory_to_libarchive_recurse (self, opts, (GFile *)root, (GFile *)root, a,
|
||||||
|
- cancellable, error))
|
||||||
|
+ seen_checksums, cancellable, error))
|
||||||
|
goto out;
|
||||||
|
|
||||||
|
ret = TRUE;
|
||||||
|
diff --git a/tests/archive-test.sh b/tests/archive-test.sh
|
||||||
|
index 6b45790e..f6bfd5fb 100644
|
||||||
|
--- a/tests/archive-test.sh
|
||||||
|
+++ b/tests/archive-test.sh
|
||||||
|
@@ -72,9 +72,9 @@ date > test-overlays/overlaid-file
|
||||||
|
$OSTREE commit ${COMMIT_ARGS} -b test-base --base test2 --owner-uid 42 --owner-gid 42 test-overlays/
|
||||||
|
$OSTREE ls -R test-base > ls.txt
|
||||||
|
if can_create_whiteout_devices; then
|
||||||
|
- assert_streq "$(wc -l < ls.txt)" 17
|
||||||
|
+ assert_streq "$(wc -l < ls.txt)" 22
|
||||||
|
else
|
||||||
|
- assert_streq "$(wc -l < ls.txt)" 14
|
||||||
|
+ assert_streq "$(wc -l < ls.txt)" 19
|
||||||
|
fi
|
||||||
|
|
||||||
|
assert_streq "$(grep '42.*42' ls.txt | wc -l)" 2
|
||||||
|
diff --git a/tests/libtest.sh b/tests/libtest.sh
|
||||||
|
index fa937827..d1c99eab 100755
|
||||||
|
--- a/tests/libtest.sh
|
||||||
|
+++ b/tests/libtest.sh
|
||||||
|
@@ -249,6 +249,13 @@ setup_test_repository () {
|
||||||
|
mkdir baz/another/
|
||||||
|
echo x > baz/another/y
|
||||||
|
|
||||||
|
+ mkdir baz/sub1
|
||||||
|
+ echo SAME_CONTENT > baz/sub1/duplicate_a
|
||||||
|
+ echo SAME_CONTENT > baz/sub1/duplicate_b
|
||||||
|
+
|
||||||
|
+ mkdir baz/sub2
|
||||||
|
+ echo SAME_CONTENT > baz/sub2/duplicate_c
|
||||||
|
+
|
||||||
|
# if we are running inside a container we cannot test
|
||||||
|
# the overlayfs whiteout marker passthrough
|
||||||
|
if ! test -n "${OSTREE_NO_WHITEOUTS:-}"; then
|
||||||
|
diff --git a/tests/test-export.sh b/tests/test-export.sh
|
||||||
|
index e490ae40..6b8de94c 100755
|
||||||
|
--- a/tests/test-export.sh
|
||||||
|
+++ b/tests/test-export.sh
|
||||||
|
@@ -28,7 +28,7 @@ fi
|
||||||
|
|
||||||
|
setup_test_repository "archive"
|
||||||
|
|
||||||
|
-echo '1..5'
|
||||||
|
+echo '1..6'
|
||||||
|
|
||||||
|
$OSTREE checkout test2 test2-co
|
||||||
|
$OSTREE commit --no-xattrs -b test2-noxattrs -s "test2 without xattrs" --tree=dir=test2-co
|
||||||
|
@@ -81,3 +81,11 @@ assert_file_empty diff.txt
|
||||||
|
rm test2.tar diff.txt t -rf
|
||||||
|
|
||||||
|
echo 'ok export import'
|
||||||
|
+
|
||||||
|
+cd ${test_tmpdir}
|
||||||
|
+${OSTREE} 'export' test2 -o test2.tar
|
||||||
|
+tar tvf test2.tar > test2.manifest
|
||||||
|
+assert_file_has_content test2.manifest 'baz/sub1/duplicate_b link to baz/sub1/duplicate_a'
|
||||||
|
+assert_file_has_content test2.manifest 'baz/sub2/duplicate_c link to baz/sub1/duplicate_a'
|
||||||
|
+
|
||||||
|
+echo 'ok export hard links'
|
||||||
|
--
|
||||||
|
2.41.0
|
||||||
|
|
@ -8,11 +8,13 @@
|
|||||||
Summary: Tool for managing bootable, immutable filesystem trees
|
Summary: Tool for managing bootable, immutable filesystem trees
|
||||||
Name: ostree
|
Name: ostree
|
||||||
Version: 2023.6
|
Version: 2023.6
|
||||||
Release: 1%{?dist}
|
Release: 2%{?dist}
|
||||||
Source0: https://github.com/ostreedev/%{name}/releases/download/v%{version}/libostree-%{version}.tar.xz
|
Source0: https://github.com/ostreedev/%{name}/releases/download/v%{version}/libostree-%{version}.tar.xz
|
||||||
License: LGPL-2.0-or-later
|
License: LGPL-2.0-or-later
|
||||||
URL: https://ostree.readthedocs.io/en/latest/
|
URL: https://ostree.readthedocs.io/en/latest/
|
||||||
|
|
||||||
|
Patch0: 0001-When-exporting-use-hardlinks-for-duplicated-files.patch
|
||||||
|
|
||||||
BuildRequires: make
|
BuildRequires: make
|
||||||
BuildRequires: git
|
BuildRequires: git
|
||||||
# We always run autogen.sh
|
# We always run autogen.sh
|
||||||
@ -170,6 +172,10 @@ find %{buildroot} -name '*.la' -delete
|
|||||||
%endif
|
%endif
|
||||||
|
|
||||||
%changelog
|
%changelog
|
||||||
|
* Fri Oct 06 2023 Colin Walters <walters@verbum.org> - 2023.6-2
|
||||||
|
- Cherry pick
|
||||||
|
https://github.com/ostreedev/ostree/pull/3060/commits/3b2fd6e9ff0a3a91a2b72f524492e4f198069dec
|
||||||
|
|
||||||
* Fri Aug 25 2023 Colin Walters <walters@verbum.org> - 2023.6-1
|
* Fri Aug 25 2023 Colin Walters <walters@verbum.org> - 2023.6-1
|
||||||
- https://github.com/ostreedev/ostree/releases/tag/v2023.6
|
- https://github.com/ostreedev/ostree/releases/tag/v2023.6
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user