summaryrefslogtreecommitdiffstats
path: root/Source
diff options
context:
space:
mode:
authorAtılhan Emre Dursunoğlu <atilhan.dursunoglu@sparsetechnology.com>2023-10-09 10:13:23 (GMT)
committerAtılhan Emre Dursunoğlu <atilhan.dursunoglu@sparsetechnology.com>2023-10-26 15:20:48 (GMT)
commit770efceccb6f1e9ea1e452b7c79227f94996a751 (patch)
treedeee65838232dee921373c8f6377be264466d78d /Source
parent35424aab2e35ae5e4e3762feae26a0c305c73b9d (diff)
downloadCMake-770efceccb6f1e9ea1e452b7c79227f94996a751.zip
CMake-770efceccb6f1e9ea1e452b7c79227f94996a751.tar.gz
CMake-770efceccb6f1e9ea1e452b7c79227f94996a751.tar.bz2
CPack: Avoid adding duplicate files to archive when combining components
Fixes: #25280
Diffstat (limited to 'Source')
-rw-r--r--Source/CPack/cmCPackArchiveGenerator.cxx153
-rw-r--r--Source/CPack/cmCPackArchiveGenerator.h6
2 files changed, 151 insertions, 8 deletions
diff --git a/Source/CPack/cmCPackArchiveGenerator.cxx b/Source/CPack/cmCPackArchiveGenerator.cxx
index c9c069c..b7b6785 100644
--- a/Source/CPack/cmCPackArchiveGenerator.cxx
+++ b/Source/CPack/cmCPackArchiveGenerator.cxx
@@ -5,6 +5,8 @@
#include <cstring>
#include <map>
#include <ostream>
+#include <unordered_map>
+#include <unordered_set>
#include <utility>
#include <vector>
@@ -17,6 +19,121 @@
#include "cmValue.h"
#include "cmWorkingDirectory.h"
+enum class DeduplicateStatus
+{
+ Skip,
+ Add,
+ Error
+};
+
+/**
+ * @class cmCPackArchiveGenerator::Deduplicator
+ * @brief A utility class for deduplicating files, folders, and symlinks.
+ *
+ * This class is responsible for identifying duplicate files, folders, and
+ * symlinks when generating an archive. It keeps track of the paths that have
+ * been processed and helps in deciding whether a new path should be added,
+ * skipped, or flagged as an error.
+ */
+class cmCPackArchiveGenerator::Deduplicator
+{
+private:
+ /**
+ * @brief Compares a file with already processed files.
+ *
+ * @param path The path of the file to compare.
+ * @param localTopLevel The top-level directory for the file.
+ * @return DeduplicateStatus indicating whether to add, skip, or flag an
+ * error for the file.
+ */
+ DeduplicateStatus CompareFile(const std::string& path,
+ const std::string& localTopLevel)
+ {
+ auto fileItr = this->Files.find(path);
+ if (fileItr != this->Files.end()) {
+ return cmSystemTools::FilesDiffer(path, fileItr->second)
+ ? DeduplicateStatus::Error
+ : DeduplicateStatus::Skip;
+ }
+
+ this->Files[path] = cmStrCat(localTopLevel, "/", path);
+ return DeduplicateStatus::Add;
+ }
+
+ /**
+ * @brief Compares a folder with already processed folders.
+ *
+ * @param path The path of the folder to compare.
+ * @return DeduplicateStatus indicating whether to add or skip the folder.
+ */
+ DeduplicateStatus CompareFolder(const std::string& path)
+ {
+ if (this->Folders.find(path) != this->Folders.end()) {
+ return DeduplicateStatus::Skip;
+ }
+
+ this->Folders.emplace(path);
+ return DeduplicateStatus::Add;
+ }
+
+ /**
+ * @brief Compares a symlink with already processed symlinks.
+ *
+ * @param path The path of the symlink to compare.
+ * @return DeduplicateStatus indicating whether to add, skip, or flag an
+ * error for the symlink.
+ */
+ DeduplicateStatus CompareSymlink(const std::string& path)
+ {
+ auto symlinkItr = this->Symlink.find(path);
+ std::string symlinkValue;
+ auto status = cmSystemTools::ReadSymlink(path, symlinkValue);
+ if (!status.IsSuccess()) {
+ return DeduplicateStatus::Error;
+ }
+
+ if (symlinkItr != this->Symlink.end()) {
+ return symlinkValue == symlinkItr->second ? DeduplicateStatus::Skip
+ : DeduplicateStatus::Error;
+ }
+
+ this->Symlink[path] = symlinkValue;
+ return DeduplicateStatus::Add;
+ }
+
+public:
+ /**
+ * @brief Determines the deduplication status of a given path.
+ *
+ * This method identifies whether the given path is a file, folder, or
+ * symlink and then delegates to the appropriate comparison method.
+ *
+ * @param path The path to check for deduplication.
+ * @param localTopLevel The top-level directory for the path.
+ * @return DeduplicateStatus indicating the action to take for the given
+ * path.
+ */
+ DeduplicateStatus IsDeduplicate(const std::string& path,
+ const std::string& localTopLevel)
+ {
+ DeduplicateStatus status;
+ if (cmSystemTools::FileIsDirectory(path)) {
+ status = this->CompareFolder(path);
+ } else if (cmSystemTools::FileIsSymlink(path)) {
+ status = this->CompareSymlink(path);
+ } else {
+ status = this->CompareFile(path, localTopLevel);
+ }
+
+ return status;
+ }
+
+private:
+ std::unordered_map<std::string, std::string> Symlink;
+ std::unordered_set<std::string> Folders;
+ std::unordered_map<std::string, std::string> Files;
+};
+
cmCPackGenerator* cmCPackArchiveGenerator::Create7ZGenerator()
{
return new cmCPackArchiveGenerator(cmArchiveWrite::CompressNone, "7zip",
@@ -110,7 +227,8 @@ int cmCPackArchiveGenerator::InitializeInternal()
}
int cmCPackArchiveGenerator::addOneComponentToArchive(
- cmArchiveWrite& archive, cmCPackComponent* component)
+ cmArchiveWrite& archive, cmCPackComponent* component,
+ Deduplicator* deduplicator)
{
cmCPackLogger(cmCPackLog::LOG_VERBOSE,
" - packaging component: " << component->Name << std::endl);
@@ -139,8 +257,25 @@ int cmCPackArchiveGenerator::addOneComponentToArchive(
}
for (std::string const& file : component->Files) {
std::string rp = filePrefix + file;
- cmCPackLogger(cmCPackLog::LOG_DEBUG, "Adding file: " << rp << std::endl);
- archive.Add(rp, 0, nullptr, false);
+
+ DeduplicateStatus status = DeduplicateStatus::Add;
+ if (deduplicator != nullptr) {
+ status = deduplicator->IsDeduplicate(rp, localToplevel);
+ }
+
+ if (deduplicator == nullptr || status == DeduplicateStatus::Add) {
+ cmCPackLogger(cmCPackLog::LOG_DEBUG, "Adding file: " << rp << std::endl);
+ archive.Add(rp, 0, nullptr, false);
+ } else if (status == DeduplicateStatus::Error) {
+ cmCPackLogger(cmCPackLog::LOG_ERROR,
+ "ERROR The data in files with the "
+ "same filename is different.");
+ return 0;
+ } else {
+ cmCPackLogger(cmCPackLog::LOG_DEBUG,
+ "Passing file: " << rp << std::endl);
+ }
+
if (!archive) {
cmCPackLogger(cmCPackLog::LOG_ERROR,
"ERROR while packaging files: " << archive.GetError()
@@ -197,6 +332,8 @@ int cmCPackArchiveGenerator::PackageComponents(bool ignoreGroup)
std::string packageFileName = std::string(this->toplevel) + "/" +
this->GetArchiveComponentFileName(compG.first, true);
+ Deduplicator deduplicator;
+
// open a block in order to automatically close archive
// at the end of the block
{
@@ -204,7 +341,7 @@ int cmCPackArchiveGenerator::PackageComponents(bool ignoreGroup)
// now iterate over the component of this group
for (cmCPackComponent* comp : (compG.second).Components) {
// Add the files of this component to the archive
- this->addOneComponentToArchive(archive, comp);
+ this->addOneComponentToArchive(archive, comp, &deduplicator);
}
}
// add the generated package to package file names list
@@ -231,7 +368,7 @@ int cmCPackArchiveGenerator::PackageComponents(bool ignoreGroup)
{
DECLARE_AND_OPEN_ARCHIVE(packageFileName, archive);
// Add the files of this component to the archive
- this->addOneComponentToArchive(archive, &(comp.second));
+ this->addOneComponentToArchive(archive, &(comp.second), nullptr);
}
// add the generated package to package file names list
this->packageFileNames.push_back(std::move(packageFileName));
@@ -252,7 +389,7 @@ int cmCPackArchiveGenerator::PackageComponents(bool ignoreGroup)
{
DECLARE_AND_OPEN_ARCHIVE(packageFileName, archive);
// Add the files of this component to the archive
- this->addOneComponentToArchive(archive, &(comp.second));
+ this->addOneComponentToArchive(archive, &(comp.second), nullptr);
}
// add the generated package to package file names list
this->packageFileNames.push_back(std::move(packageFileName));
@@ -282,10 +419,12 @@ int cmCPackArchiveGenerator::PackageComponentsAllInOne()
<< std::endl);
DECLARE_AND_OPEN_ARCHIVE(packageFileNames[0], archive);
+ Deduplicator deduplicator;
+
// The ALL COMPONENTS in ONE package case
for (auto& comp : this->Components) {
// Add the files of this component to the archive
- this->addOneComponentToArchive(archive, &(comp.second));
+ this->addOneComponentToArchive(archive, &(comp.second), &deduplicator);
}
// archive goes out of scope so it will finalized and closed.
diff --git a/Source/CPack/cmCPackArchiveGenerator.h b/Source/CPack/cmCPackArchiveGenerator.h
index 8a9bbc6..b8a1afa 100644
--- a/Source/CPack/cmCPackArchiveGenerator.h
+++ b/Source/CPack/cmCPackArchiveGenerator.h
@@ -47,6 +47,8 @@ private:
std::string GetArchiveComponentFileName(const std::string& component,
bool isGroupName);
+ class Deduplicator;
+
protected:
int InitializeInternal() override;
/**
@@ -54,9 +56,11 @@ protected:
* to the provided (already opened) archive.
* @param[in,out] archive the archive object
* @param[in] component the component whose file will be added to archive
+ * @param[in] deduplicator file deduplicator utility.
*/
int addOneComponentToArchive(cmArchiveWrite& archive,
- cmCPackComponent* component);
+ cmCPackComponent* component,
+ Deduplicator* deduplicator);
/**
* The main package file method.